tic6x: Call _bfd_elf_add_dynamic_tags
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
CommitLineData
b534c6d3 1/* tc-i386.c -- Assemble code for the Intel 80386
b3adc24a 2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
252b5132
RH
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
ec2655a6 8 the Free Software Foundation; either version 3, or (at your option)
252b5132
RH
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
4b4da160
NC
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
252b5132 20
47926f60
KH
21/* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
3e73aa7c 23 x86_64 support by Jan Hubicka (jh@suse.cz)
0f10071e 24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
47926f60
KH
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
252b5132 27
252b5132 28#include "as.h"
3882b010 29#include "safe-ctype.h"
252b5132 30#include "subsegs.h"
316e2c05 31#include "dwarf2dbg.h"
54cfded0 32#include "dw2gencfi.h"
d2b2c203 33#include "elf/x86-64.h"
40fb9820 34#include "opcodes/i386-init.h"
252b5132 35
41fd2579
L
36#ifdef HAVE_LIMITS_H
37#include <limits.h>
38#else
39#ifdef HAVE_SYS_PARAM_H
40#include <sys/param.h>
41#endif
42#ifndef INT_MAX
43#define INT_MAX (int) (((unsigned) (-1)) >> 1)
44#endif
45#endif
46
c3332e24 47#ifndef INFER_ADDR_PREFIX
eecb386c 48#define INFER_ADDR_PREFIX 1
c3332e24
AM
49#endif
50
29b0f896
AM
51#ifndef DEFAULT_ARCH
52#define DEFAULT_ARCH "i386"
246fcdee 53#endif
252b5132 54
edde18a5
AM
55#ifndef INLINE
56#if __GNUC__ >= 2
57#define INLINE __inline__
58#else
59#define INLINE
60#endif
61#endif
62
6305a203
L
63/* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
42164a71 67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
6305a203
L
68#define WAIT_PREFIX 0
69#define SEG_PREFIX 1
70#define ADDR_PREFIX 2
71#define DATA_PREFIX 3
c32fa91d 72#define REP_PREFIX 4
42164a71 73#define HLE_PREFIX REP_PREFIX
7e8b059b 74#define BND_PREFIX REP_PREFIX
c32fa91d 75#define LOCK_PREFIX 5
4e9ac44a
L
76#define REX_PREFIX 6 /* must come last. */
77#define MAX_PREFIXES 7 /* max prefixes per opcode */
6305a203
L
78
79/* we define the syntax here (modulo base,index,scale syntax) */
80#define REGISTER_PREFIX '%'
81#define IMMEDIATE_PREFIX '$'
82#define ABSOLUTE_PREFIX '*'
83
84/* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86#define WORD_MNEM_SUFFIX 'w'
87#define BYTE_MNEM_SUFFIX 'b'
88#define SHORT_MNEM_SUFFIX 's'
89#define LONG_MNEM_SUFFIX 'l'
90#define QWORD_MNEM_SUFFIX 'q'
6305a203
L
91/* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93#define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95#define END_OF_INSN '\0'
96
79dec6b7
JB
97/* This matches the C -> StaticRounding alias in the opcode table. */
98#define commutative staticrounding
99
6305a203
L
100/*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107typedef struct
108{
d3ce72d0
NC
109 const insn_template *start;
110 const insn_template *end;
6305a203
L
111}
112templates;
113
114/* 386 operand encoding bytes: see 386 book for details of this. */
115typedef struct
116{
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120}
121modrm_byte;
122
123/* x86-64 extension prefix. */
124typedef int rex_byte;
125
6305a203
L
126/* 386 opcode byte to code indirect addressing. */
127typedef struct
128{
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132}
133sib_byte;
134
6305a203
L
135/* x86 arch names, types and features */
136typedef struct
137{
138 const char *name; /* arch name */
8a2c8fef 139 unsigned int len; /* arch string length */
6305a203
L
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
8a2c8fef 142 unsigned int skip; /* show_arch should skip this. */
6305a203
L
143}
144arch_entry;
145
293f5f65
L
146/* Used to turn off indicated flags. */
147typedef struct
148{
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152}
153noarch_entry;
154
78f12dd3 155static void update_code_flag (int, int);
e3bb37b5
L
156static void set_code_flag (int);
157static void set_16bit_gcc_code_flag (int);
158static void set_intel_syntax (int);
1efbbeb4 159static void set_intel_mnemonic (int);
db51cc60 160static void set_allow_index_reg (int);
7bab8ab5 161static void set_check (int);
e3bb37b5 162static void set_cpu_arch (int);
6482c264 163#ifdef TE_PE
e3bb37b5 164static void pe_directive_secrel (int);
6482c264 165#endif
e3bb37b5
L
166static void signed_cons (int);
167static char *output_invalid (int c);
ee86248c
JB
168static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
a7619375 172static int i386_att_operand (char *);
e3bb37b5 173static int i386_intel_operand (char *, int);
ee86248c
JB
174static int i386_intel_simplify (expressionS *);
175static int i386_intel_parse_name (const char *, expressionS *);
e3bb37b5
L
176static const reg_entry *parse_register (char *, char **);
177static char *parse_insn (char *, char *);
178static char *parse_operands (char *, const char *);
179static void swap_operands (void);
4d456e3d 180static void swap_2_operands (int, int);
48bcea9f 181static enum flag_code i386_addressing_mode (void);
e3bb37b5
L
182static void optimize_imm (void);
183static void optimize_disp (void);
83b16ac6 184static const insn_template *match_template (char);
e3bb37b5
L
185static int check_string (void);
186static int process_suffix (void);
187static int check_byte_reg (void);
188static int check_long_reg (void);
189static int check_qword_reg (void);
190static int check_word_reg (void);
191static int finalize_imm (void);
192static int process_operands (void);
193static const seg_entry *build_modrm_byte (void);
194static void output_insn (void);
195static void output_imm (fragS *, offsetT);
196static void output_disp (fragS *, offsetT);
29b0f896 197#ifndef I386COFF
e3bb37b5 198static void s_bss (int);
252b5132 199#endif
17d4e2a2
L
200#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201static void handle_large_common (int small ATTRIBUTE_UNUSED);
b4a3a7b4
L
202
203/* GNU_PROPERTY_X86_ISA_1_USED. */
204static unsigned int x86_isa_1_used;
205/* GNU_PROPERTY_X86_FEATURE_2_USED. */
206static unsigned int x86_feature_2_used;
207/* Generate x86 used ISA and feature properties. */
208static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
17d4e2a2 209#endif
252b5132 210
a847613f 211static const char *default_arch = DEFAULT_ARCH;
3e73aa7c 212
8a6fb3f9
JB
213/* parse_register() returns this when a register alias cannot be used. */
214static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
215 { Dw2Inval, Dw2Inval } };
216
43234a1e
L
217/* This struct describes rounding control and SAE in the instruction. */
218struct RC_Operation
219{
220 enum rc_type
221 {
222 rne = 0,
223 rd,
224 ru,
225 rz,
226 saeonly
227 } type;
228 int operand;
229};
230
231static struct RC_Operation rc_op;
232
233/* The struct describes masking, applied to OPERAND in the instruction.
234 MASK is a pointer to the corresponding mask register. ZEROING tells
235 whether merging or zeroing mask is used. */
236struct Mask_Operation
237{
238 const reg_entry *mask;
239 unsigned int zeroing;
240 /* The operand where this operation is associated. */
241 int operand;
242};
243
244static struct Mask_Operation mask_op;
245
246/* The struct describes broadcasting, applied to OPERAND. FACTOR is
247 broadcast factor. */
248struct Broadcast_Operation
249{
8e6e0792 250 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
43234a1e
L
251 int type;
252
253 /* Index of broadcasted operand. */
254 int operand;
4a1b91ea
L
255
256 /* Number of bytes to broadcast. */
257 int bytes;
43234a1e
L
258};
259
260static struct Broadcast_Operation broadcast_op;
261
c0f3af97
L
262/* VEX prefix. */
263typedef struct
264{
43234a1e
L
265 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
266 unsigned char bytes[4];
c0f3af97
L
267 unsigned int length;
268 /* Destination or source register specifier. */
269 const reg_entry *register_specifier;
270} vex_prefix;
271
252b5132 272/* 'md_assemble ()' gathers together information and puts it into a
47926f60 273 i386_insn. */
252b5132 274
520dc8e8
AM
275union i386_op
276 {
277 expressionS *disps;
278 expressionS *imms;
279 const reg_entry *regs;
280 };
281
a65babc9
L
282enum i386_error
283 {
86e026a4 284 operand_size_mismatch,
a65babc9
L
285 operand_type_mismatch,
286 register_type_mismatch,
287 number_of_operands_mismatch,
288 invalid_instruction_suffix,
289 bad_imm4,
a65babc9
L
290 unsupported_with_intel_mnemonic,
291 unsupported_syntax,
6c30d220
L
292 unsupported,
293 invalid_vsib_address,
7bab8ab5 294 invalid_vector_register_set,
43234a1e
L
295 unsupported_vector_index_register,
296 unsupported_broadcast,
43234a1e
L
297 broadcast_needed,
298 unsupported_masking,
299 mask_not_on_destination,
300 no_default_mask,
301 unsupported_rc_sae,
302 rc_sae_operand_not_last_imm,
303 invalid_register_operand,
a65babc9
L
304 };
305
252b5132
RH
306struct _i386_insn
307 {
47926f60 308 /* TM holds the template for the insn were currently assembling. */
d3ce72d0 309 insn_template tm;
252b5132 310
7d5e4556
L
311 /* SUFFIX holds the instruction size suffix for byte, word, dword
312 or qword, if given. */
252b5132
RH
313 char suffix;
314
47926f60 315 /* OPERANDS gives the number of given operands. */
252b5132
RH
316 unsigned int operands;
317
318 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
319 of given register, displacement, memory operands and immediate
47926f60 320 operands. */
252b5132
RH
321 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
322
323 /* TYPES [i] is the type (see above #defines) which tells us how to
520dc8e8 324 use OP[i] for the corresponding operand. */
40fb9820 325 i386_operand_type types[MAX_OPERANDS];
252b5132 326
520dc8e8
AM
327 /* Displacement expression, immediate expression, or register for each
328 operand. */
329 union i386_op op[MAX_OPERANDS];
252b5132 330
3e73aa7c
JH
331 /* Flags for operands. */
332 unsigned int flags[MAX_OPERANDS];
333#define Operand_PCrel 1
c48dadc9 334#define Operand_Mem 2
3e73aa7c 335
252b5132 336 /* Relocation type for operand */
f86103b7 337 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
252b5132 338
252b5132
RH
339 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
340 the base index byte below. */
341 const reg_entry *base_reg;
342 const reg_entry *index_reg;
343 unsigned int log2_scale_factor;
344
345 /* SEG gives the seg_entries of this insn. They are zero unless
47926f60 346 explicit segment overrides are given. */
ce8a8b2f 347 const seg_entry *seg[2];
252b5132 348
8325cc63
JB
349 /* Copied first memory operand string, for re-checking. */
350 char *memop1_string;
351
252b5132
RH
352 /* PREFIX holds all the given prefix opcodes (usually null).
353 PREFIXES is the number of prefix opcodes. */
354 unsigned int prefixes;
355 unsigned char prefix[MAX_PREFIXES];
356
50128d0c
JB
357 /* Register is in low 3 bits of opcode. */
358 bfd_boolean short_form;
359
6f2f06be
JB
360 /* The operand to a branch insn indicates an absolute branch. */
361 bfd_boolean jumpabsolute;
362
b4a3a7b4
L
363 /* Has MMX register operands. */
364 bfd_boolean has_regmmx;
365
366 /* Has XMM register operands. */
367 bfd_boolean has_regxmm;
368
369 /* Has YMM register operands. */
370 bfd_boolean has_regymm;
371
372 /* Has ZMM register operands. */
373 bfd_boolean has_regzmm;
374
e379e5f3
L
375 /* Has GOTPC or TLS relocation. */
376 bfd_boolean has_gotpc_tls_reloc;
377
252b5132 378 /* RM and SIB are the modrm byte and the sib byte where the
c1e679ec 379 addressing modes of this insn are encoded. */
252b5132 380 modrm_byte rm;
3e73aa7c 381 rex_byte rex;
43234a1e 382 rex_byte vrex;
252b5132 383 sib_byte sib;
c0f3af97 384 vex_prefix vex;
b6169b20 385
43234a1e
L
386 /* Masking attributes. */
387 struct Mask_Operation *mask;
388
389 /* Rounding control and SAE attributes. */
390 struct RC_Operation *rounding;
391
392 /* Broadcasting attributes. */
393 struct Broadcast_Operation *broadcast;
394
395 /* Compressed disp8*N attribute. */
396 unsigned int memshift;
397
86fa6981
L
398 /* Prefer load or store in encoding. */
399 enum
400 {
401 dir_encoding_default = 0,
402 dir_encoding_load,
64c49ab3
JB
403 dir_encoding_store,
404 dir_encoding_swap
86fa6981 405 } dir_encoding;
891edac4 406
a501d77e
L
407 /* Prefer 8bit or 32bit displacement in encoding. */
408 enum
409 {
410 disp_encoding_default = 0,
411 disp_encoding_8bit,
412 disp_encoding_32bit
413 } disp_encoding;
f8a5c266 414
6b6b6807
L
415 /* Prefer the REX byte in encoding. */
416 bfd_boolean rex_encoding;
417
b6f8c7c4
L
418 /* Disable instruction size optimization. */
419 bfd_boolean no_optimize;
420
86fa6981
L
421 /* How to encode vector instructions. */
422 enum
423 {
424 vex_encoding_default = 0,
42e04b36 425 vex_encoding_vex,
86fa6981 426 vex_encoding_vex3,
da4977e0
JB
427 vex_encoding_evex,
428 vex_encoding_error
86fa6981
L
429 } vec_encoding;
430
d5de92cf
L
431 /* REP prefix. */
432 const char *rep_prefix;
433
165de32a
L
434 /* HLE prefix. */
435 const char *hle_prefix;
42164a71 436
7e8b059b
L
437 /* Have BND prefix. */
438 const char *bnd_prefix;
439
04ef582a
L
440 /* Have NOTRACK prefix. */
441 const char *notrack_prefix;
442
891edac4 443 /* Error message. */
a65babc9 444 enum i386_error error;
252b5132
RH
445 };
446
447typedef struct _i386_insn i386_insn;
448
43234a1e
L
449/* Link RC type with corresponding string, that'll be looked for in
450 asm. */
451struct RC_name
452{
453 enum rc_type type;
454 const char *name;
455 unsigned int len;
456};
457
458static const struct RC_name RC_NamesTable[] =
459{
460 { rne, STRING_COMMA_LEN ("rn-sae") },
461 { rd, STRING_COMMA_LEN ("rd-sae") },
462 { ru, STRING_COMMA_LEN ("ru-sae") },
463 { rz, STRING_COMMA_LEN ("rz-sae") },
464 { saeonly, STRING_COMMA_LEN ("sae") },
465};
466
252b5132
RH
467/* List of chars besides those in app.c:symbol_chars that can start an
468 operand. Used to prevent the scrubber eating vital white-space. */
86fa6981 469const char extra_symbol_chars[] = "*%-([{}"
252b5132 470#ifdef LEX_AT
32137342
NC
471 "@"
472#endif
473#ifdef LEX_QM
474 "?"
252b5132 475#endif
32137342 476 ;
252b5132 477
29b0f896
AM
478#if (defined (TE_I386AIX) \
479 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
3896cfd5 480 && !defined (TE_GNU) \
29b0f896 481 && !defined (TE_LINUX) \
8d63c93e 482 && !defined (TE_NACL) \
29b0f896 483 && !defined (TE_FreeBSD) \
5b806d27 484 && !defined (TE_DragonFly) \
29b0f896 485 && !defined (TE_NetBSD)))
252b5132 486/* This array holds the chars that always start a comment. If the
b3b91714
AM
487 pre-processor is disabled, these aren't very useful. The option
488 --divide will remove '/' from this list. */
489const char *i386_comment_chars = "#/";
490#define SVR4_COMMENT_CHARS 1
252b5132 491#define PREFIX_SEPARATOR '\\'
252b5132 492
b3b91714
AM
493#else
494const char *i386_comment_chars = "#";
495#define PREFIX_SEPARATOR '/'
496#endif
497
252b5132
RH
498/* This array holds the chars that only start a comment at the beginning of
499 a line. If the line seems to have the form '# 123 filename'
ce8a8b2f
AM
500 .line and .file directives will appear in the pre-processed output.
501 Note that input_file.c hand checks for '#' at the beginning of the
252b5132 502 first line of the input file. This is because the compiler outputs
ce8a8b2f
AM
503 #NO_APP at the beginning of its output.
504 Also note that comments started like this one will always work if
252b5132 505 '/' isn't otherwise defined. */
b3b91714 506const char line_comment_chars[] = "#/";
252b5132 507
63a0b638 508const char line_separator_chars[] = ";";
252b5132 509
ce8a8b2f
AM
510/* Chars that can be used to separate mant from exp in floating point
511 nums. */
252b5132
RH
512const char EXP_CHARS[] = "eE";
513
ce8a8b2f
AM
514/* Chars that mean this number is a floating point constant
515 As in 0f12.456
516 or 0d1.2345e12. */
252b5132
RH
517const char FLT_CHARS[] = "fFdDxX";
518
ce8a8b2f 519/* Tables for lexical analysis. */
252b5132
RH
520static char mnemonic_chars[256];
521static char register_chars[256];
522static char operand_chars[256];
523static char identifier_chars[256];
524static char digit_chars[256];
525
ce8a8b2f 526/* Lexical macros. */
252b5132
RH
527#define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
528#define is_operand_char(x) (operand_chars[(unsigned char) x])
529#define is_register_char(x) (register_chars[(unsigned char) x])
530#define is_space_char(x) ((x) == ' ')
531#define is_identifier_char(x) (identifier_chars[(unsigned char) x])
532#define is_digit_char(x) (digit_chars[(unsigned char) x])
533
0234cb7c 534/* All non-digit non-letter characters that may occur in an operand. */
252b5132
RH
535static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
536
537/* md_assemble() always leaves the strings it's passed unaltered. To
538 effect this we maintain a stack of saved characters that we've smashed
539 with '\0's (indicating end of strings for various sub-fields of the
47926f60 540 assembler instruction). */
252b5132 541static char save_stack[32];
ce8a8b2f 542static char *save_stack_p;
252b5132
RH
543#define END_STRING_AND_SAVE(s) \
544 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
545#define RESTORE_END_STRING(s) \
546 do { *(s) = *--save_stack_p; } while (0)
547
47926f60 548/* The instruction we're assembling. */
252b5132
RH
549static i386_insn i;
550
551/* Possible templates for current insn. */
552static const templates *current_templates;
553
31b2323c
L
554/* Per instruction expressionS buffers: max displacements & immediates. */
555static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
556static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
252b5132 557
47926f60 558/* Current operand we are working on. */
ee86248c 559static int this_operand = -1;
252b5132 560
3e73aa7c
JH
561/* We support four different modes. FLAG_CODE variable is used to distinguish
562 these. */
563
564enum flag_code {
565 CODE_32BIT,
566 CODE_16BIT,
567 CODE_64BIT };
568
569static enum flag_code flag_code;
4fa24527 570static unsigned int object_64bit;
862be3fb 571static unsigned int disallow_64bit_reloc;
3e73aa7c 572static int use_rela_relocations = 0;
e379e5f3
L
573/* __tls_get_addr/___tls_get_addr symbol for TLS. */
574static const char *tls_get_addr;
3e73aa7c 575
7af8ed2d
NC
576#if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
577 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
578 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
579
351f65ca
L
580/* The ELF ABI to use. */
581enum x86_elf_abi
582{
583 I386_ABI,
7f56bc95
L
584 X86_64_ABI,
585 X86_64_X32_ABI
351f65ca
L
586};
587
588static enum x86_elf_abi x86_elf_abi = I386_ABI;
7af8ed2d 589#endif
351f65ca 590
167ad85b
TG
591#if defined (TE_PE) || defined (TE_PEP)
592/* Use big object file format. */
593static int use_big_obj = 0;
594#endif
595
8dcea932
L
596#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
597/* 1 if generating code for a shared library. */
598static int shared = 0;
599#endif
600
47926f60
KH
601/* 1 for intel syntax,
602 0 if att syntax. */
603static int intel_syntax = 0;
252b5132 604
4b5aaf5f
L
605static enum x86_64_isa
606{
607 amd64 = 1, /* AMD64 ISA. */
608 intel64 /* Intel64 ISA. */
609} isa64;
e89c5eaa 610
1efbbeb4
L
611/* 1 for intel mnemonic,
612 0 if att mnemonic. */
613static int intel_mnemonic = !SYSV386_COMPAT;
614
a60de03c
JB
615/* 1 if pseudo registers are permitted. */
616static int allow_pseudo_reg = 0;
617
47926f60
KH
618/* 1 if register prefix % not required. */
619static int allow_naked_reg = 0;
252b5132 620
33eaf5de 621/* 1 if the assembler should add BND prefix for all control-transferring
7e8b059b
L
622 instructions supporting it, even if this prefix wasn't specified
623 explicitly. */
624static int add_bnd_prefix = 0;
625
ba104c83 626/* 1 if pseudo index register, eiz/riz, is allowed . */
db51cc60
L
627static int allow_index_reg = 0;
628
d022bddd
IT
629/* 1 if the assembler should ignore LOCK prefix, even if it was
630 specified explicitly. */
631static int omit_lock_prefix = 0;
632
e4e00185
AS
633/* 1 if the assembler should encode lfence, mfence, and sfence as
634 "lock addl $0, (%{re}sp)". */
635static int avoid_fence = 0;
636
ae531041
L
637/* 1 if lfence should be inserted after every load. */
638static int lfence_after_load = 0;
639
640/* Non-zero if lfence should be inserted before indirect branch. */
641static enum lfence_before_indirect_branch_kind
642 {
643 lfence_branch_none = 0,
644 lfence_branch_register,
645 lfence_branch_memory,
646 lfence_branch_all
647 }
648lfence_before_indirect_branch;
649
650/* Non-zero if lfence should be inserted before ret. */
651static enum lfence_before_ret_kind
652 {
653 lfence_before_ret_none = 0,
654 lfence_before_ret_not,
a09f656b 655 lfence_before_ret_or,
656 lfence_before_ret_shl
ae531041
L
657 }
658lfence_before_ret;
659
660/* Types of previous instruction is .byte or prefix. */
e379e5f3
L
661static struct
662 {
663 segT seg;
664 const char *file;
665 const char *name;
666 unsigned int line;
667 enum last_insn_kind
668 {
669 last_insn_other = 0,
670 last_insn_directive,
671 last_insn_prefix
672 } kind;
673 } last_insn;
674
0cb4071e
L
675/* 1 if the assembler should generate relax relocations. */
676
677static int generate_relax_relocations
678 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
679
7bab8ab5 680static enum check_kind
daf50ae7 681 {
7bab8ab5
JB
682 check_none = 0,
683 check_warning,
684 check_error
daf50ae7 685 }
7bab8ab5 686sse_check, operand_check = check_warning;
daf50ae7 687
e379e5f3
L
688/* Non-zero if branches should be aligned within power of 2 boundary. */
689static int align_branch_power = 0;
690
691/* Types of branches to align. */
692enum align_branch_kind
693 {
694 align_branch_none = 0,
695 align_branch_jcc = 1,
696 align_branch_fused = 2,
697 align_branch_jmp = 3,
698 align_branch_call = 4,
699 align_branch_indirect = 5,
700 align_branch_ret = 6
701 };
702
703/* Type bits of branches to align. */
704enum align_branch_bit
705 {
706 align_branch_jcc_bit = 1 << align_branch_jcc,
707 align_branch_fused_bit = 1 << align_branch_fused,
708 align_branch_jmp_bit = 1 << align_branch_jmp,
709 align_branch_call_bit = 1 << align_branch_call,
710 align_branch_indirect_bit = 1 << align_branch_indirect,
711 align_branch_ret_bit = 1 << align_branch_ret
712 };
713
714static unsigned int align_branch = (align_branch_jcc_bit
715 | align_branch_fused_bit
716 | align_branch_jmp_bit);
717
79d72f45
HL
718/* Types of condition jump used by macro-fusion. */
719enum mf_jcc_kind
720 {
721 mf_jcc_jo = 0, /* base opcode 0x70 */
722 mf_jcc_jc, /* base opcode 0x72 */
723 mf_jcc_je, /* base opcode 0x74 */
724 mf_jcc_jna, /* base opcode 0x76 */
725 mf_jcc_js, /* base opcode 0x78 */
726 mf_jcc_jp, /* base opcode 0x7a */
727 mf_jcc_jl, /* base opcode 0x7c */
728 mf_jcc_jle, /* base opcode 0x7e */
729 };
730
731/* Types of compare flag-modifying insntructions used by macro-fusion. */
732enum mf_cmp_kind
733 {
734 mf_cmp_test_and, /* test/cmp */
735 mf_cmp_alu_cmp, /* add/sub/cmp */
736 mf_cmp_incdec /* inc/dec */
737 };
738
e379e5f3
L
739/* The maximum padding size for fused jcc. CMP like instruction can
740 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
741 prefixes. */
742#define MAX_FUSED_JCC_PADDING_SIZE 20
743
744/* The maximum number of prefixes added for an instruction. */
745static unsigned int align_branch_prefix_size = 5;
746
b6f8c7c4
L
747/* Optimization:
748 1. Clear the REX_W bit with register operand if possible.
749 2. Above plus use 128bit vector instruction to clear the full vector
750 register.
751 */
752static int optimize = 0;
753
754/* Optimization:
755 1. Clear the REX_W bit with register operand if possible.
756 2. Above plus use 128bit vector instruction to clear the full vector
757 register.
758 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
759 "testb $imm7,%r8".
760 */
761static int optimize_for_space = 0;
762
2ca3ace5
L
763/* Register prefix used for error message. */
764static const char *register_prefix = "%";
765
47926f60
KH
766/* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
767 leave, push, and pop instructions so that gcc has the same stack
768 frame as in 32 bit mode. */
769static char stackop_size = '\0';
eecb386c 770
12b55ccc
L
771/* Non-zero to optimize code alignment. */
772int optimize_align_code = 1;
773
47926f60
KH
774/* Non-zero to quieten some warnings. */
775static int quiet_warnings = 0;
a38cf1db 776
47926f60
KH
777/* CPU name. */
778static const char *cpu_arch_name = NULL;
6305a203 779static char *cpu_sub_arch_name = NULL;
a38cf1db 780
47926f60 781/* CPU feature flags. */
40fb9820
L
782static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
783
ccc9c027
L
784/* If we have selected a cpu we are generating instructions for. */
785static int cpu_arch_tune_set = 0;
786
9103f4f4 787/* Cpu we are generating instructions for. */
fbf3f584 788enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
9103f4f4
L
789
790/* CPU feature flags of cpu we are generating instructions for. */
40fb9820 791static i386_cpu_flags cpu_arch_tune_flags;
9103f4f4 792
ccc9c027 793/* CPU instruction set architecture used. */
fbf3f584 794enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
ccc9c027 795
9103f4f4 796/* CPU feature flags of instruction set architecture used. */
fbf3f584 797i386_cpu_flags cpu_arch_isa_flags;
9103f4f4 798
fddf5b5b
AM
799/* If set, conditional jumps are not automatically promoted to handle
800 larger than a byte offset. */
801static unsigned int no_cond_jump_promotion = 0;
802
c0f3af97
L
803/* Encode SSE instructions with VEX prefix. */
804static unsigned int sse2avx;
805
539f890d
L
806/* Encode scalar AVX instructions with specific vector length. */
807static enum
808 {
809 vex128 = 0,
810 vex256
811 } avxscalar;
812
03751133
L
813/* Encode VEX WIG instructions with specific vex.w. */
814static enum
815 {
816 vexw0 = 0,
817 vexw1
818 } vexwig;
819
43234a1e
L
820/* Encode scalar EVEX LIG instructions with specific vector length. */
821static enum
822 {
823 evexl128 = 0,
824 evexl256,
825 evexl512
826 } evexlig;
827
828/* Encode EVEX WIG instructions with specific evex.w. */
829static enum
830 {
831 evexw0 = 0,
832 evexw1
833 } evexwig;
834
d3d3c6db
IT
835/* Value to encode in EVEX RC bits, for SAE-only instructions. */
836static enum rc_type evexrcig = rne;
837
29b0f896 838/* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
87c245cc 839static symbolS *GOT_symbol;
29b0f896 840
a4447b93
RH
841/* The dwarf2 return column, adjusted for 32 or 64 bit. */
842unsigned int x86_dwarf2_return_column;
843
844/* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
845int x86_cie_data_alignment;
846
252b5132 847/* Interface to relax_segment.
fddf5b5b
AM
848 There are 3 major relax states for 386 jump insns because the
849 different types of jumps add different sizes to frags when we're
e379e5f3
L
850 figuring out what sort of jump to choose to reach a given label.
851
852 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
853 branches which are handled by md_estimate_size_before_relax() and
854 i386_generic_table_relax_frag(). */
252b5132 855
47926f60 856/* Types. */
93c2a809
AM
857#define UNCOND_JUMP 0
858#define COND_JUMP 1
859#define COND_JUMP86 2
e379e5f3
L
860#define BRANCH_PADDING 3
861#define BRANCH_PREFIX 4
862#define FUSED_JCC_PADDING 5
fddf5b5b 863
47926f60 864/* Sizes. */
252b5132
RH
865#define CODE16 1
866#define SMALL 0
29b0f896 867#define SMALL16 (SMALL | CODE16)
252b5132 868#define BIG 2
29b0f896 869#define BIG16 (BIG | CODE16)
252b5132
RH
870
871#ifndef INLINE
872#ifdef __GNUC__
873#define INLINE __inline__
874#else
875#define INLINE
876#endif
877#endif
878
fddf5b5b
AM
879#define ENCODE_RELAX_STATE(type, size) \
880 ((relax_substateT) (((type) << 2) | (size)))
881#define TYPE_FROM_RELAX_STATE(s) \
882 ((s) >> 2)
883#define DISP_SIZE_FROM_RELAX_STATE(s) \
884 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
252b5132
RH
885
886/* This table is used by relax_frag to promote short jumps to long
887 ones where necessary. SMALL (short) jumps may be promoted to BIG
888 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
889 don't allow a short jump in a 32 bit code segment to be promoted to
890 a 16 bit offset jump because it's slower (requires data size
891 prefix), and doesn't work, unless the destination is in the bottom
892 64k of the code segment (The top 16 bits of eip are zeroed). */
893
894const relax_typeS md_relax_table[] =
895{
24eab124
AM
896 /* The fields are:
897 1) most positive reach of this state,
898 2) most negative reach of this state,
93c2a809 899 3) how many bytes this mode will have in the variable part of the frag
ce8a8b2f 900 4) which index into the table to try if we can't fit into this one. */
252b5132 901
fddf5b5b 902 /* UNCOND_JUMP states. */
93c2a809
AM
903 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
904 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
905 /* dword jmp adds 4 bytes to frag:
906 0 extra opcode bytes, 4 displacement bytes. */
252b5132 907 {0, 0, 4, 0},
93c2a809
AM
908 /* word jmp adds 2 byte2 to frag:
909 0 extra opcode bytes, 2 displacement bytes. */
252b5132
RH
910 {0, 0, 2, 0},
911
93c2a809
AM
912 /* COND_JUMP states. */
913 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
914 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
915 /* dword conditionals adds 5 bytes to frag:
916 1 extra opcode byte, 4 displacement bytes. */
917 {0, 0, 5, 0},
fddf5b5b 918 /* word conditionals add 3 bytes to frag:
93c2a809
AM
919 1 extra opcode byte, 2 displacement bytes. */
920 {0, 0, 3, 0},
921
922 /* COND_JUMP86 states. */
923 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
924 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
925 /* dword conditionals adds 5 bytes to frag:
926 1 extra opcode byte, 4 displacement bytes. */
927 {0, 0, 5, 0},
928 /* word conditionals add 4 bytes to frag:
929 1 displacement byte and a 3 byte long branch insn. */
930 {0, 0, 4, 0}
252b5132
RH
931};
932
9103f4f4
L
933static const arch_entry cpu_arch[] =
934{
89507696
JB
935 /* Do not replace the first two entries - i386_target_format()
936 relies on them being there in this order. */
8a2c8fef 937 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
293f5f65 938 CPU_GENERIC32_FLAGS, 0 },
8a2c8fef 939 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
293f5f65 940 CPU_GENERIC64_FLAGS, 0 },
8a2c8fef 941 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
293f5f65 942 CPU_NONE_FLAGS, 0 },
8a2c8fef 943 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
293f5f65 944 CPU_I186_FLAGS, 0 },
8a2c8fef 945 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
293f5f65 946 CPU_I286_FLAGS, 0 },
8a2c8fef 947 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
293f5f65 948 CPU_I386_FLAGS, 0 },
8a2c8fef 949 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
293f5f65 950 CPU_I486_FLAGS, 0 },
8a2c8fef 951 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
293f5f65 952 CPU_I586_FLAGS, 0 },
8a2c8fef 953 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
293f5f65 954 CPU_I686_FLAGS, 0 },
8a2c8fef 955 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
293f5f65 956 CPU_I586_FLAGS, 0 },
8a2c8fef 957 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
293f5f65 958 CPU_PENTIUMPRO_FLAGS, 0 },
8a2c8fef 959 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
293f5f65 960 CPU_P2_FLAGS, 0 },
8a2c8fef 961 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
293f5f65 962 CPU_P3_FLAGS, 0 },
8a2c8fef 963 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
293f5f65 964 CPU_P4_FLAGS, 0 },
8a2c8fef 965 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
293f5f65 966 CPU_CORE_FLAGS, 0 },
8a2c8fef 967 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
293f5f65 968 CPU_NOCONA_FLAGS, 0 },
8a2c8fef 969 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
293f5f65 970 CPU_CORE_FLAGS, 1 },
8a2c8fef 971 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
293f5f65 972 CPU_CORE_FLAGS, 0 },
8a2c8fef 973 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
293f5f65 974 CPU_CORE2_FLAGS, 1 },
8a2c8fef 975 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
293f5f65 976 CPU_CORE2_FLAGS, 0 },
8a2c8fef 977 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
293f5f65 978 CPU_COREI7_FLAGS, 0 },
8a2c8fef 979 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
293f5f65 980 CPU_L1OM_FLAGS, 0 },
7a9068fe 981 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
293f5f65 982 CPU_K1OM_FLAGS, 0 },
81486035 983 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
293f5f65 984 CPU_IAMCU_FLAGS, 0 },
8a2c8fef 985 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
293f5f65 986 CPU_K6_FLAGS, 0 },
8a2c8fef 987 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
293f5f65 988 CPU_K6_2_FLAGS, 0 },
8a2c8fef 989 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
293f5f65 990 CPU_ATHLON_FLAGS, 0 },
8a2c8fef 991 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
293f5f65 992 CPU_K8_FLAGS, 1 },
8a2c8fef 993 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
293f5f65 994 CPU_K8_FLAGS, 0 },
8a2c8fef 995 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
293f5f65 996 CPU_K8_FLAGS, 0 },
8a2c8fef 997 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
293f5f65 998 CPU_AMDFAM10_FLAGS, 0 },
8aedb9fe 999 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
293f5f65 1000 CPU_BDVER1_FLAGS, 0 },
8aedb9fe 1001 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
293f5f65 1002 CPU_BDVER2_FLAGS, 0 },
5e5c50d3 1003 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
293f5f65 1004 CPU_BDVER3_FLAGS, 0 },
c7b0bd56 1005 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
293f5f65 1006 CPU_BDVER4_FLAGS, 0 },
029f3522 1007 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
293f5f65 1008 CPU_ZNVER1_FLAGS, 0 },
a9660a6f
AP
1009 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1010 CPU_ZNVER2_FLAGS, 0 },
7b458c12 1011 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
293f5f65 1012 CPU_BTVER1_FLAGS, 0 },
7b458c12 1013 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
293f5f65 1014 CPU_BTVER2_FLAGS, 0 },
8a2c8fef 1015 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
293f5f65 1016 CPU_8087_FLAGS, 0 },
8a2c8fef 1017 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
293f5f65 1018 CPU_287_FLAGS, 0 },
8a2c8fef 1019 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
293f5f65 1020 CPU_387_FLAGS, 0 },
1848e567
L
1021 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1022 CPU_687_FLAGS, 0 },
d871f3f4
L
1023 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1024 CPU_CMOV_FLAGS, 0 },
1025 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1026 CPU_FXSR_FLAGS, 0 },
8a2c8fef 1027 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
293f5f65 1028 CPU_MMX_FLAGS, 0 },
8a2c8fef 1029 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
293f5f65 1030 CPU_SSE_FLAGS, 0 },
8a2c8fef 1031 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
293f5f65 1032 CPU_SSE2_FLAGS, 0 },
8a2c8fef 1033 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
293f5f65 1034 CPU_SSE3_FLAGS, 0 },
af5c13b0
L
1035 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1036 CPU_SSE4A_FLAGS, 0 },
8a2c8fef 1037 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
293f5f65 1038 CPU_SSSE3_FLAGS, 0 },
8a2c8fef 1039 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
293f5f65 1040 CPU_SSE4_1_FLAGS, 0 },
8a2c8fef 1041 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
293f5f65 1042 CPU_SSE4_2_FLAGS, 0 },
8a2c8fef 1043 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
293f5f65 1044 CPU_SSE4_2_FLAGS, 0 },
8a2c8fef 1045 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
293f5f65 1046 CPU_AVX_FLAGS, 0 },
6c30d220 1047 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
293f5f65 1048 CPU_AVX2_FLAGS, 0 },
43234a1e 1049 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
293f5f65 1050 CPU_AVX512F_FLAGS, 0 },
43234a1e 1051 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
293f5f65 1052 CPU_AVX512CD_FLAGS, 0 },
43234a1e 1053 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
293f5f65 1054 CPU_AVX512ER_FLAGS, 0 },
43234a1e 1055 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
293f5f65 1056 CPU_AVX512PF_FLAGS, 0 },
1dfc6506 1057 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
293f5f65 1058 CPU_AVX512DQ_FLAGS, 0 },
1dfc6506 1059 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
293f5f65 1060 CPU_AVX512BW_FLAGS, 0 },
1dfc6506 1061 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
293f5f65 1062 CPU_AVX512VL_FLAGS, 0 },
8a2c8fef 1063 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
293f5f65 1064 CPU_VMX_FLAGS, 0 },
8729a6f6 1065 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
293f5f65 1066 CPU_VMFUNC_FLAGS, 0 },
8a2c8fef 1067 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
293f5f65 1068 CPU_SMX_FLAGS, 0 },
8a2c8fef 1069 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
293f5f65 1070 CPU_XSAVE_FLAGS, 0 },
c7b8aa3a 1071 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
293f5f65 1072 CPU_XSAVEOPT_FLAGS, 0 },
1dfc6506 1073 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
293f5f65 1074 CPU_XSAVEC_FLAGS, 0 },
1dfc6506 1075 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
293f5f65 1076 CPU_XSAVES_FLAGS, 0 },
8a2c8fef 1077 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
293f5f65 1078 CPU_AES_FLAGS, 0 },
8a2c8fef 1079 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
293f5f65 1080 CPU_PCLMUL_FLAGS, 0 },
8a2c8fef 1081 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
293f5f65 1082 CPU_PCLMUL_FLAGS, 1 },
c7b8aa3a 1083 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
293f5f65 1084 CPU_FSGSBASE_FLAGS, 0 },
c7b8aa3a 1085 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
293f5f65 1086 CPU_RDRND_FLAGS, 0 },
c7b8aa3a 1087 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
293f5f65 1088 CPU_F16C_FLAGS, 0 },
6c30d220 1089 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
293f5f65 1090 CPU_BMI2_FLAGS, 0 },
8a2c8fef 1091 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
293f5f65 1092 CPU_FMA_FLAGS, 0 },
8a2c8fef 1093 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
293f5f65 1094 CPU_FMA4_FLAGS, 0 },
8a2c8fef 1095 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
293f5f65 1096 CPU_XOP_FLAGS, 0 },
8a2c8fef 1097 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
293f5f65 1098 CPU_LWP_FLAGS, 0 },
8a2c8fef 1099 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
293f5f65 1100 CPU_MOVBE_FLAGS, 0 },
60aa667e 1101 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
293f5f65 1102 CPU_CX16_FLAGS, 0 },
8a2c8fef 1103 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
293f5f65 1104 CPU_EPT_FLAGS, 0 },
6c30d220 1105 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
293f5f65 1106 CPU_LZCNT_FLAGS, 0 },
272a84b1
L
1107 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1108 CPU_POPCNT_FLAGS, 0 },
42164a71 1109 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
293f5f65 1110 CPU_HLE_FLAGS, 0 },
42164a71 1111 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
293f5f65 1112 CPU_RTM_FLAGS, 0 },
6c30d220 1113 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
293f5f65 1114 CPU_INVPCID_FLAGS, 0 },
8a2c8fef 1115 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
293f5f65 1116 CPU_CLFLUSH_FLAGS, 0 },
22109423 1117 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
293f5f65 1118 CPU_NOP_FLAGS, 0 },
8a2c8fef 1119 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
293f5f65 1120 CPU_SYSCALL_FLAGS, 0 },
8a2c8fef 1121 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
293f5f65 1122 CPU_RDTSCP_FLAGS, 0 },
8a2c8fef 1123 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
293f5f65 1124 CPU_3DNOW_FLAGS, 0 },
8a2c8fef 1125 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
293f5f65 1126 CPU_3DNOWA_FLAGS, 0 },
8a2c8fef 1127 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
293f5f65 1128 CPU_PADLOCK_FLAGS, 0 },
8a2c8fef 1129 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
293f5f65 1130 CPU_SVME_FLAGS, 1 },
8a2c8fef 1131 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
293f5f65 1132 CPU_SVME_FLAGS, 0 },
8a2c8fef 1133 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
293f5f65 1134 CPU_SSE4A_FLAGS, 0 },
8a2c8fef 1135 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
293f5f65 1136 CPU_ABM_FLAGS, 0 },
87973e9f 1137 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
293f5f65 1138 CPU_BMI_FLAGS, 0 },
2a2a0f38 1139 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
293f5f65 1140 CPU_TBM_FLAGS, 0 },
e2e1fcde 1141 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
293f5f65 1142 CPU_ADX_FLAGS, 0 },
e2e1fcde 1143 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
293f5f65 1144 CPU_RDSEED_FLAGS, 0 },
e2e1fcde 1145 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
293f5f65 1146 CPU_PRFCHW_FLAGS, 0 },
5c111e37 1147 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
293f5f65 1148 CPU_SMAP_FLAGS, 0 },
7e8b059b 1149 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
293f5f65 1150 CPU_MPX_FLAGS, 0 },
a0046408 1151 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
293f5f65 1152 CPU_SHA_FLAGS, 0 },
963f3586 1153 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
293f5f65 1154 CPU_CLFLUSHOPT_FLAGS, 0 },
dcf893b5 1155 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
293f5f65 1156 CPU_PREFETCHWT1_FLAGS, 0 },
2cf200a4 1157 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
293f5f65 1158 CPU_SE1_FLAGS, 0 },
c5e7287a 1159 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
293f5f65 1160 CPU_CLWB_FLAGS, 0 },
2cc1b5aa 1161 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
293f5f65 1162 CPU_AVX512IFMA_FLAGS, 0 },
14f195c9 1163 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
293f5f65 1164 CPU_AVX512VBMI_FLAGS, 0 },
920d2ddc
IT
1165 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1166 CPU_AVX512_4FMAPS_FLAGS, 0 },
47acf0bd
IT
1167 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1168 CPU_AVX512_4VNNIW_FLAGS, 0 },
620214f7
IT
1169 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1170 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
53467f57
IT
1171 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1172 CPU_AVX512_VBMI2_FLAGS, 0 },
8cfcb765
IT
1173 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1174 CPU_AVX512_VNNI_FLAGS, 0 },
ee6872be
IT
1175 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1176 CPU_AVX512_BITALG_FLAGS, 0 },
029f3522 1177 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
293f5f65 1178 CPU_CLZERO_FLAGS, 0 },
9916071f 1179 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
293f5f65 1180 CPU_MWAITX_FLAGS, 0 },
8eab4136 1181 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
293f5f65 1182 CPU_OSPKE_FLAGS, 0 },
8bc52696 1183 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
293f5f65 1184 CPU_RDPID_FLAGS, 0 },
6b40c462
L
1185 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1186 CPU_PTWRITE_FLAGS, 0 },
d777820b
IT
1187 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1188 CPU_IBT_FLAGS, 0 },
1189 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1190 CPU_SHSTK_FLAGS, 0 },
48521003
IT
1191 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1192 CPU_GFNI_FLAGS, 0 },
8dcf1fad
IT
1193 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1194 CPU_VAES_FLAGS, 0 },
ff1982d5
IT
1195 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1196 CPU_VPCLMULQDQ_FLAGS, 0 },
3233d7d0
IT
1197 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1198 CPU_WBNOINVD_FLAGS, 0 },
be3a8dca
IT
1199 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1200 CPU_PCONFIG_FLAGS, 0 },
de89d0a3
IT
1201 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1202 CPU_WAITPKG_FLAGS, 0 },
c48935d7
IT
1203 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1204 CPU_CLDEMOTE_FLAGS, 0 },
c0a30a9f
L
1205 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1206 CPU_MOVDIRI_FLAGS, 0 },
1207 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1208 CPU_MOVDIR64B_FLAGS, 0 },
d6aab7a1
XG
1209 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1210 CPU_AVX512_BF16_FLAGS, 0 },
9186c494
L
1211 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1212 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
dd455cf5
L
1213 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1214 CPU_ENQCMD_FLAGS, 0 },
4b27d27c
L
1215 { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1216 CPU_SERIALIZE_FLAGS, 0 },
142861df
JB
1217 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1218 CPU_RDPRU_FLAGS, 0 },
1219 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1220 CPU_MCOMMIT_FLAGS, 0 },
a847e322
JB
1221 { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1222 CPU_SEV_ES_FLAGS, 0 },
bb651e8b
CL
1223 { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1224 CPU_TSXLDTRK_FLAGS, 0 },
293f5f65
L
1225};
1226
1227static const noarch_entry cpu_noarch[] =
1228{
1229 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1848e567
L
1230 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1231 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1232 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
d871f3f4
L
1233 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1234 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
293f5f65
L
1235 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1236 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1848e567
L
1237 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1238 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
af5c13b0 1239 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1848e567
L
1240 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1241 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1242 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
af5c13b0 1243 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
293f5f65 1244 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1848e567 1245 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
144b71e2
L
1246 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1247 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1248 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1249 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1250 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1251 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1252 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1253 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1254 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
920d2ddc 1255 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
47acf0bd 1256 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
620214f7 1257 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
53467f57 1258 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
8cfcb765 1259 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
ee6872be 1260 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
d777820b
IT
1261 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1262 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
c0a30a9f
L
1263 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1264 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
d6aab7a1 1265 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
708a2fff
CL
1266 { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1267 CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
dd455cf5 1268 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
4b27d27c 1269 { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
bb651e8b 1270 { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
e413e4e9
AM
1271};
1272
704209c0 1273#ifdef I386COFF
a6c24e68
NC
1274/* Like s_lcomm_internal in gas/read.c but the alignment string
1275 is allowed to be optional. */
1276
1277static symbolS *
1278pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1279{
1280 addressT align = 0;
1281
1282 SKIP_WHITESPACE ();
1283
7ab9ffdd 1284 if (needs_align
a6c24e68
NC
1285 && *input_line_pointer == ',')
1286 {
1287 align = parse_align (needs_align - 1);
7ab9ffdd 1288
a6c24e68
NC
1289 if (align == (addressT) -1)
1290 return NULL;
1291 }
1292 else
1293 {
1294 if (size >= 8)
1295 align = 3;
1296 else if (size >= 4)
1297 align = 2;
1298 else if (size >= 2)
1299 align = 1;
1300 else
1301 align = 0;
1302 }
1303
1304 bss_alloc (symbolP, size, align);
1305 return symbolP;
1306}
1307
704209c0 1308static void
a6c24e68
NC
1309pe_lcomm (int needs_align)
1310{
1311 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1312}
704209c0 1313#endif
a6c24e68 1314
29b0f896
AM
1315const pseudo_typeS md_pseudo_table[] =
1316{
1317#if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1318 {"align", s_align_bytes, 0},
1319#else
1320 {"align", s_align_ptwo, 0},
1321#endif
1322 {"arch", set_cpu_arch, 0},
1323#ifndef I386COFF
1324 {"bss", s_bss, 0},
a6c24e68
NC
1325#else
1326 {"lcomm", pe_lcomm, 1},
29b0f896
AM
1327#endif
1328 {"ffloat", float_cons, 'f'},
1329 {"dfloat", float_cons, 'd'},
1330 {"tfloat", float_cons, 'x'},
1331 {"value", cons, 2},
d182319b 1332 {"slong", signed_cons, 4},
29b0f896
AM
1333 {"noopt", s_ignore, 0},
1334 {"optim", s_ignore, 0},
1335 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1336 {"code16", set_code_flag, CODE_16BIT},
1337 {"code32", set_code_flag, CODE_32BIT},
da5f19a2 1338#ifdef BFD64
29b0f896 1339 {"code64", set_code_flag, CODE_64BIT},
da5f19a2 1340#endif
29b0f896
AM
1341 {"intel_syntax", set_intel_syntax, 1},
1342 {"att_syntax", set_intel_syntax, 0},
1efbbeb4
L
1343 {"intel_mnemonic", set_intel_mnemonic, 1},
1344 {"att_mnemonic", set_intel_mnemonic, 0},
db51cc60
L
1345 {"allow_index_reg", set_allow_index_reg, 1},
1346 {"disallow_index_reg", set_allow_index_reg, 0},
7bab8ab5
JB
1347 {"sse_check", set_check, 0},
1348 {"operand_check", set_check, 1},
3b22753a
L
1349#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1350 {"largecomm", handle_large_common, 0},
07a53e5c 1351#else
68d20676 1352 {"file", dwarf2_directive_file, 0},
07a53e5c
RH
1353 {"loc", dwarf2_directive_loc, 0},
1354 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
3b22753a 1355#endif
6482c264
NC
1356#ifdef TE_PE
1357 {"secrel32", pe_directive_secrel, 0},
1358#endif
29b0f896
AM
1359 {0, 0, 0}
1360};
1361
1362/* For interface with expression (). */
1363extern char *input_line_pointer;
1364
1365/* Hash table for instruction mnemonic lookup. */
1366static struct hash_control *op_hash;
1367
1368/* Hash table for register lookup. */
1369static struct hash_control *reg_hash;
1370\f
ce8a8b2f
AM
1371 /* Various efficient no-op patterns for aligning code labels.
1372 Note: Don't try to assemble the instructions in the comments.
1373 0L and 0w are not legal. */
62a02d25
L
1374static const unsigned char f32_1[] =
1375 {0x90}; /* nop */
1376static const unsigned char f32_2[] =
1377 {0x66,0x90}; /* xchg %ax,%ax */
1378static const unsigned char f32_3[] =
1379 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1380static const unsigned char f32_4[] =
1381 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
62a02d25
L
1382static const unsigned char f32_6[] =
1383 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1384static const unsigned char f32_7[] =
1385 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
62a02d25 1386static const unsigned char f16_3[] =
3ae729d5 1387 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
62a02d25 1388static const unsigned char f16_4[] =
3ae729d5
L
1389 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1390static const unsigned char jump_disp8[] =
1391 {0xeb}; /* jmp disp8 */
1392static const unsigned char jump32_disp32[] =
1393 {0xe9}; /* jmp disp32 */
1394static const unsigned char jump16_disp32[] =
1395 {0x66,0xe9}; /* jmp disp32 */
62a02d25
L
1396/* 32-bit NOPs patterns. */
1397static const unsigned char *const f32_patt[] = {
3ae729d5 1398 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
62a02d25
L
1399};
1400/* 16-bit NOPs patterns. */
1401static const unsigned char *const f16_patt[] = {
3ae729d5 1402 f32_1, f32_2, f16_3, f16_4
62a02d25
L
1403};
1404/* nopl (%[re]ax) */
1405static const unsigned char alt_3[] =
1406 {0x0f,0x1f,0x00};
1407/* nopl 0(%[re]ax) */
1408static const unsigned char alt_4[] =
1409 {0x0f,0x1f,0x40,0x00};
1410/* nopl 0(%[re]ax,%[re]ax,1) */
1411static const unsigned char alt_5[] =
1412 {0x0f,0x1f,0x44,0x00,0x00};
1413/* nopw 0(%[re]ax,%[re]ax,1) */
1414static const unsigned char alt_6[] =
1415 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1416/* nopl 0L(%[re]ax) */
1417static const unsigned char alt_7[] =
1418 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1419/* nopl 0L(%[re]ax,%[re]ax,1) */
1420static const unsigned char alt_8[] =
1421 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1422/* nopw 0L(%[re]ax,%[re]ax,1) */
1423static const unsigned char alt_9[] =
1424 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1425/* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1426static const unsigned char alt_10[] =
1427 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
3ae729d5
L
1428/* data16 nopw %cs:0L(%eax,%eax,1) */
1429static const unsigned char alt_11[] =
1430 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
62a02d25
L
1431/* 32-bit and 64-bit NOPs patterns. */
1432static const unsigned char *const alt_patt[] = {
1433 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
3ae729d5 1434 alt_9, alt_10, alt_11
62a02d25
L
1435};
1436
1437/* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1438 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1439
1440static void
1441i386_output_nops (char *where, const unsigned char *const *patt,
1442 int count, int max_single_nop_size)
1443
1444{
3ae729d5
L
1445 /* Place the longer NOP first. */
1446 int last;
1447 int offset;
3076e594
NC
1448 const unsigned char *nops;
1449
1450 if (max_single_nop_size < 1)
1451 {
1452 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1453 max_single_nop_size);
1454 return;
1455 }
1456
1457 nops = patt[max_single_nop_size - 1];
3ae729d5
L
1458
1459 /* Use the smaller one if the requsted one isn't available. */
1460 if (nops == NULL)
62a02d25 1461 {
3ae729d5
L
1462 max_single_nop_size--;
1463 nops = patt[max_single_nop_size - 1];
62a02d25
L
1464 }
1465
3ae729d5
L
1466 last = count % max_single_nop_size;
1467
1468 count -= last;
1469 for (offset = 0; offset < count; offset += max_single_nop_size)
1470 memcpy (where + offset, nops, max_single_nop_size);
1471
1472 if (last)
1473 {
1474 nops = patt[last - 1];
1475 if (nops == NULL)
1476 {
1477 /* Use the smaller one plus one-byte NOP if the needed one
1478 isn't available. */
1479 last--;
1480 nops = patt[last - 1];
1481 memcpy (where + offset, nops, last);
1482 where[offset + last] = *patt[0];
1483 }
1484 else
1485 memcpy (where + offset, nops, last);
1486 }
62a02d25
L
1487}
1488
3ae729d5
L
1489static INLINE int
1490fits_in_imm7 (offsetT num)
1491{
1492 return (num & 0x7f) == num;
1493}
1494
1495static INLINE int
1496fits_in_imm31 (offsetT num)
1497{
1498 return (num & 0x7fffffff) == num;
1499}
62a02d25
L
1500
1501/* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1502 single NOP instruction LIMIT. */
1503
1504void
3ae729d5 1505i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
62a02d25 1506{
3ae729d5 1507 const unsigned char *const *patt = NULL;
62a02d25 1508 int max_single_nop_size;
3ae729d5
L
1509 /* Maximum number of NOPs before switching to jump over NOPs. */
1510 int max_number_of_nops;
62a02d25 1511
3ae729d5 1512 switch (fragP->fr_type)
62a02d25 1513 {
3ae729d5
L
1514 case rs_fill_nop:
1515 case rs_align_code:
1516 break;
e379e5f3
L
1517 case rs_machine_dependent:
1518 /* Allow NOP padding for jumps and calls. */
1519 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1520 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1521 break;
1522 /* Fall through. */
3ae729d5 1523 default:
62a02d25
L
1524 return;
1525 }
1526
ccc9c027
L
1527 /* We need to decide which NOP sequence to use for 32bit and
1528 64bit. When -mtune= is used:
4eed87de 1529
76bc74dc
L
1530 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1531 PROCESSOR_GENERIC32, f32_patt will be used.
80b8656c
L
1532 2. For the rest, alt_patt will be used.
1533
1534 When -mtune= isn't used, alt_patt will be used if
22109423 1535 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
76bc74dc 1536 be used.
ccc9c027
L
1537
1538 When -march= or .arch is used, we can't use anything beyond
1539 cpu_arch_isa_flags. */
1540
1541 if (flag_code == CODE_16BIT)
1542 {
3ae729d5
L
1543 patt = f16_patt;
1544 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1545 /* Limit number of NOPs to 2 in 16-bit mode. */
1546 max_number_of_nops = 2;
252b5132 1547 }
33fef721 1548 else
ccc9c027 1549 {
fbf3f584 1550 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
ccc9c027
L
1551 {
1552 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1553 switch (cpu_arch_tune)
1554 {
1555 case PROCESSOR_UNKNOWN:
1556 /* We use cpu_arch_isa_flags to check if we SHOULD
22109423
L
1557 optimize with nops. */
1558 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1559 patt = alt_patt;
ccc9c027
L
1560 else
1561 patt = f32_patt;
1562 break;
ccc9c027
L
1563 case PROCESSOR_PENTIUM4:
1564 case PROCESSOR_NOCONA:
ef05d495 1565 case PROCESSOR_CORE:
76bc74dc 1566 case PROCESSOR_CORE2:
bd5295b2 1567 case PROCESSOR_COREI7:
3632d14b 1568 case PROCESSOR_L1OM:
7a9068fe 1569 case PROCESSOR_K1OM:
76bc74dc 1570 case PROCESSOR_GENERIC64:
ccc9c027
L
1571 case PROCESSOR_K6:
1572 case PROCESSOR_ATHLON:
1573 case PROCESSOR_K8:
4eed87de 1574 case PROCESSOR_AMDFAM10:
8aedb9fe 1575 case PROCESSOR_BD:
029f3522 1576 case PROCESSOR_ZNVER:
7b458c12 1577 case PROCESSOR_BT:
80b8656c 1578 patt = alt_patt;
ccc9c027 1579 break;
76bc74dc 1580 case PROCESSOR_I386:
ccc9c027
L
1581 case PROCESSOR_I486:
1582 case PROCESSOR_PENTIUM:
2dde1948 1583 case PROCESSOR_PENTIUMPRO:
81486035 1584 case PROCESSOR_IAMCU:
ccc9c027
L
1585 case PROCESSOR_GENERIC32:
1586 patt = f32_patt;
1587 break;
4eed87de 1588 }
ccc9c027
L
1589 }
1590 else
1591 {
fbf3f584 1592 switch (fragP->tc_frag_data.tune)
ccc9c027
L
1593 {
1594 case PROCESSOR_UNKNOWN:
e6a14101 1595 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
ccc9c027
L
1596 PROCESSOR_UNKNOWN. */
1597 abort ();
1598 break;
1599
76bc74dc 1600 case PROCESSOR_I386:
ccc9c027
L
1601 case PROCESSOR_I486:
1602 case PROCESSOR_PENTIUM:
81486035 1603 case PROCESSOR_IAMCU:
ccc9c027
L
1604 case PROCESSOR_K6:
1605 case PROCESSOR_ATHLON:
1606 case PROCESSOR_K8:
4eed87de 1607 case PROCESSOR_AMDFAM10:
8aedb9fe 1608 case PROCESSOR_BD:
029f3522 1609 case PROCESSOR_ZNVER:
7b458c12 1610 case PROCESSOR_BT:
ccc9c027
L
1611 case PROCESSOR_GENERIC32:
1612 /* We use cpu_arch_isa_flags to check if we CAN optimize
22109423
L
1613 with nops. */
1614 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1615 patt = alt_patt;
ccc9c027
L
1616 else
1617 patt = f32_patt;
1618 break;
76bc74dc
L
1619 case PROCESSOR_PENTIUMPRO:
1620 case PROCESSOR_PENTIUM4:
1621 case PROCESSOR_NOCONA:
1622 case PROCESSOR_CORE:
ef05d495 1623 case PROCESSOR_CORE2:
bd5295b2 1624 case PROCESSOR_COREI7:
3632d14b 1625 case PROCESSOR_L1OM:
7a9068fe 1626 case PROCESSOR_K1OM:
22109423 1627 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1628 patt = alt_patt;
ccc9c027
L
1629 else
1630 patt = f32_patt;
1631 break;
1632 case PROCESSOR_GENERIC64:
80b8656c 1633 patt = alt_patt;
ccc9c027 1634 break;
4eed87de 1635 }
ccc9c027
L
1636 }
1637
76bc74dc
L
1638 if (patt == f32_patt)
1639 {
3ae729d5
L
1640 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1641 /* Limit number of NOPs to 2 for older processors. */
1642 max_number_of_nops = 2;
76bc74dc
L
1643 }
1644 else
1645 {
3ae729d5
L
1646 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1647 /* Limit number of NOPs to 7 for newer processors. */
1648 max_number_of_nops = 7;
1649 }
1650 }
1651
1652 if (limit == 0)
1653 limit = max_single_nop_size;
1654
1655 if (fragP->fr_type == rs_fill_nop)
1656 {
1657 /* Output NOPs for .nop directive. */
1658 if (limit > max_single_nop_size)
1659 {
1660 as_bad_where (fragP->fr_file, fragP->fr_line,
1661 _("invalid single nop size: %d "
1662 "(expect within [0, %d])"),
1663 limit, max_single_nop_size);
1664 return;
1665 }
1666 }
e379e5f3 1667 else if (fragP->fr_type != rs_machine_dependent)
3ae729d5
L
1668 fragP->fr_var = count;
1669
1670 if ((count / max_single_nop_size) > max_number_of_nops)
1671 {
1672 /* Generate jump over NOPs. */
1673 offsetT disp = count - 2;
1674 if (fits_in_imm7 (disp))
1675 {
1676 /* Use "jmp disp8" if possible. */
1677 count = disp;
1678 where[0] = jump_disp8[0];
1679 where[1] = count;
1680 where += 2;
1681 }
1682 else
1683 {
1684 unsigned int size_of_jump;
1685
1686 if (flag_code == CODE_16BIT)
1687 {
1688 where[0] = jump16_disp32[0];
1689 where[1] = jump16_disp32[1];
1690 size_of_jump = 2;
1691 }
1692 else
1693 {
1694 where[0] = jump32_disp32[0];
1695 size_of_jump = 1;
1696 }
1697
1698 count -= size_of_jump + 4;
1699 if (!fits_in_imm31 (count))
1700 {
1701 as_bad_where (fragP->fr_file, fragP->fr_line,
1702 _("jump over nop padding out of range"));
1703 return;
1704 }
1705
1706 md_number_to_chars (where + size_of_jump, count, 4);
1707 where += size_of_jump + 4;
76bc74dc 1708 }
ccc9c027 1709 }
3ae729d5
L
1710
1711 /* Generate multiple NOPs. */
1712 i386_output_nops (where, patt, count, limit);
252b5132
RH
1713}
1714
c6fb90c8 1715static INLINE int
0dfbf9d7 1716operand_type_all_zero (const union i386_operand_type *x)
40fb9820 1717{
0dfbf9d7 1718 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1719 {
1720 case 3:
0dfbf9d7 1721 if (x->array[2])
c6fb90c8 1722 return 0;
1a0670f3 1723 /* Fall through. */
c6fb90c8 1724 case 2:
0dfbf9d7 1725 if (x->array[1])
c6fb90c8 1726 return 0;
1a0670f3 1727 /* Fall through. */
c6fb90c8 1728 case 1:
0dfbf9d7 1729 return !x->array[0];
c6fb90c8
L
1730 default:
1731 abort ();
1732 }
40fb9820
L
1733}
1734
c6fb90c8 1735static INLINE void
0dfbf9d7 1736operand_type_set (union i386_operand_type *x, unsigned int v)
40fb9820 1737{
0dfbf9d7 1738 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1739 {
1740 case 3:
0dfbf9d7 1741 x->array[2] = v;
1a0670f3 1742 /* Fall through. */
c6fb90c8 1743 case 2:
0dfbf9d7 1744 x->array[1] = v;
1a0670f3 1745 /* Fall through. */
c6fb90c8 1746 case 1:
0dfbf9d7 1747 x->array[0] = v;
1a0670f3 1748 /* Fall through. */
c6fb90c8
L
1749 break;
1750 default:
1751 abort ();
1752 }
bab6aec1
JB
1753
1754 x->bitfield.class = ClassNone;
75e5731b 1755 x->bitfield.instance = InstanceNone;
c6fb90c8 1756}
40fb9820 1757
c6fb90c8 1758static INLINE int
0dfbf9d7
L
1759operand_type_equal (const union i386_operand_type *x,
1760 const union i386_operand_type *y)
c6fb90c8 1761{
0dfbf9d7 1762 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1763 {
1764 case 3:
0dfbf9d7 1765 if (x->array[2] != y->array[2])
c6fb90c8 1766 return 0;
1a0670f3 1767 /* Fall through. */
c6fb90c8 1768 case 2:
0dfbf9d7 1769 if (x->array[1] != y->array[1])
c6fb90c8 1770 return 0;
1a0670f3 1771 /* Fall through. */
c6fb90c8 1772 case 1:
0dfbf9d7 1773 return x->array[0] == y->array[0];
c6fb90c8
L
1774 break;
1775 default:
1776 abort ();
1777 }
1778}
40fb9820 1779
0dfbf9d7
L
1780static INLINE int
1781cpu_flags_all_zero (const union i386_cpu_flags *x)
1782{
1783 switch (ARRAY_SIZE(x->array))
1784 {
53467f57
IT
1785 case 4:
1786 if (x->array[3])
1787 return 0;
1788 /* Fall through. */
0dfbf9d7
L
1789 case 3:
1790 if (x->array[2])
1791 return 0;
1a0670f3 1792 /* Fall through. */
0dfbf9d7
L
1793 case 2:
1794 if (x->array[1])
1795 return 0;
1a0670f3 1796 /* Fall through. */
0dfbf9d7
L
1797 case 1:
1798 return !x->array[0];
1799 default:
1800 abort ();
1801 }
1802}
1803
0dfbf9d7
L
1804static INLINE int
1805cpu_flags_equal (const union i386_cpu_flags *x,
1806 const union i386_cpu_flags *y)
1807{
1808 switch (ARRAY_SIZE(x->array))
1809 {
53467f57
IT
1810 case 4:
1811 if (x->array[3] != y->array[3])
1812 return 0;
1813 /* Fall through. */
0dfbf9d7
L
1814 case 3:
1815 if (x->array[2] != y->array[2])
1816 return 0;
1a0670f3 1817 /* Fall through. */
0dfbf9d7
L
1818 case 2:
1819 if (x->array[1] != y->array[1])
1820 return 0;
1a0670f3 1821 /* Fall through. */
0dfbf9d7
L
1822 case 1:
1823 return x->array[0] == y->array[0];
1824 break;
1825 default:
1826 abort ();
1827 }
1828}
c6fb90c8
L
1829
1830static INLINE int
1831cpu_flags_check_cpu64 (i386_cpu_flags f)
1832{
1833 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1834 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
40fb9820
L
1835}
1836
c6fb90c8
L
1837static INLINE i386_cpu_flags
1838cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
40fb9820 1839{
c6fb90c8
L
1840 switch (ARRAY_SIZE (x.array))
1841 {
53467f57
IT
1842 case 4:
1843 x.array [3] &= y.array [3];
1844 /* Fall through. */
c6fb90c8
L
1845 case 3:
1846 x.array [2] &= y.array [2];
1a0670f3 1847 /* Fall through. */
c6fb90c8
L
1848 case 2:
1849 x.array [1] &= y.array [1];
1a0670f3 1850 /* Fall through. */
c6fb90c8
L
1851 case 1:
1852 x.array [0] &= y.array [0];
1853 break;
1854 default:
1855 abort ();
1856 }
1857 return x;
1858}
40fb9820 1859
c6fb90c8
L
1860static INLINE i386_cpu_flags
1861cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
40fb9820 1862{
c6fb90c8 1863 switch (ARRAY_SIZE (x.array))
40fb9820 1864 {
53467f57
IT
1865 case 4:
1866 x.array [3] |= y.array [3];
1867 /* Fall through. */
c6fb90c8
L
1868 case 3:
1869 x.array [2] |= y.array [2];
1a0670f3 1870 /* Fall through. */
c6fb90c8
L
1871 case 2:
1872 x.array [1] |= y.array [1];
1a0670f3 1873 /* Fall through. */
c6fb90c8
L
1874 case 1:
1875 x.array [0] |= y.array [0];
40fb9820
L
1876 break;
1877 default:
1878 abort ();
1879 }
40fb9820
L
1880 return x;
1881}
1882
309d3373
JB
1883static INLINE i386_cpu_flags
1884cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1885{
1886 switch (ARRAY_SIZE (x.array))
1887 {
53467f57
IT
1888 case 4:
1889 x.array [3] &= ~y.array [3];
1890 /* Fall through. */
309d3373
JB
1891 case 3:
1892 x.array [2] &= ~y.array [2];
1a0670f3 1893 /* Fall through. */
309d3373
JB
1894 case 2:
1895 x.array [1] &= ~y.array [1];
1a0670f3 1896 /* Fall through. */
309d3373
JB
1897 case 1:
1898 x.array [0] &= ~y.array [0];
1899 break;
1900 default:
1901 abort ();
1902 }
1903 return x;
1904}
1905
6c0946d0
JB
1906static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1907
c0f3af97
L
1908#define CPU_FLAGS_ARCH_MATCH 0x1
1909#define CPU_FLAGS_64BIT_MATCH 0x2
1910
c0f3af97 1911#define CPU_FLAGS_PERFECT_MATCH \
db12e14e 1912 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
c0f3af97
L
1913
1914/* Return CPU flags match bits. */
3629bb00 1915
40fb9820 1916static int
d3ce72d0 1917cpu_flags_match (const insn_template *t)
40fb9820 1918{
c0f3af97
L
1919 i386_cpu_flags x = t->cpu_flags;
1920 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
40fb9820
L
1921
1922 x.bitfield.cpu64 = 0;
1923 x.bitfield.cpuno64 = 0;
1924
0dfbf9d7 1925 if (cpu_flags_all_zero (&x))
c0f3af97
L
1926 {
1927 /* This instruction is available on all archs. */
db12e14e 1928 match |= CPU_FLAGS_ARCH_MATCH;
c0f3af97 1929 }
3629bb00
L
1930 else
1931 {
c0f3af97 1932 /* This instruction is available only on some archs. */
3629bb00
L
1933 i386_cpu_flags cpu = cpu_arch_flags;
1934
ab592e75
JB
1935 /* AVX512VL is no standalone feature - match it and then strip it. */
1936 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1937 return match;
1938 x.bitfield.cpuavx512vl = 0;
1939
3629bb00 1940 cpu = cpu_flags_and (x, cpu);
c0f3af97
L
1941 if (!cpu_flags_all_zero (&cpu))
1942 {
a5ff0eb2
L
1943 if (x.bitfield.cpuavx)
1944 {
929f69fa 1945 /* We need to check a few extra flags with AVX. */
b9d49817 1946 if (cpu.bitfield.cpuavx
40d231b4
JB
1947 && (!t->opcode_modifier.sse2avx
1948 || (sse2avx && !i.prefix[DATA_PREFIX]))
b9d49817 1949 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
929f69fa 1950 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
b9d49817
JB
1951 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1952 match |= CPU_FLAGS_ARCH_MATCH;
a5ff0eb2 1953 }
929f69fa
JB
1954 else if (x.bitfield.cpuavx512f)
1955 {
1956 /* We need to check a few extra flags with AVX512F. */
1957 if (cpu.bitfield.cpuavx512f
1958 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1959 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1960 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1961 match |= CPU_FLAGS_ARCH_MATCH;
1962 }
a5ff0eb2 1963 else
db12e14e 1964 match |= CPU_FLAGS_ARCH_MATCH;
c0f3af97 1965 }
3629bb00 1966 }
c0f3af97 1967 return match;
40fb9820
L
1968}
1969
c6fb90c8
L
1970static INLINE i386_operand_type
1971operand_type_and (i386_operand_type x, i386_operand_type y)
40fb9820 1972{
bab6aec1
JB
1973 if (x.bitfield.class != y.bitfield.class)
1974 x.bitfield.class = ClassNone;
75e5731b
JB
1975 if (x.bitfield.instance != y.bitfield.instance)
1976 x.bitfield.instance = InstanceNone;
bab6aec1 1977
c6fb90c8
L
1978 switch (ARRAY_SIZE (x.array))
1979 {
1980 case 3:
1981 x.array [2] &= y.array [2];
1a0670f3 1982 /* Fall through. */
c6fb90c8
L
1983 case 2:
1984 x.array [1] &= y.array [1];
1a0670f3 1985 /* Fall through. */
c6fb90c8
L
1986 case 1:
1987 x.array [0] &= y.array [0];
1988 break;
1989 default:
1990 abort ();
1991 }
1992 return x;
40fb9820
L
1993}
1994
73053c1f
JB
1995static INLINE i386_operand_type
1996operand_type_and_not (i386_operand_type x, i386_operand_type y)
1997{
bab6aec1 1998 gas_assert (y.bitfield.class == ClassNone);
75e5731b 1999 gas_assert (y.bitfield.instance == InstanceNone);
bab6aec1 2000
73053c1f
JB
2001 switch (ARRAY_SIZE (x.array))
2002 {
2003 case 3:
2004 x.array [2] &= ~y.array [2];
2005 /* Fall through. */
2006 case 2:
2007 x.array [1] &= ~y.array [1];
2008 /* Fall through. */
2009 case 1:
2010 x.array [0] &= ~y.array [0];
2011 break;
2012 default:
2013 abort ();
2014 }
2015 return x;
2016}
2017
c6fb90c8
L
2018static INLINE i386_operand_type
2019operand_type_or (i386_operand_type x, i386_operand_type y)
40fb9820 2020{
bab6aec1
JB
2021 gas_assert (x.bitfield.class == ClassNone ||
2022 y.bitfield.class == ClassNone ||
2023 x.bitfield.class == y.bitfield.class);
75e5731b
JB
2024 gas_assert (x.bitfield.instance == InstanceNone ||
2025 y.bitfield.instance == InstanceNone ||
2026 x.bitfield.instance == y.bitfield.instance);
bab6aec1 2027
c6fb90c8 2028 switch (ARRAY_SIZE (x.array))
40fb9820 2029 {
c6fb90c8
L
2030 case 3:
2031 x.array [2] |= y.array [2];
1a0670f3 2032 /* Fall through. */
c6fb90c8
L
2033 case 2:
2034 x.array [1] |= y.array [1];
1a0670f3 2035 /* Fall through. */
c6fb90c8
L
2036 case 1:
2037 x.array [0] |= y.array [0];
40fb9820
L
2038 break;
2039 default:
2040 abort ();
2041 }
c6fb90c8
L
2042 return x;
2043}
40fb9820 2044
c6fb90c8
L
2045static INLINE i386_operand_type
2046operand_type_xor (i386_operand_type x, i386_operand_type y)
2047{
bab6aec1 2048 gas_assert (y.bitfield.class == ClassNone);
75e5731b 2049 gas_assert (y.bitfield.instance == InstanceNone);
bab6aec1 2050
c6fb90c8
L
2051 switch (ARRAY_SIZE (x.array))
2052 {
2053 case 3:
2054 x.array [2] ^= y.array [2];
1a0670f3 2055 /* Fall through. */
c6fb90c8
L
2056 case 2:
2057 x.array [1] ^= y.array [1];
1a0670f3 2058 /* Fall through. */
c6fb90c8
L
2059 case 1:
2060 x.array [0] ^= y.array [0];
2061 break;
2062 default:
2063 abort ();
2064 }
40fb9820
L
2065 return x;
2066}
2067
40fb9820
L
2068static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2069static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2070static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2071static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
bab6aec1
JB
2072static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2073static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
40fb9820 2074static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
43234a1e 2075static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
40fb9820
L
2076static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2077static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2078static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2079static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2080static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2081static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2082static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2083static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2084static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2085
2086enum operand_type
2087{
2088 reg,
40fb9820
L
2089 imm,
2090 disp,
2091 anymem
2092};
2093
c6fb90c8 2094static INLINE int
40fb9820
L
2095operand_type_check (i386_operand_type t, enum operand_type c)
2096{
2097 switch (c)
2098 {
2099 case reg:
bab6aec1 2100 return t.bitfield.class == Reg;
40fb9820 2101
40fb9820
L
2102 case imm:
2103 return (t.bitfield.imm8
2104 || t.bitfield.imm8s
2105 || t.bitfield.imm16
2106 || t.bitfield.imm32
2107 || t.bitfield.imm32s
2108 || t.bitfield.imm64);
2109
2110 case disp:
2111 return (t.bitfield.disp8
2112 || t.bitfield.disp16
2113 || t.bitfield.disp32
2114 || t.bitfield.disp32s
2115 || t.bitfield.disp64);
2116
2117 case anymem:
2118 return (t.bitfield.disp8
2119 || t.bitfield.disp16
2120 || t.bitfield.disp32
2121 || t.bitfield.disp32s
2122 || t.bitfield.disp64
2123 || t.bitfield.baseindex);
2124
2125 default:
2126 abort ();
2127 }
2cfe26b6
AM
2128
2129 return 0;
40fb9820
L
2130}
2131
7a54636a
L
2132/* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2133 between operand GIVEN and opeand WANTED for instruction template T. */
5c07affc
L
2134
2135static INLINE int
7a54636a
L
2136match_operand_size (const insn_template *t, unsigned int wanted,
2137 unsigned int given)
5c07affc 2138{
3ac21baa
JB
2139 return !((i.types[given].bitfield.byte
2140 && !t->operand_types[wanted].bitfield.byte)
2141 || (i.types[given].bitfield.word
2142 && !t->operand_types[wanted].bitfield.word)
2143 || (i.types[given].bitfield.dword
2144 && !t->operand_types[wanted].bitfield.dword)
2145 || (i.types[given].bitfield.qword
2146 && !t->operand_types[wanted].bitfield.qword)
2147 || (i.types[given].bitfield.tbyte
2148 && !t->operand_types[wanted].bitfield.tbyte));
5c07affc
L
2149}
2150
dd40ce22
L
2151/* Return 1 if there is no conflict in SIMD register between operand
2152 GIVEN and opeand WANTED for instruction template T. */
1b54b8d7
JB
2153
2154static INLINE int
dd40ce22
L
2155match_simd_size (const insn_template *t, unsigned int wanted,
2156 unsigned int given)
1b54b8d7 2157{
3ac21baa
JB
2158 return !((i.types[given].bitfield.xmmword
2159 && !t->operand_types[wanted].bitfield.xmmword)
2160 || (i.types[given].bitfield.ymmword
2161 && !t->operand_types[wanted].bitfield.ymmword)
2162 || (i.types[given].bitfield.zmmword
2163 && !t->operand_types[wanted].bitfield.zmmword));
1b54b8d7
JB
2164}
2165
7a54636a
L
2166/* Return 1 if there is no conflict in any size between operand GIVEN
2167 and opeand WANTED for instruction template T. */
5c07affc
L
2168
2169static INLINE int
dd40ce22
L
2170match_mem_size (const insn_template *t, unsigned int wanted,
2171 unsigned int given)
5c07affc 2172{
7a54636a 2173 return (match_operand_size (t, wanted, given)
3ac21baa 2174 && !((i.types[given].bitfield.unspecified
af508cb9 2175 && !i.broadcast
3ac21baa
JB
2176 && !t->operand_types[wanted].bitfield.unspecified)
2177 || (i.types[given].bitfield.fword
2178 && !t->operand_types[wanted].bitfield.fword)
1b54b8d7
JB
2179 /* For scalar opcode templates to allow register and memory
2180 operands at the same time, some special casing is needed
d6793fa1
JB
2181 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2182 down-conversion vpmov*. */
3528c362 2183 || ((t->operand_types[wanted].bitfield.class == RegSIMD
bc49bfd8
JB
2184 && t->operand_types[wanted].bitfield.byte
2185 + t->operand_types[wanted].bitfield.word
2186 + t->operand_types[wanted].bitfield.dword
2187 + t->operand_types[wanted].bitfield.qword
2188 > !!t->opcode_modifier.broadcast)
3ac21baa
JB
2189 ? (i.types[given].bitfield.xmmword
2190 || i.types[given].bitfield.ymmword
2191 || i.types[given].bitfield.zmmword)
2192 : !match_simd_size(t, wanted, given))));
5c07affc
L
2193}
2194
3ac21baa
JB
2195/* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2196 operands for instruction template T, and it has MATCH_REVERSE set if there
2197 is no size conflict on any operands for the template with operands reversed
2198 (and the template allows for reversing in the first place). */
5c07affc 2199
3ac21baa
JB
2200#define MATCH_STRAIGHT 1
2201#define MATCH_REVERSE 2
2202
2203static INLINE unsigned int
d3ce72d0 2204operand_size_match (const insn_template *t)
5c07affc 2205{
3ac21baa 2206 unsigned int j, match = MATCH_STRAIGHT;
5c07affc 2207
0cfa3eb3 2208 /* Don't check non-absolute jump instructions. */
5c07affc 2209 if (t->opcode_modifier.jump
0cfa3eb3 2210 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5c07affc
L
2211 return match;
2212
2213 /* Check memory and accumulator operand size. */
2214 for (j = 0; j < i.operands; j++)
2215 {
3528c362
JB
2216 if (i.types[j].bitfield.class != Reg
2217 && i.types[j].bitfield.class != RegSIMD
601e8564 2218 && t->opcode_modifier.anysize)
5c07affc
L
2219 continue;
2220
bab6aec1 2221 if (t->operand_types[j].bitfield.class == Reg
7a54636a 2222 && !match_operand_size (t, j, j))
5c07affc
L
2223 {
2224 match = 0;
2225 break;
2226 }
2227
3528c362 2228 if (t->operand_types[j].bitfield.class == RegSIMD
3ac21baa 2229 && !match_simd_size (t, j, j))
1b54b8d7
JB
2230 {
2231 match = 0;
2232 break;
2233 }
2234
75e5731b 2235 if (t->operand_types[j].bitfield.instance == Accum
7a54636a 2236 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
1b54b8d7
JB
2237 {
2238 match = 0;
2239 break;
2240 }
2241
c48dadc9 2242 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
5c07affc
L
2243 {
2244 match = 0;
2245 break;
2246 }
2247 }
2248
3ac21baa 2249 if (!t->opcode_modifier.d)
891edac4 2250 {
dc1e8a47 2251 mismatch:
3ac21baa
JB
2252 if (!match)
2253 i.error = operand_size_mismatch;
2254 return match;
891edac4 2255 }
5c07affc
L
2256
2257 /* Check reverse. */
f5eb1d70 2258 gas_assert (i.operands >= 2 && i.operands <= 3);
5c07affc 2259
f5eb1d70 2260 for (j = 0; j < i.operands; j++)
5c07affc 2261 {
f5eb1d70
JB
2262 unsigned int given = i.operands - j - 1;
2263
bab6aec1 2264 if (t->operand_types[j].bitfield.class == Reg
f5eb1d70 2265 && !match_operand_size (t, j, given))
891edac4 2266 goto mismatch;
5c07affc 2267
3528c362 2268 if (t->operand_types[j].bitfield.class == RegSIMD
f5eb1d70 2269 && !match_simd_size (t, j, given))
dbbc8b7e
JB
2270 goto mismatch;
2271
75e5731b 2272 if (t->operand_types[j].bitfield.instance == Accum
f5eb1d70
JB
2273 && (!match_operand_size (t, j, given)
2274 || !match_simd_size (t, j, given)))
dbbc8b7e
JB
2275 goto mismatch;
2276
f5eb1d70 2277 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
891edac4 2278 goto mismatch;
5c07affc
L
2279 }
2280
3ac21baa 2281 return match | MATCH_REVERSE;
5c07affc
L
2282}
2283
c6fb90c8 2284static INLINE int
40fb9820
L
2285operand_type_match (i386_operand_type overlap,
2286 i386_operand_type given)
2287{
2288 i386_operand_type temp = overlap;
2289
7d5e4556 2290 temp.bitfield.unspecified = 0;
5c07affc
L
2291 temp.bitfield.byte = 0;
2292 temp.bitfield.word = 0;
2293 temp.bitfield.dword = 0;
2294 temp.bitfield.fword = 0;
2295 temp.bitfield.qword = 0;
2296 temp.bitfield.tbyte = 0;
2297 temp.bitfield.xmmword = 0;
c0f3af97 2298 temp.bitfield.ymmword = 0;
43234a1e 2299 temp.bitfield.zmmword = 0;
0dfbf9d7 2300 if (operand_type_all_zero (&temp))
891edac4 2301 goto mismatch;
40fb9820 2302
6f2f06be 2303 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
891edac4
L
2304 return 1;
2305
dc1e8a47 2306 mismatch:
a65babc9 2307 i.error = operand_type_mismatch;
891edac4 2308 return 0;
40fb9820
L
2309}
2310
7d5e4556 2311/* If given types g0 and g1 are registers they must be of the same type
10c17abd 2312 unless the expected operand type register overlap is null.
5de4d9ef 2313 Some Intel syntax memory operand size checking also happens here. */
40fb9820 2314
c6fb90c8 2315static INLINE int
dc821c5f 2316operand_type_register_match (i386_operand_type g0,
40fb9820 2317 i386_operand_type t0,
40fb9820
L
2318 i386_operand_type g1,
2319 i386_operand_type t1)
2320{
bab6aec1 2321 if (g0.bitfield.class != Reg
3528c362 2322 && g0.bitfield.class != RegSIMD
10c17abd
JB
2323 && (!operand_type_check (g0, anymem)
2324 || g0.bitfield.unspecified
5de4d9ef
JB
2325 || (t0.bitfield.class != Reg
2326 && t0.bitfield.class != RegSIMD)))
40fb9820
L
2327 return 1;
2328
bab6aec1 2329 if (g1.bitfield.class != Reg
3528c362 2330 && g1.bitfield.class != RegSIMD
10c17abd
JB
2331 && (!operand_type_check (g1, anymem)
2332 || g1.bitfield.unspecified
5de4d9ef
JB
2333 || (t1.bitfield.class != Reg
2334 && t1.bitfield.class != RegSIMD)))
40fb9820
L
2335 return 1;
2336
dc821c5f
JB
2337 if (g0.bitfield.byte == g1.bitfield.byte
2338 && g0.bitfield.word == g1.bitfield.word
2339 && g0.bitfield.dword == g1.bitfield.dword
10c17abd
JB
2340 && g0.bitfield.qword == g1.bitfield.qword
2341 && g0.bitfield.xmmword == g1.bitfield.xmmword
2342 && g0.bitfield.ymmword == g1.bitfield.ymmword
2343 && g0.bitfield.zmmword == g1.bitfield.zmmword)
40fb9820
L
2344 return 1;
2345
dc821c5f
JB
2346 if (!(t0.bitfield.byte & t1.bitfield.byte)
2347 && !(t0.bitfield.word & t1.bitfield.word)
2348 && !(t0.bitfield.dword & t1.bitfield.dword)
10c17abd
JB
2349 && !(t0.bitfield.qword & t1.bitfield.qword)
2350 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2351 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2352 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
891edac4
L
2353 return 1;
2354
a65babc9 2355 i.error = register_type_mismatch;
891edac4
L
2356
2357 return 0;
40fb9820
L
2358}
2359
4c692bc7
JB
2360static INLINE unsigned int
2361register_number (const reg_entry *r)
2362{
2363 unsigned int nr = r->reg_num;
2364
2365 if (r->reg_flags & RegRex)
2366 nr += 8;
2367
200cbe0f
L
2368 if (r->reg_flags & RegVRex)
2369 nr += 16;
2370
4c692bc7
JB
2371 return nr;
2372}
2373
252b5132 2374static INLINE unsigned int
40fb9820 2375mode_from_disp_size (i386_operand_type t)
252b5132 2376{
b5014f7a 2377 if (t.bitfield.disp8)
40fb9820
L
2378 return 1;
2379 else if (t.bitfield.disp16
2380 || t.bitfield.disp32
2381 || t.bitfield.disp32s)
2382 return 2;
2383 else
2384 return 0;
252b5132
RH
2385}
2386
2387static INLINE int
65879393 2388fits_in_signed_byte (addressT num)
252b5132 2389{
65879393 2390 return num + 0x80 <= 0xff;
47926f60 2391}
252b5132
RH
2392
2393static INLINE int
65879393 2394fits_in_unsigned_byte (addressT num)
252b5132 2395{
65879393 2396 return num <= 0xff;
47926f60 2397}
252b5132
RH
2398
2399static INLINE int
65879393 2400fits_in_unsigned_word (addressT num)
252b5132 2401{
65879393 2402 return num <= 0xffff;
47926f60 2403}
252b5132
RH
2404
2405static INLINE int
65879393 2406fits_in_signed_word (addressT num)
252b5132 2407{
65879393 2408 return num + 0x8000 <= 0xffff;
47926f60 2409}
2a962e6d 2410
3e73aa7c 2411static INLINE int
65879393 2412fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
3e73aa7c
JH
2413{
2414#ifndef BFD64
2415 return 1;
2416#else
65879393 2417 return num + 0x80000000 <= 0xffffffff;
3e73aa7c
JH
2418#endif
2419} /* fits_in_signed_long() */
2a962e6d 2420
3e73aa7c 2421static INLINE int
65879393 2422fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
3e73aa7c
JH
2423{
2424#ifndef BFD64
2425 return 1;
2426#else
65879393 2427 return num <= 0xffffffff;
3e73aa7c
JH
2428#endif
2429} /* fits_in_unsigned_long() */
252b5132 2430
43234a1e 2431static INLINE int
b5014f7a 2432fits_in_disp8 (offsetT num)
43234a1e
L
2433{
2434 int shift = i.memshift;
2435 unsigned int mask;
2436
2437 if (shift == -1)
2438 abort ();
2439
2440 mask = (1 << shift) - 1;
2441
2442 /* Return 0 if NUM isn't properly aligned. */
2443 if ((num & mask))
2444 return 0;
2445
2446 /* Check if NUM will fit in 8bit after shift. */
2447 return fits_in_signed_byte (num >> shift);
2448}
2449
a683cc34
SP
2450static INLINE int
2451fits_in_imm4 (offsetT num)
2452{
2453 return (num & 0xf) == num;
2454}
2455
40fb9820 2456static i386_operand_type
e3bb37b5 2457smallest_imm_type (offsetT num)
252b5132 2458{
40fb9820 2459 i386_operand_type t;
7ab9ffdd 2460
0dfbf9d7 2461 operand_type_set (&t, 0);
40fb9820
L
2462 t.bitfield.imm64 = 1;
2463
2464 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
e413e4e9
AM
2465 {
2466 /* This code is disabled on the 486 because all the Imm1 forms
2467 in the opcode table are slower on the i486. They're the
2468 versions with the implicitly specified single-position
2469 displacement, which has another syntax if you really want to
2470 use that form. */
40fb9820
L
2471 t.bitfield.imm1 = 1;
2472 t.bitfield.imm8 = 1;
2473 t.bitfield.imm8s = 1;
2474 t.bitfield.imm16 = 1;
2475 t.bitfield.imm32 = 1;
2476 t.bitfield.imm32s = 1;
2477 }
2478 else if (fits_in_signed_byte (num))
2479 {
2480 t.bitfield.imm8 = 1;
2481 t.bitfield.imm8s = 1;
2482 t.bitfield.imm16 = 1;
2483 t.bitfield.imm32 = 1;
2484 t.bitfield.imm32s = 1;
2485 }
2486 else if (fits_in_unsigned_byte (num))
2487 {
2488 t.bitfield.imm8 = 1;
2489 t.bitfield.imm16 = 1;
2490 t.bitfield.imm32 = 1;
2491 t.bitfield.imm32s = 1;
2492 }
2493 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2494 {
2495 t.bitfield.imm16 = 1;
2496 t.bitfield.imm32 = 1;
2497 t.bitfield.imm32s = 1;
2498 }
2499 else if (fits_in_signed_long (num))
2500 {
2501 t.bitfield.imm32 = 1;
2502 t.bitfield.imm32s = 1;
2503 }
2504 else if (fits_in_unsigned_long (num))
2505 t.bitfield.imm32 = 1;
2506
2507 return t;
47926f60 2508}
252b5132 2509
847f7ad4 2510static offsetT
e3bb37b5 2511offset_in_range (offsetT val, int size)
847f7ad4 2512{
508866be 2513 addressT mask;
ba2adb93 2514
847f7ad4
AM
2515 switch (size)
2516 {
508866be
L
2517 case 1: mask = ((addressT) 1 << 8) - 1; break;
2518 case 2: mask = ((addressT) 1 << 16) - 1; break;
3b0ec529 2519 case 4: mask = ((addressT) 2 << 31) - 1; break;
3e73aa7c
JH
2520#ifdef BFD64
2521 case 8: mask = ((addressT) 2 << 63) - 1; break;
2522#endif
47926f60 2523 default: abort ();
847f7ad4
AM
2524 }
2525
9de868bf
L
2526#ifdef BFD64
2527 /* If BFD64, sign extend val for 32bit address mode. */
2528 if (flag_code != CODE_64BIT
2529 || i.prefix[ADDR_PREFIX])
3e73aa7c
JH
2530 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2531 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
fa289fb8 2532#endif
ba2adb93 2533
47926f60 2534 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
847f7ad4
AM
2535 {
2536 char buf1[40], buf2[40];
2537
2538 sprint_value (buf1, val);
2539 sprint_value (buf2, val & mask);
2540 as_warn (_("%s shortened to %s"), buf1, buf2);
2541 }
2542 return val & mask;
2543}
2544
c32fa91d
L
2545enum PREFIX_GROUP
2546{
2547 PREFIX_EXIST = 0,
2548 PREFIX_LOCK,
2549 PREFIX_REP,
04ef582a 2550 PREFIX_DS,
c32fa91d
L
2551 PREFIX_OTHER
2552};
2553
2554/* Returns
2555 a. PREFIX_EXIST if attempting to add a prefix where one from the
2556 same class already exists.
2557 b. PREFIX_LOCK if lock prefix is added.
2558 c. PREFIX_REP if rep/repne prefix is added.
04ef582a
L
2559 d. PREFIX_DS if ds prefix is added.
2560 e. PREFIX_OTHER if other prefix is added.
c32fa91d
L
2561 */
2562
2563static enum PREFIX_GROUP
e3bb37b5 2564add_prefix (unsigned int prefix)
252b5132 2565{
c32fa91d 2566 enum PREFIX_GROUP ret = PREFIX_OTHER;
b1905489 2567 unsigned int q;
252b5132 2568
29b0f896
AM
2569 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2570 && flag_code == CODE_64BIT)
b1905489 2571 {
161a04f6 2572 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
44846f29
JB
2573 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2574 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2575 || (i.prefix[REX_PREFIX] & prefix & REX_B))
c32fa91d 2576 ret = PREFIX_EXIST;
b1905489
JB
2577 q = REX_PREFIX;
2578 }
3e73aa7c 2579 else
b1905489
JB
2580 {
2581 switch (prefix)
2582 {
2583 default:
2584 abort ();
2585
b1905489 2586 case DS_PREFIX_OPCODE:
04ef582a
L
2587 ret = PREFIX_DS;
2588 /* Fall through. */
2589 case CS_PREFIX_OPCODE:
b1905489
JB
2590 case ES_PREFIX_OPCODE:
2591 case FS_PREFIX_OPCODE:
2592 case GS_PREFIX_OPCODE:
2593 case SS_PREFIX_OPCODE:
2594 q = SEG_PREFIX;
2595 break;
2596
2597 case REPNE_PREFIX_OPCODE:
2598 case REPE_PREFIX_OPCODE:
c32fa91d
L
2599 q = REP_PREFIX;
2600 ret = PREFIX_REP;
2601 break;
2602
b1905489 2603 case LOCK_PREFIX_OPCODE:
c32fa91d
L
2604 q = LOCK_PREFIX;
2605 ret = PREFIX_LOCK;
b1905489
JB
2606 break;
2607
2608 case FWAIT_OPCODE:
2609 q = WAIT_PREFIX;
2610 break;
2611
2612 case ADDR_PREFIX_OPCODE:
2613 q = ADDR_PREFIX;
2614 break;
2615
2616 case DATA_PREFIX_OPCODE:
2617 q = DATA_PREFIX;
2618 break;
2619 }
2620 if (i.prefix[q] != 0)
c32fa91d 2621 ret = PREFIX_EXIST;
b1905489 2622 }
252b5132 2623
b1905489 2624 if (ret)
252b5132 2625 {
b1905489
JB
2626 if (!i.prefix[q])
2627 ++i.prefixes;
2628 i.prefix[q] |= prefix;
252b5132 2629 }
b1905489
JB
2630 else
2631 as_bad (_("same type of prefix used twice"));
252b5132 2632
252b5132
RH
2633 return ret;
2634}
2635
2636static void
78f12dd3 2637update_code_flag (int value, int check)
eecb386c 2638{
78f12dd3
L
2639 PRINTF_LIKE ((*as_error));
2640
1e9cc1c2 2641 flag_code = (enum flag_code) value;
40fb9820
L
2642 if (flag_code == CODE_64BIT)
2643 {
2644 cpu_arch_flags.bitfield.cpu64 = 1;
2645 cpu_arch_flags.bitfield.cpuno64 = 0;
40fb9820
L
2646 }
2647 else
2648 {
2649 cpu_arch_flags.bitfield.cpu64 = 0;
2650 cpu_arch_flags.bitfield.cpuno64 = 1;
40fb9820
L
2651 }
2652 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
3e73aa7c 2653 {
78f12dd3
L
2654 if (check)
2655 as_error = as_fatal;
2656 else
2657 as_error = as_bad;
2658 (*as_error) (_("64bit mode not supported on `%s'."),
2659 cpu_arch_name ? cpu_arch_name : default_arch);
3e73aa7c 2660 }
40fb9820 2661 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
3e73aa7c 2662 {
78f12dd3
L
2663 if (check)
2664 as_error = as_fatal;
2665 else
2666 as_error = as_bad;
2667 (*as_error) (_("32bit mode not supported on `%s'."),
2668 cpu_arch_name ? cpu_arch_name : default_arch);
3e73aa7c 2669 }
eecb386c
AM
2670 stackop_size = '\0';
2671}
2672
78f12dd3
L
2673static void
2674set_code_flag (int value)
2675{
2676 update_code_flag (value, 0);
2677}
2678
eecb386c 2679static void
e3bb37b5 2680set_16bit_gcc_code_flag (int new_code_flag)
252b5132 2681{
1e9cc1c2 2682 flag_code = (enum flag_code) new_code_flag;
40fb9820
L
2683 if (flag_code != CODE_16BIT)
2684 abort ();
2685 cpu_arch_flags.bitfield.cpu64 = 0;
2686 cpu_arch_flags.bitfield.cpuno64 = 1;
9306ca4a 2687 stackop_size = LONG_MNEM_SUFFIX;
252b5132
RH
2688}
2689
2690static void
e3bb37b5 2691set_intel_syntax (int syntax_flag)
252b5132
RH
2692{
2693 /* Find out if register prefixing is specified. */
2694 int ask_naked_reg = 0;
2695
2696 SKIP_WHITESPACE ();
29b0f896 2697 if (!is_end_of_line[(unsigned char) *input_line_pointer])
252b5132 2698 {
d02603dc
NC
2699 char *string;
2700 int e = get_symbol_name (&string);
252b5132 2701
47926f60 2702 if (strcmp (string, "prefix") == 0)
252b5132 2703 ask_naked_reg = 1;
47926f60 2704 else if (strcmp (string, "noprefix") == 0)
252b5132
RH
2705 ask_naked_reg = -1;
2706 else
d0b47220 2707 as_bad (_("bad argument to syntax directive."));
d02603dc 2708 (void) restore_line_pointer (e);
252b5132
RH
2709 }
2710 demand_empty_rest_of_line ();
c3332e24 2711
252b5132
RH
2712 intel_syntax = syntax_flag;
2713
2714 if (ask_naked_reg == 0)
f86103b7
AM
2715 allow_naked_reg = (intel_syntax
2716 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
252b5132
RH
2717 else
2718 allow_naked_reg = (ask_naked_reg < 0);
9306ca4a 2719
ee86248c 2720 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
7ab9ffdd 2721
e4a3b5a4 2722 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
9306ca4a 2723 identifier_chars['$'] = intel_syntax ? '$' : 0;
e4a3b5a4 2724 register_prefix = allow_naked_reg ? "" : "%";
252b5132
RH
2725}
2726
1efbbeb4
L
2727static void
2728set_intel_mnemonic (int mnemonic_flag)
2729{
e1d4d893 2730 intel_mnemonic = mnemonic_flag;
1efbbeb4
L
2731}
2732
db51cc60
L
2733static void
2734set_allow_index_reg (int flag)
2735{
2736 allow_index_reg = flag;
2737}
2738
cb19c032 2739static void
7bab8ab5 2740set_check (int what)
cb19c032 2741{
7bab8ab5
JB
2742 enum check_kind *kind;
2743 const char *str;
2744
2745 if (what)
2746 {
2747 kind = &operand_check;
2748 str = "operand";
2749 }
2750 else
2751 {
2752 kind = &sse_check;
2753 str = "sse";
2754 }
2755
cb19c032
L
2756 SKIP_WHITESPACE ();
2757
2758 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2759 {
d02603dc
NC
2760 char *string;
2761 int e = get_symbol_name (&string);
cb19c032
L
2762
2763 if (strcmp (string, "none") == 0)
7bab8ab5 2764 *kind = check_none;
cb19c032 2765 else if (strcmp (string, "warning") == 0)
7bab8ab5 2766 *kind = check_warning;
cb19c032 2767 else if (strcmp (string, "error") == 0)
7bab8ab5 2768 *kind = check_error;
cb19c032 2769 else
7bab8ab5 2770 as_bad (_("bad argument to %s_check directive."), str);
d02603dc 2771 (void) restore_line_pointer (e);
cb19c032
L
2772 }
2773 else
7bab8ab5 2774 as_bad (_("missing argument for %s_check directive"), str);
cb19c032
L
2775
2776 demand_empty_rest_of_line ();
2777}
2778
8a9036a4
L
2779static void
2780check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
1e9cc1c2 2781 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
8a9036a4
L
2782{
2783#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2784 static const char *arch;
2785
2786 /* Intel LIOM is only supported on ELF. */
2787 if (!IS_ELF)
2788 return;
2789
2790 if (!arch)
2791 {
2792 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2793 use default_arch. */
2794 arch = cpu_arch_name;
2795 if (!arch)
2796 arch = default_arch;
2797 }
2798
81486035
L
2799 /* If we are targeting Intel MCU, we must enable it. */
2800 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2801 || new_flag.bitfield.cpuiamcu)
2802 return;
2803
3632d14b 2804 /* If we are targeting Intel L1OM, we must enable it. */
8a9036a4 2805 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
1e9cc1c2 2806 || new_flag.bitfield.cpul1om)
8a9036a4 2807 return;
76ba9986 2808
7a9068fe
L
2809 /* If we are targeting Intel K1OM, we must enable it. */
2810 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2811 || new_flag.bitfield.cpuk1om)
2812 return;
2813
8a9036a4
L
2814 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2815#endif
2816}
2817
e413e4e9 2818static void
e3bb37b5 2819set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
e413e4e9 2820{
47926f60 2821 SKIP_WHITESPACE ();
e413e4e9 2822
29b0f896 2823 if (!is_end_of_line[(unsigned char) *input_line_pointer])
e413e4e9 2824 {
d02603dc
NC
2825 char *string;
2826 int e = get_symbol_name (&string);
91d6fa6a 2827 unsigned int j;
40fb9820 2828 i386_cpu_flags flags;
e413e4e9 2829
91d6fa6a 2830 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
e413e4e9 2831 {
91d6fa6a 2832 if (strcmp (string, cpu_arch[j].name) == 0)
e413e4e9 2833 {
91d6fa6a 2834 check_cpu_arch_compatible (string, cpu_arch[j].flags);
8a9036a4 2835
5c6af06e
JB
2836 if (*string != '.')
2837 {
91d6fa6a 2838 cpu_arch_name = cpu_arch[j].name;
5c6af06e 2839 cpu_sub_arch_name = NULL;
91d6fa6a 2840 cpu_arch_flags = cpu_arch[j].flags;
40fb9820
L
2841 if (flag_code == CODE_64BIT)
2842 {
2843 cpu_arch_flags.bitfield.cpu64 = 1;
2844 cpu_arch_flags.bitfield.cpuno64 = 0;
2845 }
2846 else
2847 {
2848 cpu_arch_flags.bitfield.cpu64 = 0;
2849 cpu_arch_flags.bitfield.cpuno64 = 1;
2850 }
91d6fa6a
NC
2851 cpu_arch_isa = cpu_arch[j].type;
2852 cpu_arch_isa_flags = cpu_arch[j].flags;
ccc9c027
L
2853 if (!cpu_arch_tune_set)
2854 {
2855 cpu_arch_tune = cpu_arch_isa;
2856 cpu_arch_tune_flags = cpu_arch_isa_flags;
2857 }
5c6af06e
JB
2858 break;
2859 }
40fb9820 2860
293f5f65
L
2861 flags = cpu_flags_or (cpu_arch_flags,
2862 cpu_arch[j].flags);
81486035 2863
5b64d091 2864 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
5c6af06e 2865 {
6305a203
L
2866 if (cpu_sub_arch_name)
2867 {
2868 char *name = cpu_sub_arch_name;
2869 cpu_sub_arch_name = concat (name,
91d6fa6a 2870 cpu_arch[j].name,
1bf57e9f 2871 (const char *) NULL);
6305a203
L
2872 free (name);
2873 }
2874 else
91d6fa6a 2875 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
40fb9820 2876 cpu_arch_flags = flags;
a586129e 2877 cpu_arch_isa_flags = flags;
5c6af06e 2878 }
0089dace
L
2879 else
2880 cpu_arch_isa_flags
2881 = cpu_flags_or (cpu_arch_isa_flags,
2882 cpu_arch[j].flags);
d02603dc 2883 (void) restore_line_pointer (e);
5c6af06e
JB
2884 demand_empty_rest_of_line ();
2885 return;
e413e4e9
AM
2886 }
2887 }
293f5f65
L
2888
2889 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2890 {
33eaf5de 2891 /* Disable an ISA extension. */
293f5f65
L
2892 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2893 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2894 {
2895 flags = cpu_flags_and_not (cpu_arch_flags,
2896 cpu_noarch[j].flags);
2897 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2898 {
2899 if (cpu_sub_arch_name)
2900 {
2901 char *name = cpu_sub_arch_name;
2902 cpu_sub_arch_name = concat (name, string,
2903 (const char *) NULL);
2904 free (name);
2905 }
2906 else
2907 cpu_sub_arch_name = xstrdup (string);
2908 cpu_arch_flags = flags;
2909 cpu_arch_isa_flags = flags;
2910 }
2911 (void) restore_line_pointer (e);
2912 demand_empty_rest_of_line ();
2913 return;
2914 }
2915
2916 j = ARRAY_SIZE (cpu_arch);
2917 }
2918
91d6fa6a 2919 if (j >= ARRAY_SIZE (cpu_arch))
e413e4e9
AM
2920 as_bad (_("no such architecture: `%s'"), string);
2921
2922 *input_line_pointer = e;
2923 }
2924 else
2925 as_bad (_("missing cpu architecture"));
2926
fddf5b5b
AM
2927 no_cond_jump_promotion = 0;
2928 if (*input_line_pointer == ','
29b0f896 2929 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
fddf5b5b 2930 {
d02603dc
NC
2931 char *string;
2932 char e;
2933
2934 ++input_line_pointer;
2935 e = get_symbol_name (&string);
fddf5b5b
AM
2936
2937 if (strcmp (string, "nojumps") == 0)
2938 no_cond_jump_promotion = 1;
2939 else if (strcmp (string, "jumps") == 0)
2940 ;
2941 else
2942 as_bad (_("no such architecture modifier: `%s'"), string);
2943
d02603dc 2944 (void) restore_line_pointer (e);
fddf5b5b
AM
2945 }
2946
e413e4e9
AM
2947 demand_empty_rest_of_line ();
2948}
2949
8a9036a4
L
2950enum bfd_architecture
2951i386_arch (void)
2952{
3632d14b 2953 if (cpu_arch_isa == PROCESSOR_L1OM)
8a9036a4
L
2954 {
2955 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2956 || flag_code != CODE_64BIT)
2957 as_fatal (_("Intel L1OM is 64bit ELF only"));
2958 return bfd_arch_l1om;
2959 }
7a9068fe
L
2960 else if (cpu_arch_isa == PROCESSOR_K1OM)
2961 {
2962 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2963 || flag_code != CODE_64BIT)
2964 as_fatal (_("Intel K1OM is 64bit ELF only"));
2965 return bfd_arch_k1om;
2966 }
81486035
L
2967 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2968 {
2969 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2970 || flag_code == CODE_64BIT)
2971 as_fatal (_("Intel MCU is 32bit ELF only"));
2972 return bfd_arch_iamcu;
2973 }
8a9036a4
L
2974 else
2975 return bfd_arch_i386;
2976}
2977
b9d79e03 2978unsigned long
7016a5d5 2979i386_mach (void)
b9d79e03 2980{
351f65ca 2981 if (!strncmp (default_arch, "x86_64", 6))
8a9036a4 2982 {
3632d14b 2983 if (cpu_arch_isa == PROCESSOR_L1OM)
8a9036a4 2984 {
351f65ca
L
2985 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2986 || default_arch[6] != '\0')
8a9036a4
L
2987 as_fatal (_("Intel L1OM is 64bit ELF only"));
2988 return bfd_mach_l1om;
2989 }
7a9068fe
L
2990 else if (cpu_arch_isa == PROCESSOR_K1OM)
2991 {
2992 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2993 || default_arch[6] != '\0')
2994 as_fatal (_("Intel K1OM is 64bit ELF only"));
2995 return bfd_mach_k1om;
2996 }
351f65ca 2997 else if (default_arch[6] == '\0')
8a9036a4 2998 return bfd_mach_x86_64;
351f65ca
L
2999 else
3000 return bfd_mach_x64_32;
8a9036a4 3001 }
5197d474
L
3002 else if (!strcmp (default_arch, "i386")
3003 || !strcmp (default_arch, "iamcu"))
81486035
L
3004 {
3005 if (cpu_arch_isa == PROCESSOR_IAMCU)
3006 {
3007 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3008 as_fatal (_("Intel MCU is 32bit ELF only"));
3009 return bfd_mach_i386_iamcu;
3010 }
3011 else
3012 return bfd_mach_i386_i386;
3013 }
b9d79e03 3014 else
2b5d6a91 3015 as_fatal (_("unknown architecture"));
b9d79e03 3016}
b9d79e03 3017\f
252b5132 3018void
7016a5d5 3019md_begin (void)
252b5132
RH
3020{
3021 const char *hash_err;
3022
86fa6981
L
3023 /* Support pseudo prefixes like {disp32}. */
3024 lex_type ['{'] = LEX_BEGIN_NAME;
3025
47926f60 3026 /* Initialize op_hash hash table. */
252b5132
RH
3027 op_hash = hash_new ();
3028
3029 {
d3ce72d0 3030 const insn_template *optab;
29b0f896 3031 templates *core_optab;
252b5132 3032
47926f60
KH
3033 /* Setup for loop. */
3034 optab = i386_optab;
add39d23 3035 core_optab = XNEW (templates);
252b5132
RH
3036 core_optab->start = optab;
3037
3038 while (1)
3039 {
3040 ++optab;
3041 if (optab->name == NULL
3042 || strcmp (optab->name, (optab - 1)->name) != 0)
3043 {
3044 /* different name --> ship out current template list;
47926f60 3045 add to hash table; & begin anew. */
252b5132
RH
3046 core_optab->end = optab;
3047 hash_err = hash_insert (op_hash,
3048 (optab - 1)->name,
5a49b8ac 3049 (void *) core_optab);
252b5132
RH
3050 if (hash_err)
3051 {
b37df7c4 3052 as_fatal (_("can't hash %s: %s"),
252b5132
RH
3053 (optab - 1)->name,
3054 hash_err);
3055 }
3056 if (optab->name == NULL)
3057 break;
add39d23 3058 core_optab = XNEW (templates);
252b5132
RH
3059 core_optab->start = optab;
3060 }
3061 }
3062 }
3063
47926f60 3064 /* Initialize reg_hash hash table. */
252b5132
RH
3065 reg_hash = hash_new ();
3066 {
29b0f896 3067 const reg_entry *regtab;
c3fe08fa 3068 unsigned int regtab_size = i386_regtab_size;
252b5132 3069
c3fe08fa 3070 for (regtab = i386_regtab; regtab_size--; regtab++)
252b5132 3071 {
5a49b8ac 3072 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
252b5132 3073 if (hash_err)
b37df7c4 3074 as_fatal (_("can't hash %s: %s"),
3e73aa7c
JH
3075 regtab->reg_name,
3076 hash_err);
252b5132
RH
3077 }
3078 }
3079
47926f60 3080 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
252b5132 3081 {
29b0f896
AM
3082 int c;
3083 char *p;
252b5132
RH
3084
3085 for (c = 0; c < 256; c++)
3086 {
3882b010 3087 if (ISDIGIT (c))
252b5132
RH
3088 {
3089 digit_chars[c] = c;
3090 mnemonic_chars[c] = c;
3091 register_chars[c] = c;
3092 operand_chars[c] = c;
3093 }
3882b010 3094 else if (ISLOWER (c))
252b5132
RH
3095 {
3096 mnemonic_chars[c] = c;
3097 register_chars[c] = c;
3098 operand_chars[c] = c;
3099 }
3882b010 3100 else if (ISUPPER (c))
252b5132 3101 {
3882b010 3102 mnemonic_chars[c] = TOLOWER (c);
252b5132
RH
3103 register_chars[c] = mnemonic_chars[c];
3104 operand_chars[c] = c;
3105 }
43234a1e 3106 else if (c == '{' || c == '}')
86fa6981
L
3107 {
3108 mnemonic_chars[c] = c;
3109 operand_chars[c] = c;
3110 }
252b5132 3111
3882b010 3112 if (ISALPHA (c) || ISDIGIT (c))
252b5132
RH
3113 identifier_chars[c] = c;
3114 else if (c >= 128)
3115 {
3116 identifier_chars[c] = c;
3117 operand_chars[c] = c;
3118 }
3119 }
3120
3121#ifdef LEX_AT
3122 identifier_chars['@'] = '@';
32137342
NC
3123#endif
3124#ifdef LEX_QM
3125 identifier_chars['?'] = '?';
3126 operand_chars['?'] = '?';
252b5132 3127#endif
252b5132 3128 digit_chars['-'] = '-';
c0f3af97 3129 mnemonic_chars['_'] = '_';
791fe849 3130 mnemonic_chars['-'] = '-';
0003779b 3131 mnemonic_chars['.'] = '.';
252b5132
RH
3132 identifier_chars['_'] = '_';
3133 identifier_chars['.'] = '.';
3134
3135 for (p = operand_special_chars; *p != '\0'; p++)
3136 operand_chars[(unsigned char) *p] = *p;
3137 }
3138
a4447b93
RH
3139 if (flag_code == CODE_64BIT)
3140 {
ca19b261
KT
3141#if defined (OBJ_COFF) && defined (TE_PE)
3142 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3143 ? 32 : 16);
3144#else
a4447b93 3145 x86_dwarf2_return_column = 16;
ca19b261 3146#endif
61ff971f 3147 x86_cie_data_alignment = -8;
a4447b93
RH
3148 }
3149 else
3150 {
3151 x86_dwarf2_return_column = 8;
3152 x86_cie_data_alignment = -4;
3153 }
e379e5f3
L
3154
3155 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3156 can be turned into BRANCH_PREFIX frag. */
3157 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3158 abort ();
252b5132
RH
3159}
3160
3161void
e3bb37b5 3162i386_print_statistics (FILE *file)
252b5132
RH
3163{
3164 hash_print_statistics (file, "i386 opcode", op_hash);
3165 hash_print_statistics (file, "i386 register", reg_hash);
3166}
3167\f
252b5132
RH
3168#ifdef DEBUG386
3169
ce8a8b2f 3170/* Debugging routines for md_assemble. */
d3ce72d0 3171static void pte (insn_template *);
40fb9820 3172static void pt (i386_operand_type);
e3bb37b5
L
3173static void pe (expressionS *);
3174static void ps (symbolS *);
252b5132
RH
3175
3176static void
2c703856 3177pi (const char *line, i386_insn *x)
252b5132 3178{
09137c09 3179 unsigned int j;
252b5132
RH
3180
3181 fprintf (stdout, "%s: template ", line);
3182 pte (&x->tm);
09f131f2
JH
3183 fprintf (stdout, " address: base %s index %s scale %x\n",
3184 x->base_reg ? x->base_reg->reg_name : "none",
3185 x->index_reg ? x->index_reg->reg_name : "none",
3186 x->log2_scale_factor);
3187 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
252b5132 3188 x->rm.mode, x->rm.reg, x->rm.regmem);
09f131f2
JH
3189 fprintf (stdout, " sib: base %x index %x scale %x\n",
3190 x->sib.base, x->sib.index, x->sib.scale);
3191 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
161a04f6
L
3192 (x->rex & REX_W) != 0,
3193 (x->rex & REX_R) != 0,
3194 (x->rex & REX_X) != 0,
3195 (x->rex & REX_B) != 0);
09137c09 3196 for (j = 0; j < x->operands; j++)
252b5132 3197 {
09137c09
SP
3198 fprintf (stdout, " #%d: ", j + 1);
3199 pt (x->types[j]);
252b5132 3200 fprintf (stdout, "\n");
bab6aec1 3201 if (x->types[j].bitfield.class == Reg
3528c362
JB
3202 || x->types[j].bitfield.class == RegMMX
3203 || x->types[j].bitfield.class == RegSIMD
dd6b8a0b 3204 || x->types[j].bitfield.class == RegMask
00cee14f 3205 || x->types[j].bitfield.class == SReg
4a5c67ed
JB
3206 || x->types[j].bitfield.class == RegCR
3207 || x->types[j].bitfield.class == RegDR
dd6b8a0b
JB
3208 || x->types[j].bitfield.class == RegTR
3209 || x->types[j].bitfield.class == RegBND)
09137c09
SP
3210 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3211 if (operand_type_check (x->types[j], imm))
3212 pe (x->op[j].imms);
3213 if (operand_type_check (x->types[j], disp))
3214 pe (x->op[j].disps);
252b5132
RH
3215 }
3216}
3217
3218static void
d3ce72d0 3219pte (insn_template *t)
252b5132 3220{
09137c09 3221 unsigned int j;
252b5132 3222 fprintf (stdout, " %d operands ", t->operands);
47926f60 3223 fprintf (stdout, "opcode %x ", t->base_opcode);
252b5132
RH
3224 if (t->extension_opcode != None)
3225 fprintf (stdout, "ext %x ", t->extension_opcode);
40fb9820 3226 if (t->opcode_modifier.d)
252b5132 3227 fprintf (stdout, "D");
40fb9820 3228 if (t->opcode_modifier.w)
252b5132
RH
3229 fprintf (stdout, "W");
3230 fprintf (stdout, "\n");
09137c09 3231 for (j = 0; j < t->operands; j++)
252b5132 3232 {
09137c09
SP
3233 fprintf (stdout, " #%d type ", j + 1);
3234 pt (t->operand_types[j]);
252b5132
RH
3235 fprintf (stdout, "\n");
3236 }
3237}
3238
3239static void
e3bb37b5 3240pe (expressionS *e)
252b5132 3241{
24eab124 3242 fprintf (stdout, " operation %d\n", e->X_op);
b77ad1d4
AM
3243 fprintf (stdout, " add_number %ld (%lx)\n",
3244 (long) e->X_add_number, (long) e->X_add_number);
252b5132
RH
3245 if (e->X_add_symbol)
3246 {
3247 fprintf (stdout, " add_symbol ");
3248 ps (e->X_add_symbol);
3249 fprintf (stdout, "\n");
3250 }
3251 if (e->X_op_symbol)
3252 {
3253 fprintf (stdout, " op_symbol ");
3254 ps (e->X_op_symbol);
3255 fprintf (stdout, "\n");
3256 }
3257}
3258
3259static void
e3bb37b5 3260ps (symbolS *s)
252b5132
RH
3261{
3262 fprintf (stdout, "%s type %s%s",
3263 S_GET_NAME (s),
3264 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3265 segment_name (S_GET_SEGMENT (s)));
3266}
3267
7b81dfbb 3268static struct type_name
252b5132 3269 {
40fb9820
L
3270 i386_operand_type mask;
3271 const char *name;
252b5132 3272 }
7b81dfbb 3273const type_names[] =
252b5132 3274{
40fb9820
L
3275 { OPERAND_TYPE_REG8, "r8" },
3276 { OPERAND_TYPE_REG16, "r16" },
3277 { OPERAND_TYPE_REG32, "r32" },
3278 { OPERAND_TYPE_REG64, "r64" },
2c703856
JB
3279 { OPERAND_TYPE_ACC8, "acc8" },
3280 { OPERAND_TYPE_ACC16, "acc16" },
3281 { OPERAND_TYPE_ACC32, "acc32" },
3282 { OPERAND_TYPE_ACC64, "acc64" },
40fb9820
L
3283 { OPERAND_TYPE_IMM8, "i8" },
3284 { OPERAND_TYPE_IMM8, "i8s" },
3285 { OPERAND_TYPE_IMM16, "i16" },
3286 { OPERAND_TYPE_IMM32, "i32" },
3287 { OPERAND_TYPE_IMM32S, "i32s" },
3288 { OPERAND_TYPE_IMM64, "i64" },
3289 { OPERAND_TYPE_IMM1, "i1" },
3290 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3291 { OPERAND_TYPE_DISP8, "d8" },
3292 { OPERAND_TYPE_DISP16, "d16" },
3293 { OPERAND_TYPE_DISP32, "d32" },
3294 { OPERAND_TYPE_DISP32S, "d32s" },
3295 { OPERAND_TYPE_DISP64, "d64" },
3296 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3297 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3298 { OPERAND_TYPE_CONTROL, "control reg" },
3299 { OPERAND_TYPE_TEST, "test reg" },
3300 { OPERAND_TYPE_DEBUG, "debug reg" },
3301 { OPERAND_TYPE_FLOATREG, "FReg" },
3302 { OPERAND_TYPE_FLOATACC, "FAcc" },
21df382b 3303 { OPERAND_TYPE_SREG, "SReg" },
40fb9820
L
3304 { OPERAND_TYPE_REGMMX, "rMMX" },
3305 { OPERAND_TYPE_REGXMM, "rXMM" },
0349dc08 3306 { OPERAND_TYPE_REGYMM, "rYMM" },
43234a1e
L
3307 { OPERAND_TYPE_REGZMM, "rZMM" },
3308 { OPERAND_TYPE_REGMASK, "Mask reg" },
252b5132
RH
3309};
3310
3311static void
40fb9820 3312pt (i386_operand_type t)
252b5132 3313{
40fb9820 3314 unsigned int j;
c6fb90c8 3315 i386_operand_type a;
252b5132 3316
40fb9820 3317 for (j = 0; j < ARRAY_SIZE (type_names); j++)
c6fb90c8
L
3318 {
3319 a = operand_type_and (t, type_names[j].mask);
2c703856 3320 if (operand_type_equal (&a, &type_names[j].mask))
c6fb90c8
L
3321 fprintf (stdout, "%s, ", type_names[j].name);
3322 }
252b5132
RH
3323 fflush (stdout);
3324}
3325
3326#endif /* DEBUG386 */
3327\f
252b5132 3328static bfd_reloc_code_real_type
3956db08 3329reloc (unsigned int size,
64e74474
AM
3330 int pcrel,
3331 int sign,
3332 bfd_reloc_code_real_type other)
252b5132 3333{
47926f60 3334 if (other != NO_RELOC)
3956db08 3335 {
91d6fa6a 3336 reloc_howto_type *rel;
3956db08
JB
3337
3338 if (size == 8)
3339 switch (other)
3340 {
64e74474
AM
3341 case BFD_RELOC_X86_64_GOT32:
3342 return BFD_RELOC_X86_64_GOT64;
3343 break;
553d1284
L
3344 case BFD_RELOC_X86_64_GOTPLT64:
3345 return BFD_RELOC_X86_64_GOTPLT64;
3346 break;
64e74474
AM
3347 case BFD_RELOC_X86_64_PLTOFF64:
3348 return BFD_RELOC_X86_64_PLTOFF64;
3349 break;
3350 case BFD_RELOC_X86_64_GOTPC32:
3351 other = BFD_RELOC_X86_64_GOTPC64;
3352 break;
3353 case BFD_RELOC_X86_64_GOTPCREL:
3354 other = BFD_RELOC_X86_64_GOTPCREL64;
3355 break;
3356 case BFD_RELOC_X86_64_TPOFF32:
3357 other = BFD_RELOC_X86_64_TPOFF64;
3358 break;
3359 case BFD_RELOC_X86_64_DTPOFF32:
3360 other = BFD_RELOC_X86_64_DTPOFF64;
3361 break;
3362 default:
3363 break;
3956db08 3364 }
e05278af 3365
8ce3d284 3366#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
3367 if (other == BFD_RELOC_SIZE32)
3368 {
3369 if (size == 8)
1ab668bf 3370 other = BFD_RELOC_SIZE64;
8fd4256d 3371 if (pcrel)
1ab668bf
AM
3372 {
3373 as_bad (_("there are no pc-relative size relocations"));
3374 return NO_RELOC;
3375 }
8fd4256d 3376 }
8ce3d284 3377#endif
8fd4256d 3378
e05278af 3379 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
f2d8a97c 3380 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
e05278af
JB
3381 sign = -1;
3382
91d6fa6a
NC
3383 rel = bfd_reloc_type_lookup (stdoutput, other);
3384 if (!rel)
3956db08 3385 as_bad (_("unknown relocation (%u)"), other);
91d6fa6a 3386 else if (size != bfd_get_reloc_size (rel))
3956db08 3387 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
91d6fa6a 3388 bfd_get_reloc_size (rel),
3956db08 3389 size);
91d6fa6a 3390 else if (pcrel && !rel->pc_relative)
3956db08 3391 as_bad (_("non-pc-relative relocation for pc-relative field"));
91d6fa6a 3392 else if ((rel->complain_on_overflow == complain_overflow_signed
3956db08 3393 && !sign)
91d6fa6a 3394 || (rel->complain_on_overflow == complain_overflow_unsigned
64e74474 3395 && sign > 0))
3956db08
JB
3396 as_bad (_("relocated field and relocation type differ in signedness"));
3397 else
3398 return other;
3399 return NO_RELOC;
3400 }
252b5132
RH
3401
3402 if (pcrel)
3403 {
3e73aa7c 3404 if (!sign)
3956db08 3405 as_bad (_("there are no unsigned pc-relative relocations"));
252b5132
RH
3406 switch (size)
3407 {
3408 case 1: return BFD_RELOC_8_PCREL;
3409 case 2: return BFD_RELOC_16_PCREL;
d258b828 3410 case 4: return BFD_RELOC_32_PCREL;
d6ab8113 3411 case 8: return BFD_RELOC_64_PCREL;
252b5132 3412 }
3956db08 3413 as_bad (_("cannot do %u byte pc-relative relocation"), size);
252b5132
RH
3414 }
3415 else
3416 {
3956db08 3417 if (sign > 0)
e5cb08ac 3418 switch (size)
3e73aa7c
JH
3419 {
3420 case 4: return BFD_RELOC_X86_64_32S;
3421 }
3422 else
3423 switch (size)
3424 {
3425 case 1: return BFD_RELOC_8;
3426 case 2: return BFD_RELOC_16;
3427 case 4: return BFD_RELOC_32;
3428 case 8: return BFD_RELOC_64;
3429 }
3956db08
JB
3430 as_bad (_("cannot do %s %u byte relocation"),
3431 sign > 0 ? "signed" : "unsigned", size);
252b5132
RH
3432 }
3433
0cc9e1d3 3434 return NO_RELOC;
252b5132
RH
3435}
3436
47926f60
KH
3437/* Here we decide which fixups can be adjusted to make them relative to
3438 the beginning of the section instead of the symbol. Basically we need
3439 to make sure that the dynamic relocations are done correctly, so in
3440 some cases we force the original symbol to be used. */
3441
252b5132 3442int
e3bb37b5 3443tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
252b5132 3444{
6d249963 3445#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 3446 if (!IS_ELF)
31312f95
AM
3447 return 1;
3448
a161fe53
AM
3449 /* Don't adjust pc-relative references to merge sections in 64-bit
3450 mode. */
3451 if (use_rela_relocations
3452 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3453 && fixP->fx_pcrel)
252b5132 3454 return 0;
31312f95 3455
8d01d9a9
AJ
3456 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3457 and changed later by validate_fix. */
3458 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3459 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3460 return 0;
3461
8fd4256d
L
3462 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3463 for size relocations. */
3464 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3465 || fixP->fx_r_type == BFD_RELOC_SIZE64
3466 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
252b5132 3467 || fixP->fx_r_type == BFD_RELOC_386_GOT32
02a86693 3468 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
13ae64f3
JJ
3469 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3470 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3471 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3472 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
37e55690
JJ
3473 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3474 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
13ae64f3
JJ
3475 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3476 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
67a4f2b7
AO
3477 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3478 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3e73aa7c 3479 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
80b3ee89 3480 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
56ceb5b5
L
3481 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3482 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
bffbf940
JJ
3483 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3484 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3485 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
d6ab8113 3486 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
bffbf940
JJ
3487 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3488 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
d6ab8113
JB
3489 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3490 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
67a4f2b7
AO
3491 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3492 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
252b5132
RH
3493 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3494 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3495 return 0;
31312f95 3496#endif
252b5132
RH
3497 return 1;
3498}
252b5132 3499
b4cac588 3500static int
e3bb37b5 3501intel_float_operand (const char *mnemonic)
252b5132 3502{
9306ca4a
JB
3503 /* Note that the value returned is meaningful only for opcodes with (memory)
3504 operands, hence the code here is free to improperly handle opcodes that
3505 have no operands (for better performance and smaller code). */
3506
3507 if (mnemonic[0] != 'f')
3508 return 0; /* non-math */
3509
3510 switch (mnemonic[1])
3511 {
3512 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3513 the fs segment override prefix not currently handled because no
3514 call path can make opcodes without operands get here */
3515 case 'i':
3516 return 2 /* integer op */;
3517 case 'l':
3518 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3519 return 3; /* fldcw/fldenv */
3520 break;
3521 case 'n':
3522 if (mnemonic[2] != 'o' /* fnop */)
3523 return 3; /* non-waiting control op */
3524 break;
3525 case 'r':
3526 if (mnemonic[2] == 's')
3527 return 3; /* frstor/frstpm */
3528 break;
3529 case 's':
3530 if (mnemonic[2] == 'a')
3531 return 3; /* fsave */
3532 if (mnemonic[2] == 't')
3533 {
3534 switch (mnemonic[3])
3535 {
3536 case 'c': /* fstcw */
3537 case 'd': /* fstdw */
3538 case 'e': /* fstenv */
3539 case 's': /* fsts[gw] */
3540 return 3;
3541 }
3542 }
3543 break;
3544 case 'x':
3545 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3546 return 0; /* fxsave/fxrstor are not really math ops */
3547 break;
3548 }
252b5132 3549
9306ca4a 3550 return 1;
252b5132
RH
3551}
3552
c0f3af97
L
3553/* Build the VEX prefix. */
3554
3555static void
d3ce72d0 3556build_vex_prefix (const insn_template *t)
c0f3af97
L
3557{
3558 unsigned int register_specifier;
3559 unsigned int implied_prefix;
3560 unsigned int vector_length;
03751133 3561 unsigned int w;
c0f3af97
L
3562
3563 /* Check register specifier. */
3564 if (i.vex.register_specifier)
43234a1e
L
3565 {
3566 register_specifier =
3567 ~register_number (i.vex.register_specifier) & 0xf;
3568 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3569 }
c0f3af97
L
3570 else
3571 register_specifier = 0xf;
3572
79f0fa25
L
3573 /* Use 2-byte VEX prefix by swapping destination and source operand
3574 if there are more than 1 register operand. */
3575 if (i.reg_operands > 1
3576 && i.vec_encoding != vex_encoding_vex3
86fa6981 3577 && i.dir_encoding == dir_encoding_default
fa99fab2 3578 && i.operands == i.reg_operands
dbbc8b7e 3579 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
7f399153 3580 && i.tm.opcode_modifier.vexopcode == VEX0F
dbbc8b7e 3581 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
fa99fab2
L
3582 && i.rex == REX_B)
3583 {
3584 unsigned int xchg = i.operands - 1;
3585 union i386_op temp_op;
3586 i386_operand_type temp_type;
3587
3588 temp_type = i.types[xchg];
3589 i.types[xchg] = i.types[0];
3590 i.types[0] = temp_type;
3591 temp_op = i.op[xchg];
3592 i.op[xchg] = i.op[0];
3593 i.op[0] = temp_op;
3594
9c2799c2 3595 gas_assert (i.rm.mode == 3);
fa99fab2
L
3596
3597 i.rex = REX_R;
3598 xchg = i.rm.regmem;
3599 i.rm.regmem = i.rm.reg;
3600 i.rm.reg = xchg;
3601
dbbc8b7e
JB
3602 if (i.tm.opcode_modifier.d)
3603 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3604 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3605 else /* Use the next insn. */
3606 i.tm = t[1];
fa99fab2
L
3607 }
3608
79dec6b7
JB
3609 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3610 are no memory operands and at least 3 register ones. */
3611 if (i.reg_operands >= 3
3612 && i.vec_encoding != vex_encoding_vex3
3613 && i.reg_operands == i.operands - i.imm_operands
3614 && i.tm.opcode_modifier.vex
3615 && i.tm.opcode_modifier.commutative
3616 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3617 && i.rex == REX_B
3618 && i.vex.register_specifier
3619 && !(i.vex.register_specifier->reg_flags & RegRex))
3620 {
3621 unsigned int xchg = i.operands - i.reg_operands;
3622 union i386_op temp_op;
3623 i386_operand_type temp_type;
3624
3625 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3626 gas_assert (!i.tm.opcode_modifier.sae);
3627 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3628 &i.types[i.operands - 3]));
3629 gas_assert (i.rm.mode == 3);
3630
3631 temp_type = i.types[xchg];
3632 i.types[xchg] = i.types[xchg + 1];
3633 i.types[xchg + 1] = temp_type;
3634 temp_op = i.op[xchg];
3635 i.op[xchg] = i.op[xchg + 1];
3636 i.op[xchg + 1] = temp_op;
3637
3638 i.rex = 0;
3639 xchg = i.rm.regmem | 8;
3640 i.rm.regmem = ~register_specifier & 0xf;
3641 gas_assert (!(i.rm.regmem & 8));
3642 i.vex.register_specifier += xchg - i.rm.regmem;
3643 register_specifier = ~xchg & 0xf;
3644 }
3645
539f890d
L
3646 if (i.tm.opcode_modifier.vex == VEXScalar)
3647 vector_length = avxscalar;
10c17abd
JB
3648 else if (i.tm.opcode_modifier.vex == VEX256)
3649 vector_length = 1;
539f890d 3650 else
10c17abd 3651 {
56522fc5 3652 unsigned int op;
10c17abd 3653
c7213af9
L
3654 /* Determine vector length from the last multi-length vector
3655 operand. */
10c17abd 3656 vector_length = 0;
56522fc5 3657 for (op = t->operands; op--;)
10c17abd
JB
3658 if (t->operand_types[op].bitfield.xmmword
3659 && t->operand_types[op].bitfield.ymmword
3660 && i.types[op].bitfield.ymmword)
3661 {
3662 vector_length = 1;
3663 break;
3664 }
3665 }
c0f3af97
L
3666
3667 switch ((i.tm.base_opcode >> 8) & 0xff)
3668 {
3669 case 0:
3670 implied_prefix = 0;
3671 break;
3672 case DATA_PREFIX_OPCODE:
3673 implied_prefix = 1;
3674 break;
3675 case REPE_PREFIX_OPCODE:
3676 implied_prefix = 2;
3677 break;
3678 case REPNE_PREFIX_OPCODE:
3679 implied_prefix = 3;
3680 break;
3681 default:
3682 abort ();
3683 }
3684
03751133
L
3685 /* Check the REX.W bit and VEXW. */
3686 if (i.tm.opcode_modifier.vexw == VEXWIG)
3687 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3688 else if (i.tm.opcode_modifier.vexw)
3689 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3690 else
931d03b7 3691 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
03751133 3692
c0f3af97 3693 /* Use 2-byte VEX prefix if possible. */
03751133
L
3694 if (w == 0
3695 && i.vec_encoding != vex_encoding_vex3
86fa6981 3696 && i.tm.opcode_modifier.vexopcode == VEX0F
c0f3af97
L
3697 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3698 {
3699 /* 2-byte VEX prefix. */
3700 unsigned int r;
3701
3702 i.vex.length = 2;
3703 i.vex.bytes[0] = 0xc5;
3704
3705 /* Check the REX.R bit. */
3706 r = (i.rex & REX_R) ? 0 : 1;
3707 i.vex.bytes[1] = (r << 7
3708 | register_specifier << 3
3709 | vector_length << 2
3710 | implied_prefix);
3711 }
3712 else
3713 {
3714 /* 3-byte VEX prefix. */
03751133 3715 unsigned int m;
c0f3af97 3716
f88c9eb0 3717 i.vex.length = 3;
f88c9eb0 3718
7f399153 3719 switch (i.tm.opcode_modifier.vexopcode)
5dd85c99 3720 {
7f399153
L
3721 case VEX0F:
3722 m = 0x1;
80de6e00 3723 i.vex.bytes[0] = 0xc4;
7f399153
L
3724 break;
3725 case VEX0F38:
3726 m = 0x2;
80de6e00 3727 i.vex.bytes[0] = 0xc4;
7f399153
L
3728 break;
3729 case VEX0F3A:
3730 m = 0x3;
80de6e00 3731 i.vex.bytes[0] = 0xc4;
7f399153
L
3732 break;
3733 case XOP08:
5dd85c99
SP
3734 m = 0x8;
3735 i.vex.bytes[0] = 0x8f;
7f399153
L
3736 break;
3737 case XOP09:
f88c9eb0
SP
3738 m = 0x9;
3739 i.vex.bytes[0] = 0x8f;
7f399153
L
3740 break;
3741 case XOP0A:
f88c9eb0
SP
3742 m = 0xa;
3743 i.vex.bytes[0] = 0x8f;
7f399153
L
3744 break;
3745 default:
3746 abort ();
f88c9eb0 3747 }
c0f3af97 3748
c0f3af97
L
3749 /* The high 3 bits of the second VEX byte are 1's compliment
3750 of RXB bits from REX. */
3751 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3752
c0f3af97
L
3753 i.vex.bytes[2] = (w << 7
3754 | register_specifier << 3
3755 | vector_length << 2
3756 | implied_prefix);
3757 }
3758}
3759
e771e7c9
JB
3760static INLINE bfd_boolean
3761is_evex_encoding (const insn_template *t)
3762{
7091c612 3763 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
e771e7c9 3764 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
a80195f1 3765 || t->opcode_modifier.sae;
e771e7c9
JB
3766}
3767
7a8655d2
JB
3768static INLINE bfd_boolean
3769is_any_vex_encoding (const insn_template *t)
3770{
3771 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3772 || is_evex_encoding (t);
3773}
3774
43234a1e
L
3775/* Build the EVEX prefix. */
3776
3777static void
3778build_evex_prefix (void)
3779{
3780 unsigned int register_specifier;
3781 unsigned int implied_prefix;
3782 unsigned int m, w;
3783 rex_byte vrex_used = 0;
3784
3785 /* Check register specifier. */
3786 if (i.vex.register_specifier)
3787 {
3788 gas_assert ((i.vrex & REX_X) == 0);
3789
3790 register_specifier = i.vex.register_specifier->reg_num;
3791 if ((i.vex.register_specifier->reg_flags & RegRex))
3792 register_specifier += 8;
3793 /* The upper 16 registers are encoded in the fourth byte of the
3794 EVEX prefix. */
3795 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3796 i.vex.bytes[3] = 0x8;
3797 register_specifier = ~register_specifier & 0xf;
3798 }
3799 else
3800 {
3801 register_specifier = 0xf;
3802
3803 /* Encode upper 16 vector index register in the fourth byte of
3804 the EVEX prefix. */
3805 if (!(i.vrex & REX_X))
3806 i.vex.bytes[3] = 0x8;
3807 else
3808 vrex_used |= REX_X;
3809 }
3810
3811 switch ((i.tm.base_opcode >> 8) & 0xff)
3812 {
3813 case 0:
3814 implied_prefix = 0;
3815 break;
3816 case DATA_PREFIX_OPCODE:
3817 implied_prefix = 1;
3818 break;
3819 case REPE_PREFIX_OPCODE:
3820 implied_prefix = 2;
3821 break;
3822 case REPNE_PREFIX_OPCODE:
3823 implied_prefix = 3;
3824 break;
3825 default:
3826 abort ();
3827 }
3828
3829 /* 4 byte EVEX prefix. */
3830 i.vex.length = 4;
3831 i.vex.bytes[0] = 0x62;
3832
3833 /* mmmm bits. */
3834 switch (i.tm.opcode_modifier.vexopcode)
3835 {
3836 case VEX0F:
3837 m = 1;
3838 break;
3839 case VEX0F38:
3840 m = 2;
3841 break;
3842 case VEX0F3A:
3843 m = 3;
3844 break;
3845 default:
3846 abort ();
3847 break;
3848 }
3849
3850 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3851 bits from REX. */
3852 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3853
3854 /* The fifth bit of the second EVEX byte is 1's compliment of the
3855 REX_R bit in VREX. */
3856 if (!(i.vrex & REX_R))
3857 i.vex.bytes[1] |= 0x10;
3858 else
3859 vrex_used |= REX_R;
3860
3861 if ((i.reg_operands + i.imm_operands) == i.operands)
3862 {
3863 /* When all operands are registers, the REX_X bit in REX is not
3864 used. We reuse it to encode the upper 16 registers, which is
3865 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3866 as 1's compliment. */
3867 if ((i.vrex & REX_B))
3868 {
3869 vrex_used |= REX_B;
3870 i.vex.bytes[1] &= ~0x40;
3871 }
3872 }
3873
3874 /* EVEX instructions shouldn't need the REX prefix. */
3875 i.vrex &= ~vrex_used;
3876 gas_assert (i.vrex == 0);
3877
6865c043
L
3878 /* Check the REX.W bit and VEXW. */
3879 if (i.tm.opcode_modifier.vexw == VEXWIG)
3880 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3881 else if (i.tm.opcode_modifier.vexw)
3882 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3883 else
931d03b7 3884 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
43234a1e
L
3885
3886 /* Encode the U bit. */
3887 implied_prefix |= 0x4;
3888
3889 /* The third byte of the EVEX prefix. */
3890 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3891
3892 /* The fourth byte of the EVEX prefix. */
3893 /* The zeroing-masking bit. */
3894 if (i.mask && i.mask->zeroing)
3895 i.vex.bytes[3] |= 0x80;
3896
3897 /* Don't always set the broadcast bit if there is no RC. */
3898 if (!i.rounding)
3899 {
3900 /* Encode the vector length. */
3901 unsigned int vec_length;
3902
e771e7c9
JB
3903 if (!i.tm.opcode_modifier.evex
3904 || i.tm.opcode_modifier.evex == EVEXDYN)
3905 {
56522fc5 3906 unsigned int op;
e771e7c9 3907
c7213af9
L
3908 /* Determine vector length from the last multi-length vector
3909 operand. */
56522fc5 3910 for (op = i.operands; op--;)
e771e7c9
JB
3911 if (i.tm.operand_types[op].bitfield.xmmword
3912 + i.tm.operand_types[op].bitfield.ymmword
3913 + i.tm.operand_types[op].bitfield.zmmword > 1)
3914 {
3915 if (i.types[op].bitfield.zmmword)
c7213af9
L
3916 {
3917 i.tm.opcode_modifier.evex = EVEX512;
3918 break;
3919 }
e771e7c9 3920 else if (i.types[op].bitfield.ymmword)
c7213af9
L
3921 {
3922 i.tm.opcode_modifier.evex = EVEX256;
3923 break;
3924 }
e771e7c9 3925 else if (i.types[op].bitfield.xmmword)
c7213af9
L
3926 {
3927 i.tm.opcode_modifier.evex = EVEX128;
3928 break;
3929 }
625cbd7a
JB
3930 else if (i.broadcast && (int) op == i.broadcast->operand)
3931 {
4a1b91ea 3932 switch (i.broadcast->bytes)
625cbd7a
JB
3933 {
3934 case 64:
3935 i.tm.opcode_modifier.evex = EVEX512;
3936 break;
3937 case 32:
3938 i.tm.opcode_modifier.evex = EVEX256;
3939 break;
3940 case 16:
3941 i.tm.opcode_modifier.evex = EVEX128;
3942 break;
3943 default:
c7213af9 3944 abort ();
625cbd7a 3945 }
c7213af9 3946 break;
625cbd7a 3947 }
e771e7c9 3948 }
c7213af9 3949
56522fc5 3950 if (op >= MAX_OPERANDS)
c7213af9 3951 abort ();
e771e7c9
JB
3952 }
3953
43234a1e
L
3954 switch (i.tm.opcode_modifier.evex)
3955 {
3956 case EVEXLIG: /* LL' is ignored */
3957 vec_length = evexlig << 5;
3958 break;
3959 case EVEX128:
3960 vec_length = 0 << 5;
3961 break;
3962 case EVEX256:
3963 vec_length = 1 << 5;
3964 break;
3965 case EVEX512:
3966 vec_length = 2 << 5;
3967 break;
3968 default:
3969 abort ();
3970 break;
3971 }
3972 i.vex.bytes[3] |= vec_length;
3973 /* Encode the broadcast bit. */
3974 if (i.broadcast)
3975 i.vex.bytes[3] |= 0x10;
3976 }
3977 else
3978 {
3979 if (i.rounding->type != saeonly)
3980 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3981 else
d3d3c6db 3982 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
43234a1e
L
3983 }
3984
3985 if (i.mask && i.mask->mask)
3986 i.vex.bytes[3] |= i.mask->mask->reg_num;
3987}
3988
65da13b5
L
3989static void
3990process_immext (void)
3991{
3992 expressionS *exp;
3993
c0f3af97 3994 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
65da13b5
L
3995 which is coded in the same place as an 8-bit immediate field
3996 would be. Here we fake an 8-bit immediate operand from the
3997 opcode suffix stored in tm.extension_opcode.
3998
c1e679ec 3999 AVX instructions also use this encoding, for some of
c0f3af97 4000 3 argument instructions. */
65da13b5 4001
43234a1e 4002 gas_assert (i.imm_operands <= 1
7ab9ffdd 4003 && (i.operands <= 2
7a8655d2 4004 || (is_any_vex_encoding (&i.tm)
7ab9ffdd 4005 && i.operands <= 4)));
65da13b5
L
4006
4007 exp = &im_expressions[i.imm_operands++];
4008 i.op[i.operands].imms = exp;
4009 i.types[i.operands] = imm8;
4010 i.operands++;
4011 exp->X_op = O_constant;
4012 exp->X_add_number = i.tm.extension_opcode;
4013 i.tm.extension_opcode = None;
4014}
4015
42164a71
L
4016
4017static int
4018check_hle (void)
4019{
4020 switch (i.tm.opcode_modifier.hleprefixok)
4021 {
4022 default:
4023 abort ();
82c2def5 4024 case HLEPrefixNone:
165de32a
L
4025 as_bad (_("invalid instruction `%s' after `%s'"),
4026 i.tm.name, i.hle_prefix);
42164a71 4027 return 0;
82c2def5 4028 case HLEPrefixLock:
42164a71
L
4029 if (i.prefix[LOCK_PREFIX])
4030 return 1;
165de32a 4031 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
42164a71 4032 return 0;
82c2def5 4033 case HLEPrefixAny:
42164a71 4034 return 1;
82c2def5 4035 case HLEPrefixRelease:
42164a71
L
4036 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4037 {
4038 as_bad (_("instruction `%s' after `xacquire' not allowed"),
4039 i.tm.name);
4040 return 0;
4041 }
8dc0818e 4042 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
42164a71
L
4043 {
4044 as_bad (_("memory destination needed for instruction `%s'"
4045 " after `xrelease'"), i.tm.name);
4046 return 0;
4047 }
4048 return 1;
4049 }
4050}
4051
b6f8c7c4
L
4052/* Try the shortest encoding by shortening operand size. */
4053
4054static void
4055optimize_encoding (void)
4056{
a0a1771e 4057 unsigned int j;
b6f8c7c4
L
4058
4059 if (optimize_for_space
72aea328 4060 && !is_any_vex_encoding (&i.tm)
b6f8c7c4
L
4061 && i.reg_operands == 1
4062 && i.imm_operands == 1
4063 && !i.types[1].bitfield.byte
4064 && i.op[0].imms->X_op == O_constant
4065 && fits_in_imm7 (i.op[0].imms->X_add_number)
72aea328 4066 && (i.tm.base_opcode == 0xa8
b6f8c7c4
L
4067 || (i.tm.base_opcode == 0xf6
4068 && i.tm.extension_opcode == 0x0)))
4069 {
4070 /* Optimize: -Os:
4071 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4072 */
4073 unsigned int base_regnum = i.op[1].regs->reg_num;
4074 if (flag_code == CODE_64BIT || base_regnum < 4)
4075 {
4076 i.types[1].bitfield.byte = 1;
4077 /* Ignore the suffix. */
4078 i.suffix = 0;
7697afb6
JB
4079 /* Convert to byte registers. */
4080 if (i.types[1].bitfield.word)
4081 j = 16;
4082 else if (i.types[1].bitfield.dword)
4083 j = 32;
4084 else
4085 j = 48;
4086 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4087 j += 8;
4088 i.op[1].regs -= j;
b6f8c7c4
L
4089 }
4090 }
4091 else if (flag_code == CODE_64BIT
72aea328 4092 && !is_any_vex_encoding (&i.tm)
d3d50934
L
4093 && ((i.types[1].bitfield.qword
4094 && i.reg_operands == 1
b6f8c7c4
L
4095 && i.imm_operands == 1
4096 && i.op[0].imms->X_op == O_constant
507916b8 4097 && ((i.tm.base_opcode == 0xb8
b6f8c7c4
L
4098 && i.tm.extension_opcode == None
4099 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4100 || (fits_in_imm31 (i.op[0].imms->X_add_number)
72aea328
JB
4101 && ((i.tm.base_opcode == 0x24
4102 || i.tm.base_opcode == 0xa8)
b6f8c7c4
L
4103 || (i.tm.base_opcode == 0x80
4104 && i.tm.extension_opcode == 0x4)
4105 || ((i.tm.base_opcode == 0xf6
507916b8 4106 || (i.tm.base_opcode | 1) == 0xc7)
b8364fa7
JB
4107 && i.tm.extension_opcode == 0x0)))
4108 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4109 && i.tm.base_opcode == 0x83
4110 && i.tm.extension_opcode == 0x4)))
d3d50934
L
4111 || (i.types[0].bitfield.qword
4112 && ((i.reg_operands == 2
4113 && i.op[0].regs == i.op[1].regs
72aea328
JB
4114 && (i.tm.base_opcode == 0x30
4115 || i.tm.base_opcode == 0x28))
d3d50934
L
4116 || (i.reg_operands == 1
4117 && i.operands == 1
72aea328 4118 && i.tm.base_opcode == 0x30)))))
b6f8c7c4
L
4119 {
4120 /* Optimize: -O:
4121 andq $imm31, %r64 -> andl $imm31, %r32
b8364fa7 4122 andq $imm7, %r64 -> andl $imm7, %r32
b6f8c7c4
L
4123 testq $imm31, %r64 -> testl $imm31, %r32
4124 xorq %r64, %r64 -> xorl %r32, %r32
4125 subq %r64, %r64 -> subl %r32, %r32
4126 movq $imm31, %r64 -> movl $imm31, %r32
4127 movq $imm32, %r64 -> movl $imm32, %r32
4128 */
4129 i.tm.opcode_modifier.norex64 = 1;
507916b8 4130 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
b6f8c7c4
L
4131 {
4132 /* Handle
4133 movq $imm31, %r64 -> movl $imm31, %r32
4134 movq $imm32, %r64 -> movl $imm32, %r32
4135 */
4136 i.tm.operand_types[0].bitfield.imm32 = 1;
4137 i.tm.operand_types[0].bitfield.imm32s = 0;
4138 i.tm.operand_types[0].bitfield.imm64 = 0;
4139 i.types[0].bitfield.imm32 = 1;
4140 i.types[0].bitfield.imm32s = 0;
4141 i.types[0].bitfield.imm64 = 0;
4142 i.types[1].bitfield.dword = 1;
4143 i.types[1].bitfield.qword = 0;
507916b8 4144 if ((i.tm.base_opcode | 1) == 0xc7)
b6f8c7c4
L
4145 {
4146 /* Handle
4147 movq $imm31, %r64 -> movl $imm31, %r32
4148 */
507916b8 4149 i.tm.base_opcode = 0xb8;
b6f8c7c4 4150 i.tm.extension_opcode = None;
507916b8 4151 i.tm.opcode_modifier.w = 0;
b6f8c7c4
L
4152 i.tm.opcode_modifier.modrm = 0;
4153 }
4154 }
4155 }
5641ec01
JB
4156 else if (optimize > 1
4157 && !optimize_for_space
72aea328 4158 && !is_any_vex_encoding (&i.tm)
5641ec01
JB
4159 && i.reg_operands == 2
4160 && i.op[0].regs == i.op[1].regs
4161 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4162 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4163 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4164 {
4165 /* Optimize: -O2:
4166 andb %rN, %rN -> testb %rN, %rN
4167 andw %rN, %rN -> testw %rN, %rN
4168 andq %rN, %rN -> testq %rN, %rN
4169 orb %rN, %rN -> testb %rN, %rN
4170 orw %rN, %rN -> testw %rN, %rN
4171 orq %rN, %rN -> testq %rN, %rN
4172
4173 and outside of 64-bit mode
4174
4175 andl %rN, %rN -> testl %rN, %rN
4176 orl %rN, %rN -> testl %rN, %rN
4177 */
4178 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4179 }
99112332 4180 else if (i.reg_operands == 3
b6f8c7c4
L
4181 && i.op[0].regs == i.op[1].regs
4182 && !i.types[2].bitfield.xmmword
4183 && (i.tm.opcode_modifier.vex
7a69eac3 4184 || ((!i.mask || i.mask->zeroing)
b6f8c7c4 4185 && !i.rounding
e771e7c9 4186 && is_evex_encoding (&i.tm)
80c34c38 4187 && (i.vec_encoding != vex_encoding_evex
dd22218c 4188 || cpu_arch_isa_flags.bitfield.cpuavx512vl
80c34c38 4189 || i.tm.cpu_flags.bitfield.cpuavx512vl
7091c612 4190 || (i.tm.operand_types[2].bitfield.zmmword
dd22218c 4191 && i.types[2].bitfield.ymmword))))
b6f8c7c4
L
4192 && ((i.tm.base_opcode == 0x55
4193 || i.tm.base_opcode == 0x6655
4194 || i.tm.base_opcode == 0x66df
4195 || i.tm.base_opcode == 0x57
4196 || i.tm.base_opcode == 0x6657
8305403a
L
4197 || i.tm.base_opcode == 0x66ef
4198 || i.tm.base_opcode == 0x66f8
4199 || i.tm.base_opcode == 0x66f9
4200 || i.tm.base_opcode == 0x66fa
1424ad86
JB
4201 || i.tm.base_opcode == 0x66fb
4202 || i.tm.base_opcode == 0x42
4203 || i.tm.base_opcode == 0x6642
4204 || i.tm.base_opcode == 0x47
4205 || i.tm.base_opcode == 0x6647)
b6f8c7c4
L
4206 && i.tm.extension_opcode == None))
4207 {
99112332 4208 /* Optimize: -O1:
8305403a
L
4209 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4210 vpsubq and vpsubw:
b6f8c7c4
L
4211 EVEX VOP %zmmM, %zmmM, %zmmN
4212 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4213 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4214 EVEX VOP %ymmM, %ymmM, %ymmN
4215 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4216 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4217 VEX VOP %ymmM, %ymmM, %ymmN
4218 -> VEX VOP %xmmM, %xmmM, %xmmN
4219 VOP, one of vpandn and vpxor:
4220 VEX VOP %ymmM, %ymmM, %ymmN
4221 -> VEX VOP %xmmM, %xmmM, %xmmN
4222 VOP, one of vpandnd and vpandnq:
4223 EVEX VOP %zmmM, %zmmM, %zmmN
4224 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4225 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4226 EVEX VOP %ymmM, %ymmM, %ymmN
4227 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4228 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4229 VOP, one of vpxord and vpxorq:
4230 EVEX VOP %zmmM, %zmmM, %zmmN
4231 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4232 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4233 EVEX VOP %ymmM, %ymmM, %ymmN
4234 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4235 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
1424ad86
JB
4236 VOP, one of kxord and kxorq:
4237 VEX VOP %kM, %kM, %kN
4238 -> VEX kxorw %kM, %kM, %kN
4239 VOP, one of kandnd and kandnq:
4240 VEX VOP %kM, %kM, %kN
4241 -> VEX kandnw %kM, %kM, %kN
b6f8c7c4 4242 */
e771e7c9 4243 if (is_evex_encoding (&i.tm))
b6f8c7c4 4244 {
7b1d7ca1 4245 if (i.vec_encoding != vex_encoding_evex)
b6f8c7c4
L
4246 {
4247 i.tm.opcode_modifier.vex = VEX128;
4248 i.tm.opcode_modifier.vexw = VEXW0;
4249 i.tm.opcode_modifier.evex = 0;
4250 }
7b1d7ca1 4251 else if (optimize > 1)
dd22218c
L
4252 i.tm.opcode_modifier.evex = EVEX128;
4253 else
4254 return;
b6f8c7c4 4255 }
f74a6307 4256 else if (i.tm.operand_types[0].bitfield.class == RegMask)
1424ad86
JB
4257 {
4258 i.tm.base_opcode &= 0xff;
4259 i.tm.opcode_modifier.vexw = VEXW0;
4260 }
b6f8c7c4
L
4261 else
4262 i.tm.opcode_modifier.vex = VEX128;
4263
4264 if (i.tm.opcode_modifier.vex)
4265 for (j = 0; j < 3; j++)
4266 {
4267 i.types[j].bitfield.xmmword = 1;
4268 i.types[j].bitfield.ymmword = 0;
4269 }
4270 }
392a5972 4271 else if (i.vec_encoding != vex_encoding_evex
97ed31ae 4272 && !i.types[0].bitfield.zmmword
392a5972 4273 && !i.types[1].bitfield.zmmword
97ed31ae 4274 && !i.mask
a0a1771e 4275 && !i.broadcast
97ed31ae 4276 && is_evex_encoding (&i.tm)
392a5972
L
4277 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4278 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
a0a1771e
JB
4279 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4280 || (i.tm.base_opcode & ~4) == 0x66db
4281 || (i.tm.base_opcode & ~4) == 0x66eb)
97ed31ae
L
4282 && i.tm.extension_opcode == None)
4283 {
4284 /* Optimize: -O1:
4285 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4286 vmovdqu32 and vmovdqu64:
4287 EVEX VOP %xmmM, %xmmN
4288 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4289 EVEX VOP %ymmM, %ymmN
4290 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4291 EVEX VOP %xmmM, mem
4292 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4293 EVEX VOP %ymmM, mem
4294 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4295 EVEX VOP mem, %xmmN
4296 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4297 EVEX VOP mem, %ymmN
4298 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
a0a1771e
JB
4299 VOP, one of vpand, vpandn, vpor, vpxor:
4300 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4301 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4302 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4303 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4304 EVEX VOP{d,q} mem, %xmmM, %xmmN
4305 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4306 EVEX VOP{d,q} mem, %ymmM, %ymmN
4307 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
97ed31ae 4308 */
a0a1771e 4309 for (j = 0; j < i.operands; j++)
392a5972
L
4310 if (operand_type_check (i.types[j], disp)
4311 && i.op[j].disps->X_op == O_constant)
4312 {
4313 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4314 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4315 bytes, we choose EVEX Disp8 over VEX Disp32. */
4316 int evex_disp8, vex_disp8;
4317 unsigned int memshift = i.memshift;
4318 offsetT n = i.op[j].disps->X_add_number;
4319
4320 evex_disp8 = fits_in_disp8 (n);
4321 i.memshift = 0;
4322 vex_disp8 = fits_in_disp8 (n);
4323 if (evex_disp8 != vex_disp8)
4324 {
4325 i.memshift = memshift;
4326 return;
4327 }
4328
4329 i.types[j].bitfield.disp8 = vex_disp8;
4330 break;
4331 }
4332 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4333 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
97ed31ae
L
4334 i.tm.opcode_modifier.vex
4335 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4336 i.tm.opcode_modifier.vexw = VEXW0;
79dec6b7
JB
4337 /* VPAND, VPOR, and VPXOR are commutative. */
4338 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4339 i.tm.opcode_modifier.commutative = 1;
97ed31ae
L
4340 i.tm.opcode_modifier.evex = 0;
4341 i.tm.opcode_modifier.masking = 0;
a0a1771e 4342 i.tm.opcode_modifier.broadcast = 0;
97ed31ae
L
4343 i.tm.opcode_modifier.disp8memshift = 0;
4344 i.memshift = 0;
a0a1771e
JB
4345 if (j < i.operands)
4346 i.types[j].bitfield.disp8
4347 = fits_in_disp8 (i.op[j].disps->X_add_number);
97ed31ae 4348 }
b6f8c7c4
L
4349}
4350
ae531041
L
4351/* Return non-zero for load instruction. */
4352
4353static int
4354load_insn_p (void)
4355{
4356 unsigned int dest;
4357 int any_vex_p = is_any_vex_encoding (&i.tm);
4358 unsigned int base_opcode = i.tm.base_opcode | 1;
4359
4360 if (!any_vex_p)
4361 {
a09f656b 4362 /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4363 prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4364 bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote. */
4365 if (i.tm.opcode_modifier.anysize)
ae531041
L
4366 return 0;
4367
a09f656b 4368 /* pop, popf, popa. */
4369 if (strcmp (i.tm.name, "pop") == 0
4370 || i.tm.base_opcode == 0x9d
4371 || i.tm.base_opcode == 0x61)
ae531041
L
4372 return 1;
4373
4374 /* movs, cmps, lods, scas. */
4375 if ((i.tm.base_opcode | 0xb) == 0xaf)
4376 return 1;
4377
a09f656b 4378 /* outs, xlatb. */
4379 if (base_opcode == 0x6f
4380 || i.tm.base_opcode == 0xd7)
ae531041 4381 return 1;
a09f656b 4382 /* NB: For AMD-specific insns with implicit memory operands,
4383 they're intentionally not covered. */
ae531041
L
4384 }
4385
4386 /* No memory operand. */
4387 if (!i.mem_operands)
4388 return 0;
4389
4390 if (any_vex_p)
4391 {
4392 /* vldmxcsr. */
4393 if (i.tm.base_opcode == 0xae
4394 && i.tm.opcode_modifier.vex
4395 && i.tm.opcode_modifier.vexopcode == VEX0F
4396 && i.tm.extension_opcode == 2)
4397 return 1;
4398 }
4399 else
4400 {
4401 /* test, not, neg, mul, imul, div, idiv. */
4402 if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4403 && i.tm.extension_opcode != 1)
4404 return 1;
4405
4406 /* inc, dec. */
4407 if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4408 return 1;
4409
4410 /* add, or, adc, sbb, and, sub, xor, cmp. */
4411 if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4412 return 1;
4413
4414 /* bt, bts, btr, btc. */
4415 if (i.tm.base_opcode == 0xfba
4416 && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4417 return 1;
4418
4419 /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4420 if ((base_opcode == 0xc1
4421 || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4422 && i.tm.extension_opcode != 6)
4423 return 1;
4424
4425 /* cmpxchg8b, cmpxchg16b, xrstors. */
4426 if (i.tm.base_opcode == 0xfc7
4427 && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4428 return 1;
4429
4430 /* fxrstor, ldmxcsr, xrstor. */
4431 if (i.tm.base_opcode == 0xfae
4432 && (i.tm.extension_opcode == 1
4433 || i.tm.extension_opcode == 2
4434 || i.tm.extension_opcode == 5))
4435 return 1;
4436
4437 /* lgdt, lidt, lmsw. */
4438 if (i.tm.base_opcode == 0xf01
4439 && (i.tm.extension_opcode == 2
4440 || i.tm.extension_opcode == 3
4441 || i.tm.extension_opcode == 6))
4442 return 1;
4443
4444 /* vmptrld */
4445 if (i.tm.base_opcode == 0xfc7
4446 && i.tm.extension_opcode == 6)
4447 return 1;
4448
4449 /* Check for x87 instructions. */
4450 if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4451 {
4452 /* Skip fst, fstp, fstenv, fstcw. */
4453 if (i.tm.base_opcode == 0xd9
4454 && (i.tm.extension_opcode == 2
4455 || i.tm.extension_opcode == 3
4456 || i.tm.extension_opcode == 6
4457 || i.tm.extension_opcode == 7))
4458 return 0;
4459
4460 /* Skip fisttp, fist, fistp, fstp. */
4461 if (i.tm.base_opcode == 0xdb
4462 && (i.tm.extension_opcode == 1
4463 || i.tm.extension_opcode == 2
4464 || i.tm.extension_opcode == 3
4465 || i.tm.extension_opcode == 7))
4466 return 0;
4467
4468 /* Skip fisttp, fst, fstp, fsave, fstsw. */
4469 if (i.tm.base_opcode == 0xdd
4470 && (i.tm.extension_opcode == 1
4471 || i.tm.extension_opcode == 2
4472 || i.tm.extension_opcode == 3
4473 || i.tm.extension_opcode == 6
4474 || i.tm.extension_opcode == 7))
4475 return 0;
4476
4477 /* Skip fisttp, fist, fistp, fbstp, fistp. */
4478 if (i.tm.base_opcode == 0xdf
4479 && (i.tm.extension_opcode == 1
4480 || i.tm.extension_opcode == 2
4481 || i.tm.extension_opcode == 3
4482 || i.tm.extension_opcode == 6
4483 || i.tm.extension_opcode == 7))
4484 return 0;
4485
4486 return 1;
4487 }
4488 }
4489
4490 dest = i.operands - 1;
4491
4492 /* Check fake imm8 operand and 3 source operands. */
4493 if ((i.tm.opcode_modifier.immext
4494 || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4495 && i.types[dest].bitfield.imm8)
4496 dest--;
4497
4498 /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd */
4499 if (!any_vex_p
4500 && (base_opcode == 0x1
4501 || base_opcode == 0x9
4502 || base_opcode == 0x11
4503 || base_opcode == 0x19
4504 || base_opcode == 0x21
4505 || base_opcode == 0x29
4506 || base_opcode == 0x31
4507 || base_opcode == 0x39
4508 || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4509 || base_opcode == 0xfc1))
4510 return 1;
4511
4512 /* Check for load instruction. */
4513 return (i.types[dest].bitfield.class != ClassNone
4514 || i.types[dest].bitfield.instance == Accum);
4515}
4516
4517/* Output lfence, 0xfaee8, after instruction. */
4518
4519static void
4520insert_lfence_after (void)
4521{
4522 if (lfence_after_load && load_insn_p ())
4523 {
a09f656b 4524 /* There are also two REP string instructions that require
4525 special treatment. Specifically, the compare string (CMPS)
4526 and scan string (SCAS) instructions set EFLAGS in a manner
4527 that depends on the data being compared/scanned. When used
4528 with a REP prefix, the number of iterations may therefore
4529 vary depending on this data. If the data is a program secret
4530 chosen by the adversary using an LVI method,
4531 then this data-dependent behavior may leak some aspect
4532 of the secret. */
4533 if (((i.tm.base_opcode | 0x1) == 0xa7
4534 || (i.tm.base_opcode | 0x1) == 0xaf)
4535 && i.prefix[REP_PREFIX])
4536 {
4537 as_warn (_("`%s` changes flags which would affect control flow behavior"),
4538 i.tm.name);
4539 }
ae531041
L
4540 char *p = frag_more (3);
4541 *p++ = 0xf;
4542 *p++ = 0xae;
4543 *p = 0xe8;
4544 }
4545}
4546
4547/* Output lfence, 0xfaee8, before instruction. */
4548
4549static void
4550insert_lfence_before (void)
4551{
4552 char *p;
4553
4554 if (is_any_vex_encoding (&i.tm))
4555 return;
4556
4557 if (i.tm.base_opcode == 0xff
4558 && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4559 {
4560 /* Insert lfence before indirect branch if needed. */
4561
4562 if (lfence_before_indirect_branch == lfence_branch_none)
4563 return;
4564
4565 if (i.operands != 1)
4566 abort ();
4567
4568 if (i.reg_operands == 1)
4569 {
4570 /* Indirect branch via register. Don't insert lfence with
4571 -mlfence-after-load=yes. */
4572 if (lfence_after_load
4573 || lfence_before_indirect_branch == lfence_branch_memory)
4574 return;
4575 }
4576 else if (i.mem_operands == 1
4577 && lfence_before_indirect_branch != lfence_branch_register)
4578 {
4579 as_warn (_("indirect `%s` with memory operand should be avoided"),
4580 i.tm.name);
4581 return;
4582 }
4583 else
4584 return;
4585
4586 if (last_insn.kind != last_insn_other
4587 && last_insn.seg == now_seg)
4588 {
4589 as_warn_where (last_insn.file, last_insn.line,
4590 _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4591 last_insn.name, i.tm.name);
4592 return;
4593 }
4594
4595 p = frag_more (3);
4596 *p++ = 0xf;
4597 *p++ = 0xae;
4598 *p = 0xe8;
4599 return;
4600 }
4601
503648e4 4602 /* Output or/not/shl and lfence before near ret. */
ae531041
L
4603 if (lfence_before_ret != lfence_before_ret_none
4604 && (i.tm.base_opcode == 0xc2
503648e4 4605 || i.tm.base_opcode == 0xc3))
ae531041
L
4606 {
4607 if (last_insn.kind != last_insn_other
4608 && last_insn.seg == now_seg)
4609 {
4610 as_warn_where (last_insn.file, last_insn.line,
4611 _("`%s` skips -mlfence-before-ret on `%s`"),
4612 last_insn.name, i.tm.name);
4613 return;
4614 }
a09f656b 4615
a09f656b 4616 /* Near ret ingore operand size override under CPU64. */
503648e4 4617 char prefix = flag_code == CODE_64BIT
4618 ? 0x48
4619 : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
a09f656b 4620
4621 if (lfence_before_ret == lfence_before_ret_not)
4622 {
4623 /* not: 0xf71424, may add prefix
4624 for operand size override or 64-bit code. */
4625 p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4626 if (prefix)
4627 *p++ = prefix;
ae531041
L
4628 *p++ = 0xf7;
4629 *p++ = 0x14;
4630 *p++ = 0x24;
a09f656b 4631 if (prefix)
4632 *p++ = prefix;
ae531041
L
4633 *p++ = 0xf7;
4634 *p++ = 0x14;
4635 *p++ = 0x24;
4636 }
a09f656b 4637 else
4638 {
4639 p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4640 if (prefix)
4641 *p++ = prefix;
4642 if (lfence_before_ret == lfence_before_ret_or)
4643 {
4644 /* or: 0x830c2400, may add prefix
4645 for operand size override or 64-bit code. */
4646 *p++ = 0x83;
4647 *p++ = 0x0c;
4648 }
4649 else
4650 {
4651 /* shl: 0xc1242400, may add prefix
4652 for operand size override or 64-bit code. */
4653 *p++ = 0xc1;
4654 *p++ = 0x24;
4655 }
4656
4657 *p++ = 0x24;
4658 *p++ = 0x0;
4659 }
4660
ae531041
L
4661 *p++ = 0xf;
4662 *p++ = 0xae;
4663 *p = 0xe8;
4664 }
4665}
4666
252b5132
RH
4667/* This is the guts of the machine-dependent assembler. LINE points to a
4668 machine dependent instruction. This function is supposed to emit
4669 the frags/bytes it assembles to. */
4670
4671void
65da13b5 4672md_assemble (char *line)
252b5132 4673{
40fb9820 4674 unsigned int j;
83b16ac6 4675 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
d3ce72d0 4676 const insn_template *t;
252b5132 4677
47926f60 4678 /* Initialize globals. */
252b5132
RH
4679 memset (&i, '\0', sizeof (i));
4680 for (j = 0; j < MAX_OPERANDS; j++)
1ae12ab7 4681 i.reloc[j] = NO_RELOC;
252b5132
RH
4682 memset (disp_expressions, '\0', sizeof (disp_expressions));
4683 memset (im_expressions, '\0', sizeof (im_expressions));
ce8a8b2f 4684 save_stack_p = save_stack;
252b5132
RH
4685
4686 /* First parse an instruction mnemonic & call i386_operand for the operands.
4687 We assume that the scrubber has arranged it so that line[0] is the valid
47926f60 4688 start of a (possibly prefixed) mnemonic. */
252b5132 4689
29b0f896
AM
4690 line = parse_insn (line, mnemonic);
4691 if (line == NULL)
4692 return;
83b16ac6 4693 mnem_suffix = i.suffix;
252b5132 4694
29b0f896 4695 line = parse_operands (line, mnemonic);
ee86248c 4696 this_operand = -1;
8325cc63
JB
4697 xfree (i.memop1_string);
4698 i.memop1_string = NULL;
29b0f896
AM
4699 if (line == NULL)
4700 return;
252b5132 4701
29b0f896
AM
4702 /* Now we've parsed the mnemonic into a set of templates, and have the
4703 operands at hand. */
4704
b630c145
JB
4705 /* All Intel opcodes have reversed operands except for "bound", "enter",
4706 "monitor*", "mwait*", "tpause", and "umwait". We also don't reverse
4707 intersegment "jmp" and "call" instructions with 2 immediate operands so
4708 that the immediate segment precedes the offset, as it does when in AT&T
4709 mode. */
4d456e3d
L
4710 if (intel_syntax
4711 && i.operands > 1
29b0f896 4712 && (strcmp (mnemonic, "bound") != 0)
30123838 4713 && (strcmp (mnemonic, "invlpga") != 0)
eedb0f2c
JB
4714 && (strncmp (mnemonic, "monitor", 7) != 0)
4715 && (strncmp (mnemonic, "mwait", 5) != 0)
b630c145
JB
4716 && (strcmp (mnemonic, "tpause") != 0)
4717 && (strcmp (mnemonic, "umwait") != 0)
40fb9820
L
4718 && !(operand_type_check (i.types[0], imm)
4719 && operand_type_check (i.types[1], imm)))
29b0f896
AM
4720 swap_operands ();
4721
ec56d5c0
JB
4722 /* The order of the immediates should be reversed
4723 for 2 immediates extrq and insertq instructions */
4724 if (i.imm_operands == 2
4725 && (strcmp (mnemonic, "extrq") == 0
4726 || strcmp (mnemonic, "insertq") == 0))
4727 swap_2_operands (0, 1);
4728
29b0f896
AM
4729 if (i.imm_operands)
4730 optimize_imm ();
4731
b300c311
L
4732 /* Don't optimize displacement for movabs since it only takes 64bit
4733 displacement. */
4734 if (i.disp_operands
a501d77e 4735 && i.disp_encoding != disp_encoding_32bit
862be3fb
L
4736 && (flag_code != CODE_64BIT
4737 || strcmp (mnemonic, "movabs") != 0))
4738 optimize_disp ();
29b0f896
AM
4739
4740 /* Next, we find a template that matches the given insn,
4741 making sure the overlap of the given operands types is consistent
4742 with the template operand types. */
252b5132 4743
83b16ac6 4744 if (!(t = match_template (mnem_suffix)))
29b0f896 4745 return;
252b5132 4746
7bab8ab5 4747 if (sse_check != check_none
81f8a913 4748 && !i.tm.opcode_modifier.noavx
6e3e5c9e 4749 && !i.tm.cpu_flags.bitfield.cpuavx
569d50f1 4750 && !i.tm.cpu_flags.bitfield.cpuavx512f
daf50ae7
L
4751 && (i.tm.cpu_flags.bitfield.cpusse
4752 || i.tm.cpu_flags.bitfield.cpusse2
4753 || i.tm.cpu_flags.bitfield.cpusse3
4754 || i.tm.cpu_flags.bitfield.cpussse3
4755 || i.tm.cpu_flags.bitfield.cpusse4_1
6e3e5c9e
JB
4756 || i.tm.cpu_flags.bitfield.cpusse4_2
4757 || i.tm.cpu_flags.bitfield.cpupclmul
4758 || i.tm.cpu_flags.bitfield.cpuaes
569d50f1 4759 || i.tm.cpu_flags.bitfield.cpusha
6e3e5c9e 4760 || i.tm.cpu_flags.bitfield.cpugfni))
daf50ae7 4761 {
7bab8ab5 4762 (sse_check == check_warning
daf50ae7
L
4763 ? as_warn
4764 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4765 }
4766
40fb9820 4767 if (i.tm.opcode_modifier.fwait)
29b0f896
AM
4768 if (!add_prefix (FWAIT_OPCODE))
4769 return;
252b5132 4770
d5de92cf
L
4771 /* Check if REP prefix is OK. */
4772 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4773 {
4774 as_bad (_("invalid instruction `%s' after `%s'"),
4775 i.tm.name, i.rep_prefix);
4776 return;
4777 }
4778
c1ba0266
L
4779 /* Check for lock without a lockable instruction. Destination operand
4780 must be memory unless it is xchg (0x86). */
c32fa91d
L
4781 if (i.prefix[LOCK_PREFIX]
4782 && (!i.tm.opcode_modifier.islockable
c1ba0266
L
4783 || i.mem_operands == 0
4784 || (i.tm.base_opcode != 0x86
8dc0818e 4785 && !(i.flags[i.operands - 1] & Operand_Mem))))
c32fa91d
L
4786 {
4787 as_bad (_("expecting lockable instruction after `lock'"));
4788 return;
4789 }
4790
40d231b4
JB
4791 /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns. */
4792 if (i.prefix[DATA_PREFIX]
4793 && (is_any_vex_encoding (&i.tm)
4794 || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4795 || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
7a8655d2
JB
4796 {
4797 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4798 return;
4799 }
4800
42164a71 4801 /* Check if HLE prefix is OK. */
165de32a 4802 if (i.hle_prefix && !check_hle ())
42164a71
L
4803 return;
4804
7e8b059b
L
4805 /* Check BND prefix. */
4806 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4807 as_bad (_("expecting valid branch instruction after `bnd'"));
4808
04ef582a 4809 /* Check NOTRACK prefix. */
9fef80d6
L
4810 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4811 as_bad (_("expecting indirect branch instruction after `notrack'"));
04ef582a 4812
327e8c42
JB
4813 if (i.tm.cpu_flags.bitfield.cpumpx)
4814 {
4815 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4816 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4817 else if (flag_code != CODE_16BIT
4818 ? i.prefix[ADDR_PREFIX]
4819 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4820 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4821 }
7e8b059b
L
4822
4823 /* Insert BND prefix. */
76d3a78a
JB
4824 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4825 {
4826 if (!i.prefix[BND_PREFIX])
4827 add_prefix (BND_PREFIX_OPCODE);
4828 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4829 {
4830 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4831 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4832 }
4833 }
7e8b059b 4834
29b0f896 4835 /* Check string instruction segment overrides. */
51c8edf6 4836 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
29b0f896 4837 {
51c8edf6 4838 gas_assert (i.mem_operands);
29b0f896 4839 if (!check_string ())
5dd0794d 4840 return;
fc0763e6 4841 i.disp_operands = 0;
29b0f896 4842 }
5dd0794d 4843
b6f8c7c4
L
4844 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4845 optimize_encoding ();
4846
29b0f896
AM
4847 if (!process_suffix ())
4848 return;
e413e4e9 4849
bc0844ae
L
4850 /* Update operand types. */
4851 for (j = 0; j < i.operands; j++)
4852 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4853
29b0f896
AM
4854 /* Make still unresolved immediate matches conform to size of immediate
4855 given in i.suffix. */
4856 if (!finalize_imm ())
4857 return;
252b5132 4858
40fb9820 4859 if (i.types[0].bitfield.imm1)
29b0f896 4860 i.imm_operands = 0; /* kludge for shift insns. */
252b5132 4861
9afe6eb8
L
4862 /* We only need to check those implicit registers for instructions
4863 with 3 operands or less. */
4864 if (i.operands <= 3)
4865 for (j = 0; j < i.operands; j++)
75e5731b
JB
4866 if (i.types[j].bitfield.instance != InstanceNone
4867 && !i.types[j].bitfield.xmmword)
9afe6eb8 4868 i.reg_operands--;
40fb9820 4869
29b0f896
AM
4870 /* For insns with operands there are more diddles to do to the opcode. */
4871 if (i.operands)
4872 {
4873 if (!process_operands ())
4874 return;
4875 }
b6cd5d10 4876 else
29b0f896 4877 {
b6cd5d10
L
4878 if (i.tm.opcode_modifier.immext)
4879 process_immext ();
4880
4881 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
29b0f896
AM
4882 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4883 as_warn (_("translating to `%sp'"), i.tm.name);
4884 }
252b5132 4885
7a8655d2 4886 if (is_any_vex_encoding (&i.tm))
9e5e5283 4887 {
c1dc7af5 4888 if (!cpu_arch_flags.bitfield.cpui286)
9e5e5283 4889 {
c1dc7af5 4890 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
9e5e5283
L
4891 i.tm.name);
4892 return;
4893 }
c0f3af97 4894
0b9404fd
JB
4895 /* Check for explicit REX prefix. */
4896 if (i.prefix[REX_PREFIX] || i.rex_encoding)
4897 {
4898 as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4899 return;
4900 }
4901
9e5e5283
L
4902 if (i.tm.opcode_modifier.vex)
4903 build_vex_prefix (t);
4904 else
4905 build_evex_prefix ();
0b9404fd
JB
4906
4907 /* The individual REX.RXBW bits got consumed. */
4908 i.rex &= REX_OPCODE;
9e5e5283 4909 }
43234a1e 4910
5dd85c99
SP
4911 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4912 instructions may define INT_OPCODE as well, so avoid this corner
4913 case for those instructions that use MODRM. */
4914 if (i.tm.base_opcode == INT_OPCODE
a6461c02
SP
4915 && !i.tm.opcode_modifier.modrm
4916 && i.op[0].imms->X_add_number == 3)
29b0f896
AM
4917 {
4918 i.tm.base_opcode = INT3_OPCODE;
4919 i.imm_operands = 0;
4920 }
252b5132 4921
0cfa3eb3
JB
4922 if ((i.tm.opcode_modifier.jump == JUMP
4923 || i.tm.opcode_modifier.jump == JUMP_BYTE
4924 || i.tm.opcode_modifier.jump == JUMP_DWORD)
29b0f896
AM
4925 && i.op[0].disps->X_op == O_constant)
4926 {
4927 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4928 the absolute address given by the constant. Since ix86 jumps and
4929 calls are pc relative, we need to generate a reloc. */
4930 i.op[0].disps->X_add_symbol = &abs_symbol;
4931 i.op[0].disps->X_op = O_symbol;
4932 }
252b5132 4933
29b0f896
AM
4934 /* For 8 bit registers we need an empty rex prefix. Also if the
4935 instruction already has a prefix, we need to convert old
4936 registers to new ones. */
773f551c 4937
bab6aec1 4938 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
29b0f896 4939 && (i.op[0].regs->reg_flags & RegRex64) != 0)
bab6aec1 4940 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
29b0f896 4941 && (i.op[1].regs->reg_flags & RegRex64) != 0)
bab6aec1
JB
4942 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4943 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
29b0f896
AM
4944 && i.rex != 0))
4945 {
4946 int x;
726c5dcd 4947
29b0f896
AM
4948 i.rex |= REX_OPCODE;
4949 for (x = 0; x < 2; x++)
4950 {
4951 /* Look for 8 bit operand that uses old registers. */
bab6aec1 4952 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
29b0f896 4953 && (i.op[x].regs->reg_flags & RegRex64) == 0)
773f551c 4954 {
3f93af61 4955 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
29b0f896
AM
4956 /* In case it is "hi" register, give up. */
4957 if (i.op[x].regs->reg_num > 3)
a540244d 4958 as_bad (_("can't encode register '%s%s' in an "
4eed87de 4959 "instruction requiring REX prefix."),
a540244d 4960 register_prefix, i.op[x].regs->reg_name);
773f551c 4961
29b0f896
AM
4962 /* Otherwise it is equivalent to the extended register.
4963 Since the encoding doesn't change this is merely
4964 cosmetic cleanup for debug output. */
4965
4966 i.op[x].regs = i.op[x].regs + 8;
773f551c 4967 }
29b0f896
AM
4968 }
4969 }
773f551c 4970
6b6b6807
L
4971 if (i.rex == 0 && i.rex_encoding)
4972 {
4973 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
3f93af61 4974 that uses legacy register. If it is "hi" register, don't add
6b6b6807
L
4975 the REX_OPCODE byte. */
4976 int x;
4977 for (x = 0; x < 2; x++)
bab6aec1 4978 if (i.types[x].bitfield.class == Reg
6b6b6807
L
4979 && i.types[x].bitfield.byte
4980 && (i.op[x].regs->reg_flags & RegRex64) == 0
4981 && i.op[x].regs->reg_num > 3)
4982 {
3f93af61 4983 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
6b6b6807
L
4984 i.rex_encoding = FALSE;
4985 break;
4986 }
4987
4988 if (i.rex_encoding)
4989 i.rex = REX_OPCODE;
4990 }
4991
7ab9ffdd 4992 if (i.rex != 0)
29b0f896
AM
4993 add_prefix (REX_OPCODE | i.rex);
4994
ae531041
L
4995 insert_lfence_before ();
4996
29b0f896
AM
4997 /* We are ready to output the insn. */
4998 output_insn ();
e379e5f3 4999
ae531041
L
5000 insert_lfence_after ();
5001
e379e5f3
L
5002 last_insn.seg = now_seg;
5003
5004 if (i.tm.opcode_modifier.isprefix)
5005 {
5006 last_insn.kind = last_insn_prefix;
5007 last_insn.name = i.tm.name;
5008 last_insn.file = as_where (&last_insn.line);
5009 }
5010 else
5011 last_insn.kind = last_insn_other;
29b0f896
AM
5012}
5013
5014static char *
e3bb37b5 5015parse_insn (char *line, char *mnemonic)
29b0f896
AM
5016{
5017 char *l = line;
5018 char *token_start = l;
5019 char *mnem_p;
5c6af06e 5020 int supported;
d3ce72d0 5021 const insn_template *t;
b6169b20 5022 char *dot_p = NULL;
29b0f896 5023
29b0f896
AM
5024 while (1)
5025 {
5026 mnem_p = mnemonic;
5027 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5028 {
b6169b20
L
5029 if (*mnem_p == '.')
5030 dot_p = mnem_p;
29b0f896
AM
5031 mnem_p++;
5032 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
45288df1 5033 {
29b0f896
AM
5034 as_bad (_("no such instruction: `%s'"), token_start);
5035 return NULL;
5036 }
5037 l++;
5038 }
5039 if (!is_space_char (*l)
5040 && *l != END_OF_INSN
e44823cf
JB
5041 && (intel_syntax
5042 || (*l != PREFIX_SEPARATOR
5043 && *l != ',')))
29b0f896
AM
5044 {
5045 as_bad (_("invalid character %s in mnemonic"),
5046 output_invalid (*l));
5047 return NULL;
5048 }
5049 if (token_start == l)
5050 {
e44823cf 5051 if (!intel_syntax && *l == PREFIX_SEPARATOR)
29b0f896
AM
5052 as_bad (_("expecting prefix; got nothing"));
5053 else
5054 as_bad (_("expecting mnemonic; got nothing"));
5055 return NULL;
5056 }
45288df1 5057
29b0f896 5058 /* Look up instruction (or prefix) via hash table. */
d3ce72d0 5059 current_templates = (const templates *) hash_find (op_hash, mnemonic);
47926f60 5060
29b0f896
AM
5061 if (*l != END_OF_INSN
5062 && (!is_space_char (*l) || l[1] != END_OF_INSN)
5063 && current_templates
40fb9820 5064 && current_templates->start->opcode_modifier.isprefix)
29b0f896 5065 {
c6fb90c8 5066 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
2dd88dca
JB
5067 {
5068 as_bad ((flag_code != CODE_64BIT
5069 ? _("`%s' is only supported in 64-bit mode")
5070 : _("`%s' is not supported in 64-bit mode")),
5071 current_templates->start->name);
5072 return NULL;
5073 }
29b0f896
AM
5074 /* If we are in 16-bit mode, do not allow addr16 or data16.
5075 Similarly, in 32-bit mode, do not allow addr32 or data32. */
673fe0f0
JB
5076 if ((current_templates->start->opcode_modifier.size == SIZE16
5077 || current_templates->start->opcode_modifier.size == SIZE32)
29b0f896 5078 && flag_code != CODE_64BIT
673fe0f0 5079 && ((current_templates->start->opcode_modifier.size == SIZE32)
29b0f896
AM
5080 ^ (flag_code == CODE_16BIT)))
5081 {
5082 as_bad (_("redundant %s prefix"),
5083 current_templates->start->name);
5084 return NULL;
45288df1 5085 }
86fa6981 5086 if (current_templates->start->opcode_length == 0)
29b0f896 5087 {
86fa6981
L
5088 /* Handle pseudo prefixes. */
5089 switch (current_templates->start->base_opcode)
5090 {
5091 case 0x0:
5092 /* {disp8} */
5093 i.disp_encoding = disp_encoding_8bit;
5094 break;
5095 case 0x1:
5096 /* {disp32} */
5097 i.disp_encoding = disp_encoding_32bit;
5098 break;
5099 case 0x2:
5100 /* {load} */
5101 i.dir_encoding = dir_encoding_load;
5102 break;
5103 case 0x3:
5104 /* {store} */
5105 i.dir_encoding = dir_encoding_store;
5106 break;
5107 case 0x4:
42e04b36
L
5108 /* {vex} */
5109 i.vec_encoding = vex_encoding_vex;
86fa6981
L
5110 break;
5111 case 0x5:
5112 /* {vex3} */
5113 i.vec_encoding = vex_encoding_vex3;
5114 break;
5115 case 0x6:
5116 /* {evex} */
5117 i.vec_encoding = vex_encoding_evex;
5118 break;
6b6b6807
L
5119 case 0x7:
5120 /* {rex} */
5121 i.rex_encoding = TRUE;
5122 break;
b6f8c7c4
L
5123 case 0x8:
5124 /* {nooptimize} */
5125 i.no_optimize = TRUE;
5126 break;
86fa6981
L
5127 default:
5128 abort ();
5129 }
5130 }
5131 else
5132 {
5133 /* Add prefix, checking for repeated prefixes. */
4e9ac44a 5134 switch (add_prefix (current_templates->start->base_opcode))
86fa6981 5135 {
4e9ac44a
L
5136 case PREFIX_EXIST:
5137 return NULL;
5138 case PREFIX_DS:
d777820b 5139 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4e9ac44a
L
5140 i.notrack_prefix = current_templates->start->name;
5141 break;
5142 case PREFIX_REP:
5143 if (current_templates->start->cpu_flags.bitfield.cpuhle)
5144 i.hle_prefix = current_templates->start->name;
5145 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5146 i.bnd_prefix = current_templates->start->name;
5147 else
5148 i.rep_prefix = current_templates->start->name;
5149 break;
5150 default:
5151 break;
86fa6981 5152 }
29b0f896
AM
5153 }
5154 /* Skip past PREFIX_SEPARATOR and reset token_start. */
5155 token_start = ++l;
5156 }
5157 else
5158 break;
5159 }
45288df1 5160
30a55f88 5161 if (!current_templates)
b6169b20 5162 {
07d5e953
JB
5163 /* Deprecated functionality (new code should use pseudo-prefixes instead):
5164 Check if we should swap operand or force 32bit displacement in
f8a5c266 5165 encoding. */
30a55f88 5166 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
64c49ab3 5167 i.dir_encoding = dir_encoding_swap;
8d63c93e 5168 else if (mnem_p - 3 == dot_p
a501d77e
L
5169 && dot_p[1] == 'd'
5170 && dot_p[2] == '8')
5171 i.disp_encoding = disp_encoding_8bit;
8d63c93e 5172 else if (mnem_p - 4 == dot_p
f8a5c266
L
5173 && dot_p[1] == 'd'
5174 && dot_p[2] == '3'
5175 && dot_p[3] == '2')
a501d77e 5176 i.disp_encoding = disp_encoding_32bit;
30a55f88
L
5177 else
5178 goto check_suffix;
5179 mnem_p = dot_p;
5180 *dot_p = '\0';
d3ce72d0 5181 current_templates = (const templates *) hash_find (op_hash, mnemonic);
b6169b20
L
5182 }
5183
29b0f896
AM
5184 if (!current_templates)
5185 {
dc1e8a47 5186 check_suffix:
1c529385 5187 if (mnem_p > mnemonic)
29b0f896 5188 {
1c529385
LH
5189 /* See if we can get a match by trimming off a suffix. */
5190 switch (mnem_p[-1])
29b0f896 5191 {
1c529385
LH
5192 case WORD_MNEM_SUFFIX:
5193 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
29b0f896
AM
5194 i.suffix = SHORT_MNEM_SUFFIX;
5195 else
1c529385
LH
5196 /* Fall through. */
5197 case BYTE_MNEM_SUFFIX:
5198 case QWORD_MNEM_SUFFIX:
5199 i.suffix = mnem_p[-1];
29b0f896 5200 mnem_p[-1] = '\0';
d3ce72d0 5201 current_templates = (const templates *) hash_find (op_hash,
1c529385
LH
5202 mnemonic);
5203 break;
5204 case SHORT_MNEM_SUFFIX:
5205 case LONG_MNEM_SUFFIX:
5206 if (!intel_syntax)
5207 {
5208 i.suffix = mnem_p[-1];
5209 mnem_p[-1] = '\0';
5210 current_templates = (const templates *) hash_find (op_hash,
5211 mnemonic);
5212 }
5213 break;
5214
5215 /* Intel Syntax. */
5216 case 'd':
5217 if (intel_syntax)
5218 {
5219 if (intel_float_operand (mnemonic) == 1)
5220 i.suffix = SHORT_MNEM_SUFFIX;
5221 else
5222 i.suffix = LONG_MNEM_SUFFIX;
5223 mnem_p[-1] = '\0';
5224 current_templates = (const templates *) hash_find (op_hash,
5225 mnemonic);
5226 }
5227 break;
29b0f896 5228 }
29b0f896 5229 }
1c529385 5230
29b0f896
AM
5231 if (!current_templates)
5232 {
5233 as_bad (_("no such instruction: `%s'"), token_start);
5234 return NULL;
5235 }
5236 }
252b5132 5237
0cfa3eb3
JB
5238 if (current_templates->start->opcode_modifier.jump == JUMP
5239 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
29b0f896
AM
5240 {
5241 /* Check for a branch hint. We allow ",pt" and ",pn" for
5242 predict taken and predict not taken respectively.
5243 I'm not sure that branch hints actually do anything on loop
5244 and jcxz insns (JumpByte) for current Pentium4 chips. They
5245 may work in the future and it doesn't hurt to accept them
5246 now. */
5247 if (l[0] == ',' && l[1] == 'p')
5248 {
5249 if (l[2] == 't')
5250 {
5251 if (!add_prefix (DS_PREFIX_OPCODE))
5252 return NULL;
5253 l += 3;
5254 }
5255 else if (l[2] == 'n')
5256 {
5257 if (!add_prefix (CS_PREFIX_OPCODE))
5258 return NULL;
5259 l += 3;
5260 }
5261 }
5262 }
5263 /* Any other comma loses. */
5264 if (*l == ',')
5265 {
5266 as_bad (_("invalid character %s in mnemonic"),
5267 output_invalid (*l));
5268 return NULL;
5269 }
252b5132 5270
29b0f896 5271 /* Check if instruction is supported on specified architecture. */
5c6af06e
JB
5272 supported = 0;
5273 for (t = current_templates->start; t < current_templates->end; ++t)
5274 {
c0f3af97
L
5275 supported |= cpu_flags_match (t);
5276 if (supported == CPU_FLAGS_PERFECT_MATCH)
548d0ee6
JB
5277 {
5278 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5279 as_warn (_("use .code16 to ensure correct addressing mode"));
3629bb00 5280
548d0ee6
JB
5281 return l;
5282 }
29b0f896 5283 }
3629bb00 5284
548d0ee6
JB
5285 if (!(supported & CPU_FLAGS_64BIT_MATCH))
5286 as_bad (flag_code == CODE_64BIT
5287 ? _("`%s' is not supported in 64-bit mode")
5288 : _("`%s' is only supported in 64-bit mode"),
5289 current_templates->start->name);
5290 else
5291 as_bad (_("`%s' is not supported on `%s%s'"),
5292 current_templates->start->name,
5293 cpu_arch_name ? cpu_arch_name : default_arch,
5294 cpu_sub_arch_name ? cpu_sub_arch_name : "");
252b5132 5295
548d0ee6 5296 return NULL;
29b0f896 5297}
252b5132 5298
29b0f896 5299static char *
e3bb37b5 5300parse_operands (char *l, const char *mnemonic)
29b0f896
AM
5301{
5302 char *token_start;
3138f287 5303
29b0f896
AM
5304 /* 1 if operand is pending after ','. */
5305 unsigned int expecting_operand = 0;
252b5132 5306
29b0f896
AM
5307 /* Non-zero if operand parens not balanced. */
5308 unsigned int paren_not_balanced;
5309
5310 while (*l != END_OF_INSN)
5311 {
5312 /* Skip optional white space before operand. */
5313 if (is_space_char (*l))
5314 ++l;
d02603dc 5315 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
29b0f896
AM
5316 {
5317 as_bad (_("invalid character %s before operand %d"),
5318 output_invalid (*l),
5319 i.operands + 1);
5320 return NULL;
5321 }
d02603dc 5322 token_start = l; /* After white space. */
29b0f896
AM
5323 paren_not_balanced = 0;
5324 while (paren_not_balanced || *l != ',')
5325 {
5326 if (*l == END_OF_INSN)
5327 {
5328 if (paren_not_balanced)
5329 {
5330 if (!intel_syntax)
5331 as_bad (_("unbalanced parenthesis in operand %d."),
5332 i.operands + 1);
5333 else
5334 as_bad (_("unbalanced brackets in operand %d."),
5335 i.operands + 1);
5336 return NULL;
5337 }
5338 else
5339 break; /* we are done */
5340 }
d02603dc 5341 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
29b0f896
AM
5342 {
5343 as_bad (_("invalid character %s in operand %d"),
5344 output_invalid (*l),
5345 i.operands + 1);
5346 return NULL;
5347 }
5348 if (!intel_syntax)
5349 {
5350 if (*l == '(')
5351 ++paren_not_balanced;
5352 if (*l == ')')
5353 --paren_not_balanced;
5354 }
5355 else
5356 {
5357 if (*l == '[')
5358 ++paren_not_balanced;
5359 if (*l == ']')
5360 --paren_not_balanced;
5361 }
5362 l++;
5363 }
5364 if (l != token_start)
5365 { /* Yes, we've read in another operand. */
5366 unsigned int operand_ok;
5367 this_operand = i.operands++;
5368 if (i.operands > MAX_OPERANDS)
5369 {
5370 as_bad (_("spurious operands; (%d operands/instruction max)"),
5371 MAX_OPERANDS);
5372 return NULL;
5373 }
9d46ce34 5374 i.types[this_operand].bitfield.unspecified = 1;
29b0f896
AM
5375 /* Now parse operand adding info to 'i' as we go along. */
5376 END_STRING_AND_SAVE (l);
5377
1286ab78
L
5378 if (i.mem_operands > 1)
5379 {
5380 as_bad (_("too many memory references for `%s'"),
5381 mnemonic);
5382 return 0;
5383 }
5384
29b0f896
AM
5385 if (intel_syntax)
5386 operand_ok =
5387 i386_intel_operand (token_start,
5388 intel_float_operand (mnemonic));
5389 else
a7619375 5390 operand_ok = i386_att_operand (token_start);
29b0f896
AM
5391
5392 RESTORE_END_STRING (l);
5393 if (!operand_ok)
5394 return NULL;
5395 }
5396 else
5397 {
5398 if (expecting_operand)
5399 {
5400 expecting_operand_after_comma:
5401 as_bad (_("expecting operand after ','; got nothing"));
5402 return NULL;
5403 }
5404 if (*l == ',')
5405 {
5406 as_bad (_("expecting operand before ','; got nothing"));
5407 return NULL;
5408 }
5409 }
7f3f1ea2 5410
29b0f896
AM
5411 /* Now *l must be either ',' or END_OF_INSN. */
5412 if (*l == ',')
5413 {
5414 if (*++l == END_OF_INSN)
5415 {
5416 /* Just skip it, if it's \n complain. */
5417 goto expecting_operand_after_comma;
5418 }
5419 expecting_operand = 1;
5420 }
5421 }
5422 return l;
5423}
7f3f1ea2 5424
050dfa73 5425static void
4d456e3d 5426swap_2_operands (int xchg1, int xchg2)
050dfa73
MM
5427{
5428 union i386_op temp_op;
40fb9820 5429 i386_operand_type temp_type;
c48dadc9 5430 unsigned int temp_flags;
050dfa73 5431 enum bfd_reloc_code_real temp_reloc;
4eed87de 5432
050dfa73
MM
5433 temp_type = i.types[xchg2];
5434 i.types[xchg2] = i.types[xchg1];
5435 i.types[xchg1] = temp_type;
c48dadc9
JB
5436
5437 temp_flags = i.flags[xchg2];
5438 i.flags[xchg2] = i.flags[xchg1];
5439 i.flags[xchg1] = temp_flags;
5440
050dfa73
MM
5441 temp_op = i.op[xchg2];
5442 i.op[xchg2] = i.op[xchg1];
5443 i.op[xchg1] = temp_op;
c48dadc9 5444
050dfa73
MM
5445 temp_reloc = i.reloc[xchg2];
5446 i.reloc[xchg2] = i.reloc[xchg1];
5447 i.reloc[xchg1] = temp_reloc;
43234a1e
L
5448
5449 if (i.mask)
5450 {
5451 if (i.mask->operand == xchg1)
5452 i.mask->operand = xchg2;
5453 else if (i.mask->operand == xchg2)
5454 i.mask->operand = xchg1;
5455 }
5456 if (i.broadcast)
5457 {
5458 if (i.broadcast->operand == xchg1)
5459 i.broadcast->operand = xchg2;
5460 else if (i.broadcast->operand == xchg2)
5461 i.broadcast->operand = xchg1;
5462 }
5463 if (i.rounding)
5464 {
5465 if (i.rounding->operand == xchg1)
5466 i.rounding->operand = xchg2;
5467 else if (i.rounding->operand == xchg2)
5468 i.rounding->operand = xchg1;
5469 }
050dfa73
MM
5470}
5471
29b0f896 5472static void
e3bb37b5 5473swap_operands (void)
29b0f896 5474{
b7c61d9a 5475 switch (i.operands)
050dfa73 5476 {
c0f3af97 5477 case 5:
b7c61d9a 5478 case 4:
4d456e3d 5479 swap_2_operands (1, i.operands - 2);
1a0670f3 5480 /* Fall through. */
b7c61d9a
L
5481 case 3:
5482 case 2:
4d456e3d 5483 swap_2_operands (0, i.operands - 1);
b7c61d9a
L
5484 break;
5485 default:
5486 abort ();
29b0f896 5487 }
29b0f896
AM
5488
5489 if (i.mem_operands == 2)
5490 {
5491 const seg_entry *temp_seg;
5492 temp_seg = i.seg[0];
5493 i.seg[0] = i.seg[1];
5494 i.seg[1] = temp_seg;
5495 }
5496}
252b5132 5497
29b0f896
AM
5498/* Try to ensure constant immediates are represented in the smallest
5499 opcode possible. */
5500static void
e3bb37b5 5501optimize_imm (void)
29b0f896
AM
5502{
5503 char guess_suffix = 0;
5504 int op;
252b5132 5505
29b0f896
AM
5506 if (i.suffix)
5507 guess_suffix = i.suffix;
5508 else if (i.reg_operands)
5509 {
5510 /* Figure out a suffix from the last register operand specified.
75e5731b
JB
5511 We can't do this properly yet, i.e. excluding special register
5512 instances, but the following works for instructions with
5513 immediates. In any case, we can't set i.suffix yet. */
29b0f896 5514 for (op = i.operands; --op >= 0;)
bab6aec1
JB
5515 if (i.types[op].bitfield.class != Reg)
5516 continue;
5517 else if (i.types[op].bitfield.byte)
7ab9ffdd 5518 {
40fb9820
L
5519 guess_suffix = BYTE_MNEM_SUFFIX;
5520 break;
5521 }
bab6aec1 5522 else if (i.types[op].bitfield.word)
252b5132 5523 {
40fb9820
L
5524 guess_suffix = WORD_MNEM_SUFFIX;
5525 break;
5526 }
bab6aec1 5527 else if (i.types[op].bitfield.dword)
40fb9820
L
5528 {
5529 guess_suffix = LONG_MNEM_SUFFIX;
5530 break;
5531 }
bab6aec1 5532 else if (i.types[op].bitfield.qword)
40fb9820
L
5533 {
5534 guess_suffix = QWORD_MNEM_SUFFIX;
29b0f896 5535 break;
252b5132 5536 }
29b0f896
AM
5537 }
5538 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5539 guess_suffix = WORD_MNEM_SUFFIX;
5540
5541 for (op = i.operands; --op >= 0;)
40fb9820 5542 if (operand_type_check (i.types[op], imm))
29b0f896
AM
5543 {
5544 switch (i.op[op].imms->X_op)
252b5132 5545 {
29b0f896
AM
5546 case O_constant:
5547 /* If a suffix is given, this operand may be shortened. */
5548 switch (guess_suffix)
252b5132 5549 {
29b0f896 5550 case LONG_MNEM_SUFFIX:
40fb9820
L
5551 i.types[op].bitfield.imm32 = 1;
5552 i.types[op].bitfield.imm64 = 1;
29b0f896
AM
5553 break;
5554 case WORD_MNEM_SUFFIX:
40fb9820
L
5555 i.types[op].bitfield.imm16 = 1;
5556 i.types[op].bitfield.imm32 = 1;
5557 i.types[op].bitfield.imm32s = 1;
5558 i.types[op].bitfield.imm64 = 1;
29b0f896
AM
5559 break;
5560 case BYTE_MNEM_SUFFIX:
40fb9820
L
5561 i.types[op].bitfield.imm8 = 1;
5562 i.types[op].bitfield.imm8s = 1;
5563 i.types[op].bitfield.imm16 = 1;
5564 i.types[op].bitfield.imm32 = 1;
5565 i.types[op].bitfield.imm32s = 1;
5566 i.types[op].bitfield.imm64 = 1;
29b0f896 5567 break;
252b5132 5568 }
252b5132 5569
29b0f896
AM
5570 /* If this operand is at most 16 bits, convert it
5571 to a signed 16 bit number before trying to see
5572 whether it will fit in an even smaller size.
5573 This allows a 16-bit operand such as $0xffe0 to
5574 be recognised as within Imm8S range. */
40fb9820 5575 if ((i.types[op].bitfield.imm16)
29b0f896 5576 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
252b5132 5577 {
29b0f896
AM
5578 i.op[op].imms->X_add_number =
5579 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5580 }
a28def75
L
5581#ifdef BFD64
5582 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
40fb9820 5583 if ((i.types[op].bitfield.imm32)
29b0f896
AM
5584 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5585 == 0))
5586 {
5587 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5588 ^ ((offsetT) 1 << 31))
5589 - ((offsetT) 1 << 31));
5590 }
a28def75 5591#endif
40fb9820 5592 i.types[op]
c6fb90c8
L
5593 = operand_type_or (i.types[op],
5594 smallest_imm_type (i.op[op].imms->X_add_number));
252b5132 5595
29b0f896
AM
5596 /* We must avoid matching of Imm32 templates when 64bit
5597 only immediate is available. */
5598 if (guess_suffix == QWORD_MNEM_SUFFIX)
40fb9820 5599 i.types[op].bitfield.imm32 = 0;
29b0f896 5600 break;
252b5132 5601
29b0f896
AM
5602 case O_absent:
5603 case O_register:
5604 abort ();
5605
5606 /* Symbols and expressions. */
5607 default:
9cd96992
JB
5608 /* Convert symbolic operand to proper sizes for matching, but don't
5609 prevent matching a set of insns that only supports sizes other
5610 than those matching the insn suffix. */
5611 {
40fb9820 5612 i386_operand_type mask, allowed;
d3ce72d0 5613 const insn_template *t;
9cd96992 5614
0dfbf9d7
L
5615 operand_type_set (&mask, 0);
5616 operand_type_set (&allowed, 0);
40fb9820 5617
4eed87de
AM
5618 for (t = current_templates->start;
5619 t < current_templates->end;
5620 ++t)
bab6aec1
JB
5621 {
5622 allowed = operand_type_or (allowed, t->operand_types[op]);
5623 allowed = operand_type_and (allowed, anyimm);
5624 }
9cd96992
JB
5625 switch (guess_suffix)
5626 {
5627 case QWORD_MNEM_SUFFIX:
40fb9820
L
5628 mask.bitfield.imm64 = 1;
5629 mask.bitfield.imm32s = 1;
9cd96992
JB
5630 break;
5631 case LONG_MNEM_SUFFIX:
40fb9820 5632 mask.bitfield.imm32 = 1;
9cd96992
JB
5633 break;
5634 case WORD_MNEM_SUFFIX:
40fb9820 5635 mask.bitfield.imm16 = 1;
9cd96992
JB
5636 break;
5637 case BYTE_MNEM_SUFFIX:
40fb9820 5638 mask.bitfield.imm8 = 1;
9cd96992
JB
5639 break;
5640 default:
9cd96992
JB
5641 break;
5642 }
c6fb90c8 5643 allowed = operand_type_and (mask, allowed);
0dfbf9d7 5644 if (!operand_type_all_zero (&allowed))
c6fb90c8 5645 i.types[op] = operand_type_and (i.types[op], mask);
9cd96992 5646 }
29b0f896 5647 break;
252b5132 5648 }
29b0f896
AM
5649 }
5650}
47926f60 5651
29b0f896
AM
5652/* Try to use the smallest displacement type too. */
5653static void
e3bb37b5 5654optimize_disp (void)
29b0f896
AM
5655{
5656 int op;
3e73aa7c 5657
29b0f896 5658 for (op = i.operands; --op >= 0;)
40fb9820 5659 if (operand_type_check (i.types[op], disp))
252b5132 5660 {
b300c311 5661 if (i.op[op].disps->X_op == O_constant)
252b5132 5662 {
91d6fa6a 5663 offsetT op_disp = i.op[op].disps->X_add_number;
29b0f896 5664
40fb9820 5665 if (i.types[op].bitfield.disp16
91d6fa6a 5666 && (op_disp & ~(offsetT) 0xffff) == 0)
b300c311
L
5667 {
5668 /* If this operand is at most 16 bits, convert
5669 to a signed 16 bit number and don't use 64bit
5670 displacement. */
91d6fa6a 5671 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
40fb9820 5672 i.types[op].bitfield.disp64 = 0;
b300c311 5673 }
a28def75
L
5674#ifdef BFD64
5675 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
40fb9820 5676 if (i.types[op].bitfield.disp32
91d6fa6a 5677 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
b300c311
L
5678 {
5679 /* If this operand is at most 32 bits, convert
5680 to a signed 32 bit number and don't use 64bit
5681 displacement. */
91d6fa6a
NC
5682 op_disp &= (((offsetT) 2 << 31) - 1);
5683 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
40fb9820 5684 i.types[op].bitfield.disp64 = 0;
b300c311 5685 }
a28def75 5686#endif
91d6fa6a 5687 if (!op_disp && i.types[op].bitfield.baseindex)
b300c311 5688 {
40fb9820
L
5689 i.types[op].bitfield.disp8 = 0;
5690 i.types[op].bitfield.disp16 = 0;
5691 i.types[op].bitfield.disp32 = 0;
5692 i.types[op].bitfield.disp32s = 0;
5693 i.types[op].bitfield.disp64 = 0;
b300c311
L
5694 i.op[op].disps = 0;
5695 i.disp_operands--;
5696 }
5697 else if (flag_code == CODE_64BIT)
5698 {
91d6fa6a 5699 if (fits_in_signed_long (op_disp))
28a9d8f5 5700 {
40fb9820
L
5701 i.types[op].bitfield.disp64 = 0;
5702 i.types[op].bitfield.disp32s = 1;
28a9d8f5 5703 }
0e1147d9 5704 if (i.prefix[ADDR_PREFIX]
91d6fa6a 5705 && fits_in_unsigned_long (op_disp))
40fb9820 5706 i.types[op].bitfield.disp32 = 1;
b300c311 5707 }
40fb9820
L
5708 if ((i.types[op].bitfield.disp32
5709 || i.types[op].bitfield.disp32s
5710 || i.types[op].bitfield.disp16)
b5014f7a 5711 && fits_in_disp8 (op_disp))
40fb9820 5712 i.types[op].bitfield.disp8 = 1;
252b5132 5713 }
67a4f2b7
AO
5714 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5715 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5716 {
5717 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5718 i.op[op].disps, 0, i.reloc[op]);
40fb9820
L
5719 i.types[op].bitfield.disp8 = 0;
5720 i.types[op].bitfield.disp16 = 0;
5721 i.types[op].bitfield.disp32 = 0;
5722 i.types[op].bitfield.disp32s = 0;
5723 i.types[op].bitfield.disp64 = 0;
67a4f2b7
AO
5724 }
5725 else
b300c311 5726 /* We only support 64bit displacement on constants. */
40fb9820 5727 i.types[op].bitfield.disp64 = 0;
252b5132 5728 }
29b0f896
AM
5729}
5730
4a1b91ea
L
5731/* Return 1 if there is a match in broadcast bytes between operand
5732 GIVEN and instruction template T. */
5733
5734static INLINE int
5735match_broadcast_size (const insn_template *t, unsigned int given)
5736{
5737 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5738 && i.types[given].bitfield.byte)
5739 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5740 && i.types[given].bitfield.word)
5741 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5742 && i.types[given].bitfield.dword)
5743 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5744 && i.types[given].bitfield.qword));
5745}
5746
6c30d220
L
5747/* Check if operands are valid for the instruction. */
5748
5749static int
5750check_VecOperands (const insn_template *t)
5751{
43234a1e 5752 unsigned int op;
e2195274 5753 i386_cpu_flags cpu;
e2195274
JB
5754
5755 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5756 any one operand are implicity requiring AVX512VL support if the actual
5757 operand size is YMMword or XMMword. Since this function runs after
5758 template matching, there's no need to check for YMMword/XMMword in
5759 the template. */
5760 cpu = cpu_flags_and (t->cpu_flags, avx512);
5761 if (!cpu_flags_all_zero (&cpu)
5762 && !t->cpu_flags.bitfield.cpuavx512vl
5763 && !cpu_arch_flags.bitfield.cpuavx512vl)
5764 {
5765 for (op = 0; op < t->operands; ++op)
5766 {
5767 if (t->operand_types[op].bitfield.zmmword
5768 && (i.types[op].bitfield.ymmword
5769 || i.types[op].bitfield.xmmword))
5770 {
5771 i.error = unsupported;
5772 return 1;
5773 }
5774 }
5775 }
43234a1e 5776
6c30d220 5777 /* Without VSIB byte, we can't have a vector register for index. */
63112cd6 5778 if (!t->opcode_modifier.sib
6c30d220 5779 && i.index_reg
1b54b8d7
JB
5780 && (i.index_reg->reg_type.bitfield.xmmword
5781 || i.index_reg->reg_type.bitfield.ymmword
5782 || i.index_reg->reg_type.bitfield.zmmword))
6c30d220
L
5783 {
5784 i.error = unsupported_vector_index_register;
5785 return 1;
5786 }
5787
ad8ecc81
MZ
5788 /* Check if default mask is allowed. */
5789 if (t->opcode_modifier.nodefmask
5790 && (!i.mask || i.mask->mask->reg_num == 0))
5791 {
5792 i.error = no_default_mask;
5793 return 1;
5794 }
5795
7bab8ab5
JB
5796 /* For VSIB byte, we need a vector register for index, and all vector
5797 registers must be distinct. */
63112cd6 5798 if (t->opcode_modifier.sib)
7bab8ab5
JB
5799 {
5800 if (!i.index_reg
63112cd6 5801 || !((t->opcode_modifier.sib == VECSIB128
1b54b8d7 5802 && i.index_reg->reg_type.bitfield.xmmword)
63112cd6 5803 || (t->opcode_modifier.sib == VECSIB256
1b54b8d7 5804 && i.index_reg->reg_type.bitfield.ymmword)
63112cd6 5805 || (t->opcode_modifier.sib == VECSIB512
1b54b8d7 5806 && i.index_reg->reg_type.bitfield.zmmword)))
7bab8ab5
JB
5807 {
5808 i.error = invalid_vsib_address;
5809 return 1;
5810 }
5811
43234a1e
L
5812 gas_assert (i.reg_operands == 2 || i.mask);
5813 if (i.reg_operands == 2 && !i.mask)
5814 {
3528c362 5815 gas_assert (i.types[0].bitfield.class == RegSIMD);
1b54b8d7
JB
5816 gas_assert (i.types[0].bitfield.xmmword
5817 || i.types[0].bitfield.ymmword);
3528c362 5818 gas_assert (i.types[2].bitfield.class == RegSIMD);
1b54b8d7
JB
5819 gas_assert (i.types[2].bitfield.xmmword
5820 || i.types[2].bitfield.ymmword);
43234a1e
L
5821 if (operand_check == check_none)
5822 return 0;
5823 if (register_number (i.op[0].regs)
5824 != register_number (i.index_reg)
5825 && register_number (i.op[2].regs)
5826 != register_number (i.index_reg)
5827 && register_number (i.op[0].regs)
5828 != register_number (i.op[2].regs))
5829 return 0;
5830 if (operand_check == check_error)
5831 {
5832 i.error = invalid_vector_register_set;
5833 return 1;
5834 }
5835 as_warn (_("mask, index, and destination registers should be distinct"));
5836 }
8444f82a
MZ
5837 else if (i.reg_operands == 1 && i.mask)
5838 {
3528c362 5839 if (i.types[1].bitfield.class == RegSIMD
1b54b8d7
JB
5840 && (i.types[1].bitfield.xmmword
5841 || i.types[1].bitfield.ymmword
5842 || i.types[1].bitfield.zmmword)
8444f82a
MZ
5843 && (register_number (i.op[1].regs)
5844 == register_number (i.index_reg)))
5845 {
5846 if (operand_check == check_error)
5847 {
5848 i.error = invalid_vector_register_set;
5849 return 1;
5850 }
5851 if (operand_check != check_none)
5852 as_warn (_("index and destination registers should be distinct"));
5853 }
5854 }
43234a1e 5855 }
7bab8ab5 5856
43234a1e
L
5857 /* Check if broadcast is supported by the instruction and is applied
5858 to the memory operand. */
5859 if (i.broadcast)
5860 {
8e6e0792 5861 i386_operand_type type, overlap;
43234a1e
L
5862
5863 /* Check if specified broadcast is supported in this instruction,
4a1b91ea 5864 and its broadcast bytes match the memory operand. */
32546502 5865 op = i.broadcast->operand;
8e6e0792 5866 if (!t->opcode_modifier.broadcast
c48dadc9 5867 || !(i.flags[op] & Operand_Mem)
c39e5b26 5868 || (!i.types[op].bitfield.unspecified
4a1b91ea 5869 && !match_broadcast_size (t, op)))
43234a1e
L
5870 {
5871 bad_broadcast:
5872 i.error = unsupported_broadcast;
5873 return 1;
5874 }
8e6e0792 5875
4a1b91ea
L
5876 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5877 * i.broadcast->type);
8e6e0792 5878 operand_type_set (&type, 0);
4a1b91ea 5879 switch (i.broadcast->bytes)
8e6e0792 5880 {
4a1b91ea
L
5881 case 2:
5882 type.bitfield.word = 1;
5883 break;
5884 case 4:
5885 type.bitfield.dword = 1;
5886 break;
8e6e0792
JB
5887 case 8:
5888 type.bitfield.qword = 1;
5889 break;
5890 case 16:
5891 type.bitfield.xmmword = 1;
5892 break;
5893 case 32:
5894 type.bitfield.ymmword = 1;
5895 break;
5896 case 64:
5897 type.bitfield.zmmword = 1;
5898 break;
5899 default:
5900 goto bad_broadcast;
5901 }
5902
5903 overlap = operand_type_and (type, t->operand_types[op]);
bc49bfd8
JB
5904 if (t->operand_types[op].bitfield.class == RegSIMD
5905 && t->operand_types[op].bitfield.byte
5906 + t->operand_types[op].bitfield.word
5907 + t->operand_types[op].bitfield.dword
5908 + t->operand_types[op].bitfield.qword > 1)
5909 {
5910 overlap.bitfield.xmmword = 0;
5911 overlap.bitfield.ymmword = 0;
5912 overlap.bitfield.zmmword = 0;
5913 }
8e6e0792
JB
5914 if (operand_type_all_zero (&overlap))
5915 goto bad_broadcast;
5916
5917 if (t->opcode_modifier.checkregsize)
5918 {
5919 unsigned int j;
5920
e2195274 5921 type.bitfield.baseindex = 1;
8e6e0792
JB
5922 for (j = 0; j < i.operands; ++j)
5923 {
5924 if (j != op
5925 && !operand_type_register_match(i.types[j],
5926 t->operand_types[j],
5927 type,
5928 t->operand_types[op]))
5929 goto bad_broadcast;
5930 }
5931 }
43234a1e
L
5932 }
5933 /* If broadcast is supported in this instruction, we need to check if
5934 operand of one-element size isn't specified without broadcast. */
5935 else if (t->opcode_modifier.broadcast && i.mem_operands)
5936 {
5937 /* Find memory operand. */
5938 for (op = 0; op < i.operands; op++)
8dc0818e 5939 if (i.flags[op] & Operand_Mem)
43234a1e
L
5940 break;
5941 gas_assert (op < i.operands);
5942 /* Check size of the memory operand. */
4a1b91ea 5943 if (match_broadcast_size (t, op))
43234a1e
L
5944 {
5945 i.error = broadcast_needed;
5946 return 1;
5947 }
5948 }
c39e5b26
JB
5949 else
5950 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
43234a1e
L
5951
5952 /* Check if requested masking is supported. */
ae2387fe 5953 if (i.mask)
43234a1e 5954 {
ae2387fe
JB
5955 switch (t->opcode_modifier.masking)
5956 {
5957 case BOTH_MASKING:
5958 break;
5959 case MERGING_MASKING:
5960 if (i.mask->zeroing)
5961 {
5962 case 0:
5963 i.error = unsupported_masking;
5964 return 1;
5965 }
5966 break;
5967 case DYNAMIC_MASKING:
5968 /* Memory destinations allow only merging masking. */
5969 if (i.mask->zeroing && i.mem_operands)
5970 {
5971 /* Find memory operand. */
5972 for (op = 0; op < i.operands; op++)
c48dadc9 5973 if (i.flags[op] & Operand_Mem)
ae2387fe
JB
5974 break;
5975 gas_assert (op < i.operands);
5976 if (op == i.operands - 1)
5977 {
5978 i.error = unsupported_masking;
5979 return 1;
5980 }
5981 }
5982 break;
5983 default:
5984 abort ();
5985 }
43234a1e
L
5986 }
5987
5988 /* Check if masking is applied to dest operand. */
5989 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5990 {
5991 i.error = mask_not_on_destination;
5992 return 1;
5993 }
5994
43234a1e
L
5995 /* Check RC/SAE. */
5996 if (i.rounding)
5997 {
a80195f1
JB
5998 if (!t->opcode_modifier.sae
5999 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
43234a1e
L
6000 {
6001 i.error = unsupported_rc_sae;
6002 return 1;
6003 }
6004 /* If the instruction has several immediate operands and one of
6005 them is rounding, the rounding operand should be the last
6006 immediate operand. */
6007 if (i.imm_operands > 1
6008 && i.rounding->operand != (int) (i.imm_operands - 1))
7bab8ab5 6009 {
43234a1e 6010 i.error = rc_sae_operand_not_last_imm;
7bab8ab5
JB
6011 return 1;
6012 }
6c30d220
L
6013 }
6014
da4977e0
JB
6015 /* Check the special Imm4 cases; must be the first operand. */
6016 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6017 {
6018 if (i.op[0].imms->X_op != O_constant
6019 || !fits_in_imm4 (i.op[0].imms->X_add_number))
6020 {
6021 i.error = bad_imm4;
6022 return 1;
6023 }
6024
6025 /* Turn off Imm<N> so that update_imm won't complain. */
6026 operand_type_set (&i.types[0], 0);
6027 }
6028
43234a1e 6029 /* Check vector Disp8 operand. */
b5014f7a
JB
6030 if (t->opcode_modifier.disp8memshift
6031 && i.disp_encoding != disp_encoding_32bit)
43234a1e
L
6032 {
6033 if (i.broadcast)
4a1b91ea 6034 i.memshift = t->opcode_modifier.broadcast - 1;
7091c612 6035 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
43234a1e 6036 i.memshift = t->opcode_modifier.disp8memshift;
7091c612
JB
6037 else
6038 {
6039 const i386_operand_type *type = NULL;
6040
6041 i.memshift = 0;
6042 for (op = 0; op < i.operands; op++)
8dc0818e 6043 if (i.flags[op] & Operand_Mem)
7091c612 6044 {
4174bfff
JB
6045 if (t->opcode_modifier.evex == EVEXLIG)
6046 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6047 else if (t->operand_types[op].bitfield.xmmword
6048 + t->operand_types[op].bitfield.ymmword
6049 + t->operand_types[op].bitfield.zmmword <= 1)
7091c612
JB
6050 type = &t->operand_types[op];
6051 else if (!i.types[op].bitfield.unspecified)
6052 type = &i.types[op];
6053 }
3528c362 6054 else if (i.types[op].bitfield.class == RegSIMD
4174bfff 6055 && t->opcode_modifier.evex != EVEXLIG)
7091c612
JB
6056 {
6057 if (i.types[op].bitfield.zmmword)
6058 i.memshift = 6;
6059 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6060 i.memshift = 5;
6061 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6062 i.memshift = 4;
6063 }
6064
6065 if (type)
6066 {
6067 if (type->bitfield.zmmword)
6068 i.memshift = 6;
6069 else if (type->bitfield.ymmword)
6070 i.memshift = 5;
6071 else if (type->bitfield.xmmword)
6072 i.memshift = 4;
6073 }
6074
6075 /* For the check in fits_in_disp8(). */
6076 if (i.memshift == 0)
6077 i.memshift = -1;
6078 }
43234a1e
L
6079
6080 for (op = 0; op < i.operands; op++)
6081 if (operand_type_check (i.types[op], disp)
6082 && i.op[op].disps->X_op == O_constant)
6083 {
b5014f7a 6084 if (fits_in_disp8 (i.op[op].disps->X_add_number))
43234a1e 6085 {
b5014f7a
JB
6086 i.types[op].bitfield.disp8 = 1;
6087 return 0;
43234a1e 6088 }
b5014f7a 6089 i.types[op].bitfield.disp8 = 0;
43234a1e
L
6090 }
6091 }
b5014f7a
JB
6092
6093 i.memshift = 0;
43234a1e 6094
6c30d220
L
6095 return 0;
6096}
6097
da4977e0 6098/* Check if encoding requirements are met by the instruction. */
a683cc34
SP
6099
6100static int
da4977e0 6101VEX_check_encoding (const insn_template *t)
a683cc34 6102{
da4977e0
JB
6103 if (i.vec_encoding == vex_encoding_error)
6104 {
6105 i.error = unsupported;
6106 return 1;
6107 }
6108
86fa6981 6109 if (i.vec_encoding == vex_encoding_evex)
43234a1e 6110 {
86fa6981 6111 /* This instruction must be encoded with EVEX prefix. */
e771e7c9 6112 if (!is_evex_encoding (t))
86fa6981
L
6113 {
6114 i.error = unsupported;
6115 return 1;
6116 }
6117 return 0;
43234a1e
L
6118 }
6119
a683cc34 6120 if (!t->opcode_modifier.vex)
86fa6981
L
6121 {
6122 /* This instruction template doesn't have VEX prefix. */
6123 if (i.vec_encoding != vex_encoding_default)
6124 {
6125 i.error = unsupported;
6126 return 1;
6127 }
6128 return 0;
6129 }
a683cc34 6130
a683cc34
SP
6131 return 0;
6132}
6133
d3ce72d0 6134static const insn_template *
83b16ac6 6135match_template (char mnem_suffix)
29b0f896
AM
6136{
6137 /* Points to template once we've found it. */
d3ce72d0 6138 const insn_template *t;
40fb9820 6139 i386_operand_type overlap0, overlap1, overlap2, overlap3;
c0f3af97 6140 i386_operand_type overlap4;
29b0f896 6141 unsigned int found_reverse_match;
dc2be329 6142 i386_opcode_modifier suffix_check;
40fb9820 6143 i386_operand_type operand_types [MAX_OPERANDS];
539e75ad 6144 int addr_prefix_disp;
45a4bb20 6145 unsigned int j, size_match, check_register;
5614d22c 6146 enum i386_error specific_error = 0;
29b0f896 6147
c0f3af97
L
6148#if MAX_OPERANDS != 5
6149# error "MAX_OPERANDS must be 5."
f48ff2ae
L
6150#endif
6151
29b0f896 6152 found_reverse_match = 0;
539e75ad 6153 addr_prefix_disp = -1;
40fb9820 6154
dc2be329 6155 /* Prepare for mnemonic suffix check. */
40fb9820 6156 memset (&suffix_check, 0, sizeof (suffix_check));
dc2be329
L
6157 switch (mnem_suffix)
6158 {
6159 case BYTE_MNEM_SUFFIX:
6160 suffix_check.no_bsuf = 1;
6161 break;
6162 case WORD_MNEM_SUFFIX:
6163 suffix_check.no_wsuf = 1;
6164 break;
6165 case SHORT_MNEM_SUFFIX:
6166 suffix_check.no_ssuf = 1;
6167 break;
6168 case LONG_MNEM_SUFFIX:
6169 suffix_check.no_lsuf = 1;
6170 break;
6171 case QWORD_MNEM_SUFFIX:
6172 suffix_check.no_qsuf = 1;
6173 break;
6174 default:
6175 /* NB: In Intel syntax, normally we can check for memory operand
6176 size when there is no mnemonic suffix. But jmp and call have
6177 2 different encodings with Dword memory operand size, one with
6178 No_ldSuf and the other without. i.suffix is set to
6179 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
6180 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6181 suffix_check.no_ldsuf = 1;
83b16ac6
JB
6182 }
6183
01559ecc
L
6184 /* Must have right number of operands. */
6185 i.error = number_of_operands_mismatch;
6186
45aa61fe 6187 for (t = current_templates->start; t < current_templates->end; t++)
29b0f896 6188 {
539e75ad 6189 addr_prefix_disp = -1;
dbbc8b7e 6190 found_reverse_match = 0;
539e75ad 6191
29b0f896
AM
6192 if (i.operands != t->operands)
6193 continue;
6194
50aecf8c 6195 /* Check processor support. */
a65babc9 6196 i.error = unsupported;
45a4bb20 6197 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
50aecf8c
L
6198 continue;
6199
e1d4d893 6200 /* Check AT&T mnemonic. */
a65babc9 6201 i.error = unsupported_with_intel_mnemonic;
e1d4d893 6202 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
1efbbeb4
L
6203 continue;
6204
4b5aaf5f 6205 /* Check AT&T/Intel syntax. */
a65babc9 6206 i.error = unsupported_syntax;
5c07affc 6207 if ((intel_syntax && t->opcode_modifier.attsyntax)
4b5aaf5f 6208 || (!intel_syntax && t->opcode_modifier.intelsyntax))
1efbbeb4
L
6209 continue;
6210
4b5aaf5f
L
6211 /* Check Intel64/AMD64 ISA. */
6212 switch (isa64)
6213 {
6214 default:
6215 /* Default: Don't accept Intel64. */
6216 if (t->opcode_modifier.isa64 == INTEL64)
6217 continue;
6218 break;
6219 case amd64:
6220 /* -mamd64: Don't accept Intel64 and Intel64 only. */
6221 if (t->opcode_modifier.isa64 >= INTEL64)
6222 continue;
6223 break;
6224 case intel64:
6225 /* -mintel64: Don't accept AMD64. */
5990e377 6226 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
4b5aaf5f
L
6227 continue;
6228 break;
6229 }
6230
dc2be329 6231 /* Check the suffix. */
a65babc9 6232 i.error = invalid_instruction_suffix;
dc2be329
L
6233 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6234 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6235 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6236 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6237 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6238 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
83b16ac6 6239 continue;
29b0f896 6240
3ac21baa
JB
6241 size_match = operand_size_match (t);
6242 if (!size_match)
7d5e4556 6243 continue;
539e75ad 6244
6f2f06be
JB
6245 /* This is intentionally not
6246
0cfa3eb3 6247 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6f2f06be
JB
6248
6249 as the case of a missing * on the operand is accepted (perhaps with
6250 a warning, issued further down). */
0cfa3eb3 6251 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6f2f06be
JB
6252 {
6253 i.error = operand_type_mismatch;
6254 continue;
6255 }
6256
5c07affc
L
6257 for (j = 0; j < MAX_OPERANDS; j++)
6258 operand_types[j] = t->operand_types[j];
6259
e365e234
JB
6260 /* In general, don't allow
6261 - 64-bit operands outside of 64-bit mode,
6262 - 32-bit operands on pre-386. */
4873e243 6263 j = i.imm_operands + (t->operands > i.imm_operands + 1);
e365e234
JB
6264 if (((i.suffix == QWORD_MNEM_SUFFIX
6265 && flag_code != CODE_64BIT
6266 && (t->base_opcode != 0x0fc7
6267 || t->extension_opcode != 1 /* cmpxchg8b */))
6268 || (i.suffix == LONG_MNEM_SUFFIX
6269 && !cpu_arch_flags.bitfield.cpui386))
45aa61fe 6270 && (intel_syntax
3cd7f3e3 6271 ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
45aa61fe
AM
6272 && !intel_float_operand (t->name))
6273 : intel_float_operand (t->name) != 2)
4873e243
JB
6274 && (t->operands == i.imm_operands
6275 || (operand_types[i.imm_operands].bitfield.class != RegMMX
6276 && operand_types[i.imm_operands].bitfield.class != RegSIMD
6277 && operand_types[i.imm_operands].bitfield.class != RegMask)
6278 || (operand_types[j].bitfield.class != RegMMX
6279 && operand_types[j].bitfield.class != RegSIMD
6280 && operand_types[j].bitfield.class != RegMask))
63112cd6 6281 && !t->opcode_modifier.sib)
192dc9c6
JB
6282 continue;
6283
29b0f896 6284 /* Do not verify operands when there are none. */
e365e234 6285 if (!t->operands)
da4977e0
JB
6286 {
6287 if (VEX_check_encoding (t))
6288 {
6289 specific_error = i.error;
6290 continue;
6291 }
6292
6293 /* We've found a match; break out of loop. */
6294 break;
6295 }
252b5132 6296
48bcea9f
JB
6297 if (!t->opcode_modifier.jump
6298 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6299 {
6300 /* There should be only one Disp operand. */
6301 for (j = 0; j < MAX_OPERANDS; j++)
6302 if (operand_type_check (operand_types[j], disp))
539e75ad 6303 break;
48bcea9f
JB
6304 if (j < MAX_OPERANDS)
6305 {
6306 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6307
6308 addr_prefix_disp = j;
6309
6310 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6311 operand into Disp32/Disp32/Disp16/Disp32 operand. */
6312 switch (flag_code)
40fb9820 6313 {
48bcea9f
JB
6314 case CODE_16BIT:
6315 override = !override;
6316 /* Fall through. */
6317 case CODE_32BIT:
6318 if (operand_types[j].bitfield.disp32
6319 && operand_types[j].bitfield.disp16)
40fb9820 6320 {
48bcea9f
JB
6321 operand_types[j].bitfield.disp16 = override;
6322 operand_types[j].bitfield.disp32 = !override;
40fb9820 6323 }
48bcea9f
JB
6324 operand_types[j].bitfield.disp32s = 0;
6325 operand_types[j].bitfield.disp64 = 0;
6326 break;
6327
6328 case CODE_64BIT:
6329 if (operand_types[j].bitfield.disp32s
6330 || operand_types[j].bitfield.disp64)
40fb9820 6331 {
48bcea9f
JB
6332 operand_types[j].bitfield.disp64 &= !override;
6333 operand_types[j].bitfield.disp32s &= !override;
6334 operand_types[j].bitfield.disp32 = override;
40fb9820 6335 }
48bcea9f
JB
6336 operand_types[j].bitfield.disp16 = 0;
6337 break;
40fb9820 6338 }
539e75ad 6339 }
48bcea9f 6340 }
539e75ad 6341
02a86693
L
6342 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
6343 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6344 continue;
6345
56ffb741 6346 /* We check register size if needed. */
e2195274
JB
6347 if (t->opcode_modifier.checkregsize)
6348 {
6349 check_register = (1 << t->operands) - 1;
6350 if (i.broadcast)
6351 check_register &= ~(1 << i.broadcast->operand);
6352 }
6353 else
6354 check_register = 0;
6355
c6fb90c8 6356 overlap0 = operand_type_and (i.types[0], operand_types[0]);
29b0f896
AM
6357 switch (t->operands)
6358 {
6359 case 1:
40fb9820 6360 if (!operand_type_match (overlap0, i.types[0]))
29b0f896
AM
6361 continue;
6362 break;
6363 case 2:
33eaf5de 6364 /* xchg %eax, %eax is a special case. It is an alias for nop
8b38ad71
L
6365 only in 32bit mode and we can use opcode 0x90. In 64bit
6366 mode, we can't use 0x90 for xchg %eax, %eax since it should
6367 zero-extend %eax to %rax. */
6368 if (flag_code == CODE_64BIT
6369 && t->base_opcode == 0x90
75e5731b
JB
6370 && i.types[0].bitfield.instance == Accum
6371 && i.types[0].bitfield.dword
6372 && i.types[1].bitfield.instance == Accum
6373 && i.types[1].bitfield.dword)
8b38ad71 6374 continue;
1212781b
JB
6375 /* xrelease mov %eax, <disp> is another special case. It must not
6376 match the accumulator-only encoding of mov. */
6377 if (flag_code != CODE_64BIT
6378 && i.hle_prefix
6379 && t->base_opcode == 0xa0
75e5731b 6380 && i.types[0].bitfield.instance == Accum
8dc0818e 6381 && (i.flags[1] & Operand_Mem))
1212781b 6382 continue;
f5eb1d70
JB
6383 /* Fall through. */
6384
6385 case 3:
3ac21baa
JB
6386 if (!(size_match & MATCH_STRAIGHT))
6387 goto check_reverse;
64c49ab3
JB
6388 /* Reverse direction of operands if swapping is possible in the first
6389 place (operands need to be symmetric) and
6390 - the load form is requested, and the template is a store form,
6391 - the store form is requested, and the template is a load form,
6392 - the non-default (swapped) form is requested. */
6393 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
f5eb1d70 6394 if (t->opcode_modifier.d && i.reg_operands == i.operands
64c49ab3
JB
6395 && !operand_type_all_zero (&overlap1))
6396 switch (i.dir_encoding)
6397 {
6398 case dir_encoding_load:
6399 if (operand_type_check (operand_types[i.operands - 1], anymem)
dfd69174 6400 || t->opcode_modifier.regmem)
64c49ab3
JB
6401 goto check_reverse;
6402 break;
6403
6404 case dir_encoding_store:
6405 if (!operand_type_check (operand_types[i.operands - 1], anymem)
dfd69174 6406 && !t->opcode_modifier.regmem)
64c49ab3
JB
6407 goto check_reverse;
6408 break;
6409
6410 case dir_encoding_swap:
6411 goto check_reverse;
6412
6413 case dir_encoding_default:
6414 break;
6415 }
86fa6981 6416 /* If we want store form, we skip the current load. */
64c49ab3
JB
6417 if ((i.dir_encoding == dir_encoding_store
6418 || i.dir_encoding == dir_encoding_swap)
86fa6981
L
6419 && i.mem_operands == 0
6420 && t->opcode_modifier.load)
fa99fab2 6421 continue;
1a0670f3 6422 /* Fall through. */
f48ff2ae 6423 case 4:
c0f3af97 6424 case 5:
c6fb90c8 6425 overlap1 = operand_type_and (i.types[1], operand_types[1]);
40fb9820
L
6426 if (!operand_type_match (overlap0, i.types[0])
6427 || !operand_type_match (overlap1, i.types[1])
e2195274 6428 || ((check_register & 3) == 3
dc821c5f 6429 && !operand_type_register_match (i.types[0],
40fb9820 6430 operand_types[0],
dc821c5f 6431 i.types[1],
40fb9820 6432 operand_types[1])))
29b0f896
AM
6433 {
6434 /* Check if other direction is valid ... */
38e314eb 6435 if (!t->opcode_modifier.d)
29b0f896
AM
6436 continue;
6437
dc1e8a47 6438 check_reverse:
3ac21baa
JB
6439 if (!(size_match & MATCH_REVERSE))
6440 continue;
29b0f896 6441 /* Try reversing direction of operands. */
f5eb1d70
JB
6442 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6443 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
40fb9820 6444 if (!operand_type_match (overlap0, i.types[0])
f5eb1d70 6445 || !operand_type_match (overlap1, i.types[i.operands - 1])
45664ddb 6446 || (check_register
dc821c5f 6447 && !operand_type_register_match (i.types[0],
f5eb1d70
JB
6448 operand_types[i.operands - 1],
6449 i.types[i.operands - 1],
45664ddb 6450 operand_types[0])))
29b0f896
AM
6451 {
6452 /* Does not match either direction. */
6453 continue;
6454 }
38e314eb 6455 /* found_reverse_match holds which of D or FloatR
29b0f896 6456 we've found. */
38e314eb
JB
6457 if (!t->opcode_modifier.d)
6458 found_reverse_match = 0;
6459 else if (operand_types[0].bitfield.tbyte)
8a2ed489 6460 found_reverse_match = Opcode_FloatD;
dbbc8b7e 6461 else if (operand_types[0].bitfield.xmmword
f5eb1d70 6462 || operand_types[i.operands - 1].bitfield.xmmword
3528c362
JB
6463 || operand_types[0].bitfield.class == RegMMX
6464 || operand_types[i.operands - 1].bitfield.class == RegMMX
dbbc8b7e
JB
6465 || is_any_vex_encoding(t))
6466 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6467 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
8a2ed489 6468 else
38e314eb 6469 found_reverse_match = Opcode_D;
40fb9820 6470 if (t->opcode_modifier.floatr)
8a2ed489 6471 found_reverse_match |= Opcode_FloatR;
29b0f896 6472 }
f48ff2ae 6473 else
29b0f896 6474 {
f48ff2ae 6475 /* Found a forward 2 operand match here. */
d1cbb4db
L
6476 switch (t->operands)
6477 {
c0f3af97
L
6478 case 5:
6479 overlap4 = operand_type_and (i.types[4],
6480 operand_types[4]);
1a0670f3 6481 /* Fall through. */
d1cbb4db 6482 case 4:
c6fb90c8
L
6483 overlap3 = operand_type_and (i.types[3],
6484 operand_types[3]);
1a0670f3 6485 /* Fall through. */
d1cbb4db 6486 case 3:
c6fb90c8
L
6487 overlap2 = operand_type_and (i.types[2],
6488 operand_types[2]);
d1cbb4db
L
6489 break;
6490 }
29b0f896 6491
f48ff2ae
L
6492 switch (t->operands)
6493 {
c0f3af97
L
6494 case 5:
6495 if (!operand_type_match (overlap4, i.types[4])
dc821c5f 6496 || !operand_type_register_match (i.types[3],
c0f3af97 6497 operand_types[3],
c0f3af97
L
6498 i.types[4],
6499 operand_types[4]))
6500 continue;
1a0670f3 6501 /* Fall through. */
f48ff2ae 6502 case 4:
40fb9820 6503 if (!operand_type_match (overlap3, i.types[3])
e2195274
JB
6504 || ((check_register & 0xa) == 0xa
6505 && !operand_type_register_match (i.types[1],
f7768225
JB
6506 operand_types[1],
6507 i.types[3],
e2195274
JB
6508 operand_types[3]))
6509 || ((check_register & 0xc) == 0xc
6510 && !operand_type_register_match (i.types[2],
6511 operand_types[2],
6512 i.types[3],
6513 operand_types[3])))
f48ff2ae 6514 continue;
1a0670f3 6515 /* Fall through. */
f48ff2ae
L
6516 case 3:
6517 /* Here we make use of the fact that there are no
23e42951 6518 reverse match 3 operand instructions. */
40fb9820 6519 if (!operand_type_match (overlap2, i.types[2])
e2195274
JB
6520 || ((check_register & 5) == 5
6521 && !operand_type_register_match (i.types[0],
23e42951
JB
6522 operand_types[0],
6523 i.types[2],
e2195274
JB
6524 operand_types[2]))
6525 || ((check_register & 6) == 6
6526 && !operand_type_register_match (i.types[1],
6527 operand_types[1],
6528 i.types[2],
6529 operand_types[2])))
f48ff2ae
L
6530 continue;
6531 break;
6532 }
29b0f896 6533 }
f48ff2ae 6534 /* Found either forward/reverse 2, 3 or 4 operand match here:
29b0f896
AM
6535 slip through to break. */
6536 }
c0f3af97 6537
da4977e0
JB
6538 /* Check if vector operands are valid. */
6539 if (check_VecOperands (t))
6540 {
6541 specific_error = i.error;
6542 continue;
6543 }
6544
6545 /* Check if VEX/EVEX encoding requirements can be satisfied. */
6546 if (VEX_check_encoding (t))
5614d22c
JB
6547 {
6548 specific_error = i.error;
6549 continue;
6550 }
a683cc34 6551
29b0f896
AM
6552 /* We've found a match; break out of loop. */
6553 break;
6554 }
6555
6556 if (t == current_templates->end)
6557 {
6558 /* We found no match. */
a65babc9 6559 const char *err_msg;
5614d22c 6560 switch (specific_error ? specific_error : i.error)
a65babc9
L
6561 {
6562 default:
6563 abort ();
86e026a4 6564 case operand_size_mismatch:
a65babc9
L
6565 err_msg = _("operand size mismatch");
6566 break;
6567 case operand_type_mismatch:
6568 err_msg = _("operand type mismatch");
6569 break;
6570 case register_type_mismatch:
6571 err_msg = _("register type mismatch");
6572 break;
6573 case number_of_operands_mismatch:
6574 err_msg = _("number of operands mismatch");
6575 break;
6576 case invalid_instruction_suffix:
6577 err_msg = _("invalid instruction suffix");
6578 break;
6579 case bad_imm4:
4a2608e3 6580 err_msg = _("constant doesn't fit in 4 bits");
a65babc9 6581 break;
a65babc9
L
6582 case unsupported_with_intel_mnemonic:
6583 err_msg = _("unsupported with Intel mnemonic");
6584 break;
6585 case unsupported_syntax:
6586 err_msg = _("unsupported syntax");
6587 break;
6588 case unsupported:
35262a23 6589 as_bad (_("unsupported instruction `%s'"),
10efe3f6
L
6590 current_templates->start->name);
6591 return NULL;
6c30d220
L
6592 case invalid_vsib_address:
6593 err_msg = _("invalid VSIB address");
6594 break;
7bab8ab5
JB
6595 case invalid_vector_register_set:
6596 err_msg = _("mask, index, and destination registers must be distinct");
6597 break;
6c30d220
L
6598 case unsupported_vector_index_register:
6599 err_msg = _("unsupported vector index register");
6600 break;
43234a1e
L
6601 case unsupported_broadcast:
6602 err_msg = _("unsupported broadcast");
6603 break;
43234a1e
L
6604 case broadcast_needed:
6605 err_msg = _("broadcast is needed for operand of such type");
6606 break;
6607 case unsupported_masking:
6608 err_msg = _("unsupported masking");
6609 break;
6610 case mask_not_on_destination:
6611 err_msg = _("mask not on destination operand");
6612 break;
6613 case no_default_mask:
6614 err_msg = _("default mask isn't allowed");
6615 break;
6616 case unsupported_rc_sae:
6617 err_msg = _("unsupported static rounding/sae");
6618 break;
6619 case rc_sae_operand_not_last_imm:
6620 if (intel_syntax)
6621 err_msg = _("RC/SAE operand must precede immediate operands");
6622 else
6623 err_msg = _("RC/SAE operand must follow immediate operands");
6624 break;
6625 case invalid_register_operand:
6626 err_msg = _("invalid register operand");
6627 break;
a65babc9
L
6628 }
6629 as_bad (_("%s for `%s'"), err_msg,
891edac4 6630 current_templates->start->name);
fa99fab2 6631 return NULL;
29b0f896 6632 }
252b5132 6633
29b0f896
AM
6634 if (!quiet_warnings)
6635 {
6636 if (!intel_syntax
0cfa3eb3 6637 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6f2f06be 6638 as_warn (_("indirect %s without `*'"), t->name);
29b0f896 6639
40fb9820 6640 if (t->opcode_modifier.isprefix
3cd7f3e3 6641 && t->opcode_modifier.mnemonicsize == IGNORESIZE)
29b0f896
AM
6642 {
6643 /* Warn them that a data or address size prefix doesn't
6644 affect assembly of the next line of code. */
6645 as_warn (_("stand-alone `%s' prefix"), t->name);
6646 }
6647 }
6648
6649 /* Copy the template we found. */
6650 i.tm = *t;
539e75ad
L
6651
6652 if (addr_prefix_disp != -1)
6653 i.tm.operand_types[addr_prefix_disp]
6654 = operand_types[addr_prefix_disp];
6655
29b0f896
AM
6656 if (found_reverse_match)
6657 {
dfd69174
JB
6658 /* If we found a reverse match we must alter the opcode direction
6659 bit and clear/flip the regmem modifier one. found_reverse_match
6660 holds bits to change (different for int & float insns). */
29b0f896
AM
6661
6662 i.tm.base_opcode ^= found_reverse_match;
6663
f5eb1d70
JB
6664 i.tm.operand_types[0] = operand_types[i.operands - 1];
6665 i.tm.operand_types[i.operands - 1] = operand_types[0];
dfd69174
JB
6666
6667 /* Certain SIMD insns have their load forms specified in the opcode
6668 table, and hence we need to _set_ RegMem instead of clearing it.
6669 We need to avoid setting the bit though on insns like KMOVW. */
6670 i.tm.opcode_modifier.regmem
6671 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6672 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6673 && !i.tm.opcode_modifier.regmem;
29b0f896
AM
6674 }
6675
fa99fab2 6676 return t;
29b0f896
AM
6677}
6678
6679static int
e3bb37b5 6680check_string (void)
29b0f896 6681{
51c8edf6
JB
6682 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6683 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
8dc0818e 6684
51c8edf6 6685 if (i.seg[op] != NULL && i.seg[op] != &es)
29b0f896 6686 {
51c8edf6
JB
6687 as_bad (_("`%s' operand %u must use `%ses' segment"),
6688 i.tm.name,
6689 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6690 register_prefix);
6691 return 0;
29b0f896 6692 }
51c8edf6
JB
6693
6694 /* There's only ever one segment override allowed per instruction.
6695 This instruction possibly has a legal segment override on the
6696 second operand, so copy the segment to where non-string
6697 instructions store it, allowing common code. */
6698 i.seg[op] = i.seg[1];
6699
29b0f896
AM
6700 return 1;
6701}
6702
6703static int
543613e9 6704process_suffix (void)
29b0f896
AM
6705{
6706 /* If matched instruction specifies an explicit instruction mnemonic
6707 suffix, use it. */
673fe0f0 6708 if (i.tm.opcode_modifier.size == SIZE16)
40fb9820 6709 i.suffix = WORD_MNEM_SUFFIX;
673fe0f0 6710 else if (i.tm.opcode_modifier.size == SIZE32)
40fb9820 6711 i.suffix = LONG_MNEM_SUFFIX;
673fe0f0 6712 else if (i.tm.opcode_modifier.size == SIZE64)
40fb9820 6713 i.suffix = QWORD_MNEM_SUFFIX;
13e600d0 6714 else if (i.reg_operands
c8f8eebc
JB
6715 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6716 && !i.tm.opcode_modifier.addrprefixopreg)
29b0f896 6717 {
65fca059
JB
6718 unsigned int numop = i.operands;
6719
6720 /* movsx/movzx want only their source operand considered here, for the
6721 ambiguity checking below. The suffix will be replaced afterwards
6722 to represent the destination (register). */
6723 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6724 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6725 --i.operands;
6726
643bb870
JB
6727 /* crc32 needs REX.W set regardless of suffix / source operand size. */
6728 if (i.tm.base_opcode == 0xf20f38f0
6729 && i.tm.operand_types[1].bitfield.qword)
6730 i.rex |= REX_W;
6731
29b0f896 6732 /* If there's no instruction mnemonic suffix we try to invent one
13e600d0 6733 based on GPR operands. */
29b0f896
AM
6734 if (!i.suffix)
6735 {
6736 /* We take i.suffix from the last register operand specified,
6737 Destination register type is more significant than source
381d071f
L
6738 register type. crc32 in SSE4.2 prefers source register
6739 type. */
1a035124 6740 unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
20592a94 6741
1a035124
JB
6742 while (op--)
6743 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6744 || i.tm.operand_types[op].bitfield.instance == Accum)
6745 {
6746 if (i.types[op].bitfield.class != Reg)
6747 continue;
6748 if (i.types[op].bitfield.byte)
6749 i.suffix = BYTE_MNEM_SUFFIX;
6750 else if (i.types[op].bitfield.word)
6751 i.suffix = WORD_MNEM_SUFFIX;
6752 else if (i.types[op].bitfield.dword)
6753 i.suffix = LONG_MNEM_SUFFIX;
6754 else if (i.types[op].bitfield.qword)
6755 i.suffix = QWORD_MNEM_SUFFIX;
6756 else
6757 continue;
6758 break;
6759 }
65fca059
JB
6760
6761 /* As an exception, movsx/movzx silently default to a byte source
6762 in AT&T mode. */
6763 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6764 && !i.suffix && !intel_syntax)
6765 i.suffix = BYTE_MNEM_SUFFIX;
29b0f896
AM
6766 }
6767 else if (i.suffix == BYTE_MNEM_SUFFIX)
6768 {
2eb952a4 6769 if (intel_syntax
3cd7f3e3 6770 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
2eb952a4
L
6771 && i.tm.opcode_modifier.no_bsuf)
6772 i.suffix = 0;
6773 else if (!check_byte_reg ())
29b0f896
AM
6774 return 0;
6775 }
6776 else if (i.suffix == LONG_MNEM_SUFFIX)
6777 {
2eb952a4 6778 if (intel_syntax
3cd7f3e3 6779 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
9f123b91
JB
6780 && i.tm.opcode_modifier.no_lsuf
6781 && !i.tm.opcode_modifier.todword
6782 && !i.tm.opcode_modifier.toqword)
2eb952a4
L
6783 i.suffix = 0;
6784 else if (!check_long_reg ())
29b0f896
AM
6785 return 0;
6786 }
6787 else if (i.suffix == QWORD_MNEM_SUFFIX)
6788 {
955e1e6a 6789 if (intel_syntax
3cd7f3e3 6790 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
9f123b91
JB
6791 && i.tm.opcode_modifier.no_qsuf
6792 && !i.tm.opcode_modifier.todword
6793 && !i.tm.opcode_modifier.toqword)
955e1e6a
L
6794 i.suffix = 0;
6795 else if (!check_qword_reg ())
29b0f896
AM
6796 return 0;
6797 }
6798 else if (i.suffix == WORD_MNEM_SUFFIX)
6799 {
2eb952a4 6800 if (intel_syntax
3cd7f3e3 6801 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
2eb952a4
L
6802 && i.tm.opcode_modifier.no_wsuf)
6803 i.suffix = 0;
6804 else if (!check_word_reg ())
29b0f896
AM
6805 return 0;
6806 }
3cd7f3e3
L
6807 else if (intel_syntax
6808 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
29b0f896
AM
6809 /* Do nothing if the instruction is going to ignore the prefix. */
6810 ;
6811 else
6812 abort ();
65fca059
JB
6813
6814 /* Undo the movsx/movzx change done above. */
6815 i.operands = numop;
29b0f896 6816 }
3cd7f3e3
L
6817 else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6818 && !i.suffix)
29b0f896 6819 {
13e600d0
JB
6820 i.suffix = stackop_size;
6821 if (stackop_size == LONG_MNEM_SUFFIX)
06f74c5c
L
6822 {
6823 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6824 .code16gcc directive to support 16-bit mode with
6825 32-bit address. For IRET without a suffix, generate
6826 16-bit IRET (opcode 0xcf) to return from an interrupt
6827 handler. */
13e600d0
JB
6828 if (i.tm.base_opcode == 0xcf)
6829 {
6830 i.suffix = WORD_MNEM_SUFFIX;
6831 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6832 }
6833 /* Warn about changed behavior for segment register push/pop. */
6834 else if ((i.tm.base_opcode | 1) == 0x07)
6835 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6836 i.tm.name);
06f74c5c 6837 }
29b0f896 6838 }
c006a730 6839 else if (!i.suffix
0cfa3eb3
JB
6840 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6841 || i.tm.opcode_modifier.jump == JUMP_BYTE
6842 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
64e74474
AM
6843 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6844 && i.tm.extension_opcode <= 3)))
9306ca4a
JB
6845 {
6846 switch (flag_code)
6847 {
6848 case CODE_64BIT:
40fb9820 6849 if (!i.tm.opcode_modifier.no_qsuf)
9306ca4a 6850 {
828c2a25
JB
6851 if (i.tm.opcode_modifier.jump == JUMP_BYTE
6852 || i.tm.opcode_modifier.no_lsuf)
6853 i.suffix = QWORD_MNEM_SUFFIX;
9306ca4a
JB
6854 break;
6855 }
1a0670f3 6856 /* Fall through. */
9306ca4a 6857 case CODE_32BIT:
40fb9820 6858 if (!i.tm.opcode_modifier.no_lsuf)
9306ca4a
JB
6859 i.suffix = LONG_MNEM_SUFFIX;
6860 break;
6861 case CODE_16BIT:
40fb9820 6862 if (!i.tm.opcode_modifier.no_wsuf)
9306ca4a
JB
6863 i.suffix = WORD_MNEM_SUFFIX;
6864 break;
6865 }
6866 }
252b5132 6867
c006a730 6868 if (!i.suffix
3cd7f3e3 6869 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
873494c8
JB
6870 /* Also cover lret/retf/iret in 64-bit mode. */
6871 || (flag_code == CODE_64BIT
6872 && !i.tm.opcode_modifier.no_lsuf
6873 && !i.tm.opcode_modifier.no_qsuf))
3cd7f3e3 6874 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
8bbb3ad8
JB
6875 /* Explicit sizing prefixes are assumed to disambiguate insns. */
6876 && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
62b3f548
JB
6877 /* Accept FLDENV et al without suffix. */
6878 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
29b0f896 6879 {
6c0946d0 6880 unsigned int suffixes, evex = 0;
c006a730
JB
6881
6882 suffixes = !i.tm.opcode_modifier.no_bsuf;
6883 if (!i.tm.opcode_modifier.no_wsuf)
6884 suffixes |= 1 << 1;
6885 if (!i.tm.opcode_modifier.no_lsuf)
6886 suffixes |= 1 << 2;
6887 if (!i.tm.opcode_modifier.no_ldsuf)
6888 suffixes |= 1 << 3;
6889 if (!i.tm.opcode_modifier.no_ssuf)
6890 suffixes |= 1 << 4;
6891 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6892 suffixes |= 1 << 5;
6893
6c0946d0
JB
6894 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6895 also suitable for AT&T syntax mode, it was requested that this be
6896 restricted to just Intel syntax. */
b9915cbc 6897 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6c0946d0 6898 {
b9915cbc 6899 unsigned int op;
6c0946d0 6900
b9915cbc 6901 for (op = 0; op < i.tm.operands; ++op)
6c0946d0 6902 {
b9915cbc
JB
6903 if (is_evex_encoding (&i.tm)
6904 && !cpu_arch_flags.bitfield.cpuavx512vl)
6c0946d0 6905 {
b9915cbc
JB
6906 if (i.tm.operand_types[op].bitfield.ymmword)
6907 i.tm.operand_types[op].bitfield.xmmword = 0;
6908 if (i.tm.operand_types[op].bitfield.zmmword)
6909 i.tm.operand_types[op].bitfield.ymmword = 0;
6910 if (!i.tm.opcode_modifier.evex
6911 || i.tm.opcode_modifier.evex == EVEXDYN)
6912 i.tm.opcode_modifier.evex = EVEX512;
6913 }
6c0946d0 6914
b9915cbc
JB
6915 if (i.tm.operand_types[op].bitfield.xmmword
6916 + i.tm.operand_types[op].bitfield.ymmword
6917 + i.tm.operand_types[op].bitfield.zmmword < 2)
6918 continue;
6c0946d0 6919
b9915cbc
JB
6920 /* Any properly sized operand disambiguates the insn. */
6921 if (i.types[op].bitfield.xmmword
6922 || i.types[op].bitfield.ymmword
6923 || i.types[op].bitfield.zmmword)
6924 {
6925 suffixes &= ~(7 << 6);
6926 evex = 0;
6927 break;
6928 }
6c0946d0 6929
b9915cbc
JB
6930 if ((i.flags[op] & Operand_Mem)
6931 && i.tm.operand_types[op].bitfield.unspecified)
6932 {
6933 if (i.tm.operand_types[op].bitfield.xmmword)
6934 suffixes |= 1 << 6;
6935 if (i.tm.operand_types[op].bitfield.ymmword)
6936 suffixes |= 1 << 7;
6937 if (i.tm.operand_types[op].bitfield.zmmword)
6938 suffixes |= 1 << 8;
6939 if (is_evex_encoding (&i.tm))
6940 evex = EVEX512;
6c0946d0
JB
6941 }
6942 }
6943 }
6944
6945 /* Are multiple suffixes / operand sizes allowed? */
c006a730 6946 if (suffixes & (suffixes - 1))
9306ca4a 6947 {
873494c8 6948 if (intel_syntax
3cd7f3e3 6949 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
873494c8 6950 || operand_check == check_error))
9306ca4a 6951 {
c006a730 6952 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
9306ca4a
JB
6953 return 0;
6954 }
c006a730 6955 if (operand_check == check_error)
9306ca4a 6956 {
c006a730
JB
6957 as_bad (_("no instruction mnemonic suffix given and "
6958 "no register operands; can't size `%s'"), i.tm.name);
9306ca4a
JB
6959 return 0;
6960 }
c006a730 6961 if (operand_check == check_warning)
873494c8
JB
6962 as_warn (_("%s; using default for `%s'"),
6963 intel_syntax
6964 ? _("ambiguous operand size")
6965 : _("no instruction mnemonic suffix given and "
6966 "no register operands"),
6967 i.tm.name);
c006a730
JB
6968
6969 if (i.tm.opcode_modifier.floatmf)
6970 i.suffix = SHORT_MNEM_SUFFIX;
65fca059
JB
6971 else if ((i.tm.base_opcode | 8) == 0xfbe
6972 || (i.tm.base_opcode == 0x63
6973 && i.tm.cpu_flags.bitfield.cpu64))
6974 /* handled below */;
6c0946d0
JB
6975 else if (evex)
6976 i.tm.opcode_modifier.evex = evex;
c006a730
JB
6977 else if (flag_code == CODE_16BIT)
6978 i.suffix = WORD_MNEM_SUFFIX;
1a035124 6979 else if (!i.tm.opcode_modifier.no_lsuf)
c006a730 6980 i.suffix = LONG_MNEM_SUFFIX;
1a035124
JB
6981 else
6982 i.suffix = QWORD_MNEM_SUFFIX;
9306ca4a 6983 }
29b0f896 6984 }
252b5132 6985
65fca059
JB
6986 if ((i.tm.base_opcode | 8) == 0xfbe
6987 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6988 {
6989 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
6990 In AT&T syntax, if there is no suffix (warned about above), the default
6991 will be byte extension. */
6992 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
6993 i.tm.base_opcode |= 1;
6994
6995 /* For further processing, the suffix should represent the destination
6996 (register). This is already the case when one was used with
6997 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
6998 no suffix to begin with. */
6999 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7000 {
7001 if (i.types[1].bitfield.word)
7002 i.suffix = WORD_MNEM_SUFFIX;
7003 else if (i.types[1].bitfield.qword)
7004 i.suffix = QWORD_MNEM_SUFFIX;
7005 else
7006 i.suffix = LONG_MNEM_SUFFIX;
7007
7008 i.tm.opcode_modifier.w = 0;
7009 }
7010 }
7011
50128d0c
JB
7012 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7013 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7014 != (i.tm.operand_types[1].bitfield.class == Reg);
7015
d2224064
JB
7016 /* Change the opcode based on the operand size given by i.suffix. */
7017 switch (i.suffix)
29b0f896 7018 {
d2224064
JB
7019 /* Size floating point instruction. */
7020 case LONG_MNEM_SUFFIX:
7021 if (i.tm.opcode_modifier.floatmf)
7022 {
7023 i.tm.base_opcode ^= 4;
7024 break;
7025 }
7026 /* fall through */
7027 case WORD_MNEM_SUFFIX:
7028 case QWORD_MNEM_SUFFIX:
29b0f896 7029 /* It's not a byte, select word/dword operation. */
40fb9820 7030 if (i.tm.opcode_modifier.w)
29b0f896 7031 {
50128d0c 7032 if (i.short_form)
29b0f896
AM
7033 i.tm.base_opcode |= 8;
7034 else
7035 i.tm.base_opcode |= 1;
7036 }
d2224064
JB
7037 /* fall through */
7038 case SHORT_MNEM_SUFFIX:
29b0f896
AM
7039 /* Now select between word & dword operations via the operand
7040 size prefix, except for instructions that will ignore this
7041 prefix anyway. */
c8f8eebc 7042 if (i.suffix != QWORD_MNEM_SUFFIX
3cd7f3e3 7043 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
c8f8eebc
JB
7044 && !i.tm.opcode_modifier.floatmf
7045 && !is_any_vex_encoding (&i.tm)
7046 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7047 || (flag_code == CODE_64BIT
7048 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
24eab124
AM
7049 {
7050 unsigned int prefix = DATA_PREFIX_OPCODE;
543613e9 7051
0cfa3eb3 7052 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
29b0f896 7053 prefix = ADDR_PREFIX_OPCODE;
252b5132 7054
29b0f896
AM
7055 if (!add_prefix (prefix))
7056 return 0;
24eab124 7057 }
252b5132 7058
29b0f896
AM
7059 /* Set mode64 for an operand. */
7060 if (i.suffix == QWORD_MNEM_SUFFIX
9146926a 7061 && flag_code == CODE_64BIT
d2224064 7062 && !i.tm.opcode_modifier.norex64
4ed21b58 7063 && !i.tm.opcode_modifier.vexw
46e883c5 7064 /* Special case for xchg %rax,%rax. It is NOP and doesn't
d2224064
JB
7065 need rex64. */
7066 && ! (i.operands == 2
7067 && i.tm.base_opcode == 0x90
7068 && i.tm.extension_opcode == None
75e5731b
JB
7069 && i.types[0].bitfield.instance == Accum
7070 && i.types[0].bitfield.qword
7071 && i.types[1].bitfield.instance == Accum
7072 && i.types[1].bitfield.qword))
d2224064 7073 i.rex |= REX_W;
3e73aa7c 7074
d2224064 7075 break;
8bbb3ad8
JB
7076
7077 case 0:
7078 /* Select word/dword/qword operation with explict data sizing prefix
7079 when there are no suitable register operands. */
7080 if (i.tm.opcode_modifier.w
7081 && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7082 && (!i.reg_operands
7083 || (i.reg_operands == 1
7084 /* ShiftCount */
7085 && (i.tm.operand_types[0].bitfield.instance == RegC
7086 /* InOutPortReg */
7087 || i.tm.operand_types[0].bitfield.instance == RegD
7088 || i.tm.operand_types[1].bitfield.instance == RegD
7089 /* CRC32 */
7090 || i.tm.base_opcode == 0xf20f38f0))))
7091 i.tm.base_opcode |= 1;
7092 break;
29b0f896 7093 }
7ecd2f8b 7094
c8f8eebc 7095 if (i.tm.opcode_modifier.addrprefixopreg)
c0a30a9f 7096 {
c8f8eebc
JB
7097 gas_assert (!i.suffix);
7098 gas_assert (i.reg_operands);
c0a30a9f 7099
c8f8eebc
JB
7100 if (i.tm.operand_types[0].bitfield.instance == Accum
7101 || i.operands == 1)
7102 {
7103 /* The address size override prefix changes the size of the
7104 first operand. */
7105 if (flag_code == CODE_64BIT
7106 && i.op[0].regs->reg_type.bitfield.word)
7107 {
7108 as_bad (_("16-bit addressing unavailable for `%s'"),
7109 i.tm.name);
7110 return 0;
7111 }
7112
7113 if ((flag_code == CODE_32BIT
7114 ? i.op[0].regs->reg_type.bitfield.word
7115 : i.op[0].regs->reg_type.bitfield.dword)
7116 && !add_prefix (ADDR_PREFIX_OPCODE))
7117 return 0;
7118 }
c0a30a9f
L
7119 else
7120 {
c8f8eebc
JB
7121 /* Check invalid register operand when the address size override
7122 prefix changes the size of register operands. */
7123 unsigned int op;
7124 enum { need_word, need_dword, need_qword } need;
7125
7126 if (flag_code == CODE_32BIT)
7127 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7128 else if (i.prefix[ADDR_PREFIX])
c0a30a9f
L
7129 need = need_dword;
7130 else
7131 need = flag_code == CODE_64BIT ? need_qword : need_word;
c0a30a9f 7132
c8f8eebc
JB
7133 for (op = 0; op < i.operands; op++)
7134 {
7135 if (i.types[op].bitfield.class != Reg)
7136 continue;
7137
7138 switch (need)
7139 {
7140 case need_word:
7141 if (i.op[op].regs->reg_type.bitfield.word)
7142 continue;
7143 break;
7144 case need_dword:
7145 if (i.op[op].regs->reg_type.bitfield.dword)
7146 continue;
7147 break;
7148 case need_qword:
7149 if (i.op[op].regs->reg_type.bitfield.qword)
7150 continue;
7151 break;
7152 }
7153
7154 as_bad (_("invalid register operand size for `%s'"),
7155 i.tm.name);
7156 return 0;
7157 }
7158 }
c0a30a9f
L
7159 }
7160
29b0f896
AM
7161 return 1;
7162}
3e73aa7c 7163
29b0f896 7164static int
543613e9 7165check_byte_reg (void)
29b0f896
AM
7166{
7167 int op;
543613e9 7168
29b0f896
AM
7169 for (op = i.operands; --op >= 0;)
7170 {
dc821c5f 7171 /* Skip non-register operands. */
bab6aec1 7172 if (i.types[op].bitfield.class != Reg)
dc821c5f
JB
7173 continue;
7174
29b0f896
AM
7175 /* If this is an eight bit register, it's OK. If it's the 16 or
7176 32 bit version of an eight bit register, we will just use the
7177 low portion, and that's OK too. */
dc821c5f 7178 if (i.types[op].bitfield.byte)
29b0f896
AM
7179 continue;
7180
5a819eb9 7181 /* I/O port address operands are OK too. */
75e5731b
JB
7182 if (i.tm.operand_types[op].bitfield.instance == RegD
7183 && i.tm.operand_types[op].bitfield.word)
5a819eb9
JB
7184 continue;
7185
9706160a
JB
7186 /* crc32 only wants its source operand checked here. */
7187 if (i.tm.base_opcode == 0xf20f38f0 && op)
9344ff29
L
7188 continue;
7189
29b0f896 7190 /* Any other register is bad. */
73c76375
JB
7191 as_bad (_("`%s%s' not allowed with `%s%c'"),
7192 register_prefix, i.op[op].regs->reg_name,
7193 i.tm.name, i.suffix);
7194 return 0;
29b0f896
AM
7195 }
7196 return 1;
7197}
7198
7199static int
e3bb37b5 7200check_long_reg (void)
29b0f896
AM
7201{
7202 int op;
7203
7204 for (op = i.operands; --op >= 0;)
dc821c5f 7205 /* Skip non-register operands. */
bab6aec1 7206 if (i.types[op].bitfield.class != Reg)
dc821c5f 7207 continue;
29b0f896
AM
7208 /* Reject eight bit registers, except where the template requires
7209 them. (eg. movzb) */
dc821c5f 7210 else if (i.types[op].bitfield.byte
bab6aec1 7211 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7212 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7213 && (i.tm.operand_types[op].bitfield.word
7214 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7215 {
a540244d
L
7216 as_bad (_("`%s%s' not allowed with `%s%c'"),
7217 register_prefix,
29b0f896
AM
7218 i.op[op].regs->reg_name,
7219 i.tm.name,
7220 i.suffix);
7221 return 0;
7222 }
be4c5e58
L
7223 /* Error if the e prefix on a general reg is missing. */
7224 else if (i.types[op].bitfield.word
bab6aec1 7225 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7226 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7227 && i.tm.operand_types[op].bitfield.dword)
29b0f896 7228 {
be4c5e58
L
7229 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7230 register_prefix, i.op[op].regs->reg_name,
7231 i.suffix);
7232 return 0;
252b5132 7233 }
e4630f71 7234 /* Warn if the r prefix on a general reg is present. */
dc821c5f 7235 else if (i.types[op].bitfield.qword
bab6aec1 7236 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7237 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7238 && i.tm.operand_types[op].bitfield.dword)
252b5132 7239 {
34828aad 7240 if (intel_syntax
65fca059 7241 && i.tm.opcode_modifier.toqword
3528c362 7242 && i.types[0].bitfield.class != RegSIMD)
34828aad 7243 {
ca61edf2 7244 /* Convert to QWORD. We want REX byte. */
34828aad
L
7245 i.suffix = QWORD_MNEM_SUFFIX;
7246 }
7247 else
7248 {
2b5d6a91 7249 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
34828aad
L
7250 register_prefix, i.op[op].regs->reg_name,
7251 i.suffix);
7252 return 0;
7253 }
29b0f896
AM
7254 }
7255 return 1;
7256}
252b5132 7257
29b0f896 7258static int
e3bb37b5 7259check_qword_reg (void)
29b0f896
AM
7260{
7261 int op;
252b5132 7262
29b0f896 7263 for (op = i.operands; --op >= 0; )
dc821c5f 7264 /* Skip non-register operands. */
bab6aec1 7265 if (i.types[op].bitfield.class != Reg)
dc821c5f 7266 continue;
29b0f896
AM
7267 /* Reject eight bit registers, except where the template requires
7268 them. (eg. movzb) */
dc821c5f 7269 else if (i.types[op].bitfield.byte
bab6aec1 7270 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7271 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7272 && (i.tm.operand_types[op].bitfield.word
7273 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7274 {
a540244d
L
7275 as_bad (_("`%s%s' not allowed with `%s%c'"),
7276 register_prefix,
29b0f896
AM
7277 i.op[op].regs->reg_name,
7278 i.tm.name,
7279 i.suffix);
7280 return 0;
7281 }
e4630f71 7282 /* Warn if the r prefix on a general reg is missing. */
dc821c5f
JB
7283 else if ((i.types[op].bitfield.word
7284 || i.types[op].bitfield.dword)
bab6aec1 7285 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7286 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7287 && i.tm.operand_types[op].bitfield.qword)
29b0f896
AM
7288 {
7289 /* Prohibit these changes in the 64bit mode, since the
7290 lowering is more complicated. */
34828aad 7291 if (intel_syntax
ca61edf2 7292 && i.tm.opcode_modifier.todword
3528c362 7293 && i.types[0].bitfield.class != RegSIMD)
34828aad 7294 {
ca61edf2 7295 /* Convert to DWORD. We don't want REX byte. */
34828aad
L
7296 i.suffix = LONG_MNEM_SUFFIX;
7297 }
7298 else
7299 {
2b5d6a91 7300 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
34828aad
L
7301 register_prefix, i.op[op].regs->reg_name,
7302 i.suffix);
7303 return 0;
7304 }
252b5132 7305 }
29b0f896
AM
7306 return 1;
7307}
252b5132 7308
29b0f896 7309static int
e3bb37b5 7310check_word_reg (void)
29b0f896
AM
7311{
7312 int op;
7313 for (op = i.operands; --op >= 0;)
dc821c5f 7314 /* Skip non-register operands. */
bab6aec1 7315 if (i.types[op].bitfield.class != Reg)
dc821c5f 7316 continue;
29b0f896
AM
7317 /* Reject eight bit registers, except where the template requires
7318 them. (eg. movzb) */
dc821c5f 7319 else if (i.types[op].bitfield.byte
bab6aec1 7320 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7321 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7322 && (i.tm.operand_types[op].bitfield.word
7323 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7324 {
a540244d
L
7325 as_bad (_("`%s%s' not allowed with `%s%c'"),
7326 register_prefix,
29b0f896
AM
7327 i.op[op].regs->reg_name,
7328 i.tm.name,
7329 i.suffix);
7330 return 0;
7331 }
9706160a
JB
7332 /* Error if the e or r prefix on a general reg is present. */
7333 else if ((i.types[op].bitfield.dword
dc821c5f 7334 || i.types[op].bitfield.qword)
bab6aec1 7335 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7336 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7337 && i.tm.operand_types[op].bitfield.word)
252b5132 7338 {
9706160a
JB
7339 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7340 register_prefix, i.op[op].regs->reg_name,
7341 i.suffix);
7342 return 0;
29b0f896
AM
7343 }
7344 return 1;
7345}
252b5132 7346
29b0f896 7347static int
40fb9820 7348update_imm (unsigned int j)
29b0f896 7349{
bc0844ae 7350 i386_operand_type overlap = i.types[j];
40fb9820
L
7351 if ((overlap.bitfield.imm8
7352 || overlap.bitfield.imm8s
7353 || overlap.bitfield.imm16
7354 || overlap.bitfield.imm32
7355 || overlap.bitfield.imm32s
7356 || overlap.bitfield.imm64)
0dfbf9d7
L
7357 && !operand_type_equal (&overlap, &imm8)
7358 && !operand_type_equal (&overlap, &imm8s)
7359 && !operand_type_equal (&overlap, &imm16)
7360 && !operand_type_equal (&overlap, &imm32)
7361 && !operand_type_equal (&overlap, &imm32s)
7362 && !operand_type_equal (&overlap, &imm64))
29b0f896
AM
7363 {
7364 if (i.suffix)
7365 {
40fb9820
L
7366 i386_operand_type temp;
7367
0dfbf9d7 7368 operand_type_set (&temp, 0);
7ab9ffdd 7369 if (i.suffix == BYTE_MNEM_SUFFIX)
40fb9820
L
7370 {
7371 temp.bitfield.imm8 = overlap.bitfield.imm8;
7372 temp.bitfield.imm8s = overlap.bitfield.imm8s;
7373 }
7374 else if (i.suffix == WORD_MNEM_SUFFIX)
7375 temp.bitfield.imm16 = overlap.bitfield.imm16;
7376 else if (i.suffix == QWORD_MNEM_SUFFIX)
7377 {
7378 temp.bitfield.imm64 = overlap.bitfield.imm64;
7379 temp.bitfield.imm32s = overlap.bitfield.imm32s;
7380 }
7381 else
7382 temp.bitfield.imm32 = overlap.bitfield.imm32;
7383 overlap = temp;
29b0f896 7384 }
0dfbf9d7
L
7385 else if (operand_type_equal (&overlap, &imm16_32_32s)
7386 || operand_type_equal (&overlap, &imm16_32)
7387 || operand_type_equal (&overlap, &imm16_32s))
29b0f896 7388 {
40fb9820 7389 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
65da13b5 7390 overlap = imm16;
40fb9820 7391 else
65da13b5 7392 overlap = imm32s;
29b0f896 7393 }
8bbb3ad8
JB
7394 else if (i.prefix[REX_PREFIX] & REX_W)
7395 overlap = operand_type_and (overlap, imm32s);
7396 else if (i.prefix[DATA_PREFIX])
7397 overlap = operand_type_and (overlap,
7398 flag_code != CODE_16BIT ? imm16 : imm32);
0dfbf9d7
L
7399 if (!operand_type_equal (&overlap, &imm8)
7400 && !operand_type_equal (&overlap, &imm8s)
7401 && !operand_type_equal (&overlap, &imm16)
7402 && !operand_type_equal (&overlap, &imm32)
7403 && !operand_type_equal (&overlap, &imm32s)
7404 && !operand_type_equal (&overlap, &imm64))
29b0f896 7405 {
4eed87de
AM
7406 as_bad (_("no instruction mnemonic suffix given; "
7407 "can't determine immediate size"));
29b0f896
AM
7408 return 0;
7409 }
7410 }
40fb9820 7411 i.types[j] = overlap;
29b0f896 7412
40fb9820
L
7413 return 1;
7414}
7415
7416static int
7417finalize_imm (void)
7418{
bc0844ae 7419 unsigned int j, n;
29b0f896 7420
bc0844ae
L
7421 /* Update the first 2 immediate operands. */
7422 n = i.operands > 2 ? 2 : i.operands;
7423 if (n)
7424 {
7425 for (j = 0; j < n; j++)
7426 if (update_imm (j) == 0)
7427 return 0;
40fb9820 7428
bc0844ae
L
7429 /* The 3rd operand can't be immediate operand. */
7430 gas_assert (operand_type_check (i.types[2], imm) == 0);
7431 }
29b0f896
AM
7432
7433 return 1;
7434}
7435
7436static int
e3bb37b5 7437process_operands (void)
29b0f896
AM
7438{
7439 /* Default segment register this instruction will use for memory
7440 accesses. 0 means unknown. This is only for optimizing out
7441 unnecessary segment overrides. */
7442 const seg_entry *default_seg = 0;
7443
a5aeccd9
JB
7444 if (i.tm.opcode_modifier.sse2avx)
7445 {
7446 /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7447 need converting. */
7448 i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7449 i.prefix[REX_PREFIX] = 0;
7450 i.rex_encoding = 0;
7451 }
c423d21a
JB
7452 /* ImmExt should be processed after SSE2AVX. */
7453 else if (i.tm.opcode_modifier.immext)
7454 process_immext ();
a5aeccd9 7455
2426c15f 7456 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
29b0f896 7457 {
91d6fa6a
NC
7458 unsigned int dupl = i.operands;
7459 unsigned int dest = dupl - 1;
9fcfb3d7
L
7460 unsigned int j;
7461
c0f3af97 7462 /* The destination must be an xmm register. */
9c2799c2 7463 gas_assert (i.reg_operands
91d6fa6a 7464 && MAX_OPERANDS > dupl
7ab9ffdd 7465 && operand_type_equal (&i.types[dest], &regxmm));
c0f3af97 7466
75e5731b 7467 if (i.tm.operand_types[0].bitfield.instance == Accum
1b54b8d7 7468 && i.tm.operand_types[0].bitfield.xmmword)
e2ec9d29 7469 {
8cd7925b 7470 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
c0f3af97
L
7471 {
7472 /* Keep xmm0 for instructions with VEX prefix and 3
7473 sources. */
75e5731b 7474 i.tm.operand_types[0].bitfield.instance = InstanceNone;
3528c362 7475 i.tm.operand_types[0].bitfield.class = RegSIMD;
c0f3af97
L
7476 goto duplicate;
7477 }
e2ec9d29 7478 else
c0f3af97
L
7479 {
7480 /* We remove the first xmm0 and keep the number of
7481 operands unchanged, which in fact duplicates the
7482 destination. */
7483 for (j = 1; j < i.operands; j++)
7484 {
7485 i.op[j - 1] = i.op[j];
7486 i.types[j - 1] = i.types[j];
7487 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
8dc0818e 7488 i.flags[j - 1] = i.flags[j];
c0f3af97
L
7489 }
7490 }
7491 }
7492 else if (i.tm.opcode_modifier.implicit1stxmm0)
7ab9ffdd 7493 {
91d6fa6a 7494 gas_assert ((MAX_OPERANDS - 1) > dupl
8cd7925b
L
7495 && (i.tm.opcode_modifier.vexsources
7496 == VEX3SOURCES));
c0f3af97
L
7497
7498 /* Add the implicit xmm0 for instructions with VEX prefix
7499 and 3 sources. */
7500 for (j = i.operands; j > 0; j--)
7501 {
7502 i.op[j] = i.op[j - 1];
7503 i.types[j] = i.types[j - 1];
7504 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
8dc0818e 7505 i.flags[j] = i.flags[j - 1];
c0f3af97
L
7506 }
7507 i.op[0].regs
7508 = (const reg_entry *) hash_find (reg_hash, "xmm0");
7ab9ffdd 7509 i.types[0] = regxmm;
c0f3af97
L
7510 i.tm.operand_types[0] = regxmm;
7511
7512 i.operands += 2;
7513 i.reg_operands += 2;
7514 i.tm.operands += 2;
7515
91d6fa6a 7516 dupl++;
c0f3af97 7517 dest++;
91d6fa6a
NC
7518 i.op[dupl] = i.op[dest];
7519 i.types[dupl] = i.types[dest];
7520 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
8dc0818e 7521 i.flags[dupl] = i.flags[dest];
e2ec9d29 7522 }
c0f3af97
L
7523 else
7524 {
dc1e8a47 7525 duplicate:
c0f3af97
L
7526 i.operands++;
7527 i.reg_operands++;
7528 i.tm.operands++;
7529
91d6fa6a
NC
7530 i.op[dupl] = i.op[dest];
7531 i.types[dupl] = i.types[dest];
7532 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
8dc0818e 7533 i.flags[dupl] = i.flags[dest];
c0f3af97
L
7534 }
7535
7536 if (i.tm.opcode_modifier.immext)
7537 process_immext ();
7538 }
75e5731b 7539 else if (i.tm.operand_types[0].bitfield.instance == Accum
1b54b8d7 7540 && i.tm.operand_types[0].bitfield.xmmword)
c0f3af97
L
7541 {
7542 unsigned int j;
7543
9fcfb3d7
L
7544 for (j = 1; j < i.operands; j++)
7545 {
7546 i.op[j - 1] = i.op[j];
7547 i.types[j - 1] = i.types[j];
7548
7549 /* We need to adjust fields in i.tm since they are used by
7550 build_modrm_byte. */
7551 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
8dc0818e
JB
7552
7553 i.flags[j - 1] = i.flags[j];
9fcfb3d7
L
7554 }
7555
e2ec9d29
L
7556 i.operands--;
7557 i.reg_operands--;
e2ec9d29
L
7558 i.tm.operands--;
7559 }
920d2ddc
IT
7560 else if (i.tm.opcode_modifier.implicitquadgroup)
7561 {
a477a8c4
JB
7562 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7563
920d2ddc 7564 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
3528c362 7565 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
a477a8c4
JB
7566 regnum = register_number (i.op[1].regs);
7567 first_reg_in_group = regnum & ~3;
7568 last_reg_in_group = first_reg_in_group + 3;
7569 if (regnum != first_reg_in_group)
7570 as_warn (_("source register `%s%s' implicitly denotes"
7571 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7572 register_prefix, i.op[1].regs->reg_name,
7573 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7574 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7575 i.tm.name);
7576 }
e2ec9d29
L
7577 else if (i.tm.opcode_modifier.regkludge)
7578 {
7579 /* The imul $imm, %reg instruction is converted into
7580 imul $imm, %reg, %reg, and the clr %reg instruction
7581 is converted into xor %reg, %reg. */
7582
7583 unsigned int first_reg_op;
7584
7585 if (operand_type_check (i.types[0], reg))
7586 first_reg_op = 0;
7587 else
7588 first_reg_op = 1;
7589 /* Pretend we saw the extra register operand. */
9c2799c2 7590 gas_assert (i.reg_operands == 1
7ab9ffdd 7591 && i.op[first_reg_op + 1].regs == 0);
e2ec9d29
L
7592 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7593 i.types[first_reg_op + 1] = i.types[first_reg_op];
7594 i.operands++;
7595 i.reg_operands++;
29b0f896
AM
7596 }
7597
85b80b0f 7598 if (i.tm.opcode_modifier.modrm)
29b0f896
AM
7599 {
7600 /* The opcode is completed (modulo i.tm.extension_opcode which
52271982
AM
7601 must be put into the modrm byte). Now, we make the modrm and
7602 index base bytes based on all the info we've collected. */
29b0f896
AM
7603
7604 default_seg = build_modrm_byte ();
7605 }
00cee14f 7606 else if (i.types[0].bitfield.class == SReg)
85b80b0f
JB
7607 {
7608 if (flag_code != CODE_64BIT
7609 ? i.tm.base_opcode == POP_SEG_SHORT
7610 && i.op[0].regs->reg_num == 1
7611 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7612 && i.op[0].regs->reg_num < 4)
7613 {
7614 as_bad (_("you can't `%s %s%s'"),
7615 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7616 return 0;
7617 }
7618 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7619 {
7620 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7621 i.tm.opcode_length = 2;
7622 }
7623 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7624 }
8a2ed489 7625 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
29b0f896
AM
7626 {
7627 default_seg = &ds;
7628 }
40fb9820 7629 else if (i.tm.opcode_modifier.isstring)
29b0f896
AM
7630 {
7631 /* For the string instructions that allow a segment override
7632 on one of their operands, the default segment is ds. */
7633 default_seg = &ds;
7634 }
50128d0c 7635 else if (i.short_form)
85b80b0f
JB
7636 {
7637 /* The register or float register operand is in operand
7638 0 or 1. */
bab6aec1 7639 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
85b80b0f
JB
7640
7641 /* Register goes in low 3 bits of opcode. */
7642 i.tm.base_opcode |= i.op[op].regs->reg_num;
7643 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7644 i.rex |= REX_B;
7645 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7646 {
7647 /* Warn about some common errors, but press on regardless.
7648 The first case can be generated by gcc (<= 2.8.1). */
7649 if (i.operands == 2)
7650 {
7651 /* Reversed arguments on faddp, fsubp, etc. */
7652 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7653 register_prefix, i.op[!intel_syntax].regs->reg_name,
7654 register_prefix, i.op[intel_syntax].regs->reg_name);
7655 }
7656 else
7657 {
7658 /* Extraneous `l' suffix on fp insn. */
7659 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7660 register_prefix, i.op[0].regs->reg_name);
7661 }
7662 }
7663 }
29b0f896 7664
514a8bb0 7665 if ((i.seg[0] || i.prefix[SEG_PREFIX])
514a8bb0
JB
7666 && i.tm.base_opcode == 0x8d /* lea */
7667 && !is_any_vex_encoding(&i.tm))
92334ad2
JB
7668 {
7669 if (!quiet_warnings)
7670 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7671 if (optimize)
7672 {
7673 i.seg[0] = NULL;
7674 i.prefix[SEG_PREFIX] = 0;
7675 }
7676 }
52271982
AM
7677
7678 /* If a segment was explicitly specified, and the specified segment
b6773884
JB
7679 is neither the default nor the one already recorded from a prefix,
7680 use an opcode prefix to select it. If we never figured out what
7681 the default segment is, then default_seg will be zero at this
7682 point, and the specified segment prefix will always be used. */
7683 if (i.seg[0]
7684 && i.seg[0] != default_seg
7685 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
29b0f896
AM
7686 {
7687 if (!add_prefix (i.seg[0]->seg_prefix))
7688 return 0;
7689 }
7690 return 1;
7691}
7692
a5aeccd9
JB
7693static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7694 bfd_boolean do_sse2avx)
7695{
7696 if (r->reg_flags & RegRex)
7697 {
7698 if (i.rex & rex_bit)
7699 as_bad (_("same type of prefix used twice"));
7700 i.rex |= rex_bit;
7701 }
7702 else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7703 {
7704 gas_assert (i.vex.register_specifier == r);
7705 i.vex.register_specifier += 8;
7706 }
7707
7708 if (r->reg_flags & RegVRex)
7709 i.vrex |= rex_bit;
7710}
7711
29b0f896 7712static const seg_entry *
e3bb37b5 7713build_modrm_byte (void)
29b0f896
AM
7714{
7715 const seg_entry *default_seg = 0;
c0f3af97 7716 unsigned int source, dest;
8cd7925b 7717 int vex_3_sources;
c0f3af97 7718
8cd7925b 7719 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
c0f3af97
L
7720 if (vex_3_sources)
7721 {
91d6fa6a 7722 unsigned int nds, reg_slot;
4c2c6516 7723 expressionS *exp;
c0f3af97 7724
6b8d3588 7725 dest = i.operands - 1;
c0f3af97 7726 nds = dest - 1;
922d8de8 7727
a683cc34 7728 /* There are 2 kinds of instructions:
bed3d976 7729 1. 5 operands: 4 register operands or 3 register operands
9d3bf266 7730 plus 1 memory operand plus one Imm4 operand, VexXDS, and
bed3d976 7731 VexW0 or VexW1. The destination must be either XMM, YMM or
43234a1e 7732 ZMM register.
bed3d976 7733 2. 4 operands: 4 register operands or 3 register operands
2f1bada2 7734 plus 1 memory operand, with VexXDS. */
922d8de8 7735 gas_assert ((i.reg_operands == 4
bed3d976
JB
7736 || (i.reg_operands == 3 && i.mem_operands == 1))
7737 && i.tm.opcode_modifier.vexvvvv == VEXXDS
dcd7e323 7738 && i.tm.opcode_modifier.vexw
3528c362 7739 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
a683cc34 7740
48db9223
JB
7741 /* If VexW1 is set, the first non-immediate operand is the source and
7742 the second non-immediate one is encoded in the immediate operand. */
7743 if (i.tm.opcode_modifier.vexw == VEXW1)
7744 {
7745 source = i.imm_operands;
7746 reg_slot = i.imm_operands + 1;
7747 }
7748 else
7749 {
7750 source = i.imm_operands + 1;
7751 reg_slot = i.imm_operands;
7752 }
7753
a683cc34 7754 if (i.imm_operands == 0)
bed3d976
JB
7755 {
7756 /* When there is no immediate operand, generate an 8bit
7757 immediate operand to encode the first operand. */
7758 exp = &im_expressions[i.imm_operands++];
7759 i.op[i.operands].imms = exp;
7760 i.types[i.operands] = imm8;
7761 i.operands++;
7762
3528c362 7763 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
bed3d976
JB
7764 exp->X_op = O_constant;
7765 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
43234a1e
L
7766 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7767 }
922d8de8 7768 else
bed3d976 7769 {
9d3bf266
JB
7770 gas_assert (i.imm_operands == 1);
7771 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7772 gas_assert (!i.tm.opcode_modifier.immext);
a683cc34 7773
9d3bf266
JB
7774 /* Turn on Imm8 again so that output_imm will generate it. */
7775 i.types[0].bitfield.imm8 = 1;
bed3d976 7776
3528c362 7777 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
9d3bf266 7778 i.op[0].imms->X_add_number
bed3d976 7779 |= register_number (i.op[reg_slot].regs) << 4;
43234a1e 7780 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
bed3d976 7781 }
a683cc34 7782
3528c362 7783 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
dae39acc 7784 i.vex.register_specifier = i.op[nds].regs;
c0f3af97
L
7785 }
7786 else
7787 source = dest = 0;
29b0f896
AM
7788
7789 /* i.reg_operands MUST be the number of real register operands;
c0f3af97
L
7790 implicit registers do not count. If there are 3 register
7791 operands, it must be a instruction with VexNDS. For a
7792 instruction with VexNDD, the destination register is encoded
7793 in VEX prefix. If there are 4 register operands, it must be
7794 a instruction with VEX prefix and 3 sources. */
7ab9ffdd
L
7795 if (i.mem_operands == 0
7796 && ((i.reg_operands == 2
2426c15f 7797 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7ab9ffdd 7798 || (i.reg_operands == 3
2426c15f 7799 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7ab9ffdd 7800 || (i.reg_operands == 4 && vex_3_sources)))
29b0f896 7801 {
cab737b9
L
7802 switch (i.operands)
7803 {
7804 case 2:
7805 source = 0;
7806 break;
7807 case 3:
c81128dc
L
7808 /* When there are 3 operands, one of them may be immediate,
7809 which may be the first or the last operand. Otherwise,
c0f3af97
L
7810 the first operand must be shift count register (cl) or it
7811 is an instruction with VexNDS. */
9c2799c2 7812 gas_assert (i.imm_operands == 1
7ab9ffdd 7813 || (i.imm_operands == 0
2426c15f 7814 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
75e5731b
JB
7815 || (i.types[0].bitfield.instance == RegC
7816 && i.types[0].bitfield.byte))));
40fb9820 7817 if (operand_type_check (i.types[0], imm)
75e5731b
JB
7818 || (i.types[0].bitfield.instance == RegC
7819 && i.types[0].bitfield.byte))
40fb9820
L
7820 source = 1;
7821 else
7822 source = 0;
cab737b9
L
7823 break;
7824 case 4:
368d64cc
L
7825 /* When there are 4 operands, the first two must be 8bit
7826 immediate operands. The source operand will be the 3rd
c0f3af97
L
7827 one.
7828
7829 For instructions with VexNDS, if the first operand
7830 an imm8, the source operand is the 2nd one. If the last
7831 operand is imm8, the source operand is the first one. */
9c2799c2 7832 gas_assert ((i.imm_operands == 2
7ab9ffdd
L
7833 && i.types[0].bitfield.imm8
7834 && i.types[1].bitfield.imm8)
2426c15f 7835 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7ab9ffdd
L
7836 && i.imm_operands == 1
7837 && (i.types[0].bitfield.imm8
43234a1e
L
7838 || i.types[i.operands - 1].bitfield.imm8
7839 || i.rounding)));
9f2670f2
L
7840 if (i.imm_operands == 2)
7841 source = 2;
7842 else
c0f3af97
L
7843 {
7844 if (i.types[0].bitfield.imm8)
7845 source = 1;
7846 else
7847 source = 0;
7848 }
c0f3af97
L
7849 break;
7850 case 5:
e771e7c9 7851 if (is_evex_encoding (&i.tm))
43234a1e
L
7852 {
7853 /* For EVEX instructions, when there are 5 operands, the
7854 first one must be immediate operand. If the second one
7855 is immediate operand, the source operand is the 3th
7856 one. If the last one is immediate operand, the source
7857 operand is the 2nd one. */
7858 gas_assert (i.imm_operands == 2
7859 && i.tm.opcode_modifier.sae
7860 && operand_type_check (i.types[0], imm));
7861 if (operand_type_check (i.types[1], imm))
7862 source = 2;
7863 else if (operand_type_check (i.types[4], imm))
7864 source = 1;
7865 else
7866 abort ();
7867 }
cab737b9
L
7868 break;
7869 default:
7870 abort ();
7871 }
7872
c0f3af97
L
7873 if (!vex_3_sources)
7874 {
7875 dest = source + 1;
7876
43234a1e
L
7877 /* RC/SAE operand could be between DEST and SRC. That happens
7878 when one operand is GPR and the other one is XMM/YMM/ZMM
7879 register. */
7880 if (i.rounding && i.rounding->operand == (int) dest)
7881 dest++;
7882
2426c15f 7883 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
c0f3af97 7884 {
43234a1e 7885 /* For instructions with VexNDS, the register-only source
c5d0745b 7886 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
dfd69174 7887 register. It is encoded in VEX prefix. */
f12dc422
L
7888
7889 i386_operand_type op;
7890 unsigned int vvvv;
7891
7892 /* Check register-only source operand when two source
7893 operands are swapped. */
7894 if (!i.tm.operand_types[source].bitfield.baseindex
7895 && i.tm.operand_types[dest].bitfield.baseindex)
7896 {
7897 vvvv = source;
7898 source = dest;
7899 }
7900 else
7901 vvvv = dest;
7902
7903 op = i.tm.operand_types[vvvv];
c0f3af97 7904 if ((dest + 1) >= i.operands
bab6aec1 7905 || ((op.bitfield.class != Reg
dc821c5f 7906 || (!op.bitfield.dword && !op.bitfield.qword))
3528c362 7907 && op.bitfield.class != RegSIMD
43234a1e 7908 && !operand_type_equal (&op, &regmask)))
c0f3af97 7909 abort ();
f12dc422 7910 i.vex.register_specifier = i.op[vvvv].regs;
c0f3af97
L
7911 dest++;
7912 }
7913 }
29b0f896
AM
7914
7915 i.rm.mode = 3;
dfd69174
JB
7916 /* One of the register operands will be encoded in the i.rm.reg
7917 field, the other in the combined i.rm.mode and i.rm.regmem
29b0f896
AM
7918 fields. If no form of this instruction supports a memory
7919 destination operand, then we assume the source operand may
7920 sometimes be a memory operand and so we need to store the
7921 destination in the i.rm.reg field. */
dfd69174 7922 if (!i.tm.opcode_modifier.regmem
40fb9820 7923 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
29b0f896
AM
7924 {
7925 i.rm.reg = i.op[dest].regs->reg_num;
7926 i.rm.regmem = i.op[source].regs->reg_num;
3528c362
JB
7927 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7928 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
b4a3a7b4 7929 i.has_regmmx = TRUE;
3528c362
JB
7930 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7931 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
b4a3a7b4
L
7932 {
7933 if (i.types[dest].bitfield.zmmword
7934 || i.types[source].bitfield.zmmword)
7935 i.has_regzmm = TRUE;
7936 else if (i.types[dest].bitfield.ymmword
7937 || i.types[source].bitfield.ymmword)
7938 i.has_regymm = TRUE;
7939 else
7940 i.has_regxmm = TRUE;
7941 }
a5aeccd9
JB
7942 set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
7943 set_rex_vrex (i.op[source].regs, REX_B, FALSE);
29b0f896
AM
7944 }
7945 else
7946 {
7947 i.rm.reg = i.op[source].regs->reg_num;
7948 i.rm.regmem = i.op[dest].regs->reg_num;
a5aeccd9
JB
7949 set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
7950 set_rex_vrex (i.op[source].regs, REX_R, FALSE);
29b0f896 7951 }
e0c7f900 7952 if (flag_code != CODE_64BIT && (i.rex & REX_R))
c4a530c5 7953 {
4a5c67ed 7954 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
c4a530c5 7955 abort ();
e0c7f900 7956 i.rex &= ~REX_R;
c4a530c5
JB
7957 add_prefix (LOCK_PREFIX_OPCODE);
7958 }
29b0f896
AM
7959 }
7960 else
7961 { /* If it's not 2 reg operands... */
c0f3af97
L
7962 unsigned int mem;
7963
29b0f896
AM
7964 if (i.mem_operands)
7965 {
7966 unsigned int fake_zero_displacement = 0;
99018f42 7967 unsigned int op;
4eed87de 7968
7ab9ffdd 7969 for (op = 0; op < i.operands; op++)
8dc0818e 7970 if (i.flags[op] & Operand_Mem)
7ab9ffdd 7971 break;
7ab9ffdd 7972 gas_assert (op < i.operands);
29b0f896 7973
63112cd6 7974 if (i.tm.opcode_modifier.sib)
6c30d220 7975 {
e968fc9b 7976 if (i.index_reg->reg_num == RegIZ)
6c30d220
L
7977 abort ();
7978
7979 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7980 if (!i.base_reg)
7981 {
7982 i.sib.base = NO_BASE_REGISTER;
7983 i.sib.scale = i.log2_scale_factor;
7984 i.types[op].bitfield.disp8 = 0;
7985 i.types[op].bitfield.disp16 = 0;
7986 i.types[op].bitfield.disp64 = 0;
43083a50 7987 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
6c30d220
L
7988 {
7989 /* Must be 32 bit */
7990 i.types[op].bitfield.disp32 = 1;
7991 i.types[op].bitfield.disp32s = 0;
7992 }
7993 else
7994 {
7995 i.types[op].bitfield.disp32 = 0;
7996 i.types[op].bitfield.disp32s = 1;
7997 }
7998 }
7999 i.sib.index = i.index_reg->reg_num;
a5aeccd9 8000 set_rex_vrex (i.index_reg, REX_X, FALSE);
6c30d220
L
8001 }
8002
29b0f896
AM
8003 default_seg = &ds;
8004
8005 if (i.base_reg == 0)
8006 {
8007 i.rm.mode = 0;
8008 if (!i.disp_operands)
9bb129e8 8009 fake_zero_displacement = 1;
29b0f896
AM
8010 if (i.index_reg == 0)
8011 {
73053c1f
JB
8012 i386_operand_type newdisp;
8013
63112cd6 8014 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896 8015 /* Operand is just <disp> */
20f0a1fc 8016 if (flag_code == CODE_64BIT)
29b0f896
AM
8017 {
8018 /* 64bit mode overwrites the 32bit absolute
8019 addressing by RIP relative addressing and
8020 absolute addressing is encoded by one of the
8021 redundant SIB forms. */
8022 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8023 i.sib.base = NO_BASE_REGISTER;
8024 i.sib.index = NO_INDEX_REGISTER;
73053c1f 8025 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
20f0a1fc 8026 }
fc225355
L
8027 else if ((flag_code == CODE_16BIT)
8028 ^ (i.prefix[ADDR_PREFIX] != 0))
20f0a1fc
NC
8029 {
8030 i.rm.regmem = NO_BASE_REGISTER_16;
73053c1f 8031 newdisp = disp16;
20f0a1fc
NC
8032 }
8033 else
8034 {
8035 i.rm.regmem = NO_BASE_REGISTER;
73053c1f 8036 newdisp = disp32;
29b0f896 8037 }
73053c1f
JB
8038 i.types[op] = operand_type_and_not (i.types[op], anydisp);
8039 i.types[op] = operand_type_or (i.types[op], newdisp);
29b0f896 8040 }
63112cd6 8041 else if (!i.tm.opcode_modifier.sib)
29b0f896 8042 {
6c30d220 8043 /* !i.base_reg && i.index_reg */
e968fc9b 8044 if (i.index_reg->reg_num == RegIZ)
db51cc60
L
8045 i.sib.index = NO_INDEX_REGISTER;
8046 else
8047 i.sib.index = i.index_reg->reg_num;
29b0f896
AM
8048 i.sib.base = NO_BASE_REGISTER;
8049 i.sib.scale = i.log2_scale_factor;
8050 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
40fb9820
L
8051 i.types[op].bitfield.disp8 = 0;
8052 i.types[op].bitfield.disp16 = 0;
8053 i.types[op].bitfield.disp64 = 0;
43083a50 8054 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
40fb9820
L
8055 {
8056 /* Must be 32 bit */
8057 i.types[op].bitfield.disp32 = 1;
8058 i.types[op].bitfield.disp32s = 0;
8059 }
29b0f896 8060 else
40fb9820
L
8061 {
8062 i.types[op].bitfield.disp32 = 0;
8063 i.types[op].bitfield.disp32s = 1;
8064 }
29b0f896 8065 if ((i.index_reg->reg_flags & RegRex) != 0)
161a04f6 8066 i.rex |= REX_X;
29b0f896
AM
8067 }
8068 }
8069 /* RIP addressing for 64bit mode. */
e968fc9b 8070 else if (i.base_reg->reg_num == RegIP)
29b0f896 8071 {
63112cd6 8072 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896 8073 i.rm.regmem = NO_BASE_REGISTER;
40fb9820
L
8074 i.types[op].bitfield.disp8 = 0;
8075 i.types[op].bitfield.disp16 = 0;
8076 i.types[op].bitfield.disp32 = 0;
8077 i.types[op].bitfield.disp32s = 1;
8078 i.types[op].bitfield.disp64 = 0;
71903a11 8079 i.flags[op] |= Operand_PCrel;
20f0a1fc
NC
8080 if (! i.disp_operands)
8081 fake_zero_displacement = 1;
29b0f896 8082 }
dc821c5f 8083 else if (i.base_reg->reg_type.bitfield.word)
29b0f896 8084 {
63112cd6 8085 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896
AM
8086 switch (i.base_reg->reg_num)
8087 {
8088 case 3: /* (%bx) */
8089 if (i.index_reg == 0)
8090 i.rm.regmem = 7;
8091 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
8092 i.rm.regmem = i.index_reg->reg_num - 6;
8093 break;
8094 case 5: /* (%bp) */
8095 default_seg = &ss;
8096 if (i.index_reg == 0)
8097 {
8098 i.rm.regmem = 6;
40fb9820 8099 if (operand_type_check (i.types[op], disp) == 0)
29b0f896
AM
8100 {
8101 /* fake (%bp) into 0(%bp) */
b5014f7a 8102 i.types[op].bitfield.disp8 = 1;
252b5132 8103 fake_zero_displacement = 1;
29b0f896
AM
8104 }
8105 }
8106 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
8107 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8108 break;
8109 default: /* (%si) -> 4 or (%di) -> 5 */
8110 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8111 }
8112 i.rm.mode = mode_from_disp_size (i.types[op]);
8113 }
8114 else /* i.base_reg and 32/64 bit mode */
8115 {
8116 if (flag_code == CODE_64BIT
40fb9820
L
8117 && operand_type_check (i.types[op], disp))
8118 {
73053c1f
JB
8119 i.types[op].bitfield.disp16 = 0;
8120 i.types[op].bitfield.disp64 = 0;
40fb9820 8121 if (i.prefix[ADDR_PREFIX] == 0)
73053c1f
JB
8122 {
8123 i.types[op].bitfield.disp32 = 0;
8124 i.types[op].bitfield.disp32s = 1;
8125 }
40fb9820 8126 else
73053c1f
JB
8127 {
8128 i.types[op].bitfield.disp32 = 1;
8129 i.types[op].bitfield.disp32s = 0;
8130 }
40fb9820 8131 }
20f0a1fc 8132
63112cd6 8133 if (!i.tm.opcode_modifier.sib)
6c30d220 8134 i.rm.regmem = i.base_reg->reg_num;
29b0f896 8135 if ((i.base_reg->reg_flags & RegRex) != 0)
161a04f6 8136 i.rex |= REX_B;
29b0f896
AM
8137 i.sib.base = i.base_reg->reg_num;
8138 /* x86-64 ignores REX prefix bit here to avoid decoder
8139 complications. */
848930b2
JB
8140 if (!(i.base_reg->reg_flags & RegRex)
8141 && (i.base_reg->reg_num == EBP_REG_NUM
8142 || i.base_reg->reg_num == ESP_REG_NUM))
29b0f896 8143 default_seg = &ss;
848930b2 8144 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
29b0f896 8145 {
848930b2 8146 fake_zero_displacement = 1;
b5014f7a 8147 i.types[op].bitfield.disp8 = 1;
29b0f896
AM
8148 }
8149 i.sib.scale = i.log2_scale_factor;
8150 if (i.index_reg == 0)
8151 {
63112cd6 8152 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896
AM
8153 /* <disp>(%esp) becomes two byte modrm with no index
8154 register. We've already stored the code for esp
8155 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8156 Any base register besides %esp will not use the
8157 extra modrm byte. */
8158 i.sib.index = NO_INDEX_REGISTER;
29b0f896 8159 }
63112cd6 8160 else if (!i.tm.opcode_modifier.sib)
29b0f896 8161 {
e968fc9b 8162 if (i.index_reg->reg_num == RegIZ)
db51cc60
L
8163 i.sib.index = NO_INDEX_REGISTER;
8164 else
8165 i.sib.index = i.index_reg->reg_num;
29b0f896
AM
8166 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8167 if ((i.index_reg->reg_flags & RegRex) != 0)
161a04f6 8168 i.rex |= REX_X;
29b0f896 8169 }
67a4f2b7
AO
8170
8171 if (i.disp_operands
8172 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8173 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8174 i.rm.mode = 0;
8175 else
a501d77e
L
8176 {
8177 if (!fake_zero_displacement
8178 && !i.disp_operands
8179 && i.disp_encoding)
8180 {
8181 fake_zero_displacement = 1;
8182 if (i.disp_encoding == disp_encoding_8bit)
8183 i.types[op].bitfield.disp8 = 1;
8184 else
8185 i.types[op].bitfield.disp32 = 1;
8186 }
8187 i.rm.mode = mode_from_disp_size (i.types[op]);
8188 }
29b0f896 8189 }
252b5132 8190
29b0f896
AM
8191 if (fake_zero_displacement)
8192 {
8193 /* Fakes a zero displacement assuming that i.types[op]
8194 holds the correct displacement size. */
8195 expressionS *exp;
8196
9c2799c2 8197 gas_assert (i.op[op].disps == 0);
29b0f896
AM
8198 exp = &disp_expressions[i.disp_operands++];
8199 i.op[op].disps = exp;
8200 exp->X_op = O_constant;
8201 exp->X_add_number = 0;
8202 exp->X_add_symbol = (symbolS *) 0;
8203 exp->X_op_symbol = (symbolS *) 0;
8204 }
c0f3af97
L
8205
8206 mem = op;
29b0f896 8207 }
c0f3af97
L
8208 else
8209 mem = ~0;
252b5132 8210
8c43a48b 8211 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
5dd85c99
SP
8212 {
8213 if (operand_type_check (i.types[0], imm))
8214 i.vex.register_specifier = NULL;
8215 else
8216 {
8217 /* VEX.vvvv encodes one of the sources when the first
8218 operand is not an immediate. */
1ef99a7b 8219 if (i.tm.opcode_modifier.vexw == VEXW0)
5dd85c99
SP
8220 i.vex.register_specifier = i.op[0].regs;
8221 else
8222 i.vex.register_specifier = i.op[1].regs;
8223 }
8224
8225 /* Destination is a XMM register encoded in the ModRM.reg
8226 and VEX.R bit. */
8227 i.rm.reg = i.op[2].regs->reg_num;
8228 if ((i.op[2].regs->reg_flags & RegRex) != 0)
8229 i.rex |= REX_R;
8230
8231 /* ModRM.rm and VEX.B encodes the other source. */
8232 if (!i.mem_operands)
8233 {
8234 i.rm.mode = 3;
8235
1ef99a7b 8236 if (i.tm.opcode_modifier.vexw == VEXW0)
5dd85c99
SP
8237 i.rm.regmem = i.op[1].regs->reg_num;
8238 else
8239 i.rm.regmem = i.op[0].regs->reg_num;
8240
8241 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8242 i.rex |= REX_B;
8243 }
8244 }
2426c15f 8245 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
f88c9eb0
SP
8246 {
8247 i.vex.register_specifier = i.op[2].regs;
8248 if (!i.mem_operands)
8249 {
8250 i.rm.mode = 3;
8251 i.rm.regmem = i.op[1].regs->reg_num;
8252 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8253 i.rex |= REX_B;
8254 }
8255 }
29b0f896
AM
8256 /* Fill in i.rm.reg or i.rm.regmem field with register operand
8257 (if any) based on i.tm.extension_opcode. Again, we must be
8258 careful to make sure that segment/control/debug/test/MMX
8259 registers are coded into the i.rm.reg field. */
f88c9eb0 8260 else if (i.reg_operands)
29b0f896 8261 {
99018f42 8262 unsigned int op;
7ab9ffdd
L
8263 unsigned int vex_reg = ~0;
8264
8265 for (op = 0; op < i.operands; op++)
b4a3a7b4 8266 {
bab6aec1 8267 if (i.types[op].bitfield.class == Reg
f74a6307
JB
8268 || i.types[op].bitfield.class == RegBND
8269 || i.types[op].bitfield.class == RegMask
00cee14f 8270 || i.types[op].bitfield.class == SReg
4a5c67ed
JB
8271 || i.types[op].bitfield.class == RegCR
8272 || i.types[op].bitfield.class == RegDR
8273 || i.types[op].bitfield.class == RegTR)
b4a3a7b4 8274 break;
3528c362 8275 if (i.types[op].bitfield.class == RegSIMD)
b4a3a7b4
L
8276 {
8277 if (i.types[op].bitfield.zmmword)
8278 i.has_regzmm = TRUE;
8279 else if (i.types[op].bitfield.ymmword)
8280 i.has_regymm = TRUE;
8281 else
8282 i.has_regxmm = TRUE;
8283 break;
8284 }
3528c362 8285 if (i.types[op].bitfield.class == RegMMX)
b4a3a7b4
L
8286 {
8287 i.has_regmmx = TRUE;
8288 break;
8289 }
8290 }
c0209578 8291
7ab9ffdd
L
8292 if (vex_3_sources)
8293 op = dest;
2426c15f 8294 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7ab9ffdd
L
8295 {
8296 /* For instructions with VexNDS, the register-only
8297 source operand is encoded in VEX prefix. */
8298 gas_assert (mem != (unsigned int) ~0);
c0f3af97 8299
7ab9ffdd 8300 if (op > mem)
c0f3af97 8301 {
7ab9ffdd
L
8302 vex_reg = op++;
8303 gas_assert (op < i.operands);
c0f3af97
L
8304 }
8305 else
c0f3af97 8306 {
f12dc422
L
8307 /* Check register-only source operand when two source
8308 operands are swapped. */
8309 if (!i.tm.operand_types[op].bitfield.baseindex
8310 && i.tm.operand_types[op + 1].bitfield.baseindex)
8311 {
8312 vex_reg = op;
8313 op += 2;
8314 gas_assert (mem == (vex_reg + 1)
8315 && op < i.operands);
8316 }
8317 else
8318 {
8319 vex_reg = op + 1;
8320 gas_assert (vex_reg < i.operands);
8321 }
c0f3af97 8322 }
7ab9ffdd 8323 }
2426c15f 8324 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7ab9ffdd 8325 {
f12dc422 8326 /* For instructions with VexNDD, the register destination
7ab9ffdd 8327 is encoded in VEX prefix. */
f12dc422
L
8328 if (i.mem_operands == 0)
8329 {
8330 /* There is no memory operand. */
8331 gas_assert ((op + 2) == i.operands);
8332 vex_reg = op + 1;
8333 }
8334 else
8d63c93e 8335 {
ed438a93
JB
8336 /* There are only 2 non-immediate operands. */
8337 gas_assert (op < i.imm_operands + 2
8338 && i.operands == i.imm_operands + 2);
8339 vex_reg = i.imm_operands + 1;
f12dc422 8340 }
7ab9ffdd
L
8341 }
8342 else
8343 gas_assert (op < i.operands);
99018f42 8344
7ab9ffdd
L
8345 if (vex_reg != (unsigned int) ~0)
8346 {
f12dc422 8347 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7ab9ffdd 8348
bab6aec1 8349 if ((type->bitfield.class != Reg
dc821c5f 8350 || (!type->bitfield.dword && !type->bitfield.qword))
3528c362 8351 && type->bitfield.class != RegSIMD
43234a1e 8352 && !operand_type_equal (type, &regmask))
7ab9ffdd 8353 abort ();
f88c9eb0 8354
7ab9ffdd
L
8355 i.vex.register_specifier = i.op[vex_reg].regs;
8356 }
8357
1b9f0c97
L
8358 /* Don't set OP operand twice. */
8359 if (vex_reg != op)
7ab9ffdd 8360 {
1b9f0c97
L
8361 /* If there is an extension opcode to put here, the
8362 register number must be put into the regmem field. */
8363 if (i.tm.extension_opcode != None)
8364 {
8365 i.rm.regmem = i.op[op].regs->reg_num;
a5aeccd9
JB
8366 set_rex_vrex (i.op[op].regs, REX_B,
8367 i.tm.opcode_modifier.sse2avx);
1b9f0c97
L
8368 }
8369 else
8370 {
8371 i.rm.reg = i.op[op].regs->reg_num;
a5aeccd9
JB
8372 set_rex_vrex (i.op[op].regs, REX_R,
8373 i.tm.opcode_modifier.sse2avx);
1b9f0c97 8374 }
7ab9ffdd 8375 }
252b5132 8376
29b0f896
AM
8377 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8378 must set it to 3 to indicate this is a register operand
8379 in the regmem field. */
8380 if (!i.mem_operands)
8381 i.rm.mode = 3;
8382 }
252b5132 8383
29b0f896 8384 /* Fill in i.rm.reg field with extension opcode (if any). */
c1e679ec 8385 if (i.tm.extension_opcode != None)
29b0f896
AM
8386 i.rm.reg = i.tm.extension_opcode;
8387 }
8388 return default_seg;
8389}
252b5132 8390
376cd056
JB
8391static unsigned int
8392flip_code16 (unsigned int code16)
8393{
8394 gas_assert (i.tm.operands == 1);
8395
8396 return !(i.prefix[REX_PREFIX] & REX_W)
8397 && (code16 ? i.tm.operand_types[0].bitfield.disp32
8398 || i.tm.operand_types[0].bitfield.disp32s
8399 : i.tm.operand_types[0].bitfield.disp16)
8400 ? CODE16 : 0;
8401}
8402
29b0f896 8403static void
e3bb37b5 8404output_branch (void)
29b0f896
AM
8405{
8406 char *p;
f8a5c266 8407 int size;
29b0f896
AM
8408 int code16;
8409 int prefix;
8410 relax_substateT subtype;
8411 symbolS *sym;
8412 offsetT off;
8413
f8a5c266 8414 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
a501d77e 8415 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
29b0f896
AM
8416
8417 prefix = 0;
8418 if (i.prefix[DATA_PREFIX] != 0)
252b5132 8419 {
29b0f896
AM
8420 prefix = 1;
8421 i.prefixes -= 1;
376cd056 8422 code16 ^= flip_code16(code16);
252b5132 8423 }
29b0f896
AM
8424 /* Pentium4 branch hints. */
8425 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8426 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
2f66722d 8427 {
29b0f896
AM
8428 prefix++;
8429 i.prefixes--;
8430 }
8431 if (i.prefix[REX_PREFIX] != 0)
8432 {
8433 prefix++;
8434 i.prefixes--;
2f66722d
AM
8435 }
8436
7e8b059b
L
8437 /* BND prefixed jump. */
8438 if (i.prefix[BND_PREFIX] != 0)
8439 {
6cb0a70e
JB
8440 prefix++;
8441 i.prefixes--;
7e8b059b
L
8442 }
8443
f2810fe0
JB
8444 if (i.prefixes != 0)
8445 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
29b0f896
AM
8446
8447 /* It's always a symbol; End frag & setup for relax.
8448 Make sure there is enough room in this frag for the largest
8449 instruction we may generate in md_convert_frag. This is 2
8450 bytes for the opcode and room for the prefix and largest
8451 displacement. */
8452 frag_grow (prefix + 2 + 4);
8453 /* Prefix and 1 opcode byte go in fr_fix. */
8454 p = frag_more (prefix + 1);
8455 if (i.prefix[DATA_PREFIX] != 0)
8456 *p++ = DATA_PREFIX_OPCODE;
8457 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8458 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8459 *p++ = i.prefix[SEG_PREFIX];
6cb0a70e
JB
8460 if (i.prefix[BND_PREFIX] != 0)
8461 *p++ = BND_PREFIX_OPCODE;
29b0f896
AM
8462 if (i.prefix[REX_PREFIX] != 0)
8463 *p++ = i.prefix[REX_PREFIX];
8464 *p = i.tm.base_opcode;
8465
8466 if ((unsigned char) *p == JUMP_PC_RELATIVE)
f8a5c266 8467 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
40fb9820 8468 else if (cpu_arch_flags.bitfield.cpui386)
f8a5c266 8469 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
29b0f896 8470 else
f8a5c266 8471 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
29b0f896 8472 subtype |= code16;
3e73aa7c 8473
29b0f896
AM
8474 sym = i.op[0].disps->X_add_symbol;
8475 off = i.op[0].disps->X_add_number;
3e73aa7c 8476
29b0f896
AM
8477 if (i.op[0].disps->X_op != O_constant
8478 && i.op[0].disps->X_op != O_symbol)
3e73aa7c 8479 {
29b0f896
AM
8480 /* Handle complex expressions. */
8481 sym = make_expr_symbol (i.op[0].disps);
8482 off = 0;
8483 }
3e73aa7c 8484
29b0f896
AM
8485 /* 1 possible extra opcode + 4 byte displacement go in var part.
8486 Pass reloc in fr_var. */
d258b828 8487 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
29b0f896 8488}
3e73aa7c 8489
bd7ab16b
L
8490#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8491/* Return TRUE iff PLT32 relocation should be used for branching to
8492 symbol S. */
8493
8494static bfd_boolean
8495need_plt32_p (symbolS *s)
8496{
8497 /* PLT32 relocation is ELF only. */
8498 if (!IS_ELF)
8499 return FALSE;
8500
a5def729
RO
8501#ifdef TE_SOLARIS
8502 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8503 krtld support it. */
8504 return FALSE;
8505#endif
8506
bd7ab16b
L
8507 /* Since there is no need to prepare for PLT branch on x86-64, we
8508 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8509 be used as a marker for 32-bit PC-relative branches. */
8510 if (!object_64bit)
8511 return FALSE;
8512
8513 /* Weak or undefined symbol need PLT32 relocation. */
8514 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8515 return TRUE;
8516
8517 /* Non-global symbol doesn't need PLT32 relocation. */
8518 if (! S_IS_EXTERNAL (s))
8519 return FALSE;
8520
8521 /* Other global symbols need PLT32 relocation. NB: Symbol with
8522 non-default visibilities are treated as normal global symbol
8523 so that PLT32 relocation can be used as a marker for 32-bit
8524 PC-relative branches. It is useful for linker relaxation. */
8525 return TRUE;
8526}
8527#endif
8528
29b0f896 8529static void
e3bb37b5 8530output_jump (void)
29b0f896
AM
8531{
8532 char *p;
8533 int size;
3e02c1cc 8534 fixS *fixP;
bd7ab16b 8535 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
29b0f896 8536
0cfa3eb3 8537 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
29b0f896
AM
8538 {
8539 /* This is a loop or jecxz type instruction. */
8540 size = 1;
8541 if (i.prefix[ADDR_PREFIX] != 0)
8542 {
8543 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8544 i.prefixes -= 1;
8545 }
8546 /* Pentium4 branch hints. */
8547 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8548 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8549 {
8550 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8551 i.prefixes--;
3e73aa7c
JH
8552 }
8553 }
29b0f896
AM
8554 else
8555 {
8556 int code16;
3e73aa7c 8557
29b0f896
AM
8558 code16 = 0;
8559 if (flag_code == CODE_16BIT)
8560 code16 = CODE16;
3e73aa7c 8561
29b0f896
AM
8562 if (i.prefix[DATA_PREFIX] != 0)
8563 {
8564 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8565 i.prefixes -= 1;
376cd056 8566 code16 ^= flip_code16(code16);
29b0f896 8567 }
252b5132 8568
29b0f896
AM
8569 size = 4;
8570 if (code16)
8571 size = 2;
8572 }
9fcc94b6 8573
6cb0a70e
JB
8574 /* BND prefixed jump. */
8575 if (i.prefix[BND_PREFIX] != 0)
29b0f896 8576 {
6cb0a70e 8577 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
29b0f896
AM
8578 i.prefixes -= 1;
8579 }
252b5132 8580
6cb0a70e 8581 if (i.prefix[REX_PREFIX] != 0)
7e8b059b 8582 {
6cb0a70e 8583 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
7e8b059b
L
8584 i.prefixes -= 1;
8585 }
8586
f2810fe0
JB
8587 if (i.prefixes != 0)
8588 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
e0890092 8589
42164a71
L
8590 p = frag_more (i.tm.opcode_length + size);
8591 switch (i.tm.opcode_length)
8592 {
8593 case 2:
8594 *p++ = i.tm.base_opcode >> 8;
1a0670f3 8595 /* Fall through. */
42164a71
L
8596 case 1:
8597 *p++ = i.tm.base_opcode;
8598 break;
8599 default:
8600 abort ();
8601 }
e0890092 8602
bd7ab16b
L
8603#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8604 if (size == 4
8605 && jump_reloc == NO_RELOC
8606 && need_plt32_p (i.op[0].disps->X_add_symbol))
8607 jump_reloc = BFD_RELOC_X86_64_PLT32;
8608#endif
8609
8610 jump_reloc = reloc (size, 1, 1, jump_reloc);
8611
3e02c1cc 8612 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
bd7ab16b 8613 i.op[0].disps, 1, jump_reloc);
3e02c1cc
AM
8614
8615 /* All jumps handled here are signed, but don't use a signed limit
8616 check for 32 and 16 bit jumps as we want to allow wrap around at
8617 4G and 64k respectively. */
8618 if (size == 1)
8619 fixP->fx_signed = 1;
29b0f896 8620}
e0890092 8621
29b0f896 8622static void
e3bb37b5 8623output_interseg_jump (void)
29b0f896
AM
8624{
8625 char *p;
8626 int size;
8627 int prefix;
8628 int code16;
252b5132 8629
29b0f896
AM
8630 code16 = 0;
8631 if (flag_code == CODE_16BIT)
8632 code16 = CODE16;
a217f122 8633
29b0f896
AM
8634 prefix = 0;
8635 if (i.prefix[DATA_PREFIX] != 0)
8636 {
8637 prefix = 1;
8638 i.prefixes -= 1;
8639 code16 ^= CODE16;
8640 }
6cb0a70e
JB
8641
8642 gas_assert (!i.prefix[REX_PREFIX]);
252b5132 8643
29b0f896
AM
8644 size = 4;
8645 if (code16)
8646 size = 2;
252b5132 8647
f2810fe0
JB
8648 if (i.prefixes != 0)
8649 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
252b5132 8650
29b0f896
AM
8651 /* 1 opcode; 2 segment; offset */
8652 p = frag_more (prefix + 1 + 2 + size);
3e73aa7c 8653
29b0f896
AM
8654 if (i.prefix[DATA_PREFIX] != 0)
8655 *p++ = DATA_PREFIX_OPCODE;
252b5132 8656
29b0f896
AM
8657 if (i.prefix[REX_PREFIX] != 0)
8658 *p++ = i.prefix[REX_PREFIX];
252b5132 8659
29b0f896
AM
8660 *p++ = i.tm.base_opcode;
8661 if (i.op[1].imms->X_op == O_constant)
8662 {
8663 offsetT n = i.op[1].imms->X_add_number;
252b5132 8664
29b0f896
AM
8665 if (size == 2
8666 && !fits_in_unsigned_word (n)
8667 && !fits_in_signed_word (n))
8668 {
8669 as_bad (_("16-bit jump out of range"));
8670 return;
8671 }
8672 md_number_to_chars (p, n, size);
8673 }
8674 else
8675 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
d258b828 8676 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
29b0f896
AM
8677 if (i.op[0].imms->X_op != O_constant)
8678 as_bad (_("can't handle non absolute segment in `%s'"),
8679 i.tm.name);
8680 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8681}
a217f122 8682
b4a3a7b4
L
8683#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8684void
8685x86_cleanup (void)
8686{
8687 char *p;
8688 asection *seg = now_seg;
8689 subsegT subseg = now_subseg;
8690 asection *sec;
8691 unsigned int alignment, align_size_1;
8692 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8693 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8694 unsigned int padding;
8695
8696 if (!IS_ELF || !x86_used_note)
8697 return;
8698
b4a3a7b4
L
8699 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8700
8701 /* The .note.gnu.property section layout:
8702
8703 Field Length Contents
8704 ---- ---- ----
8705 n_namsz 4 4
8706 n_descsz 4 The note descriptor size
8707 n_type 4 NT_GNU_PROPERTY_TYPE_0
8708 n_name 4 "GNU"
8709 n_desc n_descsz The program property array
8710 .... .... ....
8711 */
8712
8713 /* Create the .note.gnu.property section. */
8714 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
fd361982 8715 bfd_set_section_flags (sec,
b4a3a7b4
L
8716 (SEC_ALLOC
8717 | SEC_LOAD
8718 | SEC_DATA
8719 | SEC_HAS_CONTENTS
8720 | SEC_READONLY));
8721
8722 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8723 {
8724 align_size_1 = 7;
8725 alignment = 3;
8726 }
8727 else
8728 {
8729 align_size_1 = 3;
8730 alignment = 2;
8731 }
8732
fd361982 8733 bfd_set_section_alignment (sec, alignment);
b4a3a7b4
L
8734 elf_section_type (sec) = SHT_NOTE;
8735
8736 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8737 + 4-byte data */
8738 isa_1_descsz_raw = 4 + 4 + 4;
8739 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8740 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8741
8742 feature_2_descsz_raw = isa_1_descsz;
8743 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8744 + 4-byte data */
8745 feature_2_descsz_raw += 4 + 4 + 4;
8746 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8747 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8748 & ~align_size_1);
8749
8750 descsz = feature_2_descsz;
8751 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8752 p = frag_more (4 + 4 + 4 + 4 + descsz);
8753
8754 /* Write n_namsz. */
8755 md_number_to_chars (p, (valueT) 4, 4);
8756
8757 /* Write n_descsz. */
8758 md_number_to_chars (p + 4, (valueT) descsz, 4);
8759
8760 /* Write n_type. */
8761 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8762
8763 /* Write n_name. */
8764 memcpy (p + 4 * 3, "GNU", 4);
8765
8766 /* Write 4-byte type. */
8767 md_number_to_chars (p + 4 * 4,
8768 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8769
8770 /* Write 4-byte data size. */
8771 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8772
8773 /* Write 4-byte data. */
8774 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8775
8776 /* Zero out paddings. */
8777 padding = isa_1_descsz - isa_1_descsz_raw;
8778 if (padding)
8779 memset (p + 4 * 7, 0, padding);
8780
8781 /* Write 4-byte type. */
8782 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8783 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8784
8785 /* Write 4-byte data size. */
8786 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8787
8788 /* Write 4-byte data. */
8789 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8790 (valueT) x86_feature_2_used, 4);
8791
8792 /* Zero out paddings. */
8793 padding = feature_2_descsz - feature_2_descsz_raw;
8794 if (padding)
8795 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8796
8797 /* We probably can't restore the current segment, for there likely
8798 isn't one yet... */
8799 if (seg && subseg)
8800 subseg_set (seg, subseg);
8801}
8802#endif
8803
9c33702b
JB
8804static unsigned int
8805encoding_length (const fragS *start_frag, offsetT start_off,
8806 const char *frag_now_ptr)
8807{
8808 unsigned int len = 0;
8809
8810 if (start_frag != frag_now)
8811 {
8812 const fragS *fr = start_frag;
8813
8814 do {
8815 len += fr->fr_fix;
8816 fr = fr->fr_next;
8817 } while (fr && fr != frag_now);
8818 }
8819
8820 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8821}
8822
e379e5f3 8823/* Return 1 for test, and, cmp, add, sub, inc and dec which may
79d72f45
HL
8824 be macro-fused with conditional jumps.
8825 NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8826 or is one of the following format:
8827
8828 cmp m, imm
8829 add m, imm
8830 sub m, imm
8831 test m, imm
8832 and m, imm
8833 inc m
8834 dec m
8835
8836 it is unfusible. */
e379e5f3
L
8837
8838static int
79d72f45 8839maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
e379e5f3
L
8840{
8841 /* No RIP address. */
8842 if (i.base_reg && i.base_reg->reg_num == RegIP)
8843 return 0;
8844
8845 /* No VEX/EVEX encoding. */
8846 if (is_any_vex_encoding (&i.tm))
8847 return 0;
8848
79d72f45
HL
8849 /* add, sub without add/sub m, imm. */
8850 if (i.tm.base_opcode <= 5
e379e5f3
L
8851 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8852 || ((i.tm.base_opcode | 3) == 0x83
79d72f45 8853 && (i.tm.extension_opcode == 0x5
e379e5f3 8854 || i.tm.extension_opcode == 0x0)))
79d72f45
HL
8855 {
8856 *mf_cmp_p = mf_cmp_alu_cmp;
8857 return !(i.mem_operands && i.imm_operands);
8858 }
e379e5f3 8859
79d72f45
HL
8860 /* and without and m, imm. */
8861 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8862 || ((i.tm.base_opcode | 3) == 0x83
8863 && i.tm.extension_opcode == 0x4))
8864 {
8865 *mf_cmp_p = mf_cmp_test_and;
8866 return !(i.mem_operands && i.imm_operands);
8867 }
8868
8869 /* test without test m imm. */
e379e5f3
L
8870 if ((i.tm.base_opcode | 1) == 0x85
8871 || (i.tm.base_opcode | 1) == 0xa9
8872 || ((i.tm.base_opcode | 1) == 0xf7
79d72f45
HL
8873 && i.tm.extension_opcode == 0))
8874 {
8875 *mf_cmp_p = mf_cmp_test_and;
8876 return !(i.mem_operands && i.imm_operands);
8877 }
8878
8879 /* cmp without cmp m, imm. */
8880 if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
e379e5f3
L
8881 || ((i.tm.base_opcode | 3) == 0x83
8882 && (i.tm.extension_opcode == 0x7)))
79d72f45
HL
8883 {
8884 *mf_cmp_p = mf_cmp_alu_cmp;
8885 return !(i.mem_operands && i.imm_operands);
8886 }
e379e5f3 8887
79d72f45 8888 /* inc, dec without inc/dec m. */
e379e5f3
L
8889 if ((i.tm.cpu_flags.bitfield.cpuno64
8890 && (i.tm.base_opcode | 0xf) == 0x4f)
8891 || ((i.tm.base_opcode | 1) == 0xff
8892 && i.tm.extension_opcode <= 0x1))
79d72f45
HL
8893 {
8894 *mf_cmp_p = mf_cmp_incdec;
8895 return !i.mem_operands;
8896 }
e379e5f3
L
8897
8898 return 0;
8899}
8900
8901/* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8902
8903static int
79d72f45 8904add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
e379e5f3
L
8905{
8906 /* NB: Don't work with COND_JUMP86 without i386. */
8907 if (!align_branch_power
8908 || now_seg == absolute_section
8909 || !cpu_arch_flags.bitfield.cpui386
8910 || !(align_branch & align_branch_fused_bit))
8911 return 0;
8912
79d72f45 8913 if (maybe_fused_with_jcc_p (mf_cmp_p))
e379e5f3
L
8914 {
8915 if (last_insn.kind == last_insn_other
8916 || last_insn.seg != now_seg)
8917 return 1;
8918 if (flag_debug)
8919 as_warn_where (last_insn.file, last_insn.line,
8920 _("`%s` skips -malign-branch-boundary on `%s`"),
8921 last_insn.name, i.tm.name);
8922 }
8923
8924 return 0;
8925}
8926
8927/* Return 1 if a BRANCH_PREFIX frag should be generated. */
8928
8929static int
8930add_branch_prefix_frag_p (void)
8931{
8932 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8933 to PadLock instructions since they include prefixes in opcode. */
8934 if (!align_branch_power
8935 || !align_branch_prefix_size
8936 || now_seg == absolute_section
8937 || i.tm.cpu_flags.bitfield.cpupadlock
8938 || !cpu_arch_flags.bitfield.cpui386)
8939 return 0;
8940
8941 /* Don't add prefix if it is a prefix or there is no operand in case
8942 that segment prefix is special. */
8943 if (!i.operands || i.tm.opcode_modifier.isprefix)
8944 return 0;
8945
8946 if (last_insn.kind == last_insn_other
8947 || last_insn.seg != now_seg)
8948 return 1;
8949
8950 if (flag_debug)
8951 as_warn_where (last_insn.file, last_insn.line,
8952 _("`%s` skips -malign-branch-boundary on `%s`"),
8953 last_insn.name, i.tm.name);
8954
8955 return 0;
8956}
8957
8958/* Return 1 if a BRANCH_PADDING frag should be generated. */
8959
8960static int
79d72f45
HL
8961add_branch_padding_frag_p (enum align_branch_kind *branch_p,
8962 enum mf_jcc_kind *mf_jcc_p)
e379e5f3
L
8963{
8964 int add_padding;
8965
8966 /* NB: Don't work with COND_JUMP86 without i386. */
8967 if (!align_branch_power
8968 || now_seg == absolute_section
8969 || !cpu_arch_flags.bitfield.cpui386)
8970 return 0;
8971
8972 add_padding = 0;
8973
8974 /* Check for jcc and direct jmp. */
8975 if (i.tm.opcode_modifier.jump == JUMP)
8976 {
8977 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8978 {
8979 *branch_p = align_branch_jmp;
8980 add_padding = align_branch & align_branch_jmp_bit;
8981 }
8982 else
8983 {
79d72f45
HL
8984 /* Because J<cc> and JN<cc> share same group in macro-fusible table,
8985 igore the lowest bit. */
8986 *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
e379e5f3
L
8987 *branch_p = align_branch_jcc;
8988 if ((align_branch & align_branch_jcc_bit))
8989 add_padding = 1;
8990 }
8991 }
8992 else if (is_any_vex_encoding (&i.tm))
8993 return 0;
8994 else if ((i.tm.base_opcode | 1) == 0xc3)
8995 {
8996 /* Near ret. */
8997 *branch_p = align_branch_ret;
8998 if ((align_branch & align_branch_ret_bit))
8999 add_padding = 1;
9000 }
9001 else
9002 {
9003 /* Check for indirect jmp, direct and indirect calls. */
9004 if (i.tm.base_opcode == 0xe8)
9005 {
9006 /* Direct call. */
9007 *branch_p = align_branch_call;
9008 if ((align_branch & align_branch_call_bit))
9009 add_padding = 1;
9010 }
9011 else if (i.tm.base_opcode == 0xff
9012 && (i.tm.extension_opcode == 2
9013 || i.tm.extension_opcode == 4))
9014 {
9015 /* Indirect call and jmp. */
9016 *branch_p = align_branch_indirect;
9017 if ((align_branch & align_branch_indirect_bit))
9018 add_padding = 1;
9019 }
9020
9021 if (add_padding
9022 && i.disp_operands
9023 && tls_get_addr
9024 && (i.op[0].disps->X_op == O_symbol
9025 || (i.op[0].disps->X_op == O_subtract
9026 && i.op[0].disps->X_op_symbol == GOT_symbol)))
9027 {
9028 symbolS *s = i.op[0].disps->X_add_symbol;
9029 /* No padding to call to global or undefined tls_get_addr. */
9030 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9031 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9032 return 0;
9033 }
9034 }
9035
9036 if (add_padding
9037 && last_insn.kind != last_insn_other
9038 && last_insn.seg == now_seg)
9039 {
9040 if (flag_debug)
9041 as_warn_where (last_insn.file, last_insn.line,
9042 _("`%s` skips -malign-branch-boundary on `%s`"),
9043 last_insn.name, i.tm.name);
9044 return 0;
9045 }
9046
9047 return add_padding;
9048}
9049
29b0f896 9050static void
e3bb37b5 9051output_insn (void)
29b0f896 9052{
2bbd9c25
JJ
9053 fragS *insn_start_frag;
9054 offsetT insn_start_off;
e379e5f3
L
9055 fragS *fragP = NULL;
9056 enum align_branch_kind branch = align_branch_none;
79d72f45
HL
9057 /* The initializer is arbitrary just to avoid uninitialized error.
9058 it's actually either assigned in add_branch_padding_frag_p
9059 or never be used. */
9060 enum mf_jcc_kind mf_jcc = mf_jcc_jo;
2bbd9c25 9061
b4a3a7b4
L
9062#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9063 if (IS_ELF && x86_used_note)
9064 {
9065 if (i.tm.cpu_flags.bitfield.cpucmov)
9066 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
9067 if (i.tm.cpu_flags.bitfield.cpusse)
9068 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
9069 if (i.tm.cpu_flags.bitfield.cpusse2)
9070 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
9071 if (i.tm.cpu_flags.bitfield.cpusse3)
9072 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
9073 if (i.tm.cpu_flags.bitfield.cpussse3)
9074 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
9075 if (i.tm.cpu_flags.bitfield.cpusse4_1)
9076 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
9077 if (i.tm.cpu_flags.bitfield.cpusse4_2)
9078 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
9079 if (i.tm.cpu_flags.bitfield.cpuavx)
9080 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
9081 if (i.tm.cpu_flags.bitfield.cpuavx2)
9082 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
9083 if (i.tm.cpu_flags.bitfield.cpufma)
9084 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
9085 if (i.tm.cpu_flags.bitfield.cpuavx512f)
9086 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
9087 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
9088 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
9089 if (i.tm.cpu_flags.bitfield.cpuavx512er)
9090 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
9091 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
9092 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
9093 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
9094 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
9095 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
9096 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
9097 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
9098 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
9099 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
9100 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
9101 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
9102 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
9103 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
9104 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
9105 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
9106 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
9107 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
9108 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
9109 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
9110 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
9111 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
9112 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
462cac58
L
9113 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
9114 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
b4a3a7b4
L
9115
9116 if (i.tm.cpu_flags.bitfield.cpu8087
9117 || i.tm.cpu_flags.bitfield.cpu287
9118 || i.tm.cpu_flags.bitfield.cpu387
9119 || i.tm.cpu_flags.bitfield.cpu687
9120 || i.tm.cpu_flags.bitfield.cpufisttp)
9121 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
319ff62c
JB
9122 if (i.has_regmmx
9123 || i.tm.base_opcode == 0xf77 /* emms */
a7e12755
L
9124 || i.tm.base_opcode == 0xf0e /* femms */
9125 || i.tm.base_opcode == 0xf2a /* cvtpi2ps */
9126 || i.tm.base_opcode == 0x660f2a /* cvtpi2pd */)
b4a3a7b4
L
9127 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9128 if (i.has_regxmm)
9129 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9130 if (i.has_regymm)
9131 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9132 if (i.has_regzmm)
9133 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9134 if (i.tm.cpu_flags.bitfield.cpufxsr)
9135 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9136 if (i.tm.cpu_flags.bitfield.cpuxsave)
9137 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9138 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9139 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9140 if (i.tm.cpu_flags.bitfield.cpuxsavec)
9141 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9142 }
9143#endif
9144
29b0f896
AM
9145 /* Tie dwarf2 debug info to the address at the start of the insn.
9146 We can't do this after the insn has been output as the current
9147 frag may have been closed off. eg. by frag_var. */
9148 dwarf2_emit_insn (0);
9149
2bbd9c25
JJ
9150 insn_start_frag = frag_now;
9151 insn_start_off = frag_now_fix ();
9152
79d72f45 9153 if (add_branch_padding_frag_p (&branch, &mf_jcc))
e379e5f3
L
9154 {
9155 char *p;
9156 /* Branch can be 8 bytes. Leave some room for prefixes. */
9157 unsigned int max_branch_padding_size = 14;
9158
9159 /* Align section to boundary. */
9160 record_alignment (now_seg, align_branch_power);
9161
9162 /* Make room for padding. */
9163 frag_grow (max_branch_padding_size);
9164
9165 /* Start of the padding. */
9166 p = frag_more (0);
9167
9168 fragP = frag_now;
9169
9170 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9171 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9172 NULL, 0, p);
9173
79d72f45 9174 fragP->tc_frag_data.mf_type = mf_jcc;
e379e5f3
L
9175 fragP->tc_frag_data.branch_type = branch;
9176 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9177 }
9178
29b0f896 9179 /* Output jumps. */
0cfa3eb3 9180 if (i.tm.opcode_modifier.jump == JUMP)
29b0f896 9181 output_branch ();
0cfa3eb3
JB
9182 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9183 || i.tm.opcode_modifier.jump == JUMP_DWORD)
29b0f896 9184 output_jump ();
0cfa3eb3 9185 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
29b0f896
AM
9186 output_interseg_jump ();
9187 else
9188 {
9189 /* Output normal instructions here. */
9190 char *p;
9191 unsigned char *q;
47465058 9192 unsigned int j;
331d2d0d 9193 unsigned int prefix;
79d72f45 9194 enum mf_cmp_kind mf_cmp;
4dffcebc 9195
e4e00185 9196 if (avoid_fence
c3949f43
JB
9197 && (i.tm.base_opcode == 0xfaee8
9198 || i.tm.base_opcode == 0xfaef0
9199 || i.tm.base_opcode == 0xfaef8))
e4e00185
AS
9200 {
9201 /* Encode lfence, mfence, and sfence as
9202 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
9203 offsetT val = 0x240483f0ULL;
9204 p = frag_more (5);
9205 md_number_to_chars (p, val, 5);
9206 return;
9207 }
9208
d022bddd
IT
9209 /* Some processors fail on LOCK prefix. This options makes
9210 assembler ignore LOCK prefix and serves as a workaround. */
9211 if (omit_lock_prefix)
9212 {
9213 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9214 return;
9215 i.prefix[LOCK_PREFIX] = 0;
9216 }
9217
e379e5f3
L
9218 if (branch)
9219 /* Skip if this is a branch. */
9220 ;
79d72f45 9221 else if (add_fused_jcc_padding_frag_p (&mf_cmp))
e379e5f3
L
9222 {
9223 /* Make room for padding. */
9224 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9225 p = frag_more (0);
9226
9227 fragP = frag_now;
9228
9229 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9230 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9231 NULL, 0, p);
9232
79d72f45 9233 fragP->tc_frag_data.mf_type = mf_cmp;
e379e5f3
L
9234 fragP->tc_frag_data.branch_type = align_branch_fused;
9235 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9236 }
9237 else if (add_branch_prefix_frag_p ())
9238 {
9239 unsigned int max_prefix_size = align_branch_prefix_size;
9240
9241 /* Make room for padding. */
9242 frag_grow (max_prefix_size);
9243 p = frag_more (0);
9244
9245 fragP = frag_now;
9246
9247 frag_var (rs_machine_dependent, max_prefix_size, 0,
9248 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9249 NULL, 0, p);
9250
9251 fragP->tc_frag_data.max_bytes = max_prefix_size;
9252 }
9253
43234a1e
L
9254 /* Since the VEX/EVEX prefix contains the implicit prefix, we
9255 don't need the explicit prefix. */
9256 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
bc4bd9ab 9257 {
c0f3af97 9258 switch (i.tm.opcode_length)
bc4bd9ab 9259 {
c0f3af97
L
9260 case 3:
9261 if (i.tm.base_opcode & 0xff000000)
4dffcebc 9262 {
c0f3af97 9263 prefix = (i.tm.base_opcode >> 24) & 0xff;
c3949f43
JB
9264 if (!i.tm.cpu_flags.bitfield.cpupadlock
9265 || prefix != REPE_PREFIX_OPCODE
9266 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
9267 add_prefix (prefix);
c0f3af97
L
9268 }
9269 break;
9270 case 2:
9271 if ((i.tm.base_opcode & 0xff0000) != 0)
9272 {
9273 prefix = (i.tm.base_opcode >> 16) & 0xff;
c3949f43 9274 add_prefix (prefix);
4dffcebc 9275 }
c0f3af97
L
9276 break;
9277 case 1:
9278 break;
390c91cf
L
9279 case 0:
9280 /* Check for pseudo prefixes. */
9281 as_bad_where (insn_start_frag->fr_file,
9282 insn_start_frag->fr_line,
9283 _("pseudo prefix without instruction"));
9284 return;
c0f3af97
L
9285 default:
9286 abort ();
bc4bd9ab 9287 }
c0f3af97 9288
6d19a37a 9289#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
cf61b747
L
9290 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9291 R_X86_64_GOTTPOFF relocation so that linker can safely
14470f07
L
9292 perform IE->LE optimization. A dummy REX_OPCODE prefix
9293 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9294 relocation for GDesc -> IE/LE optimization. */
cf61b747
L
9295 if (x86_elf_abi == X86_64_X32_ABI
9296 && i.operands == 2
14470f07
L
9297 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9298 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
cf61b747
L
9299 && i.prefix[REX_PREFIX] == 0)
9300 add_prefix (REX_OPCODE);
6d19a37a 9301#endif
cf61b747 9302
c0f3af97
L
9303 /* The prefix bytes. */
9304 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9305 if (*q)
9306 FRAG_APPEND_1_CHAR (*q);
0f10071e 9307 }
ae5c1c7b 9308 else
c0f3af97
L
9309 {
9310 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9311 if (*q)
9312 switch (j)
9313 {
c0f3af97
L
9314 case SEG_PREFIX:
9315 case ADDR_PREFIX:
9316 FRAG_APPEND_1_CHAR (*q);
9317 break;
9318 default:
9319 /* There should be no other prefixes for instructions
9320 with VEX prefix. */
9321 abort ();
9322 }
9323
43234a1e
L
9324 /* For EVEX instructions i.vrex should become 0 after
9325 build_evex_prefix. For VEX instructions upper 16 registers
9326 aren't available, so VREX should be 0. */
9327 if (i.vrex)
9328 abort ();
c0f3af97
L
9329 /* Now the VEX prefix. */
9330 p = frag_more (i.vex.length);
9331 for (j = 0; j < i.vex.length; j++)
9332 p[j] = i.vex.bytes[j];
9333 }
252b5132 9334
29b0f896 9335 /* Now the opcode; be careful about word order here! */
4dffcebc 9336 if (i.tm.opcode_length == 1)
29b0f896
AM
9337 {
9338 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9339 }
9340 else
9341 {
4dffcebc 9342 switch (i.tm.opcode_length)
331d2d0d 9343 {
43234a1e
L
9344 case 4:
9345 p = frag_more (4);
9346 *p++ = (i.tm.base_opcode >> 24) & 0xff;
9347 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9348 break;
4dffcebc 9349 case 3:
331d2d0d
L
9350 p = frag_more (3);
9351 *p++ = (i.tm.base_opcode >> 16) & 0xff;
4dffcebc
L
9352 break;
9353 case 2:
9354 p = frag_more (2);
9355 break;
9356 default:
9357 abort ();
9358 break;
331d2d0d 9359 }
0f10071e 9360
29b0f896
AM
9361 /* Put out high byte first: can't use md_number_to_chars! */
9362 *p++ = (i.tm.base_opcode >> 8) & 0xff;
9363 *p = i.tm.base_opcode & 0xff;
9364 }
3e73aa7c 9365
29b0f896 9366 /* Now the modrm byte and sib byte (if present). */
40fb9820 9367 if (i.tm.opcode_modifier.modrm)
29b0f896 9368 {
4a3523fa
L
9369 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
9370 | i.rm.reg << 3
9371 | i.rm.mode << 6));
29b0f896
AM
9372 /* If i.rm.regmem == ESP (4)
9373 && i.rm.mode != (Register mode)
9374 && not 16 bit
9375 ==> need second modrm byte. */
9376 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9377 && i.rm.mode != 3
dc821c5f 9378 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
4a3523fa
L
9379 FRAG_APPEND_1_CHAR ((i.sib.base << 0
9380 | i.sib.index << 3
9381 | i.sib.scale << 6));
29b0f896 9382 }
3e73aa7c 9383
29b0f896 9384 if (i.disp_operands)
2bbd9c25 9385 output_disp (insn_start_frag, insn_start_off);
3e73aa7c 9386
29b0f896 9387 if (i.imm_operands)
2bbd9c25 9388 output_imm (insn_start_frag, insn_start_off);
9c33702b
JB
9389
9390 /*
9391 * frag_now_fix () returning plain abs_section_offset when we're in the
9392 * absolute section, and abs_section_offset not getting updated as data
9393 * gets added to the frag breaks the logic below.
9394 */
9395 if (now_seg != absolute_section)
9396 {
9397 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9398 if (j > 15)
9399 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9400 j);
e379e5f3
L
9401 else if (fragP)
9402 {
9403 /* NB: Don't add prefix with GOTPC relocation since
9404 output_disp() above depends on the fixed encoding
9405 length. Can't add prefix with TLS relocation since
9406 it breaks TLS linker optimization. */
9407 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9408 /* Prefix count on the current instruction. */
9409 unsigned int count = i.vex.length;
9410 unsigned int k;
9411 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9412 /* REX byte is encoded in VEX/EVEX prefix. */
9413 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9414 count++;
9415
9416 /* Count prefixes for extended opcode maps. */
9417 if (!i.vex.length)
9418 switch (i.tm.opcode_length)
9419 {
9420 case 3:
9421 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9422 {
9423 count++;
9424 switch ((i.tm.base_opcode >> 8) & 0xff)
9425 {
9426 case 0x38:
9427 case 0x3a:
9428 count++;
9429 break;
9430 default:
9431 break;
9432 }
9433 }
9434 break;
9435 case 2:
9436 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9437 count++;
9438 break;
9439 case 1:
9440 break;
9441 default:
9442 abort ();
9443 }
9444
9445 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9446 == BRANCH_PREFIX)
9447 {
9448 /* Set the maximum prefix size in BRANCH_PREFIX
9449 frag. */
9450 if (fragP->tc_frag_data.max_bytes > max)
9451 fragP->tc_frag_data.max_bytes = max;
9452 if (fragP->tc_frag_data.max_bytes > count)
9453 fragP->tc_frag_data.max_bytes -= count;
9454 else
9455 fragP->tc_frag_data.max_bytes = 0;
9456 }
9457 else
9458 {
9459 /* Remember the maximum prefix size in FUSED_JCC_PADDING
9460 frag. */
9461 unsigned int max_prefix_size;
9462 if (align_branch_prefix_size > max)
9463 max_prefix_size = max;
9464 else
9465 max_prefix_size = align_branch_prefix_size;
9466 if (max_prefix_size > count)
9467 fragP->tc_frag_data.max_prefix_length
9468 = max_prefix_size - count;
9469 }
9470
9471 /* Use existing segment prefix if possible. Use CS
9472 segment prefix in 64-bit mode. In 32-bit mode, use SS
9473 segment prefix with ESP/EBP base register and use DS
9474 segment prefix without ESP/EBP base register. */
9475 if (i.prefix[SEG_PREFIX])
9476 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9477 else if (flag_code == CODE_64BIT)
9478 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9479 else if (i.base_reg
9480 && (i.base_reg->reg_num == 4
9481 || i.base_reg->reg_num == 5))
9482 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9483 else
9484 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9485 }
9c33702b 9486 }
29b0f896 9487 }
252b5132 9488
e379e5f3
L
9489 /* NB: Don't work with COND_JUMP86 without i386. */
9490 if (align_branch_power
9491 && now_seg != absolute_section
9492 && cpu_arch_flags.bitfield.cpui386)
9493 {
9494 /* Terminate each frag so that we can add prefix and check for
9495 fused jcc. */
9496 frag_wane (frag_now);
9497 frag_new (0);
9498 }
9499
29b0f896
AM
9500#ifdef DEBUG386
9501 if (flag_debug)
9502 {
7b81dfbb 9503 pi ("" /*line*/, &i);
29b0f896
AM
9504 }
9505#endif /* DEBUG386 */
9506}
252b5132 9507
e205caa7
L
9508/* Return the size of the displacement operand N. */
9509
9510static int
9511disp_size (unsigned int n)
9512{
9513 int size = 4;
43234a1e 9514
b5014f7a 9515 if (i.types[n].bitfield.disp64)
40fb9820
L
9516 size = 8;
9517 else if (i.types[n].bitfield.disp8)
9518 size = 1;
9519 else if (i.types[n].bitfield.disp16)
9520 size = 2;
e205caa7
L
9521 return size;
9522}
9523
9524/* Return the size of the immediate operand N. */
9525
9526static int
9527imm_size (unsigned int n)
9528{
9529 int size = 4;
40fb9820
L
9530 if (i.types[n].bitfield.imm64)
9531 size = 8;
9532 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9533 size = 1;
9534 else if (i.types[n].bitfield.imm16)
9535 size = 2;
e205caa7
L
9536 return size;
9537}
9538
29b0f896 9539static void
64e74474 9540output_disp (fragS *insn_start_frag, offsetT insn_start_off)
29b0f896
AM
9541{
9542 char *p;
9543 unsigned int n;
252b5132 9544
29b0f896
AM
9545 for (n = 0; n < i.operands; n++)
9546 {
b5014f7a 9547 if (operand_type_check (i.types[n], disp))
29b0f896
AM
9548 {
9549 if (i.op[n].disps->X_op == O_constant)
9550 {
e205caa7 9551 int size = disp_size (n);
43234a1e 9552 offsetT val = i.op[n].disps->X_add_number;
252b5132 9553
629cfaf1
JB
9554 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9555 size);
29b0f896
AM
9556 p = frag_more (size);
9557 md_number_to_chars (p, val, size);
9558 }
9559 else
9560 {
f86103b7 9561 enum bfd_reloc_code_real reloc_type;
e205caa7 9562 int size = disp_size (n);
40fb9820 9563 int sign = i.types[n].bitfield.disp32s;
29b0f896 9564 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
02a86693 9565 fixS *fixP;
29b0f896 9566
e205caa7 9567 /* We can't have 8 bit displacement here. */
9c2799c2 9568 gas_assert (!i.types[n].bitfield.disp8);
e205caa7 9569
29b0f896
AM
9570 /* The PC relative address is computed relative
9571 to the instruction boundary, so in case immediate
9572 fields follows, we need to adjust the value. */
9573 if (pcrel && i.imm_operands)
9574 {
29b0f896 9575 unsigned int n1;
e205caa7 9576 int sz = 0;
252b5132 9577
29b0f896 9578 for (n1 = 0; n1 < i.operands; n1++)
40fb9820 9579 if (operand_type_check (i.types[n1], imm))
252b5132 9580 {
e205caa7
L
9581 /* Only one immediate is allowed for PC
9582 relative address. */
9c2799c2 9583 gas_assert (sz == 0);
e205caa7
L
9584 sz = imm_size (n1);
9585 i.op[n].disps->X_add_number -= sz;
252b5132 9586 }
29b0f896 9587 /* We should find the immediate. */
9c2799c2 9588 gas_assert (sz != 0);
29b0f896 9589 }
520dc8e8 9590
29b0f896 9591 p = frag_more (size);
d258b828 9592 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
d6ab8113 9593 if (GOT_symbol
2bbd9c25 9594 && GOT_symbol == i.op[n].disps->X_add_symbol
d6ab8113 9595 && (((reloc_type == BFD_RELOC_32
7b81dfbb
AJ
9596 || reloc_type == BFD_RELOC_X86_64_32S
9597 || (reloc_type == BFD_RELOC_64
9598 && object_64bit))
d6ab8113
JB
9599 && (i.op[n].disps->X_op == O_symbol
9600 || (i.op[n].disps->X_op == O_add
9601 && ((symbol_get_value_expression
9602 (i.op[n].disps->X_op_symbol)->X_op)
9603 == O_subtract))))
9604 || reloc_type == BFD_RELOC_32_PCREL))
2bbd9c25 9605 {
4fa24527 9606 if (!object_64bit)
7b81dfbb
AJ
9607 {
9608 reloc_type = BFD_RELOC_386_GOTPC;
e379e5f3 9609 i.has_gotpc_tls_reloc = TRUE;
d583596c
JB
9610 i.op[n].imms->X_add_number +=
9611 encoding_length (insn_start_frag, insn_start_off, p);
7b81dfbb
AJ
9612 }
9613 else if (reloc_type == BFD_RELOC_64)
9614 reloc_type = BFD_RELOC_X86_64_GOTPC64;
d6ab8113 9615 else
7b81dfbb
AJ
9616 /* Don't do the adjustment for x86-64, as there
9617 the pcrel addressing is relative to the _next_
9618 insn, and that is taken care of in other code. */
d6ab8113 9619 reloc_type = BFD_RELOC_X86_64_GOTPC32;
2bbd9c25 9620 }
e379e5f3
L
9621 else if (align_branch_power)
9622 {
9623 switch (reloc_type)
9624 {
9625 case BFD_RELOC_386_TLS_GD:
9626 case BFD_RELOC_386_TLS_LDM:
9627 case BFD_RELOC_386_TLS_IE:
9628 case BFD_RELOC_386_TLS_IE_32:
9629 case BFD_RELOC_386_TLS_GOTIE:
9630 case BFD_RELOC_386_TLS_GOTDESC:
9631 case BFD_RELOC_386_TLS_DESC_CALL:
9632 case BFD_RELOC_X86_64_TLSGD:
9633 case BFD_RELOC_X86_64_TLSLD:
9634 case BFD_RELOC_X86_64_GOTTPOFF:
9635 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9636 case BFD_RELOC_X86_64_TLSDESC_CALL:
9637 i.has_gotpc_tls_reloc = TRUE;
9638 default:
9639 break;
9640 }
9641 }
02a86693
L
9642 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9643 size, i.op[n].disps, pcrel,
9644 reloc_type);
9645 /* Check for "call/jmp *mem", "mov mem, %reg",
9646 "test %reg, mem" and "binop mem, %reg" where binop
9647 is one of adc, add, and, cmp, or, sbb, sub, xor
e60f4d3b
L
9648 instructions without data prefix. Always generate
9649 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9650 if (i.prefix[DATA_PREFIX] == 0
9651 && (generate_relax_relocations
9652 || (!object_64bit
9653 && i.rm.mode == 0
9654 && i.rm.regmem == 5))
0cb4071e
L
9655 && (i.rm.mode == 2
9656 || (i.rm.mode == 0 && i.rm.regmem == 5))
2ae4c703 9657 && !is_any_vex_encoding(&i.tm)
02a86693
L
9658 && ((i.operands == 1
9659 && i.tm.base_opcode == 0xff
9660 && (i.rm.reg == 2 || i.rm.reg == 4))
9661 || (i.operands == 2
9662 && (i.tm.base_opcode == 0x8b
9663 || i.tm.base_opcode == 0x85
2ae4c703 9664 || (i.tm.base_opcode & ~0x38) == 0x03))))
02a86693
L
9665 {
9666 if (object_64bit)
9667 {
9668 fixP->fx_tcbit = i.rex != 0;
9669 if (i.base_reg
e968fc9b 9670 && (i.base_reg->reg_num == RegIP))
02a86693
L
9671 fixP->fx_tcbit2 = 1;
9672 }
9673 else
9674 fixP->fx_tcbit2 = 1;
9675 }
29b0f896
AM
9676 }
9677 }
9678 }
9679}
252b5132 9680
29b0f896 9681static void
64e74474 9682output_imm (fragS *insn_start_frag, offsetT insn_start_off)
29b0f896
AM
9683{
9684 char *p;
9685 unsigned int n;
252b5132 9686
29b0f896
AM
9687 for (n = 0; n < i.operands; n++)
9688 {
43234a1e
L
9689 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9690 if (i.rounding && (int) n == i.rounding->operand)
9691 continue;
9692
40fb9820 9693 if (operand_type_check (i.types[n], imm))
29b0f896
AM
9694 {
9695 if (i.op[n].imms->X_op == O_constant)
9696 {
e205caa7 9697 int size = imm_size (n);
29b0f896 9698 offsetT val;
b4cac588 9699
29b0f896
AM
9700 val = offset_in_range (i.op[n].imms->X_add_number,
9701 size);
9702 p = frag_more (size);
9703 md_number_to_chars (p, val, size);
9704 }
9705 else
9706 {
9707 /* Not absolute_section.
9708 Need a 32-bit fixup (don't support 8bit
9709 non-absolute imms). Try to support other
9710 sizes ... */
f86103b7 9711 enum bfd_reloc_code_real reloc_type;
e205caa7
L
9712 int size = imm_size (n);
9713 int sign;
29b0f896 9714
40fb9820 9715 if (i.types[n].bitfield.imm32s
a7d61044 9716 && (i.suffix == QWORD_MNEM_SUFFIX
40fb9820 9717 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
29b0f896 9718 sign = 1;
e205caa7
L
9719 else
9720 sign = 0;
520dc8e8 9721
29b0f896 9722 p = frag_more (size);
d258b828 9723 reloc_type = reloc (size, 0, sign, i.reloc[n]);
f86103b7 9724
2bbd9c25
JJ
9725 /* This is tough to explain. We end up with this one if we
9726 * have operands that look like
9727 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9728 * obtain the absolute address of the GOT, and it is strongly
9729 * preferable from a performance point of view to avoid using
9730 * a runtime relocation for this. The actual sequence of
9731 * instructions often look something like:
9732 *
9733 * call .L66
9734 * .L66:
9735 * popl %ebx
9736 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9737 *
9738 * The call and pop essentially return the absolute address
9739 * of the label .L66 and store it in %ebx. The linker itself
9740 * will ultimately change the first operand of the addl so
9741 * that %ebx points to the GOT, but to keep things simple, the
9742 * .o file must have this operand set so that it generates not
9743 * the absolute address of .L66, but the absolute address of
9744 * itself. This allows the linker itself simply treat a GOTPC
9745 * relocation as asking for a pcrel offset to the GOT to be
9746 * added in, and the addend of the relocation is stored in the
9747 * operand field for the instruction itself.
9748 *
9749 * Our job here is to fix the operand so that it would add
9750 * the correct offset so that %ebx would point to itself. The
9751 * thing that is tricky is that .-.L66 will point to the
9752 * beginning of the instruction, so we need to further modify
9753 * the operand so that it will point to itself. There are
9754 * other cases where you have something like:
9755 *
9756 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9757 *
9758 * and here no correction would be required. Internally in
9759 * the assembler we treat operands of this form as not being
9760 * pcrel since the '.' is explicitly mentioned, and I wonder
9761 * whether it would simplify matters to do it this way. Who
9762 * knows. In earlier versions of the PIC patches, the
9763 * pcrel_adjust field was used to store the correction, but
9764 * since the expression is not pcrel, I felt it would be
9765 * confusing to do it this way. */
9766
d6ab8113 9767 if ((reloc_type == BFD_RELOC_32
7b81dfbb
AJ
9768 || reloc_type == BFD_RELOC_X86_64_32S
9769 || reloc_type == BFD_RELOC_64)
29b0f896
AM
9770 && GOT_symbol
9771 && GOT_symbol == i.op[n].imms->X_add_symbol
9772 && (i.op[n].imms->X_op == O_symbol
9773 || (i.op[n].imms->X_op == O_add
9774 && ((symbol_get_value_expression
9775 (i.op[n].imms->X_op_symbol)->X_op)
9776 == O_subtract))))
9777 {
4fa24527 9778 if (!object_64bit)
d6ab8113 9779 reloc_type = BFD_RELOC_386_GOTPC;
7b81dfbb 9780 else if (size == 4)
d6ab8113 9781 reloc_type = BFD_RELOC_X86_64_GOTPC32;
7b81dfbb
AJ
9782 else if (size == 8)
9783 reloc_type = BFD_RELOC_X86_64_GOTPC64;
e379e5f3 9784 i.has_gotpc_tls_reloc = TRUE;
d583596c
JB
9785 i.op[n].imms->X_add_number +=
9786 encoding_length (insn_start_frag, insn_start_off, p);
29b0f896 9787 }
29b0f896
AM
9788 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9789 i.op[n].imms, 0, reloc_type);
9790 }
9791 }
9792 }
252b5132
RH
9793}
9794\f
d182319b
JB
9795/* x86_cons_fix_new is called via the expression parsing code when a
9796 reloc is needed. We use this hook to get the correct .got reloc. */
d182319b
JB
9797static int cons_sign = -1;
9798
9799void
e3bb37b5 9800x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
62ebcb5c 9801 expressionS *exp, bfd_reloc_code_real_type r)
d182319b 9802{
d258b828 9803 r = reloc (len, 0, cons_sign, r);
d182319b
JB
9804
9805#ifdef TE_PE
9806 if (exp->X_op == O_secrel)
9807 {
9808 exp->X_op = O_symbol;
9809 r = BFD_RELOC_32_SECREL;
9810 }
9811#endif
9812
9813 fix_new_exp (frag, off, len, exp, 0, r);
9814}
9815
357d1bd8
L
9816/* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9817 purpose of the `.dc.a' internal pseudo-op. */
9818
9819int
9820x86_address_bytes (void)
9821{
9822 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9823 return 4;
9824 return stdoutput->arch_info->bits_per_address / 8;
9825}
9826
d382c579
TG
9827#if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9828 || defined (LEX_AT)
d258b828 9829# define lex_got(reloc, adjust, types) NULL
718ddfc0 9830#else
f3c180ae
AM
9831/* Parse operands of the form
9832 <symbol>@GOTOFF+<nnn>
9833 and similar .plt or .got references.
9834
9835 If we find one, set up the correct relocation in RELOC and copy the
9836 input string, minus the `@GOTOFF' into a malloc'd buffer for
9837 parsing by the calling routine. Return this buffer, and if ADJUST
9838 is non-null set it to the length of the string we removed from the
9839 input line. Otherwise return NULL. */
9840static char *
91d6fa6a 9841lex_got (enum bfd_reloc_code_real *rel,
64e74474 9842 int *adjust,
d258b828 9843 i386_operand_type *types)
f3c180ae 9844{
7b81dfbb
AJ
9845 /* Some of the relocations depend on the size of what field is to
9846 be relocated. But in our callers i386_immediate and i386_displacement
9847 we don't yet know the operand size (this will be set by insn
9848 matching). Hence we record the word32 relocation here,
9849 and adjust the reloc according to the real size in reloc(). */
f3c180ae
AM
9850 static const struct {
9851 const char *str;
cff8d58a 9852 int len;
4fa24527 9853 const enum bfd_reloc_code_real rel[2];
40fb9820 9854 const i386_operand_type types64;
f3c180ae 9855 } gotrel[] = {
8ce3d284 9856#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
9857 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9858 BFD_RELOC_SIZE32 },
9859 OPERAND_TYPE_IMM32_64 },
8ce3d284 9860#endif
cff8d58a
L
9861 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9862 BFD_RELOC_X86_64_PLTOFF64 },
40fb9820 9863 OPERAND_TYPE_IMM64 },
cff8d58a
L
9864 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9865 BFD_RELOC_X86_64_PLT32 },
40fb9820 9866 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9867 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9868 BFD_RELOC_X86_64_GOTPLT64 },
40fb9820 9869 OPERAND_TYPE_IMM64_DISP64 },
cff8d58a
L
9870 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9871 BFD_RELOC_X86_64_GOTOFF64 },
40fb9820 9872 OPERAND_TYPE_IMM64_DISP64 },
cff8d58a
L
9873 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9874 BFD_RELOC_X86_64_GOTPCREL },
40fb9820 9875 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9876 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9877 BFD_RELOC_X86_64_TLSGD },
40fb9820 9878 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9879 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9880 _dummy_first_bfd_reloc_code_real },
40fb9820 9881 OPERAND_TYPE_NONE },
cff8d58a
L
9882 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9883 BFD_RELOC_X86_64_TLSLD },
40fb9820 9884 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9885 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9886 BFD_RELOC_X86_64_GOTTPOFF },
40fb9820 9887 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9888 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9889 BFD_RELOC_X86_64_TPOFF32 },
40fb9820 9890 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
cff8d58a
L
9891 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9892 _dummy_first_bfd_reloc_code_real },
40fb9820 9893 OPERAND_TYPE_NONE },
cff8d58a
L
9894 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9895 BFD_RELOC_X86_64_DTPOFF32 },
40fb9820 9896 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
cff8d58a
L
9897 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9898 _dummy_first_bfd_reloc_code_real },
40fb9820 9899 OPERAND_TYPE_NONE },
cff8d58a
L
9900 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9901 _dummy_first_bfd_reloc_code_real },
40fb9820 9902 OPERAND_TYPE_NONE },
cff8d58a
L
9903 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9904 BFD_RELOC_X86_64_GOT32 },
40fb9820 9905 OPERAND_TYPE_IMM32_32S_64_DISP32 },
cff8d58a
L
9906 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9907 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
40fb9820 9908 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9909 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9910 BFD_RELOC_X86_64_TLSDESC_CALL },
40fb9820 9911 OPERAND_TYPE_IMM32_32S_DISP32 },
f3c180ae
AM
9912 };
9913 char *cp;
9914 unsigned int j;
9915
d382c579 9916#if defined (OBJ_MAYBE_ELF)
718ddfc0
JB
9917 if (!IS_ELF)
9918 return NULL;
d382c579 9919#endif
718ddfc0 9920
f3c180ae 9921 for (cp = input_line_pointer; *cp != '@'; cp++)
67c11a9b 9922 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
f3c180ae
AM
9923 return NULL;
9924
47465058 9925 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
f3c180ae 9926 {
cff8d58a 9927 int len = gotrel[j].len;
28f81592 9928 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
f3c180ae 9929 {
4fa24527 9930 if (gotrel[j].rel[object_64bit] != 0)
f3c180ae 9931 {
28f81592
AM
9932 int first, second;
9933 char *tmpbuf, *past_reloc;
f3c180ae 9934
91d6fa6a 9935 *rel = gotrel[j].rel[object_64bit];
f3c180ae 9936
3956db08
JB
9937 if (types)
9938 {
9939 if (flag_code != CODE_64BIT)
40fb9820
L
9940 {
9941 types->bitfield.imm32 = 1;
9942 types->bitfield.disp32 = 1;
9943 }
3956db08
JB
9944 else
9945 *types = gotrel[j].types64;
9946 }
9947
8fd4256d 9948 if (j != 0 && GOT_symbol == NULL)
f3c180ae
AM
9949 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9950
28f81592 9951 /* The length of the first part of our input line. */
f3c180ae 9952 first = cp - input_line_pointer;
28f81592
AM
9953
9954 /* The second part goes from after the reloc token until
67c11a9b 9955 (and including) an end_of_line char or comma. */
28f81592 9956 past_reloc = cp + 1 + len;
67c11a9b
AM
9957 cp = past_reloc;
9958 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9959 ++cp;
9960 second = cp + 1 - past_reloc;
28f81592
AM
9961
9962 /* Allocate and copy string. The trailing NUL shouldn't
9963 be necessary, but be safe. */
add39d23 9964 tmpbuf = XNEWVEC (char, first + second + 2);
f3c180ae 9965 memcpy (tmpbuf, input_line_pointer, first);
0787a12d
AM
9966 if (second != 0 && *past_reloc != ' ')
9967 /* Replace the relocation token with ' ', so that
9968 errors like foo@GOTOFF1 will be detected. */
9969 tmpbuf[first++] = ' ';
af89796a
L
9970 else
9971 /* Increment length by 1 if the relocation token is
9972 removed. */
9973 len++;
9974 if (adjust)
9975 *adjust = len;
0787a12d
AM
9976 memcpy (tmpbuf + first, past_reloc, second);
9977 tmpbuf[first + second] = '\0';
f3c180ae
AM
9978 return tmpbuf;
9979 }
9980
4fa24527
JB
9981 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9982 gotrel[j].str, 1 << (5 + object_64bit));
f3c180ae
AM
9983 return NULL;
9984 }
9985 }
9986
9987 /* Might be a symbol version string. Don't as_bad here. */
9988 return NULL;
9989}
4e4f7c87 9990#endif
f3c180ae 9991
a988325c
NC
9992#ifdef TE_PE
9993#ifdef lex_got
9994#undef lex_got
9995#endif
9996/* Parse operands of the form
9997 <symbol>@SECREL32+<nnn>
9998
9999 If we find one, set up the correct relocation in RELOC and copy the
10000 input string, minus the `@SECREL32' into a malloc'd buffer for
10001 parsing by the calling routine. Return this buffer, and if ADJUST
10002 is non-null set it to the length of the string we removed from the
34bca508
L
10003 input line. Otherwise return NULL.
10004
a988325c
NC
10005 This function is copied from the ELF version above adjusted for PE targets. */
10006
10007static char *
10008lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10009 int *adjust ATTRIBUTE_UNUSED,
d258b828 10010 i386_operand_type *types)
a988325c
NC
10011{
10012 static const struct
10013 {
10014 const char *str;
10015 int len;
10016 const enum bfd_reloc_code_real rel[2];
10017 const i386_operand_type types64;
10018 }
10019 gotrel[] =
10020 {
10021 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
10022 BFD_RELOC_32_SECREL },
10023 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10024 };
10025
10026 char *cp;
10027 unsigned j;
10028
10029 for (cp = input_line_pointer; *cp != '@'; cp++)
10030 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10031 return NULL;
10032
10033 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10034 {
10035 int len = gotrel[j].len;
10036
10037 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10038 {
10039 if (gotrel[j].rel[object_64bit] != 0)
10040 {
10041 int first, second;
10042 char *tmpbuf, *past_reloc;
10043
10044 *rel = gotrel[j].rel[object_64bit];
10045 if (adjust)
10046 *adjust = len;
10047
10048 if (types)
10049 {
10050 if (flag_code != CODE_64BIT)
10051 {
10052 types->bitfield.imm32 = 1;
10053 types->bitfield.disp32 = 1;
10054 }
10055 else
10056 *types = gotrel[j].types64;
10057 }
10058
10059 /* The length of the first part of our input line. */
10060 first = cp - input_line_pointer;
10061
10062 /* The second part goes from after the reloc token until
10063 (and including) an end_of_line char or comma. */
10064 past_reloc = cp + 1 + len;
10065 cp = past_reloc;
10066 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10067 ++cp;
10068 second = cp + 1 - past_reloc;
10069
10070 /* Allocate and copy string. The trailing NUL shouldn't
10071 be necessary, but be safe. */
add39d23 10072 tmpbuf = XNEWVEC (char, first + second + 2);
a988325c
NC
10073 memcpy (tmpbuf, input_line_pointer, first);
10074 if (second != 0 && *past_reloc != ' ')
10075 /* Replace the relocation token with ' ', so that
10076 errors like foo@SECLREL321 will be detected. */
10077 tmpbuf[first++] = ' ';
10078 memcpy (tmpbuf + first, past_reloc, second);
10079 tmpbuf[first + second] = '\0';
10080 return tmpbuf;
10081 }
10082
10083 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10084 gotrel[j].str, 1 << (5 + object_64bit));
10085 return NULL;
10086 }
10087 }
10088
10089 /* Might be a symbol version string. Don't as_bad here. */
10090 return NULL;
10091}
10092
10093#endif /* TE_PE */
10094
62ebcb5c 10095bfd_reloc_code_real_type
e3bb37b5 10096x86_cons (expressionS *exp, int size)
f3c180ae 10097{
62ebcb5c
AM
10098 bfd_reloc_code_real_type got_reloc = NO_RELOC;
10099
ee86248c
JB
10100 intel_syntax = -intel_syntax;
10101
3c7b9c2c 10102 exp->X_md = 0;
4fa24527 10103 if (size == 4 || (object_64bit && size == 8))
f3c180ae
AM
10104 {
10105 /* Handle @GOTOFF and the like in an expression. */
10106 char *save;
10107 char *gotfree_input_line;
4a57f2cf 10108 int adjust = 0;
f3c180ae
AM
10109
10110 save = input_line_pointer;
d258b828 10111 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
f3c180ae
AM
10112 if (gotfree_input_line)
10113 input_line_pointer = gotfree_input_line;
10114
10115 expression (exp);
10116
10117 if (gotfree_input_line)
10118 {
10119 /* expression () has merrily parsed up to the end of line,
10120 or a comma - in the wrong buffer. Transfer how far
10121 input_line_pointer has moved to the right buffer. */
10122 input_line_pointer = (save
10123 + (input_line_pointer - gotfree_input_line)
10124 + adjust);
10125 free (gotfree_input_line);
3992d3b7
AM
10126 if (exp->X_op == O_constant
10127 || exp->X_op == O_absent
10128 || exp->X_op == O_illegal
0398aac5 10129 || exp->X_op == O_register
3992d3b7
AM
10130 || exp->X_op == O_big)
10131 {
10132 char c = *input_line_pointer;
10133 *input_line_pointer = 0;
10134 as_bad (_("missing or invalid expression `%s'"), save);
10135 *input_line_pointer = c;
10136 }
b9519cfe
L
10137 else if ((got_reloc == BFD_RELOC_386_PLT32
10138 || got_reloc == BFD_RELOC_X86_64_PLT32)
10139 && exp->X_op != O_symbol)
10140 {
10141 char c = *input_line_pointer;
10142 *input_line_pointer = 0;
10143 as_bad (_("invalid PLT expression `%s'"), save);
10144 *input_line_pointer = c;
10145 }
f3c180ae
AM
10146 }
10147 }
10148 else
10149 expression (exp);
ee86248c
JB
10150
10151 intel_syntax = -intel_syntax;
10152
10153 if (intel_syntax)
10154 i386_intel_simplify (exp);
62ebcb5c
AM
10155
10156 return got_reloc;
f3c180ae 10157}
f3c180ae 10158
9f32dd5b
L
10159static void
10160signed_cons (int size)
6482c264 10161{
d182319b
JB
10162 if (flag_code == CODE_64BIT)
10163 cons_sign = 1;
10164 cons (size);
10165 cons_sign = -1;
6482c264
NC
10166}
10167
d182319b 10168#ifdef TE_PE
6482c264 10169static void
7016a5d5 10170pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
6482c264
NC
10171{
10172 expressionS exp;
10173
10174 do
10175 {
10176 expression (&exp);
10177 if (exp.X_op == O_symbol)
10178 exp.X_op = O_secrel;
10179
10180 emit_expr (&exp, 4);
10181 }
10182 while (*input_line_pointer++ == ',');
10183
10184 input_line_pointer--;
10185 demand_empty_rest_of_line ();
10186}
6482c264
NC
10187#endif
10188
43234a1e
L
10189/* Handle Vector operations. */
10190
10191static char *
10192check_VecOperations (char *op_string, char *op_end)
10193{
10194 const reg_entry *mask;
10195 const char *saved;
10196 char *end_op;
10197
10198 while (*op_string
10199 && (op_end == NULL || op_string < op_end))
10200 {
10201 saved = op_string;
10202 if (*op_string == '{')
10203 {
10204 op_string++;
10205
10206 /* Check broadcasts. */
10207 if (strncmp (op_string, "1to", 3) == 0)
10208 {
10209 int bcst_type;
10210
10211 if (i.broadcast)
10212 goto duplicated_vec_op;
10213
10214 op_string += 3;
10215 if (*op_string == '8')
8e6e0792 10216 bcst_type = 8;
b28d1bda 10217 else if (*op_string == '4')
8e6e0792 10218 bcst_type = 4;
b28d1bda 10219 else if (*op_string == '2')
8e6e0792 10220 bcst_type = 2;
43234a1e
L
10221 else if (*op_string == '1'
10222 && *(op_string+1) == '6')
10223 {
8e6e0792 10224 bcst_type = 16;
43234a1e
L
10225 op_string++;
10226 }
10227 else
10228 {
10229 as_bad (_("Unsupported broadcast: `%s'"), saved);
10230 return NULL;
10231 }
10232 op_string++;
10233
10234 broadcast_op.type = bcst_type;
10235 broadcast_op.operand = this_operand;
1f75763a 10236 broadcast_op.bytes = 0;
43234a1e
L
10237 i.broadcast = &broadcast_op;
10238 }
10239 /* Check masking operation. */
10240 else if ((mask = parse_register (op_string, &end_op)) != NULL)
10241 {
8a6fb3f9
JB
10242 if (mask == &bad_reg)
10243 return NULL;
10244
43234a1e 10245 /* k0 can't be used for write mask. */
f74a6307 10246 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
43234a1e 10247 {
6d2cd6b2
JB
10248 as_bad (_("`%s%s' can't be used for write mask"),
10249 register_prefix, mask->reg_name);
43234a1e
L
10250 return NULL;
10251 }
10252
10253 if (!i.mask)
10254 {
10255 mask_op.mask = mask;
10256 mask_op.zeroing = 0;
10257 mask_op.operand = this_operand;
10258 i.mask = &mask_op;
10259 }
10260 else
10261 {
10262 if (i.mask->mask)
10263 goto duplicated_vec_op;
10264
10265 i.mask->mask = mask;
10266
10267 /* Only "{z}" is allowed here. No need to check
10268 zeroing mask explicitly. */
10269 if (i.mask->operand != this_operand)
10270 {
10271 as_bad (_("invalid write mask `%s'"), saved);
10272 return NULL;
10273 }
10274 }
10275
10276 op_string = end_op;
10277 }
10278 /* Check zeroing-flag for masking operation. */
10279 else if (*op_string == 'z')
10280 {
10281 if (!i.mask)
10282 {
10283 mask_op.mask = NULL;
10284 mask_op.zeroing = 1;
10285 mask_op.operand = this_operand;
10286 i.mask = &mask_op;
10287 }
10288 else
10289 {
10290 if (i.mask->zeroing)
10291 {
10292 duplicated_vec_op:
10293 as_bad (_("duplicated `%s'"), saved);
10294 return NULL;
10295 }
10296
10297 i.mask->zeroing = 1;
10298
10299 /* Only "{%k}" is allowed here. No need to check mask
10300 register explicitly. */
10301 if (i.mask->operand != this_operand)
10302 {
10303 as_bad (_("invalid zeroing-masking `%s'"),
10304 saved);
10305 return NULL;
10306 }
10307 }
10308
10309 op_string++;
10310 }
10311 else
10312 goto unknown_vec_op;
10313
10314 if (*op_string != '}')
10315 {
10316 as_bad (_("missing `}' in `%s'"), saved);
10317 return NULL;
10318 }
10319 op_string++;
0ba3a731
L
10320
10321 /* Strip whitespace since the addition of pseudo prefixes
10322 changed how the scrubber treats '{'. */
10323 if (is_space_char (*op_string))
10324 ++op_string;
10325
43234a1e
L
10326 continue;
10327 }
10328 unknown_vec_op:
10329 /* We don't know this one. */
10330 as_bad (_("unknown vector operation: `%s'"), saved);
10331 return NULL;
10332 }
10333
6d2cd6b2
JB
10334 if (i.mask && i.mask->zeroing && !i.mask->mask)
10335 {
10336 as_bad (_("zeroing-masking only allowed with write mask"));
10337 return NULL;
10338 }
10339
43234a1e
L
10340 return op_string;
10341}
10342
252b5132 10343static int
70e41ade 10344i386_immediate (char *imm_start)
252b5132
RH
10345{
10346 char *save_input_line_pointer;
f3c180ae 10347 char *gotfree_input_line;
252b5132 10348 segT exp_seg = 0;
47926f60 10349 expressionS *exp;
40fb9820
L
10350 i386_operand_type types;
10351
0dfbf9d7 10352 operand_type_set (&types, ~0);
252b5132
RH
10353
10354 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10355 {
31b2323c
L
10356 as_bad (_("at most %d immediate operands are allowed"),
10357 MAX_IMMEDIATE_OPERANDS);
252b5132
RH
10358 return 0;
10359 }
10360
10361 exp = &im_expressions[i.imm_operands++];
520dc8e8 10362 i.op[this_operand].imms = exp;
252b5132
RH
10363
10364 if (is_space_char (*imm_start))
10365 ++imm_start;
10366
10367 save_input_line_pointer = input_line_pointer;
10368 input_line_pointer = imm_start;
10369
d258b828 10370 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
f3c180ae
AM
10371 if (gotfree_input_line)
10372 input_line_pointer = gotfree_input_line;
252b5132
RH
10373
10374 exp_seg = expression (exp);
10375
83183c0c 10376 SKIP_WHITESPACE ();
43234a1e
L
10377
10378 /* Handle vector operations. */
10379 if (*input_line_pointer == '{')
10380 {
10381 input_line_pointer = check_VecOperations (input_line_pointer,
10382 NULL);
10383 if (input_line_pointer == NULL)
10384 return 0;
10385 }
10386
252b5132 10387 if (*input_line_pointer)
f3c180ae 10388 as_bad (_("junk `%s' after expression"), input_line_pointer);
252b5132
RH
10389
10390 input_line_pointer = save_input_line_pointer;
f3c180ae 10391 if (gotfree_input_line)
ee86248c
JB
10392 {
10393 free (gotfree_input_line);
10394
10395 if (exp->X_op == O_constant || exp->X_op == O_register)
10396 exp->X_op = O_illegal;
10397 }
10398
10399 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10400}
252b5132 10401
ee86248c
JB
10402static int
10403i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10404 i386_operand_type types, const char *imm_start)
10405{
10406 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
252b5132 10407 {
313c53d1
L
10408 if (imm_start)
10409 as_bad (_("missing or invalid immediate expression `%s'"),
10410 imm_start);
3992d3b7 10411 return 0;
252b5132 10412 }
3e73aa7c 10413 else if (exp->X_op == O_constant)
252b5132 10414 {
47926f60 10415 /* Size it properly later. */
40fb9820 10416 i.types[this_operand].bitfield.imm64 = 1;
13f864ae
L
10417 /* If not 64bit, sign extend val. */
10418 if (flag_code != CODE_64BIT
4eed87de
AM
10419 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10420 exp->X_add_number
10421 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
252b5132 10422 }
4c63da97 10423#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
f86103b7 10424 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
31312f95 10425 && exp_seg != absolute_section
47926f60 10426 && exp_seg != text_section
24eab124
AM
10427 && exp_seg != data_section
10428 && exp_seg != bss_section
10429 && exp_seg != undefined_section
f86103b7 10430 && !bfd_is_com_section (exp_seg))
252b5132 10431 {
d0b47220 10432 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
252b5132
RH
10433 return 0;
10434 }
10435#endif
a841bdf5 10436 else if (!intel_syntax && exp_seg == reg_section)
bb8f5920 10437 {
313c53d1
L
10438 if (imm_start)
10439 as_bad (_("illegal immediate register operand %s"), imm_start);
bb8f5920
L
10440 return 0;
10441 }
252b5132
RH
10442 else
10443 {
10444 /* This is an address. The size of the address will be
24eab124 10445 determined later, depending on destination register,
3e73aa7c 10446 suffix, or the default for the section. */
40fb9820
L
10447 i.types[this_operand].bitfield.imm8 = 1;
10448 i.types[this_operand].bitfield.imm16 = 1;
10449 i.types[this_operand].bitfield.imm32 = 1;
10450 i.types[this_operand].bitfield.imm32s = 1;
10451 i.types[this_operand].bitfield.imm64 = 1;
c6fb90c8
L
10452 i.types[this_operand] = operand_type_and (i.types[this_operand],
10453 types);
252b5132
RH
10454 }
10455
10456 return 1;
10457}
10458
551c1ca1 10459static char *
e3bb37b5 10460i386_scale (char *scale)
252b5132 10461{
551c1ca1
AM
10462 offsetT val;
10463 char *save = input_line_pointer;
252b5132 10464
551c1ca1
AM
10465 input_line_pointer = scale;
10466 val = get_absolute_expression ();
10467
10468 switch (val)
252b5132 10469 {
551c1ca1 10470 case 1:
252b5132
RH
10471 i.log2_scale_factor = 0;
10472 break;
551c1ca1 10473 case 2:
252b5132
RH
10474 i.log2_scale_factor = 1;
10475 break;
551c1ca1 10476 case 4:
252b5132
RH
10477 i.log2_scale_factor = 2;
10478 break;
551c1ca1 10479 case 8:
252b5132
RH
10480 i.log2_scale_factor = 3;
10481 break;
10482 default:
a724f0f4
JB
10483 {
10484 char sep = *input_line_pointer;
10485
10486 *input_line_pointer = '\0';
10487 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10488 scale);
10489 *input_line_pointer = sep;
10490 input_line_pointer = save;
10491 return NULL;
10492 }
252b5132 10493 }
29b0f896 10494 if (i.log2_scale_factor != 0 && i.index_reg == 0)
252b5132
RH
10495 {
10496 as_warn (_("scale factor of %d without an index register"),
24eab124 10497 1 << i.log2_scale_factor);
252b5132 10498 i.log2_scale_factor = 0;
252b5132 10499 }
551c1ca1
AM
10500 scale = input_line_pointer;
10501 input_line_pointer = save;
10502 return scale;
252b5132
RH
10503}
10504
252b5132 10505static int
e3bb37b5 10506i386_displacement (char *disp_start, char *disp_end)
252b5132 10507{
29b0f896 10508 expressionS *exp;
252b5132
RH
10509 segT exp_seg = 0;
10510 char *save_input_line_pointer;
f3c180ae 10511 char *gotfree_input_line;
40fb9820
L
10512 int override;
10513 i386_operand_type bigdisp, types = anydisp;
3992d3b7 10514 int ret;
252b5132 10515
31b2323c
L
10516 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10517 {
10518 as_bad (_("at most %d displacement operands are allowed"),
10519 MAX_MEMORY_OPERANDS);
10520 return 0;
10521 }
10522
0dfbf9d7 10523 operand_type_set (&bigdisp, 0);
6f2f06be 10524 if (i.jumpabsolute
48bcea9f 10525 || i.types[this_operand].bitfield.baseindex
0cfa3eb3
JB
10526 || (current_templates->start->opcode_modifier.jump != JUMP
10527 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
e05278af 10528 {
48bcea9f 10529 i386_addressing_mode ();
e05278af 10530 override = (i.prefix[ADDR_PREFIX] != 0);
40fb9820
L
10531 if (flag_code == CODE_64BIT)
10532 {
10533 if (!override)
10534 {
10535 bigdisp.bitfield.disp32s = 1;
10536 bigdisp.bitfield.disp64 = 1;
10537 }
48bcea9f
JB
10538 else
10539 bigdisp.bitfield.disp32 = 1;
40fb9820
L
10540 }
10541 else if ((flag_code == CODE_16BIT) ^ override)
40fb9820 10542 bigdisp.bitfield.disp16 = 1;
48bcea9f
JB
10543 else
10544 bigdisp.bitfield.disp32 = 1;
e05278af
JB
10545 }
10546 else
10547 {
376cd056
JB
10548 /* For PC-relative branches, the width of the displacement may be
10549 dependent upon data size, but is never dependent upon address size.
10550 Also make sure to not unintentionally match against a non-PC-relative
10551 branch template. */
10552 static templates aux_templates;
10553 const insn_template *t = current_templates->start;
10554 bfd_boolean has_intel64 = FALSE;
10555
10556 aux_templates.start = t;
10557 while (++t < current_templates->end)
10558 {
10559 if (t->opcode_modifier.jump
10560 != current_templates->start->opcode_modifier.jump)
10561 break;
4b5aaf5f 10562 if ((t->opcode_modifier.isa64 >= INTEL64))
376cd056
JB
10563 has_intel64 = TRUE;
10564 }
10565 if (t < current_templates->end)
10566 {
10567 aux_templates.end = t;
10568 current_templates = &aux_templates;
10569 }
10570
e05278af 10571 override = (i.prefix[DATA_PREFIX] != 0);
40fb9820
L
10572 if (flag_code == CODE_64BIT)
10573 {
376cd056
JB
10574 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10575 && (!intel64 || !has_intel64))
40fb9820
L
10576 bigdisp.bitfield.disp16 = 1;
10577 else
48bcea9f 10578 bigdisp.bitfield.disp32s = 1;
40fb9820
L
10579 }
10580 else
e05278af
JB
10581 {
10582 if (!override)
10583 override = (i.suffix == (flag_code != CODE_16BIT
10584 ? WORD_MNEM_SUFFIX
10585 : LONG_MNEM_SUFFIX));
40fb9820
L
10586 bigdisp.bitfield.disp32 = 1;
10587 if ((flag_code == CODE_16BIT) ^ override)
10588 {
10589 bigdisp.bitfield.disp32 = 0;
10590 bigdisp.bitfield.disp16 = 1;
10591 }
e05278af 10592 }
e05278af 10593 }
c6fb90c8
L
10594 i.types[this_operand] = operand_type_or (i.types[this_operand],
10595 bigdisp);
252b5132
RH
10596
10597 exp = &disp_expressions[i.disp_operands];
520dc8e8 10598 i.op[this_operand].disps = exp;
252b5132
RH
10599 i.disp_operands++;
10600 save_input_line_pointer = input_line_pointer;
10601 input_line_pointer = disp_start;
10602 END_STRING_AND_SAVE (disp_end);
10603
10604#ifndef GCC_ASM_O_HACK
10605#define GCC_ASM_O_HACK 0
10606#endif
10607#if GCC_ASM_O_HACK
10608 END_STRING_AND_SAVE (disp_end + 1);
40fb9820 10609 if (i.types[this_operand].bitfield.baseIndex
24eab124 10610 && displacement_string_end[-1] == '+')
252b5132
RH
10611 {
10612 /* This hack is to avoid a warning when using the "o"
24eab124
AM
10613 constraint within gcc asm statements.
10614 For instance:
10615
10616 #define _set_tssldt_desc(n,addr,limit,type) \
10617 __asm__ __volatile__ ( \
10618 "movw %w2,%0\n\t" \
10619 "movw %w1,2+%0\n\t" \
10620 "rorl $16,%1\n\t" \
10621 "movb %b1,4+%0\n\t" \
10622 "movb %4,5+%0\n\t" \
10623 "movb $0,6+%0\n\t" \
10624 "movb %h1,7+%0\n\t" \
10625 "rorl $16,%1" \
10626 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10627
10628 This works great except that the output assembler ends
10629 up looking a bit weird if it turns out that there is
10630 no offset. You end up producing code that looks like:
10631
10632 #APP
10633 movw $235,(%eax)
10634 movw %dx,2+(%eax)
10635 rorl $16,%edx
10636 movb %dl,4+(%eax)
10637 movb $137,5+(%eax)
10638 movb $0,6+(%eax)
10639 movb %dh,7+(%eax)
10640 rorl $16,%edx
10641 #NO_APP
10642
47926f60 10643 So here we provide the missing zero. */
24eab124
AM
10644
10645 *displacement_string_end = '0';
252b5132
RH
10646 }
10647#endif
d258b828 10648 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
f3c180ae
AM
10649 if (gotfree_input_line)
10650 input_line_pointer = gotfree_input_line;
252b5132 10651
24eab124 10652 exp_seg = expression (exp);
252b5132 10653
636c26b0
AM
10654 SKIP_WHITESPACE ();
10655 if (*input_line_pointer)
10656 as_bad (_("junk `%s' after expression"), input_line_pointer);
10657#if GCC_ASM_O_HACK
10658 RESTORE_END_STRING (disp_end + 1);
10659#endif
636c26b0 10660 input_line_pointer = save_input_line_pointer;
636c26b0 10661 if (gotfree_input_line)
ee86248c
JB
10662 {
10663 free (gotfree_input_line);
10664
10665 if (exp->X_op == O_constant || exp->X_op == O_register)
10666 exp->X_op = O_illegal;
10667 }
10668
10669 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10670
10671 RESTORE_END_STRING (disp_end);
10672
10673 return ret;
10674}
10675
10676static int
10677i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10678 i386_operand_type types, const char *disp_start)
10679{
10680 i386_operand_type bigdisp;
10681 int ret = 1;
636c26b0 10682
24eab124
AM
10683 /* We do this to make sure that the section symbol is in
10684 the symbol table. We will ultimately change the relocation
47926f60 10685 to be relative to the beginning of the section. */
1ae12ab7 10686 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
d6ab8113
JB
10687 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10688 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
24eab124 10689 {
636c26b0 10690 if (exp->X_op != O_symbol)
3992d3b7 10691 goto inv_disp;
636c26b0 10692
e5cb08ac 10693 if (S_IS_LOCAL (exp->X_add_symbol)
c64efb4b
L
10694 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10695 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
24eab124 10696 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
24eab124
AM
10697 exp->X_op = O_subtract;
10698 exp->X_op_symbol = GOT_symbol;
1ae12ab7 10699 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
29b0f896 10700 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
d6ab8113
JB
10701 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10702 i.reloc[this_operand] = BFD_RELOC_64;
23df1078 10703 else
29b0f896 10704 i.reloc[this_operand] = BFD_RELOC_32;
24eab124 10705 }
252b5132 10706
3992d3b7
AM
10707 else if (exp->X_op == O_absent
10708 || exp->X_op == O_illegal
ee86248c 10709 || exp->X_op == O_big)
2daf4fd8 10710 {
3992d3b7
AM
10711 inv_disp:
10712 as_bad (_("missing or invalid displacement expression `%s'"),
2daf4fd8 10713 disp_start);
3992d3b7 10714 ret = 0;
2daf4fd8
AM
10715 }
10716
0e1147d9
L
10717 else if (flag_code == CODE_64BIT
10718 && !i.prefix[ADDR_PREFIX]
10719 && exp->X_op == O_constant)
10720 {
10721 /* Since displacement is signed extended to 64bit, don't allow
10722 disp32 and turn off disp32s if they are out of range. */
10723 i.types[this_operand].bitfield.disp32 = 0;
10724 if (!fits_in_signed_long (exp->X_add_number))
10725 {
10726 i.types[this_operand].bitfield.disp32s = 0;
10727 if (i.types[this_operand].bitfield.baseindex)
10728 {
10729 as_bad (_("0x%lx out range of signed 32bit displacement"),
10730 (long) exp->X_add_number);
10731 ret = 0;
10732 }
10733 }
10734 }
10735
4c63da97 10736#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
3992d3b7
AM
10737 else if (exp->X_op != O_constant
10738 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10739 && exp_seg != absolute_section
10740 && exp_seg != text_section
10741 && exp_seg != data_section
10742 && exp_seg != bss_section
10743 && exp_seg != undefined_section
10744 && !bfd_is_com_section (exp_seg))
24eab124 10745 {
d0b47220 10746 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
3992d3b7 10747 ret = 0;
24eab124 10748 }
252b5132 10749#endif
3956db08 10750
48bcea9f
JB
10751 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10752 /* Constants get taken care of by optimize_disp(). */
10753 && exp->X_op != O_constant)
10754 i.types[this_operand].bitfield.disp8 = 1;
10755
40fb9820
L
10756 /* Check if this is a displacement only operand. */
10757 bigdisp = i.types[this_operand];
10758 bigdisp.bitfield.disp8 = 0;
10759 bigdisp.bitfield.disp16 = 0;
10760 bigdisp.bitfield.disp32 = 0;
10761 bigdisp.bitfield.disp32s = 0;
10762 bigdisp.bitfield.disp64 = 0;
0dfbf9d7 10763 if (operand_type_all_zero (&bigdisp))
c6fb90c8
L
10764 i.types[this_operand] = operand_type_and (i.types[this_operand],
10765 types);
3956db08 10766
3992d3b7 10767 return ret;
252b5132
RH
10768}
10769
2abc2bec
JB
10770/* Return the active addressing mode, taking address override and
10771 registers forming the address into consideration. Update the
10772 address override prefix if necessary. */
47926f60 10773
2abc2bec
JB
10774static enum flag_code
10775i386_addressing_mode (void)
252b5132 10776{
be05d201
L
10777 enum flag_code addr_mode;
10778
10779 if (i.prefix[ADDR_PREFIX])
10780 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
a23b33b3
JB
10781 else if (flag_code == CODE_16BIT
10782 && current_templates->start->cpu_flags.bitfield.cpumpx
10783 /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10784 from md_assemble() by "is not a valid base/index expression"
10785 when there is a base and/or index. */
10786 && !i.types[this_operand].bitfield.baseindex)
10787 {
10788 /* MPX insn memory operands with neither base nor index must be forced
10789 to use 32-bit addressing in 16-bit mode. */
10790 addr_mode = CODE_32BIT;
10791 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10792 ++i.prefixes;
10793 gas_assert (!i.types[this_operand].bitfield.disp16);
10794 gas_assert (!i.types[this_operand].bitfield.disp32);
10795 }
be05d201
L
10796 else
10797 {
10798 addr_mode = flag_code;
10799
24eab124 10800#if INFER_ADDR_PREFIX
be05d201
L
10801 if (i.mem_operands == 0)
10802 {
10803 /* Infer address prefix from the first memory operand. */
10804 const reg_entry *addr_reg = i.base_reg;
10805
10806 if (addr_reg == NULL)
10807 addr_reg = i.index_reg;
eecb386c 10808
be05d201
L
10809 if (addr_reg)
10810 {
e968fc9b 10811 if (addr_reg->reg_type.bitfield.dword)
be05d201
L
10812 addr_mode = CODE_32BIT;
10813 else if (flag_code != CODE_64BIT
dc821c5f 10814 && addr_reg->reg_type.bitfield.word)
be05d201
L
10815 addr_mode = CODE_16BIT;
10816
10817 if (addr_mode != flag_code)
10818 {
10819 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10820 i.prefixes += 1;
10821 /* Change the size of any displacement too. At most one
10822 of Disp16 or Disp32 is set.
10823 FIXME. There doesn't seem to be any real need for
10824 separate Disp16 and Disp32 flags. The same goes for
10825 Imm16 and Imm32. Removing them would probably clean
10826 up the code quite a lot. */
10827 if (flag_code != CODE_64BIT
10828 && (i.types[this_operand].bitfield.disp16
10829 || i.types[this_operand].bitfield.disp32))
10830 i.types[this_operand]
10831 = operand_type_xor (i.types[this_operand], disp16_32);
10832 }
10833 }
10834 }
24eab124 10835#endif
be05d201
L
10836 }
10837
2abc2bec
JB
10838 return addr_mode;
10839}
10840
10841/* Make sure the memory operand we've been dealt is valid.
10842 Return 1 on success, 0 on a failure. */
10843
10844static int
10845i386_index_check (const char *operand_string)
10846{
10847 const char *kind = "base/index";
10848 enum flag_code addr_mode = i386_addressing_mode ();
10849
fc0763e6 10850 if (current_templates->start->opcode_modifier.isstring
c3949f43 10851 && !current_templates->start->cpu_flags.bitfield.cpupadlock
fc0763e6
JB
10852 && (current_templates->end[-1].opcode_modifier.isstring
10853 || i.mem_operands))
10854 {
10855 /* Memory operands of string insns are special in that they only allow
10856 a single register (rDI, rSI, or rBX) as their memory address. */
be05d201
L
10857 const reg_entry *expected_reg;
10858 static const char *di_si[][2] =
10859 {
10860 { "esi", "edi" },
10861 { "si", "di" },
10862 { "rsi", "rdi" }
10863 };
10864 static const char *bx[] = { "ebx", "bx", "rbx" };
fc0763e6
JB
10865
10866 kind = "string address";
10867
8325cc63 10868 if (current_templates->start->opcode_modifier.repprefixok)
fc0763e6 10869 {
51c8edf6
JB
10870 int es_op = current_templates->end[-1].opcode_modifier.isstring
10871 - IS_STRING_ES_OP0;
10872 int op = 0;
fc0763e6 10873
51c8edf6 10874 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
fc0763e6
JB
10875 || ((!i.mem_operands != !intel_syntax)
10876 && current_templates->end[-1].operand_types[1]
10877 .bitfield.baseindex))
51c8edf6
JB
10878 op = 1;
10879 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
fc0763e6
JB
10880 }
10881 else
be05d201 10882 expected_reg = hash_find (reg_hash, bx[addr_mode]);
fc0763e6 10883
be05d201
L
10884 if (i.base_reg != expected_reg
10885 || i.index_reg
fc0763e6 10886 || operand_type_check (i.types[this_operand], disp))
fc0763e6 10887 {
be05d201
L
10888 /* The second memory operand must have the same size as
10889 the first one. */
10890 if (i.mem_operands
10891 && i.base_reg
10892 && !((addr_mode == CODE_64BIT
dc821c5f 10893 && i.base_reg->reg_type.bitfield.qword)
be05d201 10894 || (addr_mode == CODE_32BIT
dc821c5f
JB
10895 ? i.base_reg->reg_type.bitfield.dword
10896 : i.base_reg->reg_type.bitfield.word)))
be05d201
L
10897 goto bad_address;
10898
fc0763e6
JB
10899 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10900 operand_string,
10901 intel_syntax ? '[' : '(',
10902 register_prefix,
be05d201 10903 expected_reg->reg_name,
fc0763e6 10904 intel_syntax ? ']' : ')');
be05d201 10905 return 1;
fc0763e6 10906 }
be05d201
L
10907 else
10908 return 1;
10909
dc1e8a47 10910 bad_address:
be05d201
L
10911 as_bad (_("`%s' is not a valid %s expression"),
10912 operand_string, kind);
10913 return 0;
3e73aa7c
JH
10914 }
10915 else
10916 {
be05d201
L
10917 if (addr_mode != CODE_16BIT)
10918 {
10919 /* 32-bit/64-bit checks. */
10920 if ((i.base_reg
e968fc9b
JB
10921 && ((addr_mode == CODE_64BIT
10922 ? !i.base_reg->reg_type.bitfield.qword
10923 : !i.base_reg->reg_type.bitfield.dword)
10924 || (i.index_reg && i.base_reg->reg_num == RegIP)
10925 || i.base_reg->reg_num == RegIZ))
be05d201 10926 || (i.index_reg
1b54b8d7
JB
10927 && !i.index_reg->reg_type.bitfield.xmmword
10928 && !i.index_reg->reg_type.bitfield.ymmword
10929 && !i.index_reg->reg_type.bitfield.zmmword
be05d201 10930 && ((addr_mode == CODE_64BIT
e968fc9b
JB
10931 ? !i.index_reg->reg_type.bitfield.qword
10932 : !i.index_reg->reg_type.bitfield.dword)
be05d201
L
10933 || !i.index_reg->reg_type.bitfield.baseindex)))
10934 goto bad_address;
8178be5b
JB
10935
10936 /* bndmk, bndldx, and bndstx have special restrictions. */
10937 if (current_templates->start->base_opcode == 0xf30f1b
10938 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10939 {
10940 /* They cannot use RIP-relative addressing. */
e968fc9b 10941 if (i.base_reg && i.base_reg->reg_num == RegIP)
8178be5b
JB
10942 {
10943 as_bad (_("`%s' cannot be used here"), operand_string);
10944 return 0;
10945 }
10946
10947 /* bndldx and bndstx ignore their scale factor. */
10948 if (current_templates->start->base_opcode != 0xf30f1b
10949 && i.log2_scale_factor)
10950 as_warn (_("register scaling is being ignored here"));
10951 }
be05d201
L
10952 }
10953 else
3e73aa7c 10954 {
be05d201 10955 /* 16-bit checks. */
3e73aa7c 10956 if ((i.base_reg
dc821c5f 10957 && (!i.base_reg->reg_type.bitfield.word
40fb9820 10958 || !i.base_reg->reg_type.bitfield.baseindex))
3e73aa7c 10959 || (i.index_reg
dc821c5f 10960 && (!i.index_reg->reg_type.bitfield.word
40fb9820 10961 || !i.index_reg->reg_type.bitfield.baseindex
29b0f896
AM
10962 || !(i.base_reg
10963 && i.base_reg->reg_num < 6
10964 && i.index_reg->reg_num >= 6
10965 && i.log2_scale_factor == 0))))
be05d201 10966 goto bad_address;
3e73aa7c
JH
10967 }
10968 }
be05d201 10969 return 1;
24eab124 10970}
252b5132 10971
43234a1e
L
10972/* Handle vector immediates. */
10973
10974static int
10975RC_SAE_immediate (const char *imm_start)
10976{
10977 unsigned int match_found, j;
10978 const char *pstr = imm_start;
10979 expressionS *exp;
10980
10981 if (*pstr != '{')
10982 return 0;
10983
10984 pstr++;
10985 match_found = 0;
10986 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10987 {
10988 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10989 {
10990 if (!i.rounding)
10991 {
10992 rc_op.type = RC_NamesTable[j].type;
10993 rc_op.operand = this_operand;
10994 i.rounding = &rc_op;
10995 }
10996 else
10997 {
10998 as_bad (_("duplicated `%s'"), imm_start);
10999 return 0;
11000 }
11001 pstr += RC_NamesTable[j].len;
11002 match_found = 1;
11003 break;
11004 }
11005 }
11006 if (!match_found)
11007 return 0;
11008
11009 if (*pstr++ != '}')
11010 {
11011 as_bad (_("Missing '}': '%s'"), imm_start);
11012 return 0;
11013 }
11014 /* RC/SAE immediate string should contain nothing more. */;
11015 if (*pstr != 0)
11016 {
11017 as_bad (_("Junk after '}': '%s'"), imm_start);
11018 return 0;
11019 }
11020
11021 exp = &im_expressions[i.imm_operands++];
11022 i.op[this_operand].imms = exp;
11023
11024 exp->X_op = O_constant;
11025 exp->X_add_number = 0;
11026 exp->X_add_symbol = (symbolS *) 0;
11027 exp->X_op_symbol = (symbolS *) 0;
11028
11029 i.types[this_operand].bitfield.imm8 = 1;
11030 return 1;
11031}
11032
8325cc63
JB
11033/* Only string instructions can have a second memory operand, so
11034 reduce current_templates to just those if it contains any. */
11035static int
11036maybe_adjust_templates (void)
11037{
11038 const insn_template *t;
11039
11040 gas_assert (i.mem_operands == 1);
11041
11042 for (t = current_templates->start; t < current_templates->end; ++t)
11043 if (t->opcode_modifier.isstring)
11044 break;
11045
11046 if (t < current_templates->end)
11047 {
11048 static templates aux_templates;
11049 bfd_boolean recheck;
11050
11051 aux_templates.start = t;
11052 for (; t < current_templates->end; ++t)
11053 if (!t->opcode_modifier.isstring)
11054 break;
11055 aux_templates.end = t;
11056
11057 /* Determine whether to re-check the first memory operand. */
11058 recheck = (aux_templates.start != current_templates->start
11059 || t != current_templates->end);
11060
11061 current_templates = &aux_templates;
11062
11063 if (recheck)
11064 {
11065 i.mem_operands = 0;
11066 if (i.memop1_string != NULL
11067 && i386_index_check (i.memop1_string) == 0)
11068 return 0;
11069 i.mem_operands = 1;
11070 }
11071 }
11072
11073 return 1;
11074}
11075
fc0763e6 11076/* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
47926f60 11077 on error. */
252b5132 11078
252b5132 11079static int
a7619375 11080i386_att_operand (char *operand_string)
252b5132 11081{
af6bdddf
AM
11082 const reg_entry *r;
11083 char *end_op;
24eab124 11084 char *op_string = operand_string;
252b5132 11085
24eab124 11086 if (is_space_char (*op_string))
252b5132
RH
11087 ++op_string;
11088
24eab124 11089 /* We check for an absolute prefix (differentiating,
47926f60 11090 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
24eab124
AM
11091 if (*op_string == ABSOLUTE_PREFIX)
11092 {
11093 ++op_string;
11094 if (is_space_char (*op_string))
11095 ++op_string;
6f2f06be 11096 i.jumpabsolute = TRUE;
24eab124 11097 }
252b5132 11098
47926f60 11099 /* Check if operand is a register. */
4d1bb795 11100 if ((r = parse_register (op_string, &end_op)) != NULL)
24eab124 11101 {
40fb9820
L
11102 i386_operand_type temp;
11103
8a6fb3f9
JB
11104 if (r == &bad_reg)
11105 return 0;
11106
24eab124
AM
11107 /* Check for a segment override by searching for ':' after a
11108 segment register. */
11109 op_string = end_op;
11110 if (is_space_char (*op_string))
11111 ++op_string;
00cee14f 11112 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
24eab124
AM
11113 {
11114 switch (r->reg_num)
11115 {
11116 case 0:
11117 i.seg[i.mem_operands] = &es;
11118 break;
11119 case 1:
11120 i.seg[i.mem_operands] = &cs;
11121 break;
11122 case 2:
11123 i.seg[i.mem_operands] = &ss;
11124 break;
11125 case 3:
11126 i.seg[i.mem_operands] = &ds;
11127 break;
11128 case 4:
11129 i.seg[i.mem_operands] = &fs;
11130 break;
11131 case 5:
11132 i.seg[i.mem_operands] = &gs;
11133 break;
11134 }
252b5132 11135
24eab124 11136 /* Skip the ':' and whitespace. */
252b5132
RH
11137 ++op_string;
11138 if (is_space_char (*op_string))
24eab124 11139 ++op_string;
252b5132 11140
24eab124
AM
11141 if (!is_digit_char (*op_string)
11142 && !is_identifier_char (*op_string)
11143 && *op_string != '('
11144 && *op_string != ABSOLUTE_PREFIX)
11145 {
11146 as_bad (_("bad memory operand `%s'"), op_string);
11147 return 0;
11148 }
47926f60 11149 /* Handle case of %es:*foo. */
24eab124
AM
11150 if (*op_string == ABSOLUTE_PREFIX)
11151 {
11152 ++op_string;
11153 if (is_space_char (*op_string))
11154 ++op_string;
6f2f06be 11155 i.jumpabsolute = TRUE;
24eab124
AM
11156 }
11157 goto do_memory_reference;
11158 }
43234a1e
L
11159
11160 /* Handle vector operations. */
11161 if (*op_string == '{')
11162 {
11163 op_string = check_VecOperations (op_string, NULL);
11164 if (op_string == NULL)
11165 return 0;
11166 }
11167
24eab124
AM
11168 if (*op_string)
11169 {
d0b47220 11170 as_bad (_("junk `%s' after register"), op_string);
24eab124
AM
11171 return 0;
11172 }
40fb9820
L
11173 temp = r->reg_type;
11174 temp.bitfield.baseindex = 0;
c6fb90c8
L
11175 i.types[this_operand] = operand_type_or (i.types[this_operand],
11176 temp);
7d5e4556 11177 i.types[this_operand].bitfield.unspecified = 0;
520dc8e8 11178 i.op[this_operand].regs = r;
24eab124
AM
11179 i.reg_operands++;
11180 }
af6bdddf
AM
11181 else if (*op_string == REGISTER_PREFIX)
11182 {
11183 as_bad (_("bad register name `%s'"), op_string);
11184 return 0;
11185 }
24eab124 11186 else if (*op_string == IMMEDIATE_PREFIX)
ce8a8b2f 11187 {
24eab124 11188 ++op_string;
6f2f06be 11189 if (i.jumpabsolute)
24eab124 11190 {
d0b47220 11191 as_bad (_("immediate operand illegal with absolute jump"));
24eab124
AM
11192 return 0;
11193 }
11194 if (!i386_immediate (op_string))
11195 return 0;
11196 }
43234a1e
L
11197 else if (RC_SAE_immediate (operand_string))
11198 {
11199 /* If it is a RC or SAE immediate, do nothing. */
11200 ;
11201 }
24eab124
AM
11202 else if (is_digit_char (*op_string)
11203 || is_identifier_char (*op_string)
d02603dc 11204 || *op_string == '"'
e5cb08ac 11205 || *op_string == '(')
24eab124 11206 {
47926f60 11207 /* This is a memory reference of some sort. */
af6bdddf 11208 char *base_string;
252b5132 11209
47926f60 11210 /* Start and end of displacement string expression (if found). */
eecb386c
AM
11211 char *displacement_string_start;
11212 char *displacement_string_end;
43234a1e 11213 char *vop_start;
252b5132 11214
24eab124 11215 do_memory_reference:
8325cc63
JB
11216 if (i.mem_operands == 1 && !maybe_adjust_templates ())
11217 return 0;
24eab124 11218 if ((i.mem_operands == 1
40fb9820 11219 && !current_templates->start->opcode_modifier.isstring)
24eab124
AM
11220 || i.mem_operands == 2)
11221 {
11222 as_bad (_("too many memory references for `%s'"),
11223 current_templates->start->name);
11224 return 0;
11225 }
252b5132 11226
24eab124
AM
11227 /* Check for base index form. We detect the base index form by
11228 looking for an ')' at the end of the operand, searching
11229 for the '(' matching it, and finding a REGISTER_PREFIX or ','
11230 after the '('. */
af6bdddf 11231 base_string = op_string + strlen (op_string);
c3332e24 11232
43234a1e
L
11233 /* Handle vector operations. */
11234 vop_start = strchr (op_string, '{');
11235 if (vop_start && vop_start < base_string)
11236 {
11237 if (check_VecOperations (vop_start, base_string) == NULL)
11238 return 0;
11239 base_string = vop_start;
11240 }
11241
af6bdddf
AM
11242 --base_string;
11243 if (is_space_char (*base_string))
11244 --base_string;
252b5132 11245
47926f60 11246 /* If we only have a displacement, set-up for it to be parsed later. */
af6bdddf
AM
11247 displacement_string_start = op_string;
11248 displacement_string_end = base_string + 1;
252b5132 11249
24eab124
AM
11250 if (*base_string == ')')
11251 {
af6bdddf 11252 char *temp_string;
24eab124
AM
11253 unsigned int parens_balanced = 1;
11254 /* We've already checked that the number of left & right ()'s are
47926f60 11255 equal, so this loop will not be infinite. */
24eab124
AM
11256 do
11257 {
11258 base_string--;
11259 if (*base_string == ')')
11260 parens_balanced++;
11261 if (*base_string == '(')
11262 parens_balanced--;
11263 }
11264 while (parens_balanced);
c3332e24 11265
af6bdddf 11266 temp_string = base_string;
c3332e24 11267
24eab124 11268 /* Skip past '(' and whitespace. */
252b5132
RH
11269 ++base_string;
11270 if (is_space_char (*base_string))
24eab124 11271 ++base_string;
252b5132 11272
af6bdddf 11273 if (*base_string == ','
4eed87de
AM
11274 || ((i.base_reg = parse_register (base_string, &end_op))
11275 != NULL))
252b5132 11276 {
af6bdddf 11277 displacement_string_end = temp_string;
252b5132 11278
40fb9820 11279 i.types[this_operand].bitfield.baseindex = 1;
252b5132 11280
af6bdddf 11281 if (i.base_reg)
24eab124 11282 {
8a6fb3f9
JB
11283 if (i.base_reg == &bad_reg)
11284 return 0;
24eab124
AM
11285 base_string = end_op;
11286 if (is_space_char (*base_string))
11287 ++base_string;
af6bdddf
AM
11288 }
11289
11290 /* There may be an index reg or scale factor here. */
11291 if (*base_string == ',')
11292 {
11293 ++base_string;
11294 if (is_space_char (*base_string))
11295 ++base_string;
11296
4eed87de
AM
11297 if ((i.index_reg = parse_register (base_string, &end_op))
11298 != NULL)
24eab124 11299 {
8a6fb3f9
JB
11300 if (i.index_reg == &bad_reg)
11301 return 0;
af6bdddf 11302 base_string = end_op;
24eab124
AM
11303 if (is_space_char (*base_string))
11304 ++base_string;
af6bdddf
AM
11305 if (*base_string == ',')
11306 {
11307 ++base_string;
11308 if (is_space_char (*base_string))
11309 ++base_string;
11310 }
e5cb08ac 11311 else if (*base_string != ')')
af6bdddf 11312 {
4eed87de
AM
11313 as_bad (_("expecting `,' or `)' "
11314 "after index register in `%s'"),
af6bdddf
AM
11315 operand_string);
11316 return 0;
11317 }
24eab124 11318 }
af6bdddf 11319 else if (*base_string == REGISTER_PREFIX)
24eab124 11320 {
f76bf5e0
L
11321 end_op = strchr (base_string, ',');
11322 if (end_op)
11323 *end_op = '\0';
af6bdddf 11324 as_bad (_("bad register name `%s'"), base_string);
24eab124
AM
11325 return 0;
11326 }
252b5132 11327
47926f60 11328 /* Check for scale factor. */
551c1ca1 11329 if (*base_string != ')')
af6bdddf 11330 {
551c1ca1
AM
11331 char *end_scale = i386_scale (base_string);
11332
11333 if (!end_scale)
af6bdddf 11334 return 0;
24eab124 11335
551c1ca1 11336 base_string = end_scale;
af6bdddf
AM
11337 if (is_space_char (*base_string))
11338 ++base_string;
11339 if (*base_string != ')')
11340 {
4eed87de
AM
11341 as_bad (_("expecting `)' "
11342 "after scale factor in `%s'"),
af6bdddf
AM
11343 operand_string);
11344 return 0;
11345 }
11346 }
11347 else if (!i.index_reg)
24eab124 11348 {
4eed87de
AM
11349 as_bad (_("expecting index register or scale factor "
11350 "after `,'; got '%c'"),
af6bdddf 11351 *base_string);
24eab124
AM
11352 return 0;
11353 }
11354 }
af6bdddf 11355 else if (*base_string != ')')
24eab124 11356 {
4eed87de
AM
11357 as_bad (_("expecting `,' or `)' "
11358 "after base register in `%s'"),
af6bdddf 11359 operand_string);
24eab124
AM
11360 return 0;
11361 }
c3332e24 11362 }
af6bdddf 11363 else if (*base_string == REGISTER_PREFIX)
c3332e24 11364 {
f76bf5e0
L
11365 end_op = strchr (base_string, ',');
11366 if (end_op)
11367 *end_op = '\0';
af6bdddf 11368 as_bad (_("bad register name `%s'"), base_string);
24eab124 11369 return 0;
c3332e24 11370 }
24eab124
AM
11371 }
11372
11373 /* If there's an expression beginning the operand, parse it,
11374 assuming displacement_string_start and
11375 displacement_string_end are meaningful. */
11376 if (displacement_string_start != displacement_string_end)
11377 {
11378 if (!i386_displacement (displacement_string_start,
11379 displacement_string_end))
11380 return 0;
11381 }
11382
11383 /* Special case for (%dx) while doing input/output op. */
11384 if (i.base_reg
75e5731b
JB
11385 && i.base_reg->reg_type.bitfield.instance == RegD
11386 && i.base_reg->reg_type.bitfield.word
24eab124
AM
11387 && i.index_reg == 0
11388 && i.log2_scale_factor == 0
11389 && i.seg[i.mem_operands] == 0
40fb9820 11390 && !operand_type_check (i.types[this_operand], disp))
24eab124 11391 {
2fb5be8d 11392 i.types[this_operand] = i.base_reg->reg_type;
24eab124
AM
11393 return 1;
11394 }
11395
eecb386c
AM
11396 if (i386_index_check (operand_string) == 0)
11397 return 0;
c48dadc9 11398 i.flags[this_operand] |= Operand_Mem;
8325cc63
JB
11399 if (i.mem_operands == 0)
11400 i.memop1_string = xstrdup (operand_string);
24eab124
AM
11401 i.mem_operands++;
11402 }
11403 else
ce8a8b2f
AM
11404 {
11405 /* It's not a memory operand; argh! */
24eab124
AM
11406 as_bad (_("invalid char %s beginning operand %d `%s'"),
11407 output_invalid (*op_string),
11408 this_operand + 1,
11409 op_string);
11410 return 0;
11411 }
47926f60 11412 return 1; /* Normal return. */
252b5132
RH
11413}
11414\f
fa94de6b
RM
11415/* Calculate the maximum variable size (i.e., excluding fr_fix)
11416 that an rs_machine_dependent frag may reach. */
11417
11418unsigned int
11419i386_frag_max_var (fragS *frag)
11420{
11421 /* The only relaxable frags are for jumps.
11422 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
11423 gas_assert (frag->fr_type == rs_machine_dependent);
11424 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11425}
11426
b084df0b
L
11427#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11428static int
8dcea932 11429elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
b084df0b
L
11430{
11431 /* STT_GNU_IFUNC symbol must go through PLT. */
11432 if ((symbol_get_bfdsym (fr_symbol)->flags
11433 & BSF_GNU_INDIRECT_FUNCTION) != 0)
11434 return 0;
11435
11436 if (!S_IS_EXTERNAL (fr_symbol))
11437 /* Symbol may be weak or local. */
11438 return !S_IS_WEAK (fr_symbol);
11439
8dcea932
L
11440 /* Global symbols with non-default visibility can't be preempted. */
11441 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11442 return 1;
11443
11444 if (fr_var != NO_RELOC)
11445 switch ((enum bfd_reloc_code_real) fr_var)
11446 {
11447 case BFD_RELOC_386_PLT32:
11448 case BFD_RELOC_X86_64_PLT32:
33eaf5de 11449 /* Symbol with PLT relocation may be preempted. */
8dcea932
L
11450 return 0;
11451 default:
11452 abort ();
11453 }
11454
b084df0b
L
11455 /* Global symbols with default visibility in a shared library may be
11456 preempted by another definition. */
8dcea932 11457 return !shared;
b084df0b
L
11458}
11459#endif
11460
79d72f45
HL
11461/* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11462 Note also work for Skylake and Cascadelake.
11463---------------------------------------------------------------------
11464| JCC | ADD/SUB/CMP | INC/DEC | TEST/AND |
11465| ------ | ----------- | ------- | -------- |
11466| Jo | N | N | Y |
11467| Jno | N | N | Y |
11468| Jc/Jb | Y | N | Y |
11469| Jae/Jnb | Y | N | Y |
11470| Je/Jz | Y | Y | Y |
11471| Jne/Jnz | Y | Y | Y |
11472| Jna/Jbe | Y | N | Y |
11473| Ja/Jnbe | Y | N | Y |
11474| Js | N | N | Y |
11475| Jns | N | N | Y |
11476| Jp/Jpe | N | N | Y |
11477| Jnp/Jpo | N | N | Y |
11478| Jl/Jnge | Y | Y | Y |
11479| Jge/Jnl | Y | Y | Y |
11480| Jle/Jng | Y | Y | Y |
11481| Jg/Jnle | Y | Y | Y |
11482--------------------------------------------------------------------- */
11483static int
11484i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11485{
11486 if (mf_cmp == mf_cmp_alu_cmp)
11487 return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11488 || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11489 if (mf_cmp == mf_cmp_incdec)
11490 return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11491 || mf_jcc == mf_jcc_jle);
11492 if (mf_cmp == mf_cmp_test_and)
11493 return 1;
11494 return 0;
11495}
11496
e379e5f3
L
11497/* Return the next non-empty frag. */
11498
11499static fragS *
11500i386_next_non_empty_frag (fragS *fragP)
11501{
11502 /* There may be a frag with a ".fill 0" when there is no room in
11503 the current frag for frag_grow in output_insn. */
11504 for (fragP = fragP->fr_next;
11505 (fragP != NULL
11506 && fragP->fr_type == rs_fill
11507 && fragP->fr_fix == 0);
11508 fragP = fragP->fr_next)
11509 ;
11510 return fragP;
11511}
11512
11513/* Return the next jcc frag after BRANCH_PADDING. */
11514
11515static fragS *
79d72f45 11516i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
e379e5f3 11517{
79d72f45
HL
11518 fragS *branch_fragP;
11519 if (!pad_fragP)
e379e5f3
L
11520 return NULL;
11521
79d72f45
HL
11522 if (pad_fragP->fr_type == rs_machine_dependent
11523 && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
e379e5f3
L
11524 == BRANCH_PADDING))
11525 {
79d72f45
HL
11526 branch_fragP = i386_next_non_empty_frag (pad_fragP);
11527 if (branch_fragP->fr_type != rs_machine_dependent)
e379e5f3 11528 return NULL;
79d72f45
HL
11529 if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11530 && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11531 pad_fragP->tc_frag_data.mf_type))
11532 return branch_fragP;
e379e5f3
L
11533 }
11534
11535 return NULL;
11536}
11537
11538/* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
11539
11540static void
11541i386_classify_machine_dependent_frag (fragS *fragP)
11542{
11543 fragS *cmp_fragP;
11544 fragS *pad_fragP;
11545 fragS *branch_fragP;
11546 fragS *next_fragP;
11547 unsigned int max_prefix_length;
11548
11549 if (fragP->tc_frag_data.classified)
11550 return;
11551
11552 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11553 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11554 for (next_fragP = fragP;
11555 next_fragP != NULL;
11556 next_fragP = next_fragP->fr_next)
11557 {
11558 next_fragP->tc_frag_data.classified = 1;
11559 if (next_fragP->fr_type == rs_machine_dependent)
11560 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11561 {
11562 case BRANCH_PADDING:
11563 /* The BRANCH_PADDING frag must be followed by a branch
11564 frag. */
11565 branch_fragP = i386_next_non_empty_frag (next_fragP);
11566 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11567 break;
11568 case FUSED_JCC_PADDING:
11569 /* Check if this is a fused jcc:
11570 FUSED_JCC_PADDING
11571 CMP like instruction
11572 BRANCH_PADDING
11573 COND_JUMP
11574 */
11575 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11576 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
79d72f45 11577 branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
e379e5f3
L
11578 if (branch_fragP)
11579 {
11580 /* The BRANCH_PADDING frag is merged with the
11581 FUSED_JCC_PADDING frag. */
11582 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11583 /* CMP like instruction size. */
11584 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11585 frag_wane (pad_fragP);
11586 /* Skip to branch_fragP. */
11587 next_fragP = branch_fragP;
11588 }
11589 else if (next_fragP->tc_frag_data.max_prefix_length)
11590 {
11591 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11592 a fused jcc. */
11593 next_fragP->fr_subtype
11594 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11595 next_fragP->tc_frag_data.max_bytes
11596 = next_fragP->tc_frag_data.max_prefix_length;
11597 /* This will be updated in the BRANCH_PREFIX scan. */
11598 next_fragP->tc_frag_data.max_prefix_length = 0;
11599 }
11600 else
11601 frag_wane (next_fragP);
11602 break;
11603 }
11604 }
11605
11606 /* Stop if there is no BRANCH_PREFIX. */
11607 if (!align_branch_prefix_size)
11608 return;
11609
11610 /* Scan for BRANCH_PREFIX. */
11611 for (; fragP != NULL; fragP = fragP->fr_next)
11612 {
11613 if (fragP->fr_type != rs_machine_dependent
11614 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11615 != BRANCH_PREFIX))
11616 continue;
11617
11618 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11619 COND_JUMP_PREFIX. */
11620 max_prefix_length = 0;
11621 for (next_fragP = fragP;
11622 next_fragP != NULL;
11623 next_fragP = next_fragP->fr_next)
11624 {
11625 if (next_fragP->fr_type == rs_fill)
11626 /* Skip rs_fill frags. */
11627 continue;
11628 else if (next_fragP->fr_type != rs_machine_dependent)
11629 /* Stop for all other frags. */
11630 break;
11631
11632 /* rs_machine_dependent frags. */
11633 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11634 == BRANCH_PREFIX)
11635 {
11636 /* Count BRANCH_PREFIX frags. */
11637 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11638 {
11639 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11640 frag_wane (next_fragP);
11641 }
11642 else
11643 max_prefix_length
11644 += next_fragP->tc_frag_data.max_bytes;
11645 }
11646 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11647 == BRANCH_PADDING)
11648 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11649 == FUSED_JCC_PADDING))
11650 {
11651 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11652 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11653 break;
11654 }
11655 else
11656 /* Stop for other rs_machine_dependent frags. */
11657 break;
11658 }
11659
11660 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11661
11662 /* Skip to the next frag. */
11663 fragP = next_fragP;
11664 }
11665}
11666
11667/* Compute padding size for
11668
11669 FUSED_JCC_PADDING
11670 CMP like instruction
11671 BRANCH_PADDING
11672 COND_JUMP/UNCOND_JUMP
11673
11674 or
11675
11676 BRANCH_PADDING
11677 COND_JUMP/UNCOND_JUMP
11678 */
11679
11680static int
11681i386_branch_padding_size (fragS *fragP, offsetT address)
11682{
11683 unsigned int offset, size, padding_size;
11684 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11685
11686 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11687 if (!address)
11688 address = fragP->fr_address;
11689 address += fragP->fr_fix;
11690
11691 /* CMP like instrunction size. */
11692 size = fragP->tc_frag_data.cmp_size;
11693
11694 /* The base size of the branch frag. */
11695 size += branch_fragP->fr_fix;
11696
11697 /* Add opcode and displacement bytes for the rs_machine_dependent
11698 branch frag. */
11699 if (branch_fragP->fr_type == rs_machine_dependent)
11700 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11701
11702 /* Check if branch is within boundary and doesn't end at the last
11703 byte. */
11704 offset = address & ((1U << align_branch_power) - 1);
11705 if ((offset + size) >= (1U << align_branch_power))
11706 /* Padding needed to avoid crossing boundary. */
11707 padding_size = (1U << align_branch_power) - offset;
11708 else
11709 /* No padding needed. */
11710 padding_size = 0;
11711
11712 /* The return value may be saved in tc_frag_data.length which is
11713 unsigned byte. */
11714 if (!fits_in_unsigned_byte (padding_size))
11715 abort ();
11716
11717 return padding_size;
11718}
11719
11720/* i386_generic_table_relax_frag()
11721
11722 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11723 grow/shrink padding to align branch frags. Hand others to
11724 relax_frag(). */
11725
11726long
11727i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11728{
11729 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11730 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11731 {
11732 long padding_size = i386_branch_padding_size (fragP, 0);
11733 long grow = padding_size - fragP->tc_frag_data.length;
11734
11735 /* When the BRANCH_PREFIX frag is used, the computed address
11736 must match the actual address and there should be no padding. */
11737 if (fragP->tc_frag_data.padding_address
11738 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11739 || padding_size))
11740 abort ();
11741
11742 /* Update the padding size. */
11743 if (grow)
11744 fragP->tc_frag_data.length = padding_size;
11745
11746 return grow;
11747 }
11748 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11749 {
11750 fragS *padding_fragP, *next_fragP;
11751 long padding_size, left_size, last_size;
11752
11753 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11754 if (!padding_fragP)
11755 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11756 return (fragP->tc_frag_data.length
11757 - fragP->tc_frag_data.last_length);
11758
11759 /* Compute the relative address of the padding frag in the very
11760 first time where the BRANCH_PREFIX frag sizes are zero. */
11761 if (!fragP->tc_frag_data.padding_address)
11762 fragP->tc_frag_data.padding_address
11763 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11764
11765 /* First update the last length from the previous interation. */
11766 left_size = fragP->tc_frag_data.prefix_length;
11767 for (next_fragP = fragP;
11768 next_fragP != padding_fragP;
11769 next_fragP = next_fragP->fr_next)
11770 if (next_fragP->fr_type == rs_machine_dependent
11771 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11772 == BRANCH_PREFIX))
11773 {
11774 if (left_size)
11775 {
11776 int max = next_fragP->tc_frag_data.max_bytes;
11777 if (max)
11778 {
11779 int size;
11780 if (max > left_size)
11781 size = left_size;
11782 else
11783 size = max;
11784 left_size -= size;
11785 next_fragP->tc_frag_data.last_length = size;
11786 }
11787 }
11788 else
11789 next_fragP->tc_frag_data.last_length = 0;
11790 }
11791
11792 /* Check the padding size for the padding frag. */
11793 padding_size = i386_branch_padding_size
11794 (padding_fragP, (fragP->fr_address
11795 + fragP->tc_frag_data.padding_address));
11796
11797 last_size = fragP->tc_frag_data.prefix_length;
11798 /* Check if there is change from the last interation. */
11799 if (padding_size == last_size)
11800 {
11801 /* Update the expected address of the padding frag. */
11802 padding_fragP->tc_frag_data.padding_address
11803 = (fragP->fr_address + padding_size
11804 + fragP->tc_frag_data.padding_address);
11805 return 0;
11806 }
11807
11808 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11809 {
11810 /* No padding if there is no sufficient room. Clear the
11811 expected address of the padding frag. */
11812 padding_fragP->tc_frag_data.padding_address = 0;
11813 padding_size = 0;
11814 }
11815 else
11816 /* Store the expected address of the padding frag. */
11817 padding_fragP->tc_frag_data.padding_address
11818 = (fragP->fr_address + padding_size
11819 + fragP->tc_frag_data.padding_address);
11820
11821 fragP->tc_frag_data.prefix_length = padding_size;
11822
11823 /* Update the length for the current interation. */
11824 left_size = padding_size;
11825 for (next_fragP = fragP;
11826 next_fragP != padding_fragP;
11827 next_fragP = next_fragP->fr_next)
11828 if (next_fragP->fr_type == rs_machine_dependent
11829 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11830 == BRANCH_PREFIX))
11831 {
11832 if (left_size)
11833 {
11834 int max = next_fragP->tc_frag_data.max_bytes;
11835 if (max)
11836 {
11837 int size;
11838 if (max > left_size)
11839 size = left_size;
11840 else
11841 size = max;
11842 left_size -= size;
11843 next_fragP->tc_frag_data.length = size;
11844 }
11845 }
11846 else
11847 next_fragP->tc_frag_data.length = 0;
11848 }
11849
11850 return (fragP->tc_frag_data.length
11851 - fragP->tc_frag_data.last_length);
11852 }
11853 return relax_frag (segment, fragP, stretch);
11854}
11855
ee7fcc42
AM
11856/* md_estimate_size_before_relax()
11857
11858 Called just before relax() for rs_machine_dependent frags. The x86
11859 assembler uses these frags to handle variable size jump
11860 instructions.
11861
11862 Any symbol that is now undefined will not become defined.
11863 Return the correct fr_subtype in the frag.
11864 Return the initial "guess for variable size of frag" to caller.
11865 The guess is actually the growth beyond the fixed part. Whatever
11866 we do to grow the fixed or variable part contributes to our
11867 returned value. */
11868
252b5132 11869int
7016a5d5 11870md_estimate_size_before_relax (fragS *fragP, segT segment)
252b5132 11871{
e379e5f3
L
11872 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11873 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11874 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11875 {
11876 i386_classify_machine_dependent_frag (fragP);
11877 return fragP->tc_frag_data.length;
11878 }
11879
252b5132 11880 /* We've already got fragP->fr_subtype right; all we have to do is
b98ef147
AM
11881 check for un-relaxable symbols. On an ELF system, we can't relax
11882 an externally visible symbol, because it may be overridden by a
11883 shared library. */
11884 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
6d249963 11885#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 11886 || (IS_ELF
8dcea932
L
11887 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11888 fragP->fr_var))
fbeb56a4
DK
11889#endif
11890#if defined (OBJ_COFF) && defined (TE_PE)
7ab9ffdd 11891 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
fbeb56a4 11892 && S_IS_WEAK (fragP->fr_symbol))
b98ef147
AM
11893#endif
11894 )
252b5132 11895 {
b98ef147
AM
11896 /* Symbol is undefined in this segment, or we need to keep a
11897 reloc so that weak symbols can be overridden. */
11898 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
f86103b7 11899 enum bfd_reloc_code_real reloc_type;
ee7fcc42
AM
11900 unsigned char *opcode;
11901 int old_fr_fix;
f6af82bd 11902
ee7fcc42 11903 if (fragP->fr_var != NO_RELOC)
1e9cc1c2 11904 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
b98ef147 11905 else if (size == 2)
f6af82bd 11906 reloc_type = BFD_RELOC_16_PCREL;
bd7ab16b
L
11907#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11908 else if (need_plt32_p (fragP->fr_symbol))
11909 reloc_type = BFD_RELOC_X86_64_PLT32;
11910#endif
f6af82bd
AM
11911 else
11912 reloc_type = BFD_RELOC_32_PCREL;
252b5132 11913
ee7fcc42
AM
11914 old_fr_fix = fragP->fr_fix;
11915 opcode = (unsigned char *) fragP->fr_opcode;
11916
fddf5b5b 11917 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
252b5132 11918 {
fddf5b5b
AM
11919 case UNCOND_JUMP:
11920 /* Make jmp (0xeb) a (d)word displacement jump. */
47926f60 11921 opcode[0] = 0xe9;
252b5132 11922 fragP->fr_fix += size;
062cd5e7
AS
11923 fix_new (fragP, old_fr_fix, size,
11924 fragP->fr_symbol,
11925 fragP->fr_offset, 1,
11926 reloc_type);
252b5132
RH
11927 break;
11928
fddf5b5b 11929 case COND_JUMP86:
412167cb
AM
11930 if (size == 2
11931 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
fddf5b5b
AM
11932 {
11933 /* Negate the condition, and branch past an
11934 unconditional jump. */
11935 opcode[0] ^= 1;
11936 opcode[1] = 3;
11937 /* Insert an unconditional jump. */
11938 opcode[2] = 0xe9;
11939 /* We added two extra opcode bytes, and have a two byte
11940 offset. */
11941 fragP->fr_fix += 2 + 2;
062cd5e7
AS
11942 fix_new (fragP, old_fr_fix + 2, 2,
11943 fragP->fr_symbol,
11944 fragP->fr_offset, 1,
11945 reloc_type);
fddf5b5b
AM
11946 break;
11947 }
11948 /* Fall through. */
11949
11950 case COND_JUMP:
412167cb
AM
11951 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11952 {
3e02c1cc
AM
11953 fixS *fixP;
11954
412167cb 11955 fragP->fr_fix += 1;
3e02c1cc
AM
11956 fixP = fix_new (fragP, old_fr_fix, 1,
11957 fragP->fr_symbol,
11958 fragP->fr_offset, 1,
11959 BFD_RELOC_8_PCREL);
11960 fixP->fx_signed = 1;
412167cb
AM
11961 break;
11962 }
93c2a809 11963
24eab124 11964 /* This changes the byte-displacement jump 0x7N
fddf5b5b 11965 to the (d)word-displacement jump 0x0f,0x8N. */
252b5132 11966 opcode[1] = opcode[0] + 0x10;
f6af82bd 11967 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
47926f60
KH
11968 /* We've added an opcode byte. */
11969 fragP->fr_fix += 1 + size;
062cd5e7
AS
11970 fix_new (fragP, old_fr_fix + 1, size,
11971 fragP->fr_symbol,
11972 fragP->fr_offset, 1,
11973 reloc_type);
252b5132 11974 break;
fddf5b5b
AM
11975
11976 default:
11977 BAD_CASE (fragP->fr_subtype);
11978 break;
252b5132
RH
11979 }
11980 frag_wane (fragP);
ee7fcc42 11981 return fragP->fr_fix - old_fr_fix;
252b5132 11982 }
93c2a809 11983
93c2a809
AM
11984 /* Guess size depending on current relax state. Initially the relax
11985 state will correspond to a short jump and we return 1, because
11986 the variable part of the frag (the branch offset) is one byte
11987 long. However, we can relax a section more than once and in that
11988 case we must either set fr_subtype back to the unrelaxed state,
11989 or return the value for the appropriate branch. */
11990 return md_relax_table[fragP->fr_subtype].rlx_length;
ee7fcc42
AM
11991}
11992
47926f60
KH
11993/* Called after relax() is finished.
11994
11995 In: Address of frag.
11996 fr_type == rs_machine_dependent.
11997 fr_subtype is what the address relaxed to.
11998
11999 Out: Any fixSs and constants are set up.
12000 Caller will turn frag into a ".space 0". */
12001
252b5132 12002void
7016a5d5
TG
12003md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12004 fragS *fragP)
252b5132 12005{
29b0f896 12006 unsigned char *opcode;
252b5132 12007 unsigned char *where_to_put_displacement = NULL;
847f7ad4
AM
12008 offsetT target_address;
12009 offsetT opcode_address;
252b5132 12010 unsigned int extension = 0;
847f7ad4 12011 offsetT displacement_from_opcode_start;
252b5132 12012
e379e5f3
L
12013 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12014 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12015 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12016 {
12017 /* Generate nop padding. */
12018 unsigned int size = fragP->tc_frag_data.length;
12019 if (size)
12020 {
12021 if (size > fragP->tc_frag_data.max_bytes)
12022 abort ();
12023
12024 if (flag_debug)
12025 {
12026 const char *msg;
12027 const char *branch = "branch";
12028 const char *prefix = "";
12029 fragS *padding_fragP;
12030 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12031 == BRANCH_PREFIX)
12032 {
12033 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12034 switch (fragP->tc_frag_data.default_prefix)
12035 {
12036 default:
12037 abort ();
12038 break;
12039 case CS_PREFIX_OPCODE:
12040 prefix = " cs";
12041 break;
12042 case DS_PREFIX_OPCODE:
12043 prefix = " ds";
12044 break;
12045 case ES_PREFIX_OPCODE:
12046 prefix = " es";
12047 break;
12048 case FS_PREFIX_OPCODE:
12049 prefix = " fs";
12050 break;
12051 case GS_PREFIX_OPCODE:
12052 prefix = " gs";
12053 break;
12054 case SS_PREFIX_OPCODE:
12055 prefix = " ss";
12056 break;
12057 }
12058 if (padding_fragP)
12059 msg = _("%s:%u: add %d%s at 0x%llx to align "
12060 "%s within %d-byte boundary\n");
12061 else
12062 msg = _("%s:%u: add additional %d%s at 0x%llx to "
12063 "align %s within %d-byte boundary\n");
12064 }
12065 else
12066 {
12067 padding_fragP = fragP;
12068 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12069 "%s within %d-byte boundary\n");
12070 }
12071
12072 if (padding_fragP)
12073 switch (padding_fragP->tc_frag_data.branch_type)
12074 {
12075 case align_branch_jcc:
12076 branch = "jcc";
12077 break;
12078 case align_branch_fused:
12079 branch = "fused jcc";
12080 break;
12081 case align_branch_jmp:
12082 branch = "jmp";
12083 break;
12084 case align_branch_call:
12085 branch = "call";
12086 break;
12087 case align_branch_indirect:
12088 branch = "indiret branch";
12089 break;
12090 case align_branch_ret:
12091 branch = "ret";
12092 break;
12093 default:
12094 break;
12095 }
12096
12097 fprintf (stdout, msg,
12098 fragP->fr_file, fragP->fr_line, size, prefix,
12099 (long long) fragP->fr_address, branch,
12100 1 << align_branch_power);
12101 }
12102 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12103 memset (fragP->fr_opcode,
12104 fragP->tc_frag_data.default_prefix, size);
12105 else
12106 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12107 size, 0);
12108 fragP->fr_fix += size;
12109 }
12110 return;
12111 }
12112
252b5132
RH
12113 opcode = (unsigned char *) fragP->fr_opcode;
12114
47926f60 12115 /* Address we want to reach in file space. */
252b5132 12116 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
252b5132 12117
47926f60 12118 /* Address opcode resides at in file space. */
252b5132
RH
12119 opcode_address = fragP->fr_address + fragP->fr_fix;
12120
47926f60 12121 /* Displacement from opcode start to fill into instruction. */
252b5132
RH
12122 displacement_from_opcode_start = target_address - opcode_address;
12123
fddf5b5b 12124 if ((fragP->fr_subtype & BIG) == 0)
252b5132 12125 {
47926f60
KH
12126 /* Don't have to change opcode. */
12127 extension = 1; /* 1 opcode + 1 displacement */
252b5132 12128 where_to_put_displacement = &opcode[1];
fddf5b5b
AM
12129 }
12130 else
12131 {
12132 if (no_cond_jump_promotion
12133 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
4eed87de
AM
12134 as_warn_where (fragP->fr_file, fragP->fr_line,
12135 _("long jump required"));
252b5132 12136
fddf5b5b
AM
12137 switch (fragP->fr_subtype)
12138 {
12139 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12140 extension = 4; /* 1 opcode + 4 displacement */
12141 opcode[0] = 0xe9;
12142 where_to_put_displacement = &opcode[1];
12143 break;
252b5132 12144
fddf5b5b
AM
12145 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12146 extension = 2; /* 1 opcode + 2 displacement */
12147 opcode[0] = 0xe9;
12148 where_to_put_displacement = &opcode[1];
12149 break;
252b5132 12150
fddf5b5b
AM
12151 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12152 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12153 extension = 5; /* 2 opcode + 4 displacement */
12154 opcode[1] = opcode[0] + 0x10;
12155 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12156 where_to_put_displacement = &opcode[2];
12157 break;
252b5132 12158
fddf5b5b
AM
12159 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12160 extension = 3; /* 2 opcode + 2 displacement */
12161 opcode[1] = opcode[0] + 0x10;
12162 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12163 where_to_put_displacement = &opcode[2];
12164 break;
252b5132 12165
fddf5b5b
AM
12166 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12167 extension = 4;
12168 opcode[0] ^= 1;
12169 opcode[1] = 3;
12170 opcode[2] = 0xe9;
12171 where_to_put_displacement = &opcode[3];
12172 break;
12173
12174 default:
12175 BAD_CASE (fragP->fr_subtype);
12176 break;
12177 }
252b5132 12178 }
fddf5b5b 12179
7b81dfbb
AJ
12180 /* If size if less then four we are sure that the operand fits,
12181 but if it's 4, then it could be that the displacement is larger
12182 then -/+ 2GB. */
12183 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12184 && object_64bit
12185 && ((addressT) (displacement_from_opcode_start - extension
4eed87de
AM
12186 + ((addressT) 1 << 31))
12187 > (((addressT) 2 << 31) - 1)))
7b81dfbb
AJ
12188 {
12189 as_bad_where (fragP->fr_file, fragP->fr_line,
12190 _("jump target out of range"));
12191 /* Make us emit 0. */
12192 displacement_from_opcode_start = extension;
12193 }
47926f60 12194 /* Now put displacement after opcode. */
252b5132
RH
12195 md_number_to_chars ((char *) where_to_put_displacement,
12196 (valueT) (displacement_from_opcode_start - extension),
fddf5b5b 12197 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
252b5132
RH
12198 fragP->fr_fix += extension;
12199}
12200\f
7016a5d5 12201/* Apply a fixup (fixP) to segment data, once it has been determined
252b5132
RH
12202 by our caller that we have all the info we need to fix it up.
12203
7016a5d5
TG
12204 Parameter valP is the pointer to the value of the bits.
12205
252b5132
RH
12206 On the 386, immediates, displacements, and data pointers are all in
12207 the same (little-endian) format, so we don't need to care about which
12208 we are handling. */
12209
94f592af 12210void
7016a5d5 12211md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
252b5132 12212{
94f592af 12213 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
c6682705 12214 valueT value = *valP;
252b5132 12215
f86103b7 12216#if !defined (TE_Mach)
93382f6d
AM
12217 if (fixP->fx_pcrel)
12218 {
12219 switch (fixP->fx_r_type)
12220 {
5865bb77
ILT
12221 default:
12222 break;
12223
d6ab8113
JB
12224 case BFD_RELOC_64:
12225 fixP->fx_r_type = BFD_RELOC_64_PCREL;
12226 break;
93382f6d 12227 case BFD_RELOC_32:
ae8887b5 12228 case BFD_RELOC_X86_64_32S:
93382f6d
AM
12229 fixP->fx_r_type = BFD_RELOC_32_PCREL;
12230 break;
12231 case BFD_RELOC_16:
12232 fixP->fx_r_type = BFD_RELOC_16_PCREL;
12233 break;
12234 case BFD_RELOC_8:
12235 fixP->fx_r_type = BFD_RELOC_8_PCREL;
12236 break;
12237 }
12238 }
252b5132 12239
a161fe53 12240 if (fixP->fx_addsy != NULL
31312f95 12241 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
d6ab8113 12242 || fixP->fx_r_type == BFD_RELOC_64_PCREL
31312f95 12243 || fixP->fx_r_type == BFD_RELOC_16_PCREL
d258b828 12244 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
31312f95 12245 && !use_rela_relocations)
252b5132 12246 {
31312f95
AM
12247 /* This is a hack. There should be a better way to handle this.
12248 This covers for the fact that bfd_install_relocation will
12249 subtract the current location (for partial_inplace, PC relative
12250 relocations); see more below. */
252b5132 12251#ifndef OBJ_AOUT
718ddfc0 12252 if (IS_ELF
252b5132
RH
12253#ifdef TE_PE
12254 || OUTPUT_FLAVOR == bfd_target_coff_flavour
12255#endif
12256 )
12257 value += fixP->fx_where + fixP->fx_frag->fr_address;
12258#endif
12259#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 12260 if (IS_ELF)
252b5132 12261 {
6539b54b 12262 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
2f66722d 12263
6539b54b 12264 if ((sym_seg == seg
2f66722d 12265 || (symbol_section_p (fixP->fx_addsy)
6539b54b 12266 && sym_seg != absolute_section))
af65af87 12267 && !generic_force_reloc (fixP))
2f66722d
AM
12268 {
12269 /* Yes, we add the values in twice. This is because
6539b54b
AM
12270 bfd_install_relocation subtracts them out again. I think
12271 bfd_install_relocation is broken, but I don't dare change
2f66722d
AM
12272 it. FIXME. */
12273 value += fixP->fx_where + fixP->fx_frag->fr_address;
12274 }
252b5132
RH
12275 }
12276#endif
12277#if defined (OBJ_COFF) && defined (TE_PE)
977cdf5a
NC
12278 /* For some reason, the PE format does not store a
12279 section address offset for a PC relative symbol. */
12280 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
7be1c489 12281 || S_IS_WEAK (fixP->fx_addsy))
252b5132
RH
12282 value += md_pcrel_from (fixP);
12283#endif
12284 }
fbeb56a4 12285#if defined (OBJ_COFF) && defined (TE_PE)
f01c1a09
NC
12286 if (fixP->fx_addsy != NULL
12287 && S_IS_WEAK (fixP->fx_addsy)
12288 /* PR 16858: Do not modify weak function references. */
12289 && ! fixP->fx_pcrel)
fbeb56a4 12290 {
296a8689
NC
12291#if !defined (TE_PEP)
12292 /* For x86 PE weak function symbols are neither PC-relative
12293 nor do they set S_IS_FUNCTION. So the only reliable way
12294 to detect them is to check the flags of their containing
12295 section. */
12296 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12297 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12298 ;
12299 else
12300#endif
fbeb56a4
DK
12301 value -= S_GET_VALUE (fixP->fx_addsy);
12302 }
12303#endif
252b5132
RH
12304
12305 /* Fix a few things - the dynamic linker expects certain values here,
0234cb7c 12306 and we must not disappoint it. */
252b5132 12307#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 12308 if (IS_ELF && fixP->fx_addsy)
47926f60
KH
12309 switch (fixP->fx_r_type)
12310 {
12311 case BFD_RELOC_386_PLT32:
3e73aa7c 12312 case BFD_RELOC_X86_64_PLT32:
b9519cfe
L
12313 /* Make the jump instruction point to the address of the operand.
12314 At runtime we merely add the offset to the actual PLT entry.
12315 NB: Subtract the offset size only for jump instructions. */
12316 if (fixP->fx_pcrel)
12317 value = -4;
47926f60 12318 break;
31312f95 12319
13ae64f3
JJ
12320 case BFD_RELOC_386_TLS_GD:
12321 case BFD_RELOC_386_TLS_LDM:
13ae64f3 12322 case BFD_RELOC_386_TLS_IE_32:
37e55690
JJ
12323 case BFD_RELOC_386_TLS_IE:
12324 case BFD_RELOC_386_TLS_GOTIE:
67a4f2b7 12325 case BFD_RELOC_386_TLS_GOTDESC:
bffbf940
JJ
12326 case BFD_RELOC_X86_64_TLSGD:
12327 case BFD_RELOC_X86_64_TLSLD:
12328 case BFD_RELOC_X86_64_GOTTPOFF:
67a4f2b7 12329 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
00f7efb6
JJ
12330 value = 0; /* Fully resolved at runtime. No addend. */
12331 /* Fallthrough */
12332 case BFD_RELOC_386_TLS_LE:
12333 case BFD_RELOC_386_TLS_LDO_32:
12334 case BFD_RELOC_386_TLS_LE_32:
12335 case BFD_RELOC_X86_64_DTPOFF32:
d6ab8113 12336 case BFD_RELOC_X86_64_DTPOFF64:
00f7efb6 12337 case BFD_RELOC_X86_64_TPOFF32:
d6ab8113 12338 case BFD_RELOC_X86_64_TPOFF64:
00f7efb6
JJ
12339 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12340 break;
12341
67a4f2b7
AO
12342 case BFD_RELOC_386_TLS_DESC_CALL:
12343 case BFD_RELOC_X86_64_TLSDESC_CALL:
12344 value = 0; /* Fully resolved at runtime. No addend. */
12345 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12346 fixP->fx_done = 0;
12347 return;
12348
47926f60
KH
12349 case BFD_RELOC_VTABLE_INHERIT:
12350 case BFD_RELOC_VTABLE_ENTRY:
12351 fixP->fx_done = 0;
94f592af 12352 return;
47926f60
KH
12353
12354 default:
12355 break;
12356 }
12357#endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
c6682705 12358 *valP = value;
f86103b7 12359#endif /* !defined (TE_Mach) */
3e73aa7c 12360
3e73aa7c 12361 /* Are we finished with this relocation now? */
c6682705 12362 if (fixP->fx_addsy == NULL)
3e73aa7c 12363 fixP->fx_done = 1;
fbeb56a4
DK
12364#if defined (OBJ_COFF) && defined (TE_PE)
12365 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12366 {
12367 fixP->fx_done = 0;
12368 /* Remember value for tc_gen_reloc. */
12369 fixP->fx_addnumber = value;
12370 /* Clear out the frag for now. */
12371 value = 0;
12372 }
12373#endif
3e73aa7c
JH
12374 else if (use_rela_relocations)
12375 {
12376 fixP->fx_no_overflow = 1;
062cd5e7
AS
12377 /* Remember value for tc_gen_reloc. */
12378 fixP->fx_addnumber = value;
3e73aa7c
JH
12379 value = 0;
12380 }
f86103b7 12381
94f592af 12382 md_number_to_chars (p, value, fixP->fx_size);
252b5132 12383}
252b5132 12384\f
6d4af3c2 12385const char *
499ac353 12386md_atof (int type, char *litP, int *sizeP)
252b5132 12387{
499ac353
NC
12388 /* This outputs the LITTLENUMs in REVERSE order;
12389 in accord with the bigendian 386. */
12390 return ieee_md_atof (type, litP, sizeP, FALSE);
252b5132
RH
12391}
12392\f
2d545b82 12393static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
252b5132 12394
252b5132 12395static char *
e3bb37b5 12396output_invalid (int c)
252b5132 12397{
3882b010 12398 if (ISPRINT (c))
f9f21a03
L
12399 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12400 "'%c'", c);
252b5132 12401 else
f9f21a03 12402 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
2d545b82 12403 "(0x%x)", (unsigned char) c);
252b5132
RH
12404 return output_invalid_buf;
12405}
12406
8a6fb3f9
JB
12407/* Verify that @r can be used in the current context. */
12408
12409static bfd_boolean check_register (const reg_entry *r)
12410{
12411 if (allow_pseudo_reg)
12412 return TRUE;
12413
12414 if (operand_type_all_zero (&r->reg_type))
12415 return FALSE;
12416
12417 if ((r->reg_type.bitfield.dword
12418 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12419 || r->reg_type.bitfield.class == RegCR
22e00a3f 12420 || r->reg_type.bitfield.class == RegDR)
8a6fb3f9
JB
12421 && !cpu_arch_flags.bitfield.cpui386)
12422 return FALSE;
12423
22e00a3f
JB
12424 if (r->reg_type.bitfield.class == RegTR
12425 && (flag_code == CODE_64BIT
12426 || !cpu_arch_flags.bitfield.cpui386
12427 || cpu_arch_isa_flags.bitfield.cpui586
12428 || cpu_arch_isa_flags.bitfield.cpui686))
12429 return FALSE;
12430
8a6fb3f9
JB
12431 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12432 return FALSE;
12433
12434 if (!cpu_arch_flags.bitfield.cpuavx512f)
12435 {
12436 if (r->reg_type.bitfield.zmmword
12437 || r->reg_type.bitfield.class == RegMask)
12438 return FALSE;
12439
12440 if (!cpu_arch_flags.bitfield.cpuavx)
12441 {
12442 if (r->reg_type.bitfield.ymmword)
12443 return FALSE;
12444
12445 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12446 return FALSE;
12447 }
12448 }
12449
12450 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12451 return FALSE;
12452
12453 /* Don't allow fake index register unless allow_index_reg isn't 0. */
12454 if (!allow_index_reg && r->reg_num == RegIZ)
12455 return FALSE;
12456
12457 /* Upper 16 vector registers are only available with VREX in 64bit
12458 mode, and require EVEX encoding. */
12459 if (r->reg_flags & RegVRex)
12460 {
12461 if (!cpu_arch_flags.bitfield.cpuavx512f
12462 || flag_code != CODE_64BIT)
12463 return FALSE;
12464
da4977e0
JB
12465 if (i.vec_encoding == vex_encoding_default)
12466 i.vec_encoding = vex_encoding_evex;
12467 else if (i.vec_encoding != vex_encoding_evex)
12468 i.vec_encoding = vex_encoding_error;
8a6fb3f9
JB
12469 }
12470
12471 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12472 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12473 && flag_code != CODE_64BIT)
12474 return FALSE;
12475
12476 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12477 && !intel_syntax)
12478 return FALSE;
12479
12480 return TRUE;
12481}
12482
af6bdddf 12483/* REG_STRING starts *before* REGISTER_PREFIX. */
252b5132
RH
12484
12485static const reg_entry *
4d1bb795 12486parse_real_register (char *reg_string, char **end_op)
252b5132 12487{
af6bdddf
AM
12488 char *s = reg_string;
12489 char *p;
252b5132
RH
12490 char reg_name_given[MAX_REG_NAME_SIZE + 1];
12491 const reg_entry *r;
12492
12493 /* Skip possible REGISTER_PREFIX and possible whitespace. */
12494 if (*s == REGISTER_PREFIX)
12495 ++s;
12496
12497 if (is_space_char (*s))
12498 ++s;
12499
12500 p = reg_name_given;
af6bdddf 12501 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
252b5132
RH
12502 {
12503 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
af6bdddf
AM
12504 return (const reg_entry *) NULL;
12505 s++;
252b5132
RH
12506 }
12507
6588847e
DN
12508 /* For naked regs, make sure that we are not dealing with an identifier.
12509 This prevents confusing an identifier like `eax_var' with register
12510 `eax'. */
12511 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12512 return (const reg_entry *) NULL;
12513
af6bdddf 12514 *end_op = s;
252b5132
RH
12515
12516 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
12517
5f47d35b 12518 /* Handle floating point regs, allowing spaces in the (i) part. */
47926f60 12519 if (r == i386_regtab /* %st is first entry of table */)
5f47d35b 12520 {
0e0eea78
JB
12521 if (!cpu_arch_flags.bitfield.cpu8087
12522 && !cpu_arch_flags.bitfield.cpu287
af32b722
JB
12523 && !cpu_arch_flags.bitfield.cpu387
12524 && !allow_pseudo_reg)
0e0eea78
JB
12525 return (const reg_entry *) NULL;
12526
5f47d35b
AM
12527 if (is_space_char (*s))
12528 ++s;
12529 if (*s == '(')
12530 {
af6bdddf 12531 ++s;
5f47d35b
AM
12532 if (is_space_char (*s))
12533 ++s;
12534 if (*s >= '0' && *s <= '7')
12535 {
db557034 12536 int fpr = *s - '0';
af6bdddf 12537 ++s;
5f47d35b
AM
12538 if (is_space_char (*s))
12539 ++s;
12540 if (*s == ')')
12541 {
12542 *end_op = s + 1;
1e9cc1c2 12543 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
db557034
AM
12544 know (r);
12545 return r + fpr;
5f47d35b 12546 }
5f47d35b 12547 }
47926f60 12548 /* We have "%st(" then garbage. */
5f47d35b
AM
12549 return (const reg_entry *) NULL;
12550 }
12551 }
12552
8a6fb3f9 12553 return r && check_register (r) ? r : NULL;
252b5132 12554}
4d1bb795
JB
12555
12556/* REG_STRING starts *before* REGISTER_PREFIX. */
12557
12558static const reg_entry *
12559parse_register (char *reg_string, char **end_op)
12560{
12561 const reg_entry *r;
12562
12563 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12564 r = parse_real_register (reg_string, end_op);
12565 else
12566 r = NULL;
12567 if (!r)
12568 {
12569 char *save = input_line_pointer;
12570 char c;
12571 symbolS *symbolP;
12572
12573 input_line_pointer = reg_string;
d02603dc 12574 c = get_symbol_name (&reg_string);
4d1bb795
JB
12575 symbolP = symbol_find (reg_string);
12576 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12577 {
12578 const expressionS *e = symbol_get_value_expression (symbolP);
12579
0398aac5 12580 know (e->X_op == O_register);
4eed87de 12581 know (e->X_add_number >= 0
c3fe08fa 12582 && (valueT) e->X_add_number < i386_regtab_size);
4d1bb795 12583 r = i386_regtab + e->X_add_number;
8a6fb3f9
JB
12584 if (!check_register (r))
12585 {
12586 as_bad (_("register '%s%s' cannot be used here"),
12587 register_prefix, r->reg_name);
12588 r = &bad_reg;
12589 }
4d1bb795
JB
12590 *end_op = input_line_pointer;
12591 }
12592 *input_line_pointer = c;
12593 input_line_pointer = save;
12594 }
12595 return r;
12596}
12597
12598int
12599i386_parse_name (char *name, expressionS *e, char *nextcharP)
12600{
12601 const reg_entry *r;
12602 char *end = input_line_pointer;
12603
12604 *end = *nextcharP;
12605 r = parse_register (name, &input_line_pointer);
12606 if (r && end <= input_line_pointer)
12607 {
12608 *nextcharP = *input_line_pointer;
12609 *input_line_pointer = 0;
8a6fb3f9
JB
12610 if (r != &bad_reg)
12611 {
12612 e->X_op = O_register;
12613 e->X_add_number = r - i386_regtab;
12614 }
12615 else
12616 e->X_op = O_illegal;
4d1bb795
JB
12617 return 1;
12618 }
12619 input_line_pointer = end;
12620 *end = 0;
ee86248c 12621 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
4d1bb795
JB
12622}
12623
12624void
12625md_operand (expressionS *e)
12626{
ee86248c
JB
12627 char *end;
12628 const reg_entry *r;
4d1bb795 12629
ee86248c
JB
12630 switch (*input_line_pointer)
12631 {
12632 case REGISTER_PREFIX:
12633 r = parse_real_register (input_line_pointer, &end);
4d1bb795
JB
12634 if (r)
12635 {
12636 e->X_op = O_register;
12637 e->X_add_number = r - i386_regtab;
12638 input_line_pointer = end;
12639 }
ee86248c
JB
12640 break;
12641
12642 case '[':
9c2799c2 12643 gas_assert (intel_syntax);
ee86248c
JB
12644 end = input_line_pointer++;
12645 expression (e);
12646 if (*input_line_pointer == ']')
12647 {
12648 ++input_line_pointer;
12649 e->X_op_symbol = make_expr_symbol (e);
12650 e->X_add_symbol = NULL;
12651 e->X_add_number = 0;
12652 e->X_op = O_index;
12653 }
12654 else
12655 {
12656 e->X_op = O_absent;
12657 input_line_pointer = end;
12658 }
12659 break;
4d1bb795
JB
12660 }
12661}
12662
252b5132 12663\f
4cc782b5 12664#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
b6f8c7c4 12665const char *md_shortopts = "kVQ:sqnO::";
252b5132 12666#else
b6f8c7c4 12667const char *md_shortopts = "qnO::";
252b5132 12668#endif
6e0b89ee 12669
3e73aa7c 12670#define OPTION_32 (OPTION_MD_BASE + 0)
b3b91714
AM
12671#define OPTION_64 (OPTION_MD_BASE + 1)
12672#define OPTION_DIVIDE (OPTION_MD_BASE + 2)
9103f4f4
L
12673#define OPTION_MARCH (OPTION_MD_BASE + 3)
12674#define OPTION_MTUNE (OPTION_MD_BASE + 4)
1efbbeb4
L
12675#define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12676#define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12677#define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12678#define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
bd5dea88 12679#define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
c0f3af97 12680#define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
daf50ae7 12681#define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
7bab8ab5
JB
12682#define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12683#define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12684#define OPTION_X32 (OPTION_MD_BASE + 14)
7e8b059b 12685#define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
43234a1e
L
12686#define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12687#define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
167ad85b 12688#define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
d1982f93 12689#define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
d3d3c6db 12690#define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
8dcea932 12691#define OPTION_MSHARED (OPTION_MD_BASE + 21)
5db04b09
L
12692#define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12693#define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
e4e00185 12694#define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
b4a3a7b4 12695#define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
03751133 12696#define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
e379e5f3
L
12697#define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12698#define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12699#define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
76cf450b 12700#define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
ae531041
L
12701#define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12702#define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12703#define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
b3b91714 12704
99ad8390
NC
12705struct option md_longopts[] =
12706{
3e73aa7c 12707 {"32", no_argument, NULL, OPTION_32},
321098a5 12708#if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
d382c579 12709 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
3e73aa7c 12710 {"64", no_argument, NULL, OPTION_64},
351f65ca
L
12711#endif
12712#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
570561f7 12713 {"x32", no_argument, NULL, OPTION_X32},
8dcea932 12714 {"mshared", no_argument, NULL, OPTION_MSHARED},
b4a3a7b4 12715 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
6e0b89ee 12716#endif
b3b91714 12717 {"divide", no_argument, NULL, OPTION_DIVIDE},
9103f4f4
L
12718 {"march", required_argument, NULL, OPTION_MARCH},
12719 {"mtune", required_argument, NULL, OPTION_MTUNE},
1efbbeb4
L
12720 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12721 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12722 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12723 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
c0f3af97 12724 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
daf50ae7 12725 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
7bab8ab5 12726 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
539f890d 12727 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
03751133 12728 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
7e8b059b 12729 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
43234a1e
L
12730 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12731 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
167ad85b
TG
12732# if defined (TE_PE) || defined (TE_PEP)
12733 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12734#endif
d1982f93 12735 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
e4e00185 12736 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
0cb4071e 12737 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
d3d3c6db 12738 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
e379e5f3
L
12739 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12740 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12741 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
76cf450b 12742 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
ae531041
L
12743 {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12744 {"mlfence-before-indirect-branch", required_argument, NULL,
12745 OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12746 {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
5db04b09
L
12747 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12748 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
252b5132
RH
12749 {NULL, no_argument, NULL, 0}
12750};
12751size_t md_longopts_size = sizeof (md_longopts);
12752
12753int
17b9d67d 12754md_parse_option (int c, const char *arg)
252b5132 12755{
91d6fa6a 12756 unsigned int j;
e379e5f3 12757 char *arch, *next, *saved, *type;
9103f4f4 12758
252b5132
RH
12759 switch (c)
12760 {
12b55ccc
L
12761 case 'n':
12762 optimize_align_code = 0;
12763 break;
12764
a38cf1db
AM
12765 case 'q':
12766 quiet_warnings = 1;
252b5132
RH
12767 break;
12768
12769#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
a38cf1db
AM
12770 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12771 should be emitted or not. FIXME: Not implemented. */
12772 case 'Q':
d4693039
JB
12773 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12774 return 0;
252b5132
RH
12775 break;
12776
12777 /* -V: SVR4 argument to print version ID. */
12778 case 'V':
12779 print_version_id ();
12780 break;
12781
a38cf1db
AM
12782 /* -k: Ignore for FreeBSD compatibility. */
12783 case 'k':
252b5132 12784 break;
4cc782b5
ILT
12785
12786 case 's':
12787 /* -s: On i386 Solaris, this tells the native assembler to use
29b0f896 12788 .stab instead of .stab.excl. We always use .stab anyhow. */
4cc782b5 12789 break;
8dcea932
L
12790
12791 case OPTION_MSHARED:
12792 shared = 1;
12793 break;
b4a3a7b4
L
12794
12795 case OPTION_X86_USED_NOTE:
12796 if (strcasecmp (arg, "yes") == 0)
12797 x86_used_note = 1;
12798 else if (strcasecmp (arg, "no") == 0)
12799 x86_used_note = 0;
12800 else
12801 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12802 break;
12803
12804
99ad8390 12805#endif
321098a5 12806#if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
d382c579 12807 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
3e73aa7c
JH
12808 case OPTION_64:
12809 {
12810 const char **list, **l;
12811
3e73aa7c
JH
12812 list = bfd_target_list ();
12813 for (l = list; *l != NULL; l++)
8620418b 12814 if (CONST_STRNEQ (*l, "elf64-x86-64")
99ad8390
NC
12815 || strcmp (*l, "coff-x86-64") == 0
12816 || strcmp (*l, "pe-x86-64") == 0
d382c579
TG
12817 || strcmp (*l, "pei-x86-64") == 0
12818 || strcmp (*l, "mach-o-x86-64") == 0)
6e0b89ee
AM
12819 {
12820 default_arch = "x86_64";
12821 break;
12822 }
3e73aa7c 12823 if (*l == NULL)
2b5d6a91 12824 as_fatal (_("no compiled in support for x86_64"));
3e73aa7c
JH
12825 free (list);
12826 }
12827 break;
12828#endif
252b5132 12829
351f65ca 12830#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
570561f7 12831 case OPTION_X32:
351f65ca
L
12832 if (IS_ELF)
12833 {
12834 const char **list, **l;
12835
12836 list = bfd_target_list ();
12837 for (l = list; *l != NULL; l++)
12838 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12839 {
12840 default_arch = "x86_64:32";
12841 break;
12842 }
12843 if (*l == NULL)
2b5d6a91 12844 as_fatal (_("no compiled in support for 32bit x86_64"));
351f65ca
L
12845 free (list);
12846 }
12847 else
12848 as_fatal (_("32bit x86_64 is only supported for ELF"));
12849 break;
12850#endif
12851
6e0b89ee
AM
12852 case OPTION_32:
12853 default_arch = "i386";
12854 break;
12855
b3b91714
AM
12856 case OPTION_DIVIDE:
12857#ifdef SVR4_COMMENT_CHARS
12858 {
12859 char *n, *t;
12860 const char *s;
12861
add39d23 12862 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
b3b91714
AM
12863 t = n;
12864 for (s = i386_comment_chars; *s != '\0'; s++)
12865 if (*s != '/')
12866 *t++ = *s;
12867 *t = '\0';
12868 i386_comment_chars = n;
12869 }
12870#endif
12871 break;
12872
9103f4f4 12873 case OPTION_MARCH:
293f5f65
L
12874 saved = xstrdup (arg);
12875 arch = saved;
12876 /* Allow -march=+nosse. */
12877 if (*arch == '+')
12878 arch++;
6305a203 12879 do
9103f4f4 12880 {
6305a203 12881 if (*arch == '.')
2b5d6a91 12882 as_fatal (_("invalid -march= option: `%s'"), arg);
6305a203
L
12883 next = strchr (arch, '+');
12884 if (next)
12885 *next++ = '\0';
91d6fa6a 12886 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9103f4f4 12887 {
91d6fa6a 12888 if (strcmp (arch, cpu_arch [j].name) == 0)
ccc9c027 12889 {
6305a203 12890 /* Processor. */
1ded5609
JB
12891 if (! cpu_arch[j].flags.bitfield.cpui386)
12892 continue;
12893
91d6fa6a 12894 cpu_arch_name = cpu_arch[j].name;
6305a203 12895 cpu_sub_arch_name = NULL;
91d6fa6a
NC
12896 cpu_arch_flags = cpu_arch[j].flags;
12897 cpu_arch_isa = cpu_arch[j].type;
12898 cpu_arch_isa_flags = cpu_arch[j].flags;
6305a203
L
12899 if (!cpu_arch_tune_set)
12900 {
12901 cpu_arch_tune = cpu_arch_isa;
12902 cpu_arch_tune_flags = cpu_arch_isa_flags;
12903 }
12904 break;
12905 }
91d6fa6a
NC
12906 else if (*cpu_arch [j].name == '.'
12907 && strcmp (arch, cpu_arch [j].name + 1) == 0)
6305a203 12908 {
33eaf5de 12909 /* ISA extension. */
6305a203 12910 i386_cpu_flags flags;
309d3373 12911
293f5f65
L
12912 flags = cpu_flags_or (cpu_arch_flags,
12913 cpu_arch[j].flags);
81486035 12914
5b64d091 12915 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
6305a203
L
12916 {
12917 if (cpu_sub_arch_name)
12918 {
12919 char *name = cpu_sub_arch_name;
12920 cpu_sub_arch_name = concat (name,
91d6fa6a 12921 cpu_arch[j].name,
1bf57e9f 12922 (const char *) NULL);
6305a203
L
12923 free (name);
12924 }
12925 else
91d6fa6a 12926 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
6305a203 12927 cpu_arch_flags = flags;
a586129e 12928 cpu_arch_isa_flags = flags;
6305a203 12929 }
0089dace
L
12930 else
12931 cpu_arch_isa_flags
12932 = cpu_flags_or (cpu_arch_isa_flags,
12933 cpu_arch[j].flags);
6305a203 12934 break;
ccc9c027 12935 }
9103f4f4 12936 }
6305a203 12937
293f5f65
L
12938 if (j >= ARRAY_SIZE (cpu_arch))
12939 {
33eaf5de 12940 /* Disable an ISA extension. */
293f5f65
L
12941 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12942 if (strcmp (arch, cpu_noarch [j].name) == 0)
12943 {
12944 i386_cpu_flags flags;
12945
12946 flags = cpu_flags_and_not (cpu_arch_flags,
12947 cpu_noarch[j].flags);
12948 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12949 {
12950 if (cpu_sub_arch_name)
12951 {
12952 char *name = cpu_sub_arch_name;
12953 cpu_sub_arch_name = concat (arch,
12954 (const char *) NULL);
12955 free (name);
12956 }
12957 else
12958 cpu_sub_arch_name = xstrdup (arch);
12959 cpu_arch_flags = flags;
12960 cpu_arch_isa_flags = flags;
12961 }
12962 break;
12963 }
12964
12965 if (j >= ARRAY_SIZE (cpu_noarch))
12966 j = ARRAY_SIZE (cpu_arch);
12967 }
12968
91d6fa6a 12969 if (j >= ARRAY_SIZE (cpu_arch))
2b5d6a91 12970 as_fatal (_("invalid -march= option: `%s'"), arg);
6305a203
L
12971
12972 arch = next;
9103f4f4 12973 }
293f5f65
L
12974 while (next != NULL);
12975 free (saved);
9103f4f4
L
12976 break;
12977
12978 case OPTION_MTUNE:
12979 if (*arg == '.')
2b5d6a91 12980 as_fatal (_("invalid -mtune= option: `%s'"), arg);
91d6fa6a 12981 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9103f4f4 12982 {
91d6fa6a 12983 if (strcmp (arg, cpu_arch [j].name) == 0)
9103f4f4 12984 {
ccc9c027 12985 cpu_arch_tune_set = 1;
91d6fa6a
NC
12986 cpu_arch_tune = cpu_arch [j].type;
12987 cpu_arch_tune_flags = cpu_arch[j].flags;
9103f4f4
L
12988 break;
12989 }
12990 }
91d6fa6a 12991 if (j >= ARRAY_SIZE (cpu_arch))
2b5d6a91 12992 as_fatal (_("invalid -mtune= option: `%s'"), arg);
9103f4f4
L
12993 break;
12994
1efbbeb4
L
12995 case OPTION_MMNEMONIC:
12996 if (strcasecmp (arg, "att") == 0)
12997 intel_mnemonic = 0;
12998 else if (strcasecmp (arg, "intel") == 0)
12999 intel_mnemonic = 1;
13000 else
2b5d6a91 13001 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
1efbbeb4
L
13002 break;
13003
13004 case OPTION_MSYNTAX:
13005 if (strcasecmp (arg, "att") == 0)
13006 intel_syntax = 0;
13007 else if (strcasecmp (arg, "intel") == 0)
13008 intel_syntax = 1;
13009 else
2b5d6a91 13010 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
1efbbeb4
L
13011 break;
13012
13013 case OPTION_MINDEX_REG:
13014 allow_index_reg = 1;
13015 break;
13016
13017 case OPTION_MNAKED_REG:
13018 allow_naked_reg = 1;
13019 break;
13020
c0f3af97
L
13021 case OPTION_MSSE2AVX:
13022 sse2avx = 1;
13023 break;
13024
daf50ae7
L
13025 case OPTION_MSSE_CHECK:
13026 if (strcasecmp (arg, "error") == 0)
7bab8ab5 13027 sse_check = check_error;
daf50ae7 13028 else if (strcasecmp (arg, "warning") == 0)
7bab8ab5 13029 sse_check = check_warning;
daf50ae7 13030 else if (strcasecmp (arg, "none") == 0)
7bab8ab5 13031 sse_check = check_none;
daf50ae7 13032 else
2b5d6a91 13033 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
daf50ae7
L
13034 break;
13035
7bab8ab5
JB
13036 case OPTION_MOPERAND_CHECK:
13037 if (strcasecmp (arg, "error") == 0)
13038 operand_check = check_error;
13039 else if (strcasecmp (arg, "warning") == 0)
13040 operand_check = check_warning;
13041 else if (strcasecmp (arg, "none") == 0)
13042 operand_check = check_none;
13043 else
13044 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13045 break;
13046
539f890d
L
13047 case OPTION_MAVXSCALAR:
13048 if (strcasecmp (arg, "128") == 0)
13049 avxscalar = vex128;
13050 else if (strcasecmp (arg, "256") == 0)
13051 avxscalar = vex256;
13052 else
2b5d6a91 13053 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
539f890d
L
13054 break;
13055
03751133
L
13056 case OPTION_MVEXWIG:
13057 if (strcmp (arg, "0") == 0)
40c9c8de 13058 vexwig = vexw0;
03751133 13059 else if (strcmp (arg, "1") == 0)
40c9c8de 13060 vexwig = vexw1;
03751133
L
13061 else
13062 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13063 break;
13064
7e8b059b
L
13065 case OPTION_MADD_BND_PREFIX:
13066 add_bnd_prefix = 1;
13067 break;
13068
43234a1e
L
13069 case OPTION_MEVEXLIG:
13070 if (strcmp (arg, "128") == 0)
13071 evexlig = evexl128;
13072 else if (strcmp (arg, "256") == 0)
13073 evexlig = evexl256;
13074 else if (strcmp (arg, "512") == 0)
13075 evexlig = evexl512;
13076 else
13077 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13078 break;
13079
d3d3c6db
IT
13080 case OPTION_MEVEXRCIG:
13081 if (strcmp (arg, "rne") == 0)
13082 evexrcig = rne;
13083 else if (strcmp (arg, "rd") == 0)
13084 evexrcig = rd;
13085 else if (strcmp (arg, "ru") == 0)
13086 evexrcig = ru;
13087 else if (strcmp (arg, "rz") == 0)
13088 evexrcig = rz;
13089 else
13090 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13091 break;
13092
43234a1e
L
13093 case OPTION_MEVEXWIG:
13094 if (strcmp (arg, "0") == 0)
13095 evexwig = evexw0;
13096 else if (strcmp (arg, "1") == 0)
13097 evexwig = evexw1;
13098 else
13099 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13100 break;
13101
167ad85b
TG
13102# if defined (TE_PE) || defined (TE_PEP)
13103 case OPTION_MBIG_OBJ:
13104 use_big_obj = 1;
13105 break;
13106#endif
13107
d1982f93 13108 case OPTION_MOMIT_LOCK_PREFIX:
d022bddd
IT
13109 if (strcasecmp (arg, "yes") == 0)
13110 omit_lock_prefix = 1;
13111 else if (strcasecmp (arg, "no") == 0)
13112 omit_lock_prefix = 0;
13113 else
13114 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13115 break;
13116
e4e00185
AS
13117 case OPTION_MFENCE_AS_LOCK_ADD:
13118 if (strcasecmp (arg, "yes") == 0)
13119 avoid_fence = 1;
13120 else if (strcasecmp (arg, "no") == 0)
13121 avoid_fence = 0;
13122 else
13123 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13124 break;
13125
ae531041
L
13126 case OPTION_MLFENCE_AFTER_LOAD:
13127 if (strcasecmp (arg, "yes") == 0)
13128 lfence_after_load = 1;
13129 else if (strcasecmp (arg, "no") == 0)
13130 lfence_after_load = 0;
13131 else
13132 as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13133 break;
13134
13135 case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13136 if (strcasecmp (arg, "all") == 0)
a09f656b 13137 {
13138 lfence_before_indirect_branch = lfence_branch_all;
13139 if (lfence_before_ret == lfence_before_ret_none)
13140 lfence_before_ret = lfence_before_ret_shl;
13141 }
ae531041
L
13142 else if (strcasecmp (arg, "memory") == 0)
13143 lfence_before_indirect_branch = lfence_branch_memory;
13144 else if (strcasecmp (arg, "register") == 0)
13145 lfence_before_indirect_branch = lfence_branch_register;
13146 else if (strcasecmp (arg, "none") == 0)
13147 lfence_before_indirect_branch = lfence_branch_none;
13148 else
13149 as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13150 arg);
13151 break;
13152
13153 case OPTION_MLFENCE_BEFORE_RET:
13154 if (strcasecmp (arg, "or") == 0)
13155 lfence_before_ret = lfence_before_ret_or;
13156 else if (strcasecmp (arg, "not") == 0)
13157 lfence_before_ret = lfence_before_ret_not;
a09f656b 13158 else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13159 lfence_before_ret = lfence_before_ret_shl;
ae531041
L
13160 else if (strcasecmp (arg, "none") == 0)
13161 lfence_before_ret = lfence_before_ret_none;
13162 else
13163 as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13164 arg);
13165 break;
13166
0cb4071e
L
13167 case OPTION_MRELAX_RELOCATIONS:
13168 if (strcasecmp (arg, "yes") == 0)
13169 generate_relax_relocations = 1;
13170 else if (strcasecmp (arg, "no") == 0)
13171 generate_relax_relocations = 0;
13172 else
13173 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13174 break;
13175
e379e5f3
L
13176 case OPTION_MALIGN_BRANCH_BOUNDARY:
13177 {
13178 char *end;
13179 long int align = strtoul (arg, &end, 0);
13180 if (*end == '\0')
13181 {
13182 if (align == 0)
13183 {
13184 align_branch_power = 0;
13185 break;
13186 }
13187 else if (align >= 16)
13188 {
13189 int align_power;
13190 for (align_power = 0;
13191 (align & 1) == 0;
13192 align >>= 1, align_power++)
13193 continue;
13194 /* Limit alignment power to 31. */
13195 if (align == 1 && align_power < 32)
13196 {
13197 align_branch_power = align_power;
13198 break;
13199 }
13200 }
13201 }
13202 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13203 }
13204 break;
13205
13206 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13207 {
13208 char *end;
13209 int align = strtoul (arg, &end, 0);
13210 /* Some processors only support 5 prefixes. */
13211 if (*end == '\0' && align >= 0 && align < 6)
13212 {
13213 align_branch_prefix_size = align;
13214 break;
13215 }
13216 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13217 arg);
13218 }
13219 break;
13220
13221 case OPTION_MALIGN_BRANCH:
13222 align_branch = 0;
13223 saved = xstrdup (arg);
13224 type = saved;
13225 do
13226 {
13227 next = strchr (type, '+');
13228 if (next)
13229 *next++ = '\0';
13230 if (strcasecmp (type, "jcc") == 0)
13231 align_branch |= align_branch_jcc_bit;
13232 else if (strcasecmp (type, "fused") == 0)
13233 align_branch |= align_branch_fused_bit;
13234 else if (strcasecmp (type, "jmp") == 0)
13235 align_branch |= align_branch_jmp_bit;
13236 else if (strcasecmp (type, "call") == 0)
13237 align_branch |= align_branch_call_bit;
13238 else if (strcasecmp (type, "ret") == 0)
13239 align_branch |= align_branch_ret_bit;
13240 else if (strcasecmp (type, "indirect") == 0)
13241 align_branch |= align_branch_indirect_bit;
13242 else
13243 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13244 type = next;
13245 }
13246 while (next != NULL);
13247 free (saved);
13248 break;
13249
76cf450b
L
13250 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13251 align_branch_power = 5;
13252 align_branch_prefix_size = 5;
13253 align_branch = (align_branch_jcc_bit
13254 | align_branch_fused_bit
13255 | align_branch_jmp_bit);
13256 break;
13257
5db04b09 13258 case OPTION_MAMD64:
4b5aaf5f 13259 isa64 = amd64;
5db04b09
L
13260 break;
13261
13262 case OPTION_MINTEL64:
4b5aaf5f 13263 isa64 = intel64;
5db04b09
L
13264 break;
13265
b6f8c7c4
L
13266 case 'O':
13267 if (arg == NULL)
13268 {
13269 optimize = 1;
13270 /* Turn off -Os. */
13271 optimize_for_space = 0;
13272 }
13273 else if (*arg == 's')
13274 {
13275 optimize_for_space = 1;
13276 /* Turn on all encoding optimizations. */
41fd2579 13277 optimize = INT_MAX;
b6f8c7c4
L
13278 }
13279 else
13280 {
13281 optimize = atoi (arg);
13282 /* Turn off -Os. */
13283 optimize_for_space = 0;
13284 }
13285 break;
13286
252b5132
RH
13287 default:
13288 return 0;
13289 }
13290 return 1;
13291}
13292
8a2c8fef
L
13293#define MESSAGE_TEMPLATE \
13294" "
13295
293f5f65
L
13296static char *
13297output_message (FILE *stream, char *p, char *message, char *start,
13298 int *left_p, const char *name, int len)
13299{
13300 int size = sizeof (MESSAGE_TEMPLATE);
13301 int left = *left_p;
13302
13303 /* Reserve 2 spaces for ", " or ",\0" */
13304 left -= len + 2;
13305
13306 /* Check if there is any room. */
13307 if (left >= 0)
13308 {
13309 if (p != start)
13310 {
13311 *p++ = ',';
13312 *p++ = ' ';
13313 }
13314 p = mempcpy (p, name, len);
13315 }
13316 else
13317 {
13318 /* Output the current message now and start a new one. */
13319 *p++ = ',';
13320 *p = '\0';
13321 fprintf (stream, "%s\n", message);
13322 p = start;
13323 left = size - (start - message) - len - 2;
13324
13325 gas_assert (left >= 0);
13326
13327 p = mempcpy (p, name, len);
13328 }
13329
13330 *left_p = left;
13331 return p;
13332}
13333
8a2c8fef 13334static void
1ded5609 13335show_arch (FILE *stream, int ext, int check)
8a2c8fef
L
13336{
13337 static char message[] = MESSAGE_TEMPLATE;
13338 char *start = message + 27;
13339 char *p;
13340 int size = sizeof (MESSAGE_TEMPLATE);
13341 int left;
13342 const char *name;
13343 int len;
13344 unsigned int j;
13345
13346 p = start;
13347 left = size - (start - message);
13348 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13349 {
13350 /* Should it be skipped? */
13351 if (cpu_arch [j].skip)
13352 continue;
13353
13354 name = cpu_arch [j].name;
13355 len = cpu_arch [j].len;
13356 if (*name == '.')
13357 {
13358 /* It is an extension. Skip if we aren't asked to show it. */
13359 if (ext)
13360 {
13361 name++;
13362 len--;
13363 }
13364 else
13365 continue;
13366 }
13367 else if (ext)
13368 {
13369 /* It is an processor. Skip if we show only extension. */
13370 continue;
13371 }
1ded5609
JB
13372 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13373 {
13374 /* It is an impossible processor - skip. */
13375 continue;
13376 }
8a2c8fef 13377
293f5f65 13378 p = output_message (stream, p, message, start, &left, name, len);
8a2c8fef
L
13379 }
13380
293f5f65
L
13381 /* Display disabled extensions. */
13382 if (ext)
13383 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13384 {
13385 name = cpu_noarch [j].name;
13386 len = cpu_noarch [j].len;
13387 p = output_message (stream, p, message, start, &left, name,
13388 len);
13389 }
13390
8a2c8fef
L
13391 *p = '\0';
13392 fprintf (stream, "%s\n", message);
13393}
13394
252b5132 13395void
8a2c8fef 13396md_show_usage (FILE *stream)
252b5132 13397{
4cc782b5
ILT
13398#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13399 fprintf (stream, _("\
d4693039 13400 -Qy, -Qn ignored\n\
a38cf1db 13401 -V print assembler version number\n\
b3b91714
AM
13402 -k ignored\n"));
13403#endif
13404 fprintf (stream, _("\
12b55ccc 13405 -n Do not optimize code alignment\n\
b3b91714
AM
13406 -q quieten some warnings\n"));
13407#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13408 fprintf (stream, _("\
a38cf1db 13409 -s ignored\n"));
b3b91714 13410#endif
d7f449c0
L
13411#if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13412 || defined (TE_PE) || defined (TE_PEP))
751d281c 13413 fprintf (stream, _("\
570561f7 13414 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
751d281c 13415#endif
b3b91714
AM
13416#ifdef SVR4_COMMENT_CHARS
13417 fprintf (stream, _("\
13418 --divide do not treat `/' as a comment character\n"));
a38cf1db
AM
13419#else
13420 fprintf (stream, _("\
b3b91714 13421 --divide ignored\n"));
4cc782b5 13422#endif
9103f4f4 13423 fprintf (stream, _("\
6305a203 13424 -march=CPU[,+EXTENSION...]\n\
8a2c8fef 13425 generate code for CPU and EXTENSION, CPU is one of:\n"));
1ded5609 13426 show_arch (stream, 0, 1);
8a2c8fef
L
13427 fprintf (stream, _("\
13428 EXTENSION is combination of:\n"));
1ded5609 13429 show_arch (stream, 1, 0);
6305a203 13430 fprintf (stream, _("\
8a2c8fef 13431 -mtune=CPU optimize for CPU, CPU is one of:\n"));
1ded5609 13432 show_arch (stream, 0, 0);
ba104c83 13433 fprintf (stream, _("\
c0f3af97
L
13434 -msse2avx encode SSE instructions with VEX prefix\n"));
13435 fprintf (stream, _("\
7c5c05ef 13436 -msse-check=[none|error|warning] (default: warning)\n\
daf50ae7
L
13437 check SSE instructions\n"));
13438 fprintf (stream, _("\
7c5c05ef 13439 -moperand-check=[none|error|warning] (default: warning)\n\
7bab8ab5
JB
13440 check operand combinations for validity\n"));
13441 fprintf (stream, _("\
7c5c05ef
L
13442 -mavxscalar=[128|256] (default: 128)\n\
13443 encode scalar AVX instructions with specific vector\n\
539f890d
L
13444 length\n"));
13445 fprintf (stream, _("\
03751133
L
13446 -mvexwig=[0|1] (default: 0)\n\
13447 encode VEX instructions with specific VEX.W value\n\
13448 for VEX.W bit ignored instructions\n"));
13449 fprintf (stream, _("\
7c5c05ef
L
13450 -mevexlig=[128|256|512] (default: 128)\n\
13451 encode scalar EVEX instructions with specific vector\n\
43234a1e
L
13452 length\n"));
13453 fprintf (stream, _("\
7c5c05ef
L
13454 -mevexwig=[0|1] (default: 0)\n\
13455 encode EVEX instructions with specific EVEX.W value\n\
43234a1e
L
13456 for EVEX.W bit ignored instructions\n"));
13457 fprintf (stream, _("\
7c5c05ef 13458 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
d3d3c6db
IT
13459 encode EVEX instructions with specific EVEX.RC value\n\
13460 for SAE-only ignored instructions\n"));
13461 fprintf (stream, _("\
7c5c05ef
L
13462 -mmnemonic=[att|intel] "));
13463 if (SYSV386_COMPAT)
13464 fprintf (stream, _("(default: att)\n"));
13465 else
13466 fprintf (stream, _("(default: intel)\n"));
13467 fprintf (stream, _("\
13468 use AT&T/Intel mnemonic\n"));
ba104c83 13469 fprintf (stream, _("\
7c5c05ef
L
13470 -msyntax=[att|intel] (default: att)\n\
13471 use AT&T/Intel syntax\n"));
ba104c83
L
13472 fprintf (stream, _("\
13473 -mindex-reg support pseudo index registers\n"));
13474 fprintf (stream, _("\
13475 -mnaked-reg don't require `%%' prefix for registers\n"));
13476 fprintf (stream, _("\
7e8b059b 13477 -madd-bnd-prefix add BND prefix for all valid branches\n"));
b4a3a7b4 13478#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8dcea932
L
13479 fprintf (stream, _("\
13480 -mshared disable branch optimization for shared code\n"));
b4a3a7b4
L
13481 fprintf (stream, _("\
13482 -mx86-used-note=[no|yes] "));
13483 if (DEFAULT_X86_USED_NOTE)
13484 fprintf (stream, _("(default: yes)\n"));
13485 else
13486 fprintf (stream, _("(default: no)\n"));
13487 fprintf (stream, _("\
13488 generate x86 used ISA and feature properties\n"));
13489#endif
13490#if defined (TE_PE) || defined (TE_PEP)
167ad85b
TG
13491 fprintf (stream, _("\
13492 -mbig-obj generate big object files\n"));
13493#endif
d022bddd 13494 fprintf (stream, _("\
7c5c05ef 13495 -momit-lock-prefix=[no|yes] (default: no)\n\
d022bddd 13496 strip all lock prefixes\n"));
5db04b09 13497 fprintf (stream, _("\
7c5c05ef 13498 -mfence-as-lock-add=[no|yes] (default: no)\n\
e4e00185
AS
13499 encode lfence, mfence and sfence as\n\
13500 lock addl $0x0, (%%{re}sp)\n"));
13501 fprintf (stream, _("\
7c5c05ef
L
13502 -mrelax-relocations=[no|yes] "));
13503 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13504 fprintf (stream, _("(default: yes)\n"));
13505 else
13506 fprintf (stream, _("(default: no)\n"));
13507 fprintf (stream, _("\
0cb4071e
L
13508 generate relax relocations\n"));
13509 fprintf (stream, _("\
e379e5f3
L
13510 -malign-branch-boundary=NUM (default: 0)\n\
13511 align branches within NUM byte boundary\n"));
13512 fprintf (stream, _("\
13513 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13514 TYPE is combination of jcc, fused, jmp, call, ret,\n\
13515 indirect\n\
13516 specify types of branches to align\n"));
13517 fprintf (stream, _("\
13518 -malign-branch-prefix-size=NUM (default: 5)\n\
13519 align branches with NUM prefixes per instruction\n"));
13520 fprintf (stream, _("\
76cf450b
L
13521 -mbranches-within-32B-boundaries\n\
13522 align branches within 32 byte boundary\n"));
13523 fprintf (stream, _("\
ae531041
L
13524 -mlfence-after-load=[no|yes] (default: no)\n\
13525 generate lfence after load\n"));
13526 fprintf (stream, _("\
13527 -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13528 generate lfence before indirect near branch\n"));
13529 fprintf (stream, _("\
a09f656b 13530 -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
ae531041
L
13531 generate lfence before ret\n"));
13532 fprintf (stream, _("\
7c5c05ef 13533 -mamd64 accept only AMD64 ISA [default]\n"));
5db04b09
L
13534 fprintf (stream, _("\
13535 -mintel64 accept only Intel64 ISA\n"));
252b5132
RH
13536}
13537
3e73aa7c 13538#if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
321098a5 13539 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
e57f8c65 13540 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
252b5132
RH
13541
13542/* Pick the target format to use. */
13543
47926f60 13544const char *
e3bb37b5 13545i386_target_format (void)
252b5132 13546{
351f65ca
L
13547 if (!strncmp (default_arch, "x86_64", 6))
13548 {
13549 update_code_flag (CODE_64BIT, 1);
13550 if (default_arch[6] == '\0')
7f56bc95 13551 x86_elf_abi = X86_64_ABI;
351f65ca 13552 else
7f56bc95 13553 x86_elf_abi = X86_64_X32_ABI;
351f65ca 13554 }
3e73aa7c 13555 else if (!strcmp (default_arch, "i386"))
78f12dd3 13556 update_code_flag (CODE_32BIT, 1);
5197d474
L
13557 else if (!strcmp (default_arch, "iamcu"))
13558 {
13559 update_code_flag (CODE_32BIT, 1);
13560 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13561 {
13562 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13563 cpu_arch_name = "iamcu";
13564 cpu_sub_arch_name = NULL;
13565 cpu_arch_flags = iamcu_flags;
13566 cpu_arch_isa = PROCESSOR_IAMCU;
13567 cpu_arch_isa_flags = iamcu_flags;
13568 if (!cpu_arch_tune_set)
13569 {
13570 cpu_arch_tune = cpu_arch_isa;
13571 cpu_arch_tune_flags = cpu_arch_isa_flags;
13572 }
13573 }
8d471ec1 13574 else if (cpu_arch_isa != PROCESSOR_IAMCU)
5197d474
L
13575 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13576 cpu_arch_name);
13577 }
3e73aa7c 13578 else
2b5d6a91 13579 as_fatal (_("unknown architecture"));
89507696
JB
13580
13581 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13582 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13583 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13584 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13585
252b5132
RH
13586 switch (OUTPUT_FLAVOR)
13587 {
9384f2ff 13588#if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
4c63da97 13589 case bfd_target_aout_flavour:
47926f60 13590 return AOUT_TARGET_FORMAT;
4c63da97 13591#endif
9384f2ff
AM
13592#if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13593# if defined (TE_PE) || defined (TE_PEP)
13594 case bfd_target_coff_flavour:
167ad85b
TG
13595 if (flag_code == CODE_64BIT)
13596 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13597 else
251dae91 13598 return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
9384f2ff 13599# elif defined (TE_GO32)
0561d57c
JK
13600 case bfd_target_coff_flavour:
13601 return "coff-go32";
9384f2ff 13602# else
252b5132
RH
13603 case bfd_target_coff_flavour:
13604 return "coff-i386";
9384f2ff 13605# endif
4c63da97 13606#endif
3e73aa7c 13607#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
252b5132 13608 case bfd_target_elf_flavour:
3e73aa7c 13609 {
351f65ca
L
13610 const char *format;
13611
13612 switch (x86_elf_abi)
4fa24527 13613 {
351f65ca
L
13614 default:
13615 format = ELF_TARGET_FORMAT;
e379e5f3
L
13616#ifndef TE_SOLARIS
13617 tls_get_addr = "___tls_get_addr";
13618#endif
351f65ca 13619 break;
7f56bc95 13620 case X86_64_ABI:
351f65ca 13621 use_rela_relocations = 1;
4fa24527 13622 object_64bit = 1;
e379e5f3
L
13623#ifndef TE_SOLARIS
13624 tls_get_addr = "__tls_get_addr";
13625#endif
351f65ca
L
13626 format = ELF_TARGET_FORMAT64;
13627 break;
7f56bc95 13628 case X86_64_X32_ABI:
4fa24527 13629 use_rela_relocations = 1;
351f65ca 13630 object_64bit = 1;
e379e5f3
L
13631#ifndef TE_SOLARIS
13632 tls_get_addr = "__tls_get_addr";
13633#endif
862be3fb 13634 disallow_64bit_reloc = 1;
351f65ca
L
13635 format = ELF_TARGET_FORMAT32;
13636 break;
4fa24527 13637 }
3632d14b 13638 if (cpu_arch_isa == PROCESSOR_L1OM)
8a9036a4 13639 {
7f56bc95 13640 if (x86_elf_abi != X86_64_ABI)
8a9036a4
L
13641 as_fatal (_("Intel L1OM is 64bit only"));
13642 return ELF_TARGET_L1OM_FORMAT;
13643 }
b49f93f6 13644 else if (cpu_arch_isa == PROCESSOR_K1OM)
7a9068fe
L
13645 {
13646 if (x86_elf_abi != X86_64_ABI)
13647 as_fatal (_("Intel K1OM is 64bit only"));
13648 return ELF_TARGET_K1OM_FORMAT;
13649 }
81486035
L
13650 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13651 {
13652 if (x86_elf_abi != I386_ABI)
13653 as_fatal (_("Intel MCU is 32bit only"));
13654 return ELF_TARGET_IAMCU_FORMAT;
13655 }
8a9036a4 13656 else
351f65ca 13657 return format;
3e73aa7c 13658 }
e57f8c65
TG
13659#endif
13660#if defined (OBJ_MACH_O)
13661 case bfd_target_mach_o_flavour:
d382c579
TG
13662 if (flag_code == CODE_64BIT)
13663 {
13664 use_rela_relocations = 1;
13665 object_64bit = 1;
13666 return "mach-o-x86-64";
13667 }
13668 else
13669 return "mach-o-i386";
4c63da97 13670#endif
252b5132
RH
13671 default:
13672 abort ();
13673 return NULL;
13674 }
13675}
13676
47926f60 13677#endif /* OBJ_MAYBE_ more than one */
252b5132 13678\f
252b5132 13679symbolS *
7016a5d5 13680md_undefined_symbol (char *name)
252b5132 13681{
18dc2407
ILT
13682 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13683 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13684 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13685 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
24eab124
AM
13686 {
13687 if (!GOT_symbol)
13688 {
13689 if (symbol_find (name))
13690 as_bad (_("GOT already in symbol table"));
13691 GOT_symbol = symbol_new (name, undefined_section,
13692 (valueT) 0, &zero_address_frag);
13693 };
13694 return GOT_symbol;
13695 }
252b5132
RH
13696 return 0;
13697}
13698
13699/* Round up a section size to the appropriate boundary. */
47926f60 13700
252b5132 13701valueT
7016a5d5 13702md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
252b5132 13703{
4c63da97
AM
13704#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13705 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13706 {
13707 /* For a.out, force the section size to be aligned. If we don't do
13708 this, BFD will align it for us, but it will not write out the
13709 final bytes of the section. This may be a bug in BFD, but it is
13710 easier to fix it here since that is how the other a.out targets
13711 work. */
13712 int align;
13713
fd361982 13714 align = bfd_section_alignment (segment);
8d3842cd 13715 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
4c63da97 13716 }
252b5132
RH
13717#endif
13718
13719 return size;
13720}
13721
13722/* On the i386, PC-relative offsets are relative to the start of the
13723 next instruction. That is, the address of the offset, plus its
13724 size, since the offset is always the last part of the insn. */
13725
13726long
e3bb37b5 13727md_pcrel_from (fixS *fixP)
252b5132
RH
13728{
13729 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13730}
13731
13732#ifndef I386COFF
13733
13734static void
e3bb37b5 13735s_bss (int ignore ATTRIBUTE_UNUSED)
252b5132 13736{
29b0f896 13737 int temp;
252b5132 13738
8a75718c
JB
13739#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13740 if (IS_ELF)
13741 obj_elf_section_change_hook ();
13742#endif
252b5132
RH
13743 temp = get_absolute_expression ();
13744 subseg_set (bss_section, (subsegT) temp);
13745 demand_empty_rest_of_line ();
13746}
13747
13748#endif
13749
e379e5f3
L
13750/* Remember constant directive. */
13751
13752void
13753i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13754{
13755 if (last_insn.kind != last_insn_directive
13756 && (bfd_section_flags (now_seg) & SEC_CODE))
13757 {
13758 last_insn.seg = now_seg;
13759 last_insn.kind = last_insn_directive;
13760 last_insn.name = "constant directive";
13761 last_insn.file = as_where (&last_insn.line);
ae531041
L
13762 if (lfence_before_ret != lfence_before_ret_none)
13763 {
13764 if (lfence_before_indirect_branch != lfence_branch_none)
13765 as_warn (_("constant directive skips -mlfence-before-ret "
13766 "and -mlfence-before-indirect-branch"));
13767 else
13768 as_warn (_("constant directive skips -mlfence-before-ret"));
13769 }
13770 else if (lfence_before_indirect_branch != lfence_branch_none)
13771 as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
e379e5f3
L
13772 }
13773}
13774
252b5132 13775void
e3bb37b5 13776i386_validate_fix (fixS *fixp)
252b5132 13777{
02a86693 13778 if (fixp->fx_subsy)
252b5132 13779 {
02a86693 13780 if (fixp->fx_subsy == GOT_symbol)
23df1078 13781 {
02a86693
L
13782 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13783 {
13784 if (!object_64bit)
13785 abort ();
13786#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13787 if (fixp->fx_tcbit2)
56ceb5b5
L
13788 fixp->fx_r_type = (fixp->fx_tcbit
13789 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13790 : BFD_RELOC_X86_64_GOTPCRELX);
02a86693
L
13791 else
13792#endif
13793 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13794 }
d6ab8113 13795 else
02a86693
L
13796 {
13797 if (!object_64bit)
13798 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13799 else
13800 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13801 }
13802 fixp->fx_subsy = 0;
23df1078 13803 }
252b5132 13804 }
02a86693
L
13805#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13806 else if (!object_64bit)
13807 {
13808 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13809 && fixp->fx_tcbit2)
13810 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13811 }
13812#endif
252b5132
RH
13813}
13814
252b5132 13815arelent *
7016a5d5 13816tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
252b5132
RH
13817{
13818 arelent *rel;
13819 bfd_reloc_code_real_type code;
13820
13821 switch (fixp->fx_r_type)
13822 {
8ce3d284 13823#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
13824 case BFD_RELOC_SIZE32:
13825 case BFD_RELOC_SIZE64:
13826 if (S_IS_DEFINED (fixp->fx_addsy)
13827 && !S_IS_EXTERNAL (fixp->fx_addsy))
13828 {
13829 /* Resolve size relocation against local symbol to size of
13830 the symbol plus addend. */
13831 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13832 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13833 && !fits_in_unsigned_long (value))
13834 as_bad_where (fixp->fx_file, fixp->fx_line,
13835 _("symbol size computation overflow"));
13836 fixp->fx_addsy = NULL;
13837 fixp->fx_subsy = NULL;
13838 md_apply_fix (fixp, (valueT *) &value, NULL);
13839 return NULL;
13840 }
8ce3d284 13841#endif
1a0670f3 13842 /* Fall through. */
8fd4256d 13843
3e73aa7c
JH
13844 case BFD_RELOC_X86_64_PLT32:
13845 case BFD_RELOC_X86_64_GOT32:
13846 case BFD_RELOC_X86_64_GOTPCREL:
56ceb5b5
L
13847 case BFD_RELOC_X86_64_GOTPCRELX:
13848 case BFD_RELOC_X86_64_REX_GOTPCRELX:
252b5132
RH
13849 case BFD_RELOC_386_PLT32:
13850 case BFD_RELOC_386_GOT32:
02a86693 13851 case BFD_RELOC_386_GOT32X:
252b5132
RH
13852 case BFD_RELOC_386_GOTOFF:
13853 case BFD_RELOC_386_GOTPC:
13ae64f3
JJ
13854 case BFD_RELOC_386_TLS_GD:
13855 case BFD_RELOC_386_TLS_LDM:
13856 case BFD_RELOC_386_TLS_LDO_32:
13857 case BFD_RELOC_386_TLS_IE_32:
37e55690
JJ
13858 case BFD_RELOC_386_TLS_IE:
13859 case BFD_RELOC_386_TLS_GOTIE:
13ae64f3
JJ
13860 case BFD_RELOC_386_TLS_LE_32:
13861 case BFD_RELOC_386_TLS_LE:
67a4f2b7
AO
13862 case BFD_RELOC_386_TLS_GOTDESC:
13863 case BFD_RELOC_386_TLS_DESC_CALL:
bffbf940
JJ
13864 case BFD_RELOC_X86_64_TLSGD:
13865 case BFD_RELOC_X86_64_TLSLD:
13866 case BFD_RELOC_X86_64_DTPOFF32:
d6ab8113 13867 case BFD_RELOC_X86_64_DTPOFF64:
bffbf940
JJ
13868 case BFD_RELOC_X86_64_GOTTPOFF:
13869 case BFD_RELOC_X86_64_TPOFF32:
d6ab8113
JB
13870 case BFD_RELOC_X86_64_TPOFF64:
13871 case BFD_RELOC_X86_64_GOTOFF64:
13872 case BFD_RELOC_X86_64_GOTPC32:
7b81dfbb
AJ
13873 case BFD_RELOC_X86_64_GOT64:
13874 case BFD_RELOC_X86_64_GOTPCREL64:
13875 case BFD_RELOC_X86_64_GOTPC64:
13876 case BFD_RELOC_X86_64_GOTPLT64:
13877 case BFD_RELOC_X86_64_PLTOFF64:
67a4f2b7
AO
13878 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13879 case BFD_RELOC_X86_64_TLSDESC_CALL:
252b5132
RH
13880 case BFD_RELOC_RVA:
13881 case BFD_RELOC_VTABLE_ENTRY:
13882 case BFD_RELOC_VTABLE_INHERIT:
6482c264
NC
13883#ifdef TE_PE
13884 case BFD_RELOC_32_SECREL:
13885#endif
252b5132
RH
13886 code = fixp->fx_r_type;
13887 break;
dbbaec26
L
13888 case BFD_RELOC_X86_64_32S:
13889 if (!fixp->fx_pcrel)
13890 {
13891 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13892 code = fixp->fx_r_type;
13893 break;
13894 }
1a0670f3 13895 /* Fall through. */
252b5132 13896 default:
93382f6d 13897 if (fixp->fx_pcrel)
252b5132 13898 {
93382f6d
AM
13899 switch (fixp->fx_size)
13900 {
13901 default:
b091f402
AM
13902 as_bad_where (fixp->fx_file, fixp->fx_line,
13903 _("can not do %d byte pc-relative relocation"),
13904 fixp->fx_size);
93382f6d
AM
13905 code = BFD_RELOC_32_PCREL;
13906 break;
13907 case 1: code = BFD_RELOC_8_PCREL; break;
13908 case 2: code = BFD_RELOC_16_PCREL; break;
d258b828 13909 case 4: code = BFD_RELOC_32_PCREL; break;
d6ab8113
JB
13910#ifdef BFD64
13911 case 8: code = BFD_RELOC_64_PCREL; break;
13912#endif
93382f6d
AM
13913 }
13914 }
13915 else
13916 {
13917 switch (fixp->fx_size)
13918 {
13919 default:
b091f402
AM
13920 as_bad_where (fixp->fx_file, fixp->fx_line,
13921 _("can not do %d byte relocation"),
13922 fixp->fx_size);
93382f6d
AM
13923 code = BFD_RELOC_32;
13924 break;
13925 case 1: code = BFD_RELOC_8; break;
13926 case 2: code = BFD_RELOC_16; break;
13927 case 4: code = BFD_RELOC_32; break;
937149dd 13928#ifdef BFD64
3e73aa7c 13929 case 8: code = BFD_RELOC_64; break;
937149dd 13930#endif
93382f6d 13931 }
252b5132
RH
13932 }
13933 break;
13934 }
252b5132 13935
d182319b
JB
13936 if ((code == BFD_RELOC_32
13937 || code == BFD_RELOC_32_PCREL
13938 || code == BFD_RELOC_X86_64_32S)
252b5132
RH
13939 && GOT_symbol
13940 && fixp->fx_addsy == GOT_symbol)
3e73aa7c 13941 {
4fa24527 13942 if (!object_64bit)
d6ab8113
JB
13943 code = BFD_RELOC_386_GOTPC;
13944 else
13945 code = BFD_RELOC_X86_64_GOTPC32;
3e73aa7c 13946 }
7b81dfbb
AJ
13947 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13948 && GOT_symbol
13949 && fixp->fx_addsy == GOT_symbol)
13950 {
13951 code = BFD_RELOC_X86_64_GOTPC64;
13952 }
252b5132 13953
add39d23
TS
13954 rel = XNEW (arelent);
13955 rel->sym_ptr_ptr = XNEW (asymbol *);
49309057 13956 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
252b5132
RH
13957
13958 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
c87db184 13959
3e73aa7c
JH
13960 if (!use_rela_relocations)
13961 {
13962 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13963 vtable entry to be used in the relocation's section offset. */
13964 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13965 rel->address = fixp->fx_offset;
fbeb56a4
DK
13966#if defined (OBJ_COFF) && defined (TE_PE)
13967 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13968 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13969 else
13970#endif
c6682705 13971 rel->addend = 0;
3e73aa7c
JH
13972 }
13973 /* Use the rela in 64bit mode. */
252b5132 13974 else
3e73aa7c 13975 {
862be3fb
L
13976 if (disallow_64bit_reloc)
13977 switch (code)
13978 {
862be3fb
L
13979 case BFD_RELOC_X86_64_DTPOFF64:
13980 case BFD_RELOC_X86_64_TPOFF64:
13981 case BFD_RELOC_64_PCREL:
13982 case BFD_RELOC_X86_64_GOTOFF64:
13983 case BFD_RELOC_X86_64_GOT64:
13984 case BFD_RELOC_X86_64_GOTPCREL64:
13985 case BFD_RELOC_X86_64_GOTPC64:
13986 case BFD_RELOC_X86_64_GOTPLT64:
13987 case BFD_RELOC_X86_64_PLTOFF64:
13988 as_bad_where (fixp->fx_file, fixp->fx_line,
13989 _("cannot represent relocation type %s in x32 mode"),
13990 bfd_get_reloc_code_name (code));
13991 break;
13992 default:
13993 break;
13994 }
13995
062cd5e7
AS
13996 if (!fixp->fx_pcrel)
13997 rel->addend = fixp->fx_offset;
13998 else
13999 switch (code)
14000 {
14001 case BFD_RELOC_X86_64_PLT32:
14002 case BFD_RELOC_X86_64_GOT32:
14003 case BFD_RELOC_X86_64_GOTPCREL:
56ceb5b5
L
14004 case BFD_RELOC_X86_64_GOTPCRELX:
14005 case BFD_RELOC_X86_64_REX_GOTPCRELX:
bffbf940
JJ
14006 case BFD_RELOC_X86_64_TLSGD:
14007 case BFD_RELOC_X86_64_TLSLD:
14008 case BFD_RELOC_X86_64_GOTTPOFF:
67a4f2b7
AO
14009 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14010 case BFD_RELOC_X86_64_TLSDESC_CALL:
062cd5e7
AS
14011 rel->addend = fixp->fx_offset - fixp->fx_size;
14012 break;
14013 default:
14014 rel->addend = (section->vma
14015 - fixp->fx_size
14016 + fixp->fx_addnumber
14017 + md_pcrel_from (fixp));
14018 break;
14019 }
3e73aa7c
JH
14020 }
14021
252b5132
RH
14022 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14023 if (rel->howto == NULL)
14024 {
14025 as_bad_where (fixp->fx_file, fixp->fx_line,
d0b47220 14026 _("cannot represent relocation type %s"),
252b5132
RH
14027 bfd_get_reloc_code_name (code));
14028 /* Set howto to a garbage value so that we can keep going. */
14029 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
9c2799c2 14030 gas_assert (rel->howto != NULL);
252b5132
RH
14031 }
14032
14033 return rel;
14034}
14035
ee86248c 14036#include "tc-i386-intel.c"
54cfded0 14037
a60de03c
JB
14038void
14039tc_x86_parse_to_dw2regnum (expressionS *exp)
54cfded0 14040{
a60de03c
JB
14041 int saved_naked_reg;
14042 char saved_register_dot;
54cfded0 14043
a60de03c
JB
14044 saved_naked_reg = allow_naked_reg;
14045 allow_naked_reg = 1;
14046 saved_register_dot = register_chars['.'];
14047 register_chars['.'] = '.';
14048 allow_pseudo_reg = 1;
14049 expression_and_evaluate (exp);
14050 allow_pseudo_reg = 0;
14051 register_chars['.'] = saved_register_dot;
14052 allow_naked_reg = saved_naked_reg;
14053
e96d56a1 14054 if (exp->X_op == O_register && exp->X_add_number >= 0)
54cfded0 14055 {
a60de03c
JB
14056 if ((addressT) exp->X_add_number < i386_regtab_size)
14057 {
14058 exp->X_op = O_constant;
14059 exp->X_add_number = i386_regtab[exp->X_add_number]
14060 .dw2_regnum[flag_code >> 1];
14061 }
14062 else
14063 exp->X_op = O_illegal;
54cfded0 14064 }
54cfded0
AM
14065}
14066
14067void
14068tc_x86_frame_initial_instructions (void)
14069{
a60de03c
JB
14070 static unsigned int sp_regno[2];
14071
14072 if (!sp_regno[flag_code >> 1])
14073 {
14074 char *saved_input = input_line_pointer;
14075 char sp[][4] = {"esp", "rsp"};
14076 expressionS exp;
a4447b93 14077
a60de03c
JB
14078 input_line_pointer = sp[flag_code >> 1];
14079 tc_x86_parse_to_dw2regnum (&exp);
9c2799c2 14080 gas_assert (exp.X_op == O_constant);
a60de03c
JB
14081 sp_regno[flag_code >> 1] = exp.X_add_number;
14082 input_line_pointer = saved_input;
14083 }
a4447b93 14084
61ff971f
L
14085 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14086 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
54cfded0 14087}
d2b2c203 14088
d7921315
L
14089int
14090x86_dwarf2_addr_size (void)
14091{
14092#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14093 if (x86_elf_abi == X86_64_X32_ABI)
14094 return 4;
14095#endif
14096 return bfd_arch_bits_per_address (stdoutput) / 8;
14097}
14098
d2b2c203
DJ
14099int
14100i386_elf_section_type (const char *str, size_t len)
14101{
14102 if (flag_code == CODE_64BIT
14103 && len == sizeof ("unwind") - 1
14104 && strncmp (str, "unwind", 6) == 0)
14105 return SHT_X86_64_UNWIND;
14106
14107 return -1;
14108}
bb41ade5 14109
ad5fec3b
EB
14110#ifdef TE_SOLARIS
14111void
14112i386_solaris_fix_up_eh_frame (segT sec)
14113{
14114 if (flag_code == CODE_64BIT)
14115 elf_section_type (sec) = SHT_X86_64_UNWIND;
14116}
14117#endif
14118
bb41ade5
AM
14119#ifdef TE_PE
14120void
14121tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14122{
91d6fa6a 14123 expressionS exp;
bb41ade5 14124
91d6fa6a
NC
14125 exp.X_op = O_secrel;
14126 exp.X_add_symbol = symbol;
14127 exp.X_add_number = 0;
14128 emit_expr (&exp, size);
bb41ade5
AM
14129}
14130#endif
3b22753a
L
14131
14132#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14133/* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
14134
01e1a5bc 14135bfd_vma
6d4af3c2 14136x86_64_section_letter (int letter, const char **ptr_msg)
3b22753a
L
14137{
14138 if (flag_code == CODE_64BIT)
14139 {
14140 if (letter == 'l')
14141 return SHF_X86_64_LARGE;
14142
8f3bae45 14143 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
64e74474 14144 }
3b22753a 14145 else
8f3bae45 14146 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
3b22753a
L
14147 return -1;
14148}
14149
01e1a5bc 14150bfd_vma
3b22753a
L
14151x86_64_section_word (char *str, size_t len)
14152{
8620418b 14153 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
3b22753a
L
14154 return SHF_X86_64_LARGE;
14155
14156 return -1;
14157}
14158
14159static void
14160handle_large_common (int small ATTRIBUTE_UNUSED)
14161{
14162 if (flag_code != CODE_64BIT)
14163 {
14164 s_comm_internal (0, elf_common_parse);
14165 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14166 }
14167 else
14168 {
14169 static segT lbss_section;
14170 asection *saved_com_section_ptr = elf_com_section_ptr;
14171 asection *saved_bss_section = bss_section;
14172
14173 if (lbss_section == NULL)
14174 {
14175 flagword applicable;
14176 segT seg = now_seg;
14177 subsegT subseg = now_subseg;
14178
14179 /* The .lbss section is for local .largecomm symbols. */
14180 lbss_section = subseg_new (".lbss", 0);
14181 applicable = bfd_applicable_section_flags (stdoutput);
fd361982 14182 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
3b22753a
L
14183 seg_info (lbss_section)->bss = 1;
14184
14185 subseg_set (seg, subseg);
14186 }
14187
14188 elf_com_section_ptr = &_bfd_elf_large_com_section;
14189 bss_section = lbss_section;
14190
14191 s_comm_internal (0, elf_common_parse);
14192
14193 elf_com_section_ptr = saved_com_section_ptr;
14194 bss_section = saved_bss_section;
14195 }
14196}
14197#endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 3.209357 seconds and 4 git commands to generate.