ae2a2c1a5367aff595b94799077da3f63af0edfb
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef INFER_ADDR_PREFIX
48 #define INFER_ADDR_PREFIX 1
49 #endif
50
51 #ifndef DEFAULT_ARCH
52 #define DEFAULT_ARCH "i386"
53 #endif
54
55 #ifndef INLINE
56 #if __GNUC__ >= 2
57 #define INLINE __inline__
58 #else
59 #define INLINE
60 #endif
61 #endif
62
63 /* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
68 #define WAIT_PREFIX 0
69 #define SEG_PREFIX 1
70 #define ADDR_PREFIX 2
71 #define DATA_PREFIX 3
72 #define REP_PREFIX 4
73 #define HLE_PREFIX REP_PREFIX
74 #define BND_PREFIX REP_PREFIX
75 #define LOCK_PREFIX 5
76 #define REX_PREFIX 6 /* must come last. */
77 #define MAX_PREFIXES 7 /* max prefixes per opcode */
78
79 /* we define the syntax here (modulo base,index,scale syntax) */
80 #define REGISTER_PREFIX '%'
81 #define IMMEDIATE_PREFIX '$'
82 #define ABSOLUTE_PREFIX '*'
83
84 /* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86 #define WORD_MNEM_SUFFIX 'w'
87 #define BYTE_MNEM_SUFFIX 'b'
88 #define SHORT_MNEM_SUFFIX 's'
89 #define LONG_MNEM_SUFFIX 'l'
90 #define QWORD_MNEM_SUFFIX 'q'
91 /* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95 #define END_OF_INSN '\0'
96
97 /* This matches the C -> StaticRounding alias in the opcode table. */
98 #define commutative staticrounding
99
100 /*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107 typedef struct
108 {
109 const insn_template *start;
110 const insn_template *end;
111 }
112 templates;
113
114 /* 386 operand encoding bytes: see 386 book for details of this. */
115 typedef struct
116 {
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120 }
121 modrm_byte;
122
123 /* x86-64 extension prefix. */
124 typedef int rex_byte;
125
126 /* 386 opcode byte to code indirect addressing. */
127 typedef struct
128 {
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132 }
133 sib_byte;
134
135 /* x86 arch names, types and features */
136 typedef struct
137 {
138 const char *name; /* arch name */
139 unsigned int len; /* arch string length */
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
142 unsigned int skip; /* show_arch should skip this. */
143 }
144 arch_entry;
145
146 /* Used to turn off indicated flags. */
147 typedef struct
148 {
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152 }
153 noarch_entry;
154
155 static void update_code_flag (int, int);
156 static void set_code_flag (int);
157 static void set_16bit_gcc_code_flag (int);
158 static void set_intel_syntax (int);
159 static void set_intel_mnemonic (int);
160 static void set_allow_index_reg (int);
161 static void set_check (int);
162 static void set_cpu_arch (int);
163 #ifdef TE_PE
164 static void pe_directive_secrel (int);
165 #endif
166 static void signed_cons (int);
167 static char *output_invalid (int c);
168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
172 static int i386_att_operand (char *);
173 static int i386_intel_operand (char *, int);
174 static int i386_intel_simplify (expressionS *);
175 static int i386_intel_parse_name (const char *, expressionS *);
176 static const reg_entry *parse_register (char *, char **);
177 static char *parse_insn (char *, char *);
178 static char *parse_operands (char *, const char *);
179 static void swap_operands (void);
180 static void swap_2_operands (int, int);
181 static enum flag_code i386_addressing_mode (void);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
202
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
210
211 static const char *default_arch = DEFAULT_ARCH;
212
213 /* parse_register() returns this when a register alias cannot be used. */
214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
215 { Dw2Inval, Dw2Inval } };
216
217 /* This struct describes rounding control and SAE in the instruction. */
218 struct RC_Operation
219 {
220 enum rc_type
221 {
222 rne = 0,
223 rd,
224 ru,
225 rz,
226 saeonly
227 } type;
228 int operand;
229 };
230
231 static struct RC_Operation rc_op;
232
233 /* The struct describes masking, applied to OPERAND in the instruction.
234 MASK is a pointer to the corresponding mask register. ZEROING tells
235 whether merging or zeroing mask is used. */
236 struct Mask_Operation
237 {
238 const reg_entry *mask;
239 unsigned int zeroing;
240 /* The operand where this operation is associated. */
241 int operand;
242 };
243
244 static struct Mask_Operation mask_op;
245
246 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
247 broadcast factor. */
248 struct Broadcast_Operation
249 {
250 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
251 int type;
252
253 /* Index of broadcasted operand. */
254 int operand;
255
256 /* Number of bytes to broadcast. */
257 int bytes;
258 };
259
260 static struct Broadcast_Operation broadcast_op;
261
262 /* VEX prefix. */
263 typedef struct
264 {
265 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
266 unsigned char bytes[4];
267 unsigned int length;
268 /* Destination or source register specifier. */
269 const reg_entry *register_specifier;
270 } vex_prefix;
271
272 /* 'md_assemble ()' gathers together information and puts it into a
273 i386_insn. */
274
275 union i386_op
276 {
277 expressionS *disps;
278 expressionS *imms;
279 const reg_entry *regs;
280 };
281
282 enum i386_error
283 {
284 operand_size_mismatch,
285 operand_type_mismatch,
286 register_type_mismatch,
287 number_of_operands_mismatch,
288 invalid_instruction_suffix,
289 bad_imm4,
290 unsupported_with_intel_mnemonic,
291 unsupported_syntax,
292 unsupported,
293 invalid_vsib_address,
294 invalid_vector_register_set,
295 unsupported_vector_index_register,
296 unsupported_broadcast,
297 broadcast_needed,
298 unsupported_masking,
299 mask_not_on_destination,
300 no_default_mask,
301 unsupported_rc_sae,
302 rc_sae_operand_not_last_imm,
303 invalid_register_operand,
304 };
305
306 struct _i386_insn
307 {
308 /* TM holds the template for the insn were currently assembling. */
309 insn_template tm;
310
311 /* SUFFIX holds the instruction size suffix for byte, word, dword
312 or qword, if given. */
313 char suffix;
314
315 /* OPERANDS gives the number of given operands. */
316 unsigned int operands;
317
318 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
319 of given register, displacement, memory operands and immediate
320 operands. */
321 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
322
323 /* TYPES [i] is the type (see above #defines) which tells us how to
324 use OP[i] for the corresponding operand. */
325 i386_operand_type types[MAX_OPERANDS];
326
327 /* Displacement expression, immediate expression, or register for each
328 operand. */
329 union i386_op op[MAX_OPERANDS];
330
331 /* Flags for operands. */
332 unsigned int flags[MAX_OPERANDS];
333 #define Operand_PCrel 1
334 #define Operand_Mem 2
335
336 /* Relocation type for operand */
337 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
338
339 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
340 the base index byte below. */
341 const reg_entry *base_reg;
342 const reg_entry *index_reg;
343 unsigned int log2_scale_factor;
344
345 /* SEG gives the seg_entries of this insn. They are zero unless
346 explicit segment overrides are given. */
347 const seg_entry *seg[2];
348
349 /* Copied first memory operand string, for re-checking. */
350 char *memop1_string;
351
352 /* PREFIX holds all the given prefix opcodes (usually null).
353 PREFIXES is the number of prefix opcodes. */
354 unsigned int prefixes;
355 unsigned char prefix[MAX_PREFIXES];
356
357 /* Register is in low 3 bits of opcode. */
358 bfd_boolean short_form;
359
360 /* The operand to a branch insn indicates an absolute branch. */
361 bfd_boolean jumpabsolute;
362
363 /* Has MMX register operands. */
364 bfd_boolean has_regmmx;
365
366 /* Has XMM register operands. */
367 bfd_boolean has_regxmm;
368
369 /* Has YMM register operands. */
370 bfd_boolean has_regymm;
371
372 /* Has ZMM register operands. */
373 bfd_boolean has_regzmm;
374
375 /* Has GOTPC or TLS relocation. */
376 bfd_boolean has_gotpc_tls_reloc;
377
378 /* RM and SIB are the modrm byte and the sib byte where the
379 addressing modes of this insn are encoded. */
380 modrm_byte rm;
381 rex_byte rex;
382 rex_byte vrex;
383 sib_byte sib;
384 vex_prefix vex;
385
386 /* Masking attributes. */
387 struct Mask_Operation *mask;
388
389 /* Rounding control and SAE attributes. */
390 struct RC_Operation *rounding;
391
392 /* Broadcasting attributes. */
393 struct Broadcast_Operation *broadcast;
394
395 /* Compressed disp8*N attribute. */
396 unsigned int memshift;
397
398 /* Prefer load or store in encoding. */
399 enum
400 {
401 dir_encoding_default = 0,
402 dir_encoding_load,
403 dir_encoding_store,
404 dir_encoding_swap
405 } dir_encoding;
406
407 /* Prefer 8bit or 32bit displacement in encoding. */
408 enum
409 {
410 disp_encoding_default = 0,
411 disp_encoding_8bit,
412 disp_encoding_32bit
413 } disp_encoding;
414
415 /* Prefer the REX byte in encoding. */
416 bfd_boolean rex_encoding;
417
418 /* Disable instruction size optimization. */
419 bfd_boolean no_optimize;
420
421 /* How to encode vector instructions. */
422 enum
423 {
424 vex_encoding_default = 0,
425 vex_encoding_vex,
426 vex_encoding_vex3,
427 vex_encoding_evex,
428 vex_encoding_error
429 } vec_encoding;
430
431 /* REP prefix. */
432 const char *rep_prefix;
433
434 /* HLE prefix. */
435 const char *hle_prefix;
436
437 /* Have BND prefix. */
438 const char *bnd_prefix;
439
440 /* Have NOTRACK prefix. */
441 const char *notrack_prefix;
442
443 /* Error message. */
444 enum i386_error error;
445 };
446
447 typedef struct _i386_insn i386_insn;
448
449 /* Link RC type with corresponding string, that'll be looked for in
450 asm. */
451 struct RC_name
452 {
453 enum rc_type type;
454 const char *name;
455 unsigned int len;
456 };
457
458 static const struct RC_name RC_NamesTable[] =
459 {
460 { rne, STRING_COMMA_LEN ("rn-sae") },
461 { rd, STRING_COMMA_LEN ("rd-sae") },
462 { ru, STRING_COMMA_LEN ("ru-sae") },
463 { rz, STRING_COMMA_LEN ("rz-sae") },
464 { saeonly, STRING_COMMA_LEN ("sae") },
465 };
466
467 /* List of chars besides those in app.c:symbol_chars that can start an
468 operand. Used to prevent the scrubber eating vital white-space. */
469 const char extra_symbol_chars[] = "*%-([{}"
470 #ifdef LEX_AT
471 "@"
472 #endif
473 #ifdef LEX_QM
474 "?"
475 #endif
476 ;
477
478 #if (defined (TE_I386AIX) \
479 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
480 && !defined (TE_GNU) \
481 && !defined (TE_LINUX) \
482 && !defined (TE_NACL) \
483 && !defined (TE_FreeBSD) \
484 && !defined (TE_DragonFly) \
485 && !defined (TE_NetBSD)))
486 /* This array holds the chars that always start a comment. If the
487 pre-processor is disabled, these aren't very useful. The option
488 --divide will remove '/' from this list. */
489 const char *i386_comment_chars = "#/";
490 #define SVR4_COMMENT_CHARS 1
491 #define PREFIX_SEPARATOR '\\'
492
493 #else
494 const char *i386_comment_chars = "#";
495 #define PREFIX_SEPARATOR '/'
496 #endif
497
498 /* This array holds the chars that only start a comment at the beginning of
499 a line. If the line seems to have the form '# 123 filename'
500 .line and .file directives will appear in the pre-processed output.
501 Note that input_file.c hand checks for '#' at the beginning of the
502 first line of the input file. This is because the compiler outputs
503 #NO_APP at the beginning of its output.
504 Also note that comments started like this one will always work if
505 '/' isn't otherwise defined. */
506 const char line_comment_chars[] = "#/";
507
508 const char line_separator_chars[] = ";";
509
510 /* Chars that can be used to separate mant from exp in floating point
511 nums. */
512 const char EXP_CHARS[] = "eE";
513
514 /* Chars that mean this number is a floating point constant
515 As in 0f12.456
516 or 0d1.2345e12. */
517 const char FLT_CHARS[] = "fFdDxX";
518
519 /* Tables for lexical analysis. */
520 static char mnemonic_chars[256];
521 static char register_chars[256];
522 static char operand_chars[256];
523 static char identifier_chars[256];
524 static char digit_chars[256];
525
526 /* Lexical macros. */
527 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
528 #define is_operand_char(x) (operand_chars[(unsigned char) x])
529 #define is_register_char(x) (register_chars[(unsigned char) x])
530 #define is_space_char(x) ((x) == ' ')
531 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
532 #define is_digit_char(x) (digit_chars[(unsigned char) x])
533
534 /* All non-digit non-letter characters that may occur in an operand. */
535 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
536
537 /* md_assemble() always leaves the strings it's passed unaltered. To
538 effect this we maintain a stack of saved characters that we've smashed
539 with '\0's (indicating end of strings for various sub-fields of the
540 assembler instruction). */
541 static char save_stack[32];
542 static char *save_stack_p;
543 #define END_STRING_AND_SAVE(s) \
544 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
545 #define RESTORE_END_STRING(s) \
546 do { *(s) = *--save_stack_p; } while (0)
547
548 /* The instruction we're assembling. */
549 static i386_insn i;
550
551 /* Possible templates for current insn. */
552 static const templates *current_templates;
553
554 /* Per instruction expressionS buffers: max displacements & immediates. */
555 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
556 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
557
558 /* Current operand we are working on. */
559 static int this_operand = -1;
560
561 /* We support four different modes. FLAG_CODE variable is used to distinguish
562 these. */
563
564 enum flag_code {
565 CODE_32BIT,
566 CODE_16BIT,
567 CODE_64BIT };
568
569 static enum flag_code flag_code;
570 static unsigned int object_64bit;
571 static unsigned int disallow_64bit_reloc;
572 static int use_rela_relocations = 0;
573 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
574 static const char *tls_get_addr;
575
576 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
577 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
578 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
579
580 /* The ELF ABI to use. */
581 enum x86_elf_abi
582 {
583 I386_ABI,
584 X86_64_ABI,
585 X86_64_X32_ABI
586 };
587
588 static enum x86_elf_abi x86_elf_abi = I386_ABI;
589 #endif
590
591 #if defined (TE_PE) || defined (TE_PEP)
592 /* Use big object file format. */
593 static int use_big_obj = 0;
594 #endif
595
596 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
597 /* 1 if generating code for a shared library. */
598 static int shared = 0;
599 #endif
600
601 /* 1 for intel syntax,
602 0 if att syntax. */
603 static int intel_syntax = 0;
604
605 static enum x86_64_isa
606 {
607 amd64 = 1, /* AMD64 ISA. */
608 intel64 /* Intel64 ISA. */
609 } isa64;
610
611 /* 1 for intel mnemonic,
612 0 if att mnemonic. */
613 static int intel_mnemonic = !SYSV386_COMPAT;
614
615 /* 1 if pseudo registers are permitted. */
616 static int allow_pseudo_reg = 0;
617
618 /* 1 if register prefix % not required. */
619 static int allow_naked_reg = 0;
620
621 /* 1 if the assembler should add BND prefix for all control-transferring
622 instructions supporting it, even if this prefix wasn't specified
623 explicitly. */
624 static int add_bnd_prefix = 0;
625
626 /* 1 if pseudo index register, eiz/riz, is allowed . */
627 static int allow_index_reg = 0;
628
629 /* 1 if the assembler should ignore LOCK prefix, even if it was
630 specified explicitly. */
631 static int omit_lock_prefix = 0;
632
633 /* 1 if the assembler should encode lfence, mfence, and sfence as
634 "lock addl $0, (%{re}sp)". */
635 static int avoid_fence = 0;
636
637 /* 1 if lfence should be inserted after every load. */
638 static int lfence_after_load = 0;
639
640 /* Non-zero if lfence should be inserted before indirect branch. */
641 static enum lfence_before_indirect_branch_kind
642 {
643 lfence_branch_none = 0,
644 lfence_branch_register,
645 lfence_branch_memory,
646 lfence_branch_all
647 }
648 lfence_before_indirect_branch;
649
650 /* Non-zero if lfence should be inserted before ret. */
651 static enum lfence_before_ret_kind
652 {
653 lfence_before_ret_none = 0,
654 lfence_before_ret_not,
655 lfence_before_ret_or,
656 lfence_before_ret_shl
657 }
658 lfence_before_ret;
659
660 /* Types of previous instruction is .byte or prefix. */
661 static struct
662 {
663 segT seg;
664 const char *file;
665 const char *name;
666 unsigned int line;
667 enum last_insn_kind
668 {
669 last_insn_other = 0,
670 last_insn_directive,
671 last_insn_prefix
672 } kind;
673 } last_insn;
674
675 /* 1 if the assembler should generate relax relocations. */
676
677 static int generate_relax_relocations
678 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
679
680 static enum check_kind
681 {
682 check_none = 0,
683 check_warning,
684 check_error
685 }
686 sse_check, operand_check = check_warning;
687
688 /* Non-zero if branches should be aligned within power of 2 boundary. */
689 static int align_branch_power = 0;
690
691 /* Types of branches to align. */
692 enum align_branch_kind
693 {
694 align_branch_none = 0,
695 align_branch_jcc = 1,
696 align_branch_fused = 2,
697 align_branch_jmp = 3,
698 align_branch_call = 4,
699 align_branch_indirect = 5,
700 align_branch_ret = 6
701 };
702
703 /* Type bits of branches to align. */
704 enum align_branch_bit
705 {
706 align_branch_jcc_bit = 1 << align_branch_jcc,
707 align_branch_fused_bit = 1 << align_branch_fused,
708 align_branch_jmp_bit = 1 << align_branch_jmp,
709 align_branch_call_bit = 1 << align_branch_call,
710 align_branch_indirect_bit = 1 << align_branch_indirect,
711 align_branch_ret_bit = 1 << align_branch_ret
712 };
713
714 static unsigned int align_branch = (align_branch_jcc_bit
715 | align_branch_fused_bit
716 | align_branch_jmp_bit);
717
718 /* Types of condition jump used by macro-fusion. */
719 enum mf_jcc_kind
720 {
721 mf_jcc_jo = 0, /* base opcode 0x70 */
722 mf_jcc_jc, /* base opcode 0x72 */
723 mf_jcc_je, /* base opcode 0x74 */
724 mf_jcc_jna, /* base opcode 0x76 */
725 mf_jcc_js, /* base opcode 0x78 */
726 mf_jcc_jp, /* base opcode 0x7a */
727 mf_jcc_jl, /* base opcode 0x7c */
728 mf_jcc_jle, /* base opcode 0x7e */
729 };
730
731 /* Types of compare flag-modifying insntructions used by macro-fusion. */
732 enum mf_cmp_kind
733 {
734 mf_cmp_test_and, /* test/cmp */
735 mf_cmp_alu_cmp, /* add/sub/cmp */
736 mf_cmp_incdec /* inc/dec */
737 };
738
739 /* The maximum padding size for fused jcc. CMP like instruction can
740 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
741 prefixes. */
742 #define MAX_FUSED_JCC_PADDING_SIZE 20
743
744 /* The maximum number of prefixes added for an instruction. */
745 static unsigned int align_branch_prefix_size = 5;
746
747 /* Optimization:
748 1. Clear the REX_W bit with register operand if possible.
749 2. Above plus use 128bit vector instruction to clear the full vector
750 register.
751 */
752 static int optimize = 0;
753
754 /* Optimization:
755 1. Clear the REX_W bit with register operand if possible.
756 2. Above plus use 128bit vector instruction to clear the full vector
757 register.
758 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
759 "testb $imm7,%r8".
760 */
761 static int optimize_for_space = 0;
762
763 /* Register prefix used for error message. */
764 static const char *register_prefix = "%";
765
766 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
767 leave, push, and pop instructions so that gcc has the same stack
768 frame as in 32 bit mode. */
769 static char stackop_size = '\0';
770
771 /* Non-zero to optimize code alignment. */
772 int optimize_align_code = 1;
773
774 /* Non-zero to quieten some warnings. */
775 static int quiet_warnings = 0;
776
777 /* CPU name. */
778 static const char *cpu_arch_name = NULL;
779 static char *cpu_sub_arch_name = NULL;
780
781 /* CPU feature flags. */
782 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
783
784 /* If we have selected a cpu we are generating instructions for. */
785 static int cpu_arch_tune_set = 0;
786
787 /* Cpu we are generating instructions for. */
788 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
789
790 /* CPU feature flags of cpu we are generating instructions for. */
791 static i386_cpu_flags cpu_arch_tune_flags;
792
793 /* CPU instruction set architecture used. */
794 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
795
796 /* CPU feature flags of instruction set architecture used. */
797 i386_cpu_flags cpu_arch_isa_flags;
798
799 /* If set, conditional jumps are not automatically promoted to handle
800 larger than a byte offset. */
801 static unsigned int no_cond_jump_promotion = 0;
802
803 /* Encode SSE instructions with VEX prefix. */
804 static unsigned int sse2avx;
805
806 /* Encode scalar AVX instructions with specific vector length. */
807 static enum
808 {
809 vex128 = 0,
810 vex256
811 } avxscalar;
812
813 /* Encode VEX WIG instructions with specific vex.w. */
814 static enum
815 {
816 vexw0 = 0,
817 vexw1
818 } vexwig;
819
820 /* Encode scalar EVEX LIG instructions with specific vector length. */
821 static enum
822 {
823 evexl128 = 0,
824 evexl256,
825 evexl512
826 } evexlig;
827
828 /* Encode EVEX WIG instructions with specific evex.w. */
829 static enum
830 {
831 evexw0 = 0,
832 evexw1
833 } evexwig;
834
835 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
836 static enum rc_type evexrcig = rne;
837
838 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
839 static symbolS *GOT_symbol;
840
841 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
842 unsigned int x86_dwarf2_return_column;
843
844 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
845 int x86_cie_data_alignment;
846
847 /* Interface to relax_segment.
848 There are 3 major relax states for 386 jump insns because the
849 different types of jumps add different sizes to frags when we're
850 figuring out what sort of jump to choose to reach a given label.
851
852 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
853 branches which are handled by md_estimate_size_before_relax() and
854 i386_generic_table_relax_frag(). */
855
856 /* Types. */
857 #define UNCOND_JUMP 0
858 #define COND_JUMP 1
859 #define COND_JUMP86 2
860 #define BRANCH_PADDING 3
861 #define BRANCH_PREFIX 4
862 #define FUSED_JCC_PADDING 5
863
864 /* Sizes. */
865 #define CODE16 1
866 #define SMALL 0
867 #define SMALL16 (SMALL | CODE16)
868 #define BIG 2
869 #define BIG16 (BIG | CODE16)
870
871 #ifndef INLINE
872 #ifdef __GNUC__
873 #define INLINE __inline__
874 #else
875 #define INLINE
876 #endif
877 #endif
878
879 #define ENCODE_RELAX_STATE(type, size) \
880 ((relax_substateT) (((type) << 2) | (size)))
881 #define TYPE_FROM_RELAX_STATE(s) \
882 ((s) >> 2)
883 #define DISP_SIZE_FROM_RELAX_STATE(s) \
884 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
885
886 /* This table is used by relax_frag to promote short jumps to long
887 ones where necessary. SMALL (short) jumps may be promoted to BIG
888 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
889 don't allow a short jump in a 32 bit code segment to be promoted to
890 a 16 bit offset jump because it's slower (requires data size
891 prefix), and doesn't work, unless the destination is in the bottom
892 64k of the code segment (The top 16 bits of eip are zeroed). */
893
894 const relax_typeS md_relax_table[] =
895 {
896 /* The fields are:
897 1) most positive reach of this state,
898 2) most negative reach of this state,
899 3) how many bytes this mode will have in the variable part of the frag
900 4) which index into the table to try if we can't fit into this one. */
901
902 /* UNCOND_JUMP states. */
903 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
904 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
905 /* dword jmp adds 4 bytes to frag:
906 0 extra opcode bytes, 4 displacement bytes. */
907 {0, 0, 4, 0},
908 /* word jmp adds 2 byte2 to frag:
909 0 extra opcode bytes, 2 displacement bytes. */
910 {0, 0, 2, 0},
911
912 /* COND_JUMP states. */
913 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
914 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
915 /* dword conditionals adds 5 bytes to frag:
916 1 extra opcode byte, 4 displacement bytes. */
917 {0, 0, 5, 0},
918 /* word conditionals add 3 bytes to frag:
919 1 extra opcode byte, 2 displacement bytes. */
920 {0, 0, 3, 0},
921
922 /* COND_JUMP86 states. */
923 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
924 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
925 /* dword conditionals adds 5 bytes to frag:
926 1 extra opcode byte, 4 displacement bytes. */
927 {0, 0, 5, 0},
928 /* word conditionals add 4 bytes to frag:
929 1 displacement byte and a 3 byte long branch insn. */
930 {0, 0, 4, 0}
931 };
932
933 static const arch_entry cpu_arch[] =
934 {
935 /* Do not replace the first two entries - i386_target_format()
936 relies on them being there in this order. */
937 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
938 CPU_GENERIC32_FLAGS, 0 },
939 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
940 CPU_GENERIC64_FLAGS, 0 },
941 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
942 CPU_NONE_FLAGS, 0 },
943 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
944 CPU_I186_FLAGS, 0 },
945 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
946 CPU_I286_FLAGS, 0 },
947 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
948 CPU_I386_FLAGS, 0 },
949 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
950 CPU_I486_FLAGS, 0 },
951 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
952 CPU_I586_FLAGS, 0 },
953 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
954 CPU_I686_FLAGS, 0 },
955 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
956 CPU_I586_FLAGS, 0 },
957 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
958 CPU_PENTIUMPRO_FLAGS, 0 },
959 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
960 CPU_P2_FLAGS, 0 },
961 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
962 CPU_P3_FLAGS, 0 },
963 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
964 CPU_P4_FLAGS, 0 },
965 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
966 CPU_CORE_FLAGS, 0 },
967 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
968 CPU_NOCONA_FLAGS, 0 },
969 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
970 CPU_CORE_FLAGS, 1 },
971 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
972 CPU_CORE_FLAGS, 0 },
973 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
974 CPU_CORE2_FLAGS, 1 },
975 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
976 CPU_CORE2_FLAGS, 0 },
977 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
978 CPU_COREI7_FLAGS, 0 },
979 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
980 CPU_L1OM_FLAGS, 0 },
981 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
982 CPU_K1OM_FLAGS, 0 },
983 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
984 CPU_IAMCU_FLAGS, 0 },
985 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
986 CPU_K6_FLAGS, 0 },
987 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
988 CPU_K6_2_FLAGS, 0 },
989 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
990 CPU_ATHLON_FLAGS, 0 },
991 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
992 CPU_K8_FLAGS, 1 },
993 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
994 CPU_K8_FLAGS, 0 },
995 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
996 CPU_K8_FLAGS, 0 },
997 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
998 CPU_AMDFAM10_FLAGS, 0 },
999 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
1000 CPU_BDVER1_FLAGS, 0 },
1001 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1002 CPU_BDVER2_FLAGS, 0 },
1003 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1004 CPU_BDVER3_FLAGS, 0 },
1005 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1006 CPU_BDVER4_FLAGS, 0 },
1007 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1008 CPU_ZNVER1_FLAGS, 0 },
1009 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1010 CPU_ZNVER2_FLAGS, 0 },
1011 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1012 CPU_BTVER1_FLAGS, 0 },
1013 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1014 CPU_BTVER2_FLAGS, 0 },
1015 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1016 CPU_8087_FLAGS, 0 },
1017 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1018 CPU_287_FLAGS, 0 },
1019 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1020 CPU_387_FLAGS, 0 },
1021 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1022 CPU_687_FLAGS, 0 },
1023 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1024 CPU_CMOV_FLAGS, 0 },
1025 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1026 CPU_FXSR_FLAGS, 0 },
1027 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1028 CPU_MMX_FLAGS, 0 },
1029 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1030 CPU_SSE_FLAGS, 0 },
1031 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1032 CPU_SSE2_FLAGS, 0 },
1033 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1034 CPU_SSE3_FLAGS, 0 },
1035 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1036 CPU_SSE4A_FLAGS, 0 },
1037 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1038 CPU_SSSE3_FLAGS, 0 },
1039 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1040 CPU_SSE4_1_FLAGS, 0 },
1041 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1042 CPU_SSE4_2_FLAGS, 0 },
1043 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1044 CPU_SSE4_2_FLAGS, 0 },
1045 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1046 CPU_AVX_FLAGS, 0 },
1047 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1048 CPU_AVX2_FLAGS, 0 },
1049 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1050 CPU_AVX512F_FLAGS, 0 },
1051 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1052 CPU_AVX512CD_FLAGS, 0 },
1053 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1054 CPU_AVX512ER_FLAGS, 0 },
1055 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1056 CPU_AVX512PF_FLAGS, 0 },
1057 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1058 CPU_AVX512DQ_FLAGS, 0 },
1059 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1060 CPU_AVX512BW_FLAGS, 0 },
1061 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1062 CPU_AVX512VL_FLAGS, 0 },
1063 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1064 CPU_VMX_FLAGS, 0 },
1065 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1066 CPU_VMFUNC_FLAGS, 0 },
1067 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1068 CPU_SMX_FLAGS, 0 },
1069 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1070 CPU_XSAVE_FLAGS, 0 },
1071 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1072 CPU_XSAVEOPT_FLAGS, 0 },
1073 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1074 CPU_XSAVEC_FLAGS, 0 },
1075 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1076 CPU_XSAVES_FLAGS, 0 },
1077 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1078 CPU_AES_FLAGS, 0 },
1079 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1080 CPU_PCLMUL_FLAGS, 0 },
1081 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1082 CPU_PCLMUL_FLAGS, 1 },
1083 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1084 CPU_FSGSBASE_FLAGS, 0 },
1085 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1086 CPU_RDRND_FLAGS, 0 },
1087 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1088 CPU_F16C_FLAGS, 0 },
1089 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1090 CPU_BMI2_FLAGS, 0 },
1091 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1092 CPU_FMA_FLAGS, 0 },
1093 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1094 CPU_FMA4_FLAGS, 0 },
1095 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1096 CPU_XOP_FLAGS, 0 },
1097 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1098 CPU_LWP_FLAGS, 0 },
1099 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1100 CPU_MOVBE_FLAGS, 0 },
1101 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1102 CPU_CX16_FLAGS, 0 },
1103 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1104 CPU_EPT_FLAGS, 0 },
1105 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1106 CPU_LZCNT_FLAGS, 0 },
1107 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1108 CPU_POPCNT_FLAGS, 0 },
1109 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1110 CPU_HLE_FLAGS, 0 },
1111 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1112 CPU_RTM_FLAGS, 0 },
1113 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1114 CPU_INVPCID_FLAGS, 0 },
1115 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1116 CPU_CLFLUSH_FLAGS, 0 },
1117 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1118 CPU_NOP_FLAGS, 0 },
1119 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1120 CPU_SYSCALL_FLAGS, 0 },
1121 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1122 CPU_RDTSCP_FLAGS, 0 },
1123 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1124 CPU_3DNOW_FLAGS, 0 },
1125 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1126 CPU_3DNOWA_FLAGS, 0 },
1127 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1128 CPU_PADLOCK_FLAGS, 0 },
1129 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1130 CPU_SVME_FLAGS, 1 },
1131 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1132 CPU_SVME_FLAGS, 0 },
1133 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1134 CPU_SSE4A_FLAGS, 0 },
1135 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1136 CPU_ABM_FLAGS, 0 },
1137 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1138 CPU_BMI_FLAGS, 0 },
1139 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1140 CPU_TBM_FLAGS, 0 },
1141 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1142 CPU_ADX_FLAGS, 0 },
1143 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1144 CPU_RDSEED_FLAGS, 0 },
1145 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1146 CPU_PRFCHW_FLAGS, 0 },
1147 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1148 CPU_SMAP_FLAGS, 0 },
1149 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1150 CPU_MPX_FLAGS, 0 },
1151 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1152 CPU_SHA_FLAGS, 0 },
1153 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1154 CPU_CLFLUSHOPT_FLAGS, 0 },
1155 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1156 CPU_PREFETCHWT1_FLAGS, 0 },
1157 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1158 CPU_SE1_FLAGS, 0 },
1159 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1160 CPU_CLWB_FLAGS, 0 },
1161 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1162 CPU_AVX512IFMA_FLAGS, 0 },
1163 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1164 CPU_AVX512VBMI_FLAGS, 0 },
1165 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1166 CPU_AVX512_4FMAPS_FLAGS, 0 },
1167 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1168 CPU_AVX512_4VNNIW_FLAGS, 0 },
1169 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1170 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1171 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1172 CPU_AVX512_VBMI2_FLAGS, 0 },
1173 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1174 CPU_AVX512_VNNI_FLAGS, 0 },
1175 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1176 CPU_AVX512_BITALG_FLAGS, 0 },
1177 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1178 CPU_CLZERO_FLAGS, 0 },
1179 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1180 CPU_MWAITX_FLAGS, 0 },
1181 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1182 CPU_OSPKE_FLAGS, 0 },
1183 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1184 CPU_RDPID_FLAGS, 0 },
1185 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1186 CPU_PTWRITE_FLAGS, 0 },
1187 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1188 CPU_IBT_FLAGS, 0 },
1189 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1190 CPU_SHSTK_FLAGS, 0 },
1191 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1192 CPU_GFNI_FLAGS, 0 },
1193 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1194 CPU_VAES_FLAGS, 0 },
1195 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1196 CPU_VPCLMULQDQ_FLAGS, 0 },
1197 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1198 CPU_WBNOINVD_FLAGS, 0 },
1199 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1200 CPU_PCONFIG_FLAGS, 0 },
1201 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1202 CPU_WAITPKG_FLAGS, 0 },
1203 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1204 CPU_CLDEMOTE_FLAGS, 0 },
1205 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1206 CPU_MOVDIRI_FLAGS, 0 },
1207 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1208 CPU_MOVDIR64B_FLAGS, 0 },
1209 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1210 CPU_AVX512_BF16_FLAGS, 0 },
1211 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1212 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1213 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1214 CPU_ENQCMD_FLAGS, 0 },
1215 { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1216 CPU_SERIALIZE_FLAGS, 0 },
1217 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1218 CPU_RDPRU_FLAGS, 0 },
1219 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1220 CPU_MCOMMIT_FLAGS, 0 },
1221 { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1222 CPU_SEV_ES_FLAGS, 0 },
1223 { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1224 CPU_TSXLDTRK_FLAGS, 0 },
1225 };
1226
1227 static const noarch_entry cpu_noarch[] =
1228 {
1229 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1230 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1231 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1232 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1233 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1234 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1235 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1236 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1237 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1238 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1239 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1240 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1241 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1242 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1243 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1244 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1245 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1246 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1247 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1248 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1249 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1250 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1251 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1252 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1253 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1254 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1255 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1256 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1257 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1258 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1259 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1260 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1261 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1262 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1263 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1264 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1265 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1266 { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1267 CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1268 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1269 { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1270 { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1271 };
1272
1273 #ifdef I386COFF
1274 /* Like s_lcomm_internal in gas/read.c but the alignment string
1275 is allowed to be optional. */
1276
1277 static symbolS *
1278 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1279 {
1280 addressT align = 0;
1281
1282 SKIP_WHITESPACE ();
1283
1284 if (needs_align
1285 && *input_line_pointer == ',')
1286 {
1287 align = parse_align (needs_align - 1);
1288
1289 if (align == (addressT) -1)
1290 return NULL;
1291 }
1292 else
1293 {
1294 if (size >= 8)
1295 align = 3;
1296 else if (size >= 4)
1297 align = 2;
1298 else if (size >= 2)
1299 align = 1;
1300 else
1301 align = 0;
1302 }
1303
1304 bss_alloc (symbolP, size, align);
1305 return symbolP;
1306 }
1307
1308 static void
1309 pe_lcomm (int needs_align)
1310 {
1311 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1312 }
1313 #endif
1314
1315 const pseudo_typeS md_pseudo_table[] =
1316 {
1317 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1318 {"align", s_align_bytes, 0},
1319 #else
1320 {"align", s_align_ptwo, 0},
1321 #endif
1322 {"arch", set_cpu_arch, 0},
1323 #ifndef I386COFF
1324 {"bss", s_bss, 0},
1325 #else
1326 {"lcomm", pe_lcomm, 1},
1327 #endif
1328 {"ffloat", float_cons, 'f'},
1329 {"dfloat", float_cons, 'd'},
1330 {"tfloat", float_cons, 'x'},
1331 {"value", cons, 2},
1332 {"slong", signed_cons, 4},
1333 {"noopt", s_ignore, 0},
1334 {"optim", s_ignore, 0},
1335 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1336 {"code16", set_code_flag, CODE_16BIT},
1337 {"code32", set_code_flag, CODE_32BIT},
1338 #ifdef BFD64
1339 {"code64", set_code_flag, CODE_64BIT},
1340 #endif
1341 {"intel_syntax", set_intel_syntax, 1},
1342 {"att_syntax", set_intel_syntax, 0},
1343 {"intel_mnemonic", set_intel_mnemonic, 1},
1344 {"att_mnemonic", set_intel_mnemonic, 0},
1345 {"allow_index_reg", set_allow_index_reg, 1},
1346 {"disallow_index_reg", set_allow_index_reg, 0},
1347 {"sse_check", set_check, 0},
1348 {"operand_check", set_check, 1},
1349 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1350 {"largecomm", handle_large_common, 0},
1351 #else
1352 {"file", dwarf2_directive_file, 0},
1353 {"loc", dwarf2_directive_loc, 0},
1354 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1355 #endif
1356 #ifdef TE_PE
1357 {"secrel32", pe_directive_secrel, 0},
1358 #endif
1359 {0, 0, 0}
1360 };
1361
1362 /* For interface with expression (). */
1363 extern char *input_line_pointer;
1364
1365 /* Hash table for instruction mnemonic lookup. */
1366 static struct hash_control *op_hash;
1367
1368 /* Hash table for register lookup. */
1369 static struct hash_control *reg_hash;
1370 \f
1371 /* Various efficient no-op patterns for aligning code labels.
1372 Note: Don't try to assemble the instructions in the comments.
1373 0L and 0w are not legal. */
1374 static const unsigned char f32_1[] =
1375 {0x90}; /* nop */
1376 static const unsigned char f32_2[] =
1377 {0x66,0x90}; /* xchg %ax,%ax */
1378 static const unsigned char f32_3[] =
1379 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1380 static const unsigned char f32_4[] =
1381 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1382 static const unsigned char f32_6[] =
1383 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1384 static const unsigned char f32_7[] =
1385 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1386 static const unsigned char f16_3[] =
1387 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1388 static const unsigned char f16_4[] =
1389 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1390 static const unsigned char jump_disp8[] =
1391 {0xeb}; /* jmp disp8 */
1392 static const unsigned char jump32_disp32[] =
1393 {0xe9}; /* jmp disp32 */
1394 static const unsigned char jump16_disp32[] =
1395 {0x66,0xe9}; /* jmp disp32 */
1396 /* 32-bit NOPs patterns. */
1397 static const unsigned char *const f32_patt[] = {
1398 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1399 };
1400 /* 16-bit NOPs patterns. */
1401 static const unsigned char *const f16_patt[] = {
1402 f32_1, f32_2, f16_3, f16_4
1403 };
1404 /* nopl (%[re]ax) */
1405 static const unsigned char alt_3[] =
1406 {0x0f,0x1f,0x00};
1407 /* nopl 0(%[re]ax) */
1408 static const unsigned char alt_4[] =
1409 {0x0f,0x1f,0x40,0x00};
1410 /* nopl 0(%[re]ax,%[re]ax,1) */
1411 static const unsigned char alt_5[] =
1412 {0x0f,0x1f,0x44,0x00,0x00};
1413 /* nopw 0(%[re]ax,%[re]ax,1) */
1414 static const unsigned char alt_6[] =
1415 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1416 /* nopl 0L(%[re]ax) */
1417 static const unsigned char alt_7[] =
1418 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1419 /* nopl 0L(%[re]ax,%[re]ax,1) */
1420 static const unsigned char alt_8[] =
1421 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1422 /* nopw 0L(%[re]ax,%[re]ax,1) */
1423 static const unsigned char alt_9[] =
1424 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1425 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1426 static const unsigned char alt_10[] =
1427 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1428 /* data16 nopw %cs:0L(%eax,%eax,1) */
1429 static const unsigned char alt_11[] =
1430 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1431 /* 32-bit and 64-bit NOPs patterns. */
1432 static const unsigned char *const alt_patt[] = {
1433 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1434 alt_9, alt_10, alt_11
1435 };
1436
1437 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1438 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1439
1440 static void
1441 i386_output_nops (char *where, const unsigned char *const *patt,
1442 int count, int max_single_nop_size)
1443
1444 {
1445 /* Place the longer NOP first. */
1446 int last;
1447 int offset;
1448 const unsigned char *nops;
1449
1450 if (max_single_nop_size < 1)
1451 {
1452 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1453 max_single_nop_size);
1454 return;
1455 }
1456
1457 nops = patt[max_single_nop_size - 1];
1458
1459 /* Use the smaller one if the requsted one isn't available. */
1460 if (nops == NULL)
1461 {
1462 max_single_nop_size--;
1463 nops = patt[max_single_nop_size - 1];
1464 }
1465
1466 last = count % max_single_nop_size;
1467
1468 count -= last;
1469 for (offset = 0; offset < count; offset += max_single_nop_size)
1470 memcpy (where + offset, nops, max_single_nop_size);
1471
1472 if (last)
1473 {
1474 nops = patt[last - 1];
1475 if (nops == NULL)
1476 {
1477 /* Use the smaller one plus one-byte NOP if the needed one
1478 isn't available. */
1479 last--;
1480 nops = patt[last - 1];
1481 memcpy (where + offset, nops, last);
1482 where[offset + last] = *patt[0];
1483 }
1484 else
1485 memcpy (where + offset, nops, last);
1486 }
1487 }
1488
1489 static INLINE int
1490 fits_in_imm7 (offsetT num)
1491 {
1492 return (num & 0x7f) == num;
1493 }
1494
1495 static INLINE int
1496 fits_in_imm31 (offsetT num)
1497 {
1498 return (num & 0x7fffffff) == num;
1499 }
1500
1501 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1502 single NOP instruction LIMIT. */
1503
1504 void
1505 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1506 {
1507 const unsigned char *const *patt = NULL;
1508 int max_single_nop_size;
1509 /* Maximum number of NOPs before switching to jump over NOPs. */
1510 int max_number_of_nops;
1511
1512 switch (fragP->fr_type)
1513 {
1514 case rs_fill_nop:
1515 case rs_align_code:
1516 break;
1517 case rs_machine_dependent:
1518 /* Allow NOP padding for jumps and calls. */
1519 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1520 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1521 break;
1522 /* Fall through. */
1523 default:
1524 return;
1525 }
1526
1527 /* We need to decide which NOP sequence to use for 32bit and
1528 64bit. When -mtune= is used:
1529
1530 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1531 PROCESSOR_GENERIC32, f32_patt will be used.
1532 2. For the rest, alt_patt will be used.
1533
1534 When -mtune= isn't used, alt_patt will be used if
1535 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1536 be used.
1537
1538 When -march= or .arch is used, we can't use anything beyond
1539 cpu_arch_isa_flags. */
1540
1541 if (flag_code == CODE_16BIT)
1542 {
1543 patt = f16_patt;
1544 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1545 /* Limit number of NOPs to 2 in 16-bit mode. */
1546 max_number_of_nops = 2;
1547 }
1548 else
1549 {
1550 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1551 {
1552 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1553 switch (cpu_arch_tune)
1554 {
1555 case PROCESSOR_UNKNOWN:
1556 /* We use cpu_arch_isa_flags to check if we SHOULD
1557 optimize with nops. */
1558 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1559 patt = alt_patt;
1560 else
1561 patt = f32_patt;
1562 break;
1563 case PROCESSOR_PENTIUM4:
1564 case PROCESSOR_NOCONA:
1565 case PROCESSOR_CORE:
1566 case PROCESSOR_CORE2:
1567 case PROCESSOR_COREI7:
1568 case PROCESSOR_L1OM:
1569 case PROCESSOR_K1OM:
1570 case PROCESSOR_GENERIC64:
1571 case PROCESSOR_K6:
1572 case PROCESSOR_ATHLON:
1573 case PROCESSOR_K8:
1574 case PROCESSOR_AMDFAM10:
1575 case PROCESSOR_BD:
1576 case PROCESSOR_ZNVER:
1577 case PROCESSOR_BT:
1578 patt = alt_patt;
1579 break;
1580 case PROCESSOR_I386:
1581 case PROCESSOR_I486:
1582 case PROCESSOR_PENTIUM:
1583 case PROCESSOR_PENTIUMPRO:
1584 case PROCESSOR_IAMCU:
1585 case PROCESSOR_GENERIC32:
1586 patt = f32_patt;
1587 break;
1588 }
1589 }
1590 else
1591 {
1592 switch (fragP->tc_frag_data.tune)
1593 {
1594 case PROCESSOR_UNKNOWN:
1595 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1596 PROCESSOR_UNKNOWN. */
1597 abort ();
1598 break;
1599
1600 case PROCESSOR_I386:
1601 case PROCESSOR_I486:
1602 case PROCESSOR_PENTIUM:
1603 case PROCESSOR_IAMCU:
1604 case PROCESSOR_K6:
1605 case PROCESSOR_ATHLON:
1606 case PROCESSOR_K8:
1607 case PROCESSOR_AMDFAM10:
1608 case PROCESSOR_BD:
1609 case PROCESSOR_ZNVER:
1610 case PROCESSOR_BT:
1611 case PROCESSOR_GENERIC32:
1612 /* We use cpu_arch_isa_flags to check if we CAN optimize
1613 with nops. */
1614 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1615 patt = alt_patt;
1616 else
1617 patt = f32_patt;
1618 break;
1619 case PROCESSOR_PENTIUMPRO:
1620 case PROCESSOR_PENTIUM4:
1621 case PROCESSOR_NOCONA:
1622 case PROCESSOR_CORE:
1623 case PROCESSOR_CORE2:
1624 case PROCESSOR_COREI7:
1625 case PROCESSOR_L1OM:
1626 case PROCESSOR_K1OM:
1627 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1628 patt = alt_patt;
1629 else
1630 patt = f32_patt;
1631 break;
1632 case PROCESSOR_GENERIC64:
1633 patt = alt_patt;
1634 break;
1635 }
1636 }
1637
1638 if (patt == f32_patt)
1639 {
1640 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1641 /* Limit number of NOPs to 2 for older processors. */
1642 max_number_of_nops = 2;
1643 }
1644 else
1645 {
1646 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1647 /* Limit number of NOPs to 7 for newer processors. */
1648 max_number_of_nops = 7;
1649 }
1650 }
1651
1652 if (limit == 0)
1653 limit = max_single_nop_size;
1654
1655 if (fragP->fr_type == rs_fill_nop)
1656 {
1657 /* Output NOPs for .nop directive. */
1658 if (limit > max_single_nop_size)
1659 {
1660 as_bad_where (fragP->fr_file, fragP->fr_line,
1661 _("invalid single nop size: %d "
1662 "(expect within [0, %d])"),
1663 limit, max_single_nop_size);
1664 return;
1665 }
1666 }
1667 else if (fragP->fr_type != rs_machine_dependent)
1668 fragP->fr_var = count;
1669
1670 if ((count / max_single_nop_size) > max_number_of_nops)
1671 {
1672 /* Generate jump over NOPs. */
1673 offsetT disp = count - 2;
1674 if (fits_in_imm7 (disp))
1675 {
1676 /* Use "jmp disp8" if possible. */
1677 count = disp;
1678 where[0] = jump_disp8[0];
1679 where[1] = count;
1680 where += 2;
1681 }
1682 else
1683 {
1684 unsigned int size_of_jump;
1685
1686 if (flag_code == CODE_16BIT)
1687 {
1688 where[0] = jump16_disp32[0];
1689 where[1] = jump16_disp32[1];
1690 size_of_jump = 2;
1691 }
1692 else
1693 {
1694 where[0] = jump32_disp32[0];
1695 size_of_jump = 1;
1696 }
1697
1698 count -= size_of_jump + 4;
1699 if (!fits_in_imm31 (count))
1700 {
1701 as_bad_where (fragP->fr_file, fragP->fr_line,
1702 _("jump over nop padding out of range"));
1703 return;
1704 }
1705
1706 md_number_to_chars (where + size_of_jump, count, 4);
1707 where += size_of_jump + 4;
1708 }
1709 }
1710
1711 /* Generate multiple NOPs. */
1712 i386_output_nops (where, patt, count, limit);
1713 }
1714
1715 static INLINE int
1716 operand_type_all_zero (const union i386_operand_type *x)
1717 {
1718 switch (ARRAY_SIZE(x->array))
1719 {
1720 case 3:
1721 if (x->array[2])
1722 return 0;
1723 /* Fall through. */
1724 case 2:
1725 if (x->array[1])
1726 return 0;
1727 /* Fall through. */
1728 case 1:
1729 return !x->array[0];
1730 default:
1731 abort ();
1732 }
1733 }
1734
1735 static INLINE void
1736 operand_type_set (union i386_operand_type *x, unsigned int v)
1737 {
1738 switch (ARRAY_SIZE(x->array))
1739 {
1740 case 3:
1741 x->array[2] = v;
1742 /* Fall through. */
1743 case 2:
1744 x->array[1] = v;
1745 /* Fall through. */
1746 case 1:
1747 x->array[0] = v;
1748 /* Fall through. */
1749 break;
1750 default:
1751 abort ();
1752 }
1753
1754 x->bitfield.class = ClassNone;
1755 x->bitfield.instance = InstanceNone;
1756 }
1757
1758 static INLINE int
1759 operand_type_equal (const union i386_operand_type *x,
1760 const union i386_operand_type *y)
1761 {
1762 switch (ARRAY_SIZE(x->array))
1763 {
1764 case 3:
1765 if (x->array[2] != y->array[2])
1766 return 0;
1767 /* Fall through. */
1768 case 2:
1769 if (x->array[1] != y->array[1])
1770 return 0;
1771 /* Fall through. */
1772 case 1:
1773 return x->array[0] == y->array[0];
1774 break;
1775 default:
1776 abort ();
1777 }
1778 }
1779
1780 static INLINE int
1781 cpu_flags_all_zero (const union i386_cpu_flags *x)
1782 {
1783 switch (ARRAY_SIZE(x->array))
1784 {
1785 case 4:
1786 if (x->array[3])
1787 return 0;
1788 /* Fall through. */
1789 case 3:
1790 if (x->array[2])
1791 return 0;
1792 /* Fall through. */
1793 case 2:
1794 if (x->array[1])
1795 return 0;
1796 /* Fall through. */
1797 case 1:
1798 return !x->array[0];
1799 default:
1800 abort ();
1801 }
1802 }
1803
1804 static INLINE int
1805 cpu_flags_equal (const union i386_cpu_flags *x,
1806 const union i386_cpu_flags *y)
1807 {
1808 switch (ARRAY_SIZE(x->array))
1809 {
1810 case 4:
1811 if (x->array[3] != y->array[3])
1812 return 0;
1813 /* Fall through. */
1814 case 3:
1815 if (x->array[2] != y->array[2])
1816 return 0;
1817 /* Fall through. */
1818 case 2:
1819 if (x->array[1] != y->array[1])
1820 return 0;
1821 /* Fall through. */
1822 case 1:
1823 return x->array[0] == y->array[0];
1824 break;
1825 default:
1826 abort ();
1827 }
1828 }
1829
1830 static INLINE int
1831 cpu_flags_check_cpu64 (i386_cpu_flags f)
1832 {
1833 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1834 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1835 }
1836
1837 static INLINE i386_cpu_flags
1838 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1839 {
1840 switch (ARRAY_SIZE (x.array))
1841 {
1842 case 4:
1843 x.array [3] &= y.array [3];
1844 /* Fall through. */
1845 case 3:
1846 x.array [2] &= y.array [2];
1847 /* Fall through. */
1848 case 2:
1849 x.array [1] &= y.array [1];
1850 /* Fall through. */
1851 case 1:
1852 x.array [0] &= y.array [0];
1853 break;
1854 default:
1855 abort ();
1856 }
1857 return x;
1858 }
1859
1860 static INLINE i386_cpu_flags
1861 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1862 {
1863 switch (ARRAY_SIZE (x.array))
1864 {
1865 case 4:
1866 x.array [3] |= y.array [3];
1867 /* Fall through. */
1868 case 3:
1869 x.array [2] |= y.array [2];
1870 /* Fall through. */
1871 case 2:
1872 x.array [1] |= y.array [1];
1873 /* Fall through. */
1874 case 1:
1875 x.array [0] |= y.array [0];
1876 break;
1877 default:
1878 abort ();
1879 }
1880 return x;
1881 }
1882
1883 static INLINE i386_cpu_flags
1884 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1885 {
1886 switch (ARRAY_SIZE (x.array))
1887 {
1888 case 4:
1889 x.array [3] &= ~y.array [3];
1890 /* Fall through. */
1891 case 3:
1892 x.array [2] &= ~y.array [2];
1893 /* Fall through. */
1894 case 2:
1895 x.array [1] &= ~y.array [1];
1896 /* Fall through. */
1897 case 1:
1898 x.array [0] &= ~y.array [0];
1899 break;
1900 default:
1901 abort ();
1902 }
1903 return x;
1904 }
1905
1906 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1907
1908 #define CPU_FLAGS_ARCH_MATCH 0x1
1909 #define CPU_FLAGS_64BIT_MATCH 0x2
1910
1911 #define CPU_FLAGS_PERFECT_MATCH \
1912 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1913
1914 /* Return CPU flags match bits. */
1915
1916 static int
1917 cpu_flags_match (const insn_template *t)
1918 {
1919 i386_cpu_flags x = t->cpu_flags;
1920 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1921
1922 x.bitfield.cpu64 = 0;
1923 x.bitfield.cpuno64 = 0;
1924
1925 if (cpu_flags_all_zero (&x))
1926 {
1927 /* This instruction is available on all archs. */
1928 match |= CPU_FLAGS_ARCH_MATCH;
1929 }
1930 else
1931 {
1932 /* This instruction is available only on some archs. */
1933 i386_cpu_flags cpu = cpu_arch_flags;
1934
1935 /* AVX512VL is no standalone feature - match it and then strip it. */
1936 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1937 return match;
1938 x.bitfield.cpuavx512vl = 0;
1939
1940 cpu = cpu_flags_and (x, cpu);
1941 if (!cpu_flags_all_zero (&cpu))
1942 {
1943 if (x.bitfield.cpuavx)
1944 {
1945 /* We need to check a few extra flags with AVX. */
1946 if (cpu.bitfield.cpuavx
1947 && (!t->opcode_modifier.sse2avx
1948 || (sse2avx && !i.prefix[DATA_PREFIX]))
1949 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1950 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1951 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1952 match |= CPU_FLAGS_ARCH_MATCH;
1953 }
1954 else if (x.bitfield.cpuavx512f)
1955 {
1956 /* We need to check a few extra flags with AVX512F. */
1957 if (cpu.bitfield.cpuavx512f
1958 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1959 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1960 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1961 match |= CPU_FLAGS_ARCH_MATCH;
1962 }
1963 else
1964 match |= CPU_FLAGS_ARCH_MATCH;
1965 }
1966 }
1967 return match;
1968 }
1969
1970 static INLINE i386_operand_type
1971 operand_type_and (i386_operand_type x, i386_operand_type y)
1972 {
1973 if (x.bitfield.class != y.bitfield.class)
1974 x.bitfield.class = ClassNone;
1975 if (x.bitfield.instance != y.bitfield.instance)
1976 x.bitfield.instance = InstanceNone;
1977
1978 switch (ARRAY_SIZE (x.array))
1979 {
1980 case 3:
1981 x.array [2] &= y.array [2];
1982 /* Fall through. */
1983 case 2:
1984 x.array [1] &= y.array [1];
1985 /* Fall through. */
1986 case 1:
1987 x.array [0] &= y.array [0];
1988 break;
1989 default:
1990 abort ();
1991 }
1992 return x;
1993 }
1994
1995 static INLINE i386_operand_type
1996 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1997 {
1998 gas_assert (y.bitfield.class == ClassNone);
1999 gas_assert (y.bitfield.instance == InstanceNone);
2000
2001 switch (ARRAY_SIZE (x.array))
2002 {
2003 case 3:
2004 x.array [2] &= ~y.array [2];
2005 /* Fall through. */
2006 case 2:
2007 x.array [1] &= ~y.array [1];
2008 /* Fall through. */
2009 case 1:
2010 x.array [0] &= ~y.array [0];
2011 break;
2012 default:
2013 abort ();
2014 }
2015 return x;
2016 }
2017
2018 static INLINE i386_operand_type
2019 operand_type_or (i386_operand_type x, i386_operand_type y)
2020 {
2021 gas_assert (x.bitfield.class == ClassNone ||
2022 y.bitfield.class == ClassNone ||
2023 x.bitfield.class == y.bitfield.class);
2024 gas_assert (x.bitfield.instance == InstanceNone ||
2025 y.bitfield.instance == InstanceNone ||
2026 x.bitfield.instance == y.bitfield.instance);
2027
2028 switch (ARRAY_SIZE (x.array))
2029 {
2030 case 3:
2031 x.array [2] |= y.array [2];
2032 /* Fall through. */
2033 case 2:
2034 x.array [1] |= y.array [1];
2035 /* Fall through. */
2036 case 1:
2037 x.array [0] |= y.array [0];
2038 break;
2039 default:
2040 abort ();
2041 }
2042 return x;
2043 }
2044
2045 static INLINE i386_operand_type
2046 operand_type_xor (i386_operand_type x, i386_operand_type y)
2047 {
2048 gas_assert (y.bitfield.class == ClassNone);
2049 gas_assert (y.bitfield.instance == InstanceNone);
2050
2051 switch (ARRAY_SIZE (x.array))
2052 {
2053 case 3:
2054 x.array [2] ^= y.array [2];
2055 /* Fall through. */
2056 case 2:
2057 x.array [1] ^= y.array [1];
2058 /* Fall through. */
2059 case 1:
2060 x.array [0] ^= y.array [0];
2061 break;
2062 default:
2063 abort ();
2064 }
2065 return x;
2066 }
2067
2068 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2069 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2070 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2071 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2072 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2073 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2074 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2075 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2076 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2077 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2078 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2079 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2080 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2081 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2082 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2083 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2084 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2085
2086 enum operand_type
2087 {
2088 reg,
2089 imm,
2090 disp,
2091 anymem
2092 };
2093
2094 static INLINE int
2095 operand_type_check (i386_operand_type t, enum operand_type c)
2096 {
2097 switch (c)
2098 {
2099 case reg:
2100 return t.bitfield.class == Reg;
2101
2102 case imm:
2103 return (t.bitfield.imm8
2104 || t.bitfield.imm8s
2105 || t.bitfield.imm16
2106 || t.bitfield.imm32
2107 || t.bitfield.imm32s
2108 || t.bitfield.imm64);
2109
2110 case disp:
2111 return (t.bitfield.disp8
2112 || t.bitfield.disp16
2113 || t.bitfield.disp32
2114 || t.bitfield.disp32s
2115 || t.bitfield.disp64);
2116
2117 case anymem:
2118 return (t.bitfield.disp8
2119 || t.bitfield.disp16
2120 || t.bitfield.disp32
2121 || t.bitfield.disp32s
2122 || t.bitfield.disp64
2123 || t.bitfield.baseindex);
2124
2125 default:
2126 abort ();
2127 }
2128
2129 return 0;
2130 }
2131
2132 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2133 between operand GIVEN and opeand WANTED for instruction template T. */
2134
2135 static INLINE int
2136 match_operand_size (const insn_template *t, unsigned int wanted,
2137 unsigned int given)
2138 {
2139 return !((i.types[given].bitfield.byte
2140 && !t->operand_types[wanted].bitfield.byte)
2141 || (i.types[given].bitfield.word
2142 && !t->operand_types[wanted].bitfield.word)
2143 || (i.types[given].bitfield.dword
2144 && !t->operand_types[wanted].bitfield.dword)
2145 || (i.types[given].bitfield.qword
2146 && !t->operand_types[wanted].bitfield.qword)
2147 || (i.types[given].bitfield.tbyte
2148 && !t->operand_types[wanted].bitfield.tbyte));
2149 }
2150
2151 /* Return 1 if there is no conflict in SIMD register between operand
2152 GIVEN and opeand WANTED for instruction template T. */
2153
2154 static INLINE int
2155 match_simd_size (const insn_template *t, unsigned int wanted,
2156 unsigned int given)
2157 {
2158 return !((i.types[given].bitfield.xmmword
2159 && !t->operand_types[wanted].bitfield.xmmword)
2160 || (i.types[given].bitfield.ymmword
2161 && !t->operand_types[wanted].bitfield.ymmword)
2162 || (i.types[given].bitfield.zmmword
2163 && !t->operand_types[wanted].bitfield.zmmword));
2164 }
2165
2166 /* Return 1 if there is no conflict in any size between operand GIVEN
2167 and opeand WANTED for instruction template T. */
2168
2169 static INLINE int
2170 match_mem_size (const insn_template *t, unsigned int wanted,
2171 unsigned int given)
2172 {
2173 return (match_operand_size (t, wanted, given)
2174 && !((i.types[given].bitfield.unspecified
2175 && !i.broadcast
2176 && !t->operand_types[wanted].bitfield.unspecified)
2177 || (i.types[given].bitfield.fword
2178 && !t->operand_types[wanted].bitfield.fword)
2179 /* For scalar opcode templates to allow register and memory
2180 operands at the same time, some special casing is needed
2181 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2182 down-conversion vpmov*. */
2183 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2184 && t->operand_types[wanted].bitfield.byte
2185 + t->operand_types[wanted].bitfield.word
2186 + t->operand_types[wanted].bitfield.dword
2187 + t->operand_types[wanted].bitfield.qword
2188 > !!t->opcode_modifier.broadcast)
2189 ? (i.types[given].bitfield.xmmword
2190 || i.types[given].bitfield.ymmword
2191 || i.types[given].bitfield.zmmword)
2192 : !match_simd_size(t, wanted, given))));
2193 }
2194
2195 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2196 operands for instruction template T, and it has MATCH_REVERSE set if there
2197 is no size conflict on any operands for the template with operands reversed
2198 (and the template allows for reversing in the first place). */
2199
2200 #define MATCH_STRAIGHT 1
2201 #define MATCH_REVERSE 2
2202
2203 static INLINE unsigned int
2204 operand_size_match (const insn_template *t)
2205 {
2206 unsigned int j, match = MATCH_STRAIGHT;
2207
2208 /* Don't check non-absolute jump instructions. */
2209 if (t->opcode_modifier.jump
2210 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2211 return match;
2212
2213 /* Check memory and accumulator operand size. */
2214 for (j = 0; j < i.operands; j++)
2215 {
2216 if (i.types[j].bitfield.class != Reg
2217 && i.types[j].bitfield.class != RegSIMD
2218 && t->opcode_modifier.anysize)
2219 continue;
2220
2221 if (t->operand_types[j].bitfield.class == Reg
2222 && !match_operand_size (t, j, j))
2223 {
2224 match = 0;
2225 break;
2226 }
2227
2228 if (t->operand_types[j].bitfield.class == RegSIMD
2229 && !match_simd_size (t, j, j))
2230 {
2231 match = 0;
2232 break;
2233 }
2234
2235 if (t->operand_types[j].bitfield.instance == Accum
2236 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2237 {
2238 match = 0;
2239 break;
2240 }
2241
2242 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2243 {
2244 match = 0;
2245 break;
2246 }
2247 }
2248
2249 if (!t->opcode_modifier.d)
2250 {
2251 mismatch:
2252 if (!match)
2253 i.error = operand_size_mismatch;
2254 return match;
2255 }
2256
2257 /* Check reverse. */
2258 gas_assert (i.operands >= 2 && i.operands <= 3);
2259
2260 for (j = 0; j < i.operands; j++)
2261 {
2262 unsigned int given = i.operands - j - 1;
2263
2264 if (t->operand_types[j].bitfield.class == Reg
2265 && !match_operand_size (t, j, given))
2266 goto mismatch;
2267
2268 if (t->operand_types[j].bitfield.class == RegSIMD
2269 && !match_simd_size (t, j, given))
2270 goto mismatch;
2271
2272 if (t->operand_types[j].bitfield.instance == Accum
2273 && (!match_operand_size (t, j, given)
2274 || !match_simd_size (t, j, given)))
2275 goto mismatch;
2276
2277 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2278 goto mismatch;
2279 }
2280
2281 return match | MATCH_REVERSE;
2282 }
2283
2284 static INLINE int
2285 operand_type_match (i386_operand_type overlap,
2286 i386_operand_type given)
2287 {
2288 i386_operand_type temp = overlap;
2289
2290 temp.bitfield.unspecified = 0;
2291 temp.bitfield.byte = 0;
2292 temp.bitfield.word = 0;
2293 temp.bitfield.dword = 0;
2294 temp.bitfield.fword = 0;
2295 temp.bitfield.qword = 0;
2296 temp.bitfield.tbyte = 0;
2297 temp.bitfield.xmmword = 0;
2298 temp.bitfield.ymmword = 0;
2299 temp.bitfield.zmmword = 0;
2300 if (operand_type_all_zero (&temp))
2301 goto mismatch;
2302
2303 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2304 return 1;
2305
2306 mismatch:
2307 i.error = operand_type_mismatch;
2308 return 0;
2309 }
2310
2311 /* If given types g0 and g1 are registers they must be of the same type
2312 unless the expected operand type register overlap is null.
2313 Some Intel syntax memory operand size checking also happens here. */
2314
2315 static INLINE int
2316 operand_type_register_match (i386_operand_type g0,
2317 i386_operand_type t0,
2318 i386_operand_type g1,
2319 i386_operand_type t1)
2320 {
2321 if (g0.bitfield.class != Reg
2322 && g0.bitfield.class != RegSIMD
2323 && (!operand_type_check (g0, anymem)
2324 || g0.bitfield.unspecified
2325 || (t0.bitfield.class != Reg
2326 && t0.bitfield.class != RegSIMD)))
2327 return 1;
2328
2329 if (g1.bitfield.class != Reg
2330 && g1.bitfield.class != RegSIMD
2331 && (!operand_type_check (g1, anymem)
2332 || g1.bitfield.unspecified
2333 || (t1.bitfield.class != Reg
2334 && t1.bitfield.class != RegSIMD)))
2335 return 1;
2336
2337 if (g0.bitfield.byte == g1.bitfield.byte
2338 && g0.bitfield.word == g1.bitfield.word
2339 && g0.bitfield.dword == g1.bitfield.dword
2340 && g0.bitfield.qword == g1.bitfield.qword
2341 && g0.bitfield.xmmword == g1.bitfield.xmmword
2342 && g0.bitfield.ymmword == g1.bitfield.ymmword
2343 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2344 return 1;
2345
2346 if (!(t0.bitfield.byte & t1.bitfield.byte)
2347 && !(t0.bitfield.word & t1.bitfield.word)
2348 && !(t0.bitfield.dword & t1.bitfield.dword)
2349 && !(t0.bitfield.qword & t1.bitfield.qword)
2350 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2351 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2352 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2353 return 1;
2354
2355 i.error = register_type_mismatch;
2356
2357 return 0;
2358 }
2359
2360 static INLINE unsigned int
2361 register_number (const reg_entry *r)
2362 {
2363 unsigned int nr = r->reg_num;
2364
2365 if (r->reg_flags & RegRex)
2366 nr += 8;
2367
2368 if (r->reg_flags & RegVRex)
2369 nr += 16;
2370
2371 return nr;
2372 }
2373
2374 static INLINE unsigned int
2375 mode_from_disp_size (i386_operand_type t)
2376 {
2377 if (t.bitfield.disp8)
2378 return 1;
2379 else if (t.bitfield.disp16
2380 || t.bitfield.disp32
2381 || t.bitfield.disp32s)
2382 return 2;
2383 else
2384 return 0;
2385 }
2386
2387 static INLINE int
2388 fits_in_signed_byte (addressT num)
2389 {
2390 return num + 0x80 <= 0xff;
2391 }
2392
2393 static INLINE int
2394 fits_in_unsigned_byte (addressT num)
2395 {
2396 return num <= 0xff;
2397 }
2398
2399 static INLINE int
2400 fits_in_unsigned_word (addressT num)
2401 {
2402 return num <= 0xffff;
2403 }
2404
2405 static INLINE int
2406 fits_in_signed_word (addressT num)
2407 {
2408 return num + 0x8000 <= 0xffff;
2409 }
2410
2411 static INLINE int
2412 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2413 {
2414 #ifndef BFD64
2415 return 1;
2416 #else
2417 return num + 0x80000000 <= 0xffffffff;
2418 #endif
2419 } /* fits_in_signed_long() */
2420
2421 static INLINE int
2422 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2423 {
2424 #ifndef BFD64
2425 return 1;
2426 #else
2427 return num <= 0xffffffff;
2428 #endif
2429 } /* fits_in_unsigned_long() */
2430
2431 static INLINE int
2432 fits_in_disp8 (offsetT num)
2433 {
2434 int shift = i.memshift;
2435 unsigned int mask;
2436
2437 if (shift == -1)
2438 abort ();
2439
2440 mask = (1 << shift) - 1;
2441
2442 /* Return 0 if NUM isn't properly aligned. */
2443 if ((num & mask))
2444 return 0;
2445
2446 /* Check if NUM will fit in 8bit after shift. */
2447 return fits_in_signed_byte (num >> shift);
2448 }
2449
2450 static INLINE int
2451 fits_in_imm4 (offsetT num)
2452 {
2453 return (num & 0xf) == num;
2454 }
2455
2456 static i386_operand_type
2457 smallest_imm_type (offsetT num)
2458 {
2459 i386_operand_type t;
2460
2461 operand_type_set (&t, 0);
2462 t.bitfield.imm64 = 1;
2463
2464 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2465 {
2466 /* This code is disabled on the 486 because all the Imm1 forms
2467 in the opcode table are slower on the i486. They're the
2468 versions with the implicitly specified single-position
2469 displacement, which has another syntax if you really want to
2470 use that form. */
2471 t.bitfield.imm1 = 1;
2472 t.bitfield.imm8 = 1;
2473 t.bitfield.imm8s = 1;
2474 t.bitfield.imm16 = 1;
2475 t.bitfield.imm32 = 1;
2476 t.bitfield.imm32s = 1;
2477 }
2478 else if (fits_in_signed_byte (num))
2479 {
2480 t.bitfield.imm8 = 1;
2481 t.bitfield.imm8s = 1;
2482 t.bitfield.imm16 = 1;
2483 t.bitfield.imm32 = 1;
2484 t.bitfield.imm32s = 1;
2485 }
2486 else if (fits_in_unsigned_byte (num))
2487 {
2488 t.bitfield.imm8 = 1;
2489 t.bitfield.imm16 = 1;
2490 t.bitfield.imm32 = 1;
2491 t.bitfield.imm32s = 1;
2492 }
2493 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2494 {
2495 t.bitfield.imm16 = 1;
2496 t.bitfield.imm32 = 1;
2497 t.bitfield.imm32s = 1;
2498 }
2499 else if (fits_in_signed_long (num))
2500 {
2501 t.bitfield.imm32 = 1;
2502 t.bitfield.imm32s = 1;
2503 }
2504 else if (fits_in_unsigned_long (num))
2505 t.bitfield.imm32 = 1;
2506
2507 return t;
2508 }
2509
2510 static offsetT
2511 offset_in_range (offsetT val, int size)
2512 {
2513 addressT mask;
2514
2515 switch (size)
2516 {
2517 case 1: mask = ((addressT) 1 << 8) - 1; break;
2518 case 2: mask = ((addressT) 1 << 16) - 1; break;
2519 case 4: mask = ((addressT) 2 << 31) - 1; break;
2520 #ifdef BFD64
2521 case 8: mask = ((addressT) 2 << 63) - 1; break;
2522 #endif
2523 default: abort ();
2524 }
2525
2526 #ifdef BFD64
2527 /* If BFD64, sign extend val for 32bit address mode. */
2528 if (flag_code != CODE_64BIT
2529 || i.prefix[ADDR_PREFIX])
2530 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2531 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2532 #endif
2533
2534 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2535 {
2536 char buf1[40], buf2[40];
2537
2538 sprint_value (buf1, val);
2539 sprint_value (buf2, val & mask);
2540 as_warn (_("%s shortened to %s"), buf1, buf2);
2541 }
2542 return val & mask;
2543 }
2544
2545 enum PREFIX_GROUP
2546 {
2547 PREFIX_EXIST = 0,
2548 PREFIX_LOCK,
2549 PREFIX_REP,
2550 PREFIX_DS,
2551 PREFIX_OTHER
2552 };
2553
2554 /* Returns
2555 a. PREFIX_EXIST if attempting to add a prefix where one from the
2556 same class already exists.
2557 b. PREFIX_LOCK if lock prefix is added.
2558 c. PREFIX_REP if rep/repne prefix is added.
2559 d. PREFIX_DS if ds prefix is added.
2560 e. PREFIX_OTHER if other prefix is added.
2561 */
2562
2563 static enum PREFIX_GROUP
2564 add_prefix (unsigned int prefix)
2565 {
2566 enum PREFIX_GROUP ret = PREFIX_OTHER;
2567 unsigned int q;
2568
2569 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2570 && flag_code == CODE_64BIT)
2571 {
2572 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2573 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2574 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2575 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2576 ret = PREFIX_EXIST;
2577 q = REX_PREFIX;
2578 }
2579 else
2580 {
2581 switch (prefix)
2582 {
2583 default:
2584 abort ();
2585
2586 case DS_PREFIX_OPCODE:
2587 ret = PREFIX_DS;
2588 /* Fall through. */
2589 case CS_PREFIX_OPCODE:
2590 case ES_PREFIX_OPCODE:
2591 case FS_PREFIX_OPCODE:
2592 case GS_PREFIX_OPCODE:
2593 case SS_PREFIX_OPCODE:
2594 q = SEG_PREFIX;
2595 break;
2596
2597 case REPNE_PREFIX_OPCODE:
2598 case REPE_PREFIX_OPCODE:
2599 q = REP_PREFIX;
2600 ret = PREFIX_REP;
2601 break;
2602
2603 case LOCK_PREFIX_OPCODE:
2604 q = LOCK_PREFIX;
2605 ret = PREFIX_LOCK;
2606 break;
2607
2608 case FWAIT_OPCODE:
2609 q = WAIT_PREFIX;
2610 break;
2611
2612 case ADDR_PREFIX_OPCODE:
2613 q = ADDR_PREFIX;
2614 break;
2615
2616 case DATA_PREFIX_OPCODE:
2617 q = DATA_PREFIX;
2618 break;
2619 }
2620 if (i.prefix[q] != 0)
2621 ret = PREFIX_EXIST;
2622 }
2623
2624 if (ret)
2625 {
2626 if (!i.prefix[q])
2627 ++i.prefixes;
2628 i.prefix[q] |= prefix;
2629 }
2630 else
2631 as_bad (_("same type of prefix used twice"));
2632
2633 return ret;
2634 }
2635
2636 static void
2637 update_code_flag (int value, int check)
2638 {
2639 PRINTF_LIKE ((*as_error));
2640
2641 flag_code = (enum flag_code) value;
2642 if (flag_code == CODE_64BIT)
2643 {
2644 cpu_arch_flags.bitfield.cpu64 = 1;
2645 cpu_arch_flags.bitfield.cpuno64 = 0;
2646 }
2647 else
2648 {
2649 cpu_arch_flags.bitfield.cpu64 = 0;
2650 cpu_arch_flags.bitfield.cpuno64 = 1;
2651 }
2652 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2653 {
2654 if (check)
2655 as_error = as_fatal;
2656 else
2657 as_error = as_bad;
2658 (*as_error) (_("64bit mode not supported on `%s'."),
2659 cpu_arch_name ? cpu_arch_name : default_arch);
2660 }
2661 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2662 {
2663 if (check)
2664 as_error = as_fatal;
2665 else
2666 as_error = as_bad;
2667 (*as_error) (_("32bit mode not supported on `%s'."),
2668 cpu_arch_name ? cpu_arch_name : default_arch);
2669 }
2670 stackop_size = '\0';
2671 }
2672
2673 static void
2674 set_code_flag (int value)
2675 {
2676 update_code_flag (value, 0);
2677 }
2678
2679 static void
2680 set_16bit_gcc_code_flag (int new_code_flag)
2681 {
2682 flag_code = (enum flag_code) new_code_flag;
2683 if (flag_code != CODE_16BIT)
2684 abort ();
2685 cpu_arch_flags.bitfield.cpu64 = 0;
2686 cpu_arch_flags.bitfield.cpuno64 = 1;
2687 stackop_size = LONG_MNEM_SUFFIX;
2688 }
2689
2690 static void
2691 set_intel_syntax (int syntax_flag)
2692 {
2693 /* Find out if register prefixing is specified. */
2694 int ask_naked_reg = 0;
2695
2696 SKIP_WHITESPACE ();
2697 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2698 {
2699 char *string;
2700 int e = get_symbol_name (&string);
2701
2702 if (strcmp (string, "prefix") == 0)
2703 ask_naked_reg = 1;
2704 else if (strcmp (string, "noprefix") == 0)
2705 ask_naked_reg = -1;
2706 else
2707 as_bad (_("bad argument to syntax directive."));
2708 (void) restore_line_pointer (e);
2709 }
2710 demand_empty_rest_of_line ();
2711
2712 intel_syntax = syntax_flag;
2713
2714 if (ask_naked_reg == 0)
2715 allow_naked_reg = (intel_syntax
2716 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2717 else
2718 allow_naked_reg = (ask_naked_reg < 0);
2719
2720 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2721
2722 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2723 identifier_chars['$'] = intel_syntax ? '$' : 0;
2724 register_prefix = allow_naked_reg ? "" : "%";
2725 }
2726
2727 static void
2728 set_intel_mnemonic (int mnemonic_flag)
2729 {
2730 intel_mnemonic = mnemonic_flag;
2731 }
2732
2733 static void
2734 set_allow_index_reg (int flag)
2735 {
2736 allow_index_reg = flag;
2737 }
2738
2739 static void
2740 set_check (int what)
2741 {
2742 enum check_kind *kind;
2743 const char *str;
2744
2745 if (what)
2746 {
2747 kind = &operand_check;
2748 str = "operand";
2749 }
2750 else
2751 {
2752 kind = &sse_check;
2753 str = "sse";
2754 }
2755
2756 SKIP_WHITESPACE ();
2757
2758 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2759 {
2760 char *string;
2761 int e = get_symbol_name (&string);
2762
2763 if (strcmp (string, "none") == 0)
2764 *kind = check_none;
2765 else if (strcmp (string, "warning") == 0)
2766 *kind = check_warning;
2767 else if (strcmp (string, "error") == 0)
2768 *kind = check_error;
2769 else
2770 as_bad (_("bad argument to %s_check directive."), str);
2771 (void) restore_line_pointer (e);
2772 }
2773 else
2774 as_bad (_("missing argument for %s_check directive"), str);
2775
2776 demand_empty_rest_of_line ();
2777 }
2778
2779 static void
2780 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2781 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2782 {
2783 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2784 static const char *arch;
2785
2786 /* Intel LIOM is only supported on ELF. */
2787 if (!IS_ELF)
2788 return;
2789
2790 if (!arch)
2791 {
2792 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2793 use default_arch. */
2794 arch = cpu_arch_name;
2795 if (!arch)
2796 arch = default_arch;
2797 }
2798
2799 /* If we are targeting Intel MCU, we must enable it. */
2800 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2801 || new_flag.bitfield.cpuiamcu)
2802 return;
2803
2804 /* If we are targeting Intel L1OM, we must enable it. */
2805 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2806 || new_flag.bitfield.cpul1om)
2807 return;
2808
2809 /* If we are targeting Intel K1OM, we must enable it. */
2810 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2811 || new_flag.bitfield.cpuk1om)
2812 return;
2813
2814 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2815 #endif
2816 }
2817
2818 static void
2819 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2820 {
2821 SKIP_WHITESPACE ();
2822
2823 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2824 {
2825 char *string;
2826 int e = get_symbol_name (&string);
2827 unsigned int j;
2828 i386_cpu_flags flags;
2829
2830 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2831 {
2832 if (strcmp (string, cpu_arch[j].name) == 0)
2833 {
2834 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2835
2836 if (*string != '.')
2837 {
2838 cpu_arch_name = cpu_arch[j].name;
2839 cpu_sub_arch_name = NULL;
2840 cpu_arch_flags = cpu_arch[j].flags;
2841 if (flag_code == CODE_64BIT)
2842 {
2843 cpu_arch_flags.bitfield.cpu64 = 1;
2844 cpu_arch_flags.bitfield.cpuno64 = 0;
2845 }
2846 else
2847 {
2848 cpu_arch_flags.bitfield.cpu64 = 0;
2849 cpu_arch_flags.bitfield.cpuno64 = 1;
2850 }
2851 cpu_arch_isa = cpu_arch[j].type;
2852 cpu_arch_isa_flags = cpu_arch[j].flags;
2853 if (!cpu_arch_tune_set)
2854 {
2855 cpu_arch_tune = cpu_arch_isa;
2856 cpu_arch_tune_flags = cpu_arch_isa_flags;
2857 }
2858 break;
2859 }
2860
2861 flags = cpu_flags_or (cpu_arch_flags,
2862 cpu_arch[j].flags);
2863
2864 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2865 {
2866 if (cpu_sub_arch_name)
2867 {
2868 char *name = cpu_sub_arch_name;
2869 cpu_sub_arch_name = concat (name,
2870 cpu_arch[j].name,
2871 (const char *) NULL);
2872 free (name);
2873 }
2874 else
2875 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2876 cpu_arch_flags = flags;
2877 cpu_arch_isa_flags = flags;
2878 }
2879 else
2880 cpu_arch_isa_flags
2881 = cpu_flags_or (cpu_arch_isa_flags,
2882 cpu_arch[j].flags);
2883 (void) restore_line_pointer (e);
2884 demand_empty_rest_of_line ();
2885 return;
2886 }
2887 }
2888
2889 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2890 {
2891 /* Disable an ISA extension. */
2892 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2893 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2894 {
2895 flags = cpu_flags_and_not (cpu_arch_flags,
2896 cpu_noarch[j].flags);
2897 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2898 {
2899 if (cpu_sub_arch_name)
2900 {
2901 char *name = cpu_sub_arch_name;
2902 cpu_sub_arch_name = concat (name, string,
2903 (const char *) NULL);
2904 free (name);
2905 }
2906 else
2907 cpu_sub_arch_name = xstrdup (string);
2908 cpu_arch_flags = flags;
2909 cpu_arch_isa_flags = flags;
2910 }
2911 (void) restore_line_pointer (e);
2912 demand_empty_rest_of_line ();
2913 return;
2914 }
2915
2916 j = ARRAY_SIZE (cpu_arch);
2917 }
2918
2919 if (j >= ARRAY_SIZE (cpu_arch))
2920 as_bad (_("no such architecture: `%s'"), string);
2921
2922 *input_line_pointer = e;
2923 }
2924 else
2925 as_bad (_("missing cpu architecture"));
2926
2927 no_cond_jump_promotion = 0;
2928 if (*input_line_pointer == ','
2929 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2930 {
2931 char *string;
2932 char e;
2933
2934 ++input_line_pointer;
2935 e = get_symbol_name (&string);
2936
2937 if (strcmp (string, "nojumps") == 0)
2938 no_cond_jump_promotion = 1;
2939 else if (strcmp (string, "jumps") == 0)
2940 ;
2941 else
2942 as_bad (_("no such architecture modifier: `%s'"), string);
2943
2944 (void) restore_line_pointer (e);
2945 }
2946
2947 demand_empty_rest_of_line ();
2948 }
2949
2950 enum bfd_architecture
2951 i386_arch (void)
2952 {
2953 if (cpu_arch_isa == PROCESSOR_L1OM)
2954 {
2955 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2956 || flag_code != CODE_64BIT)
2957 as_fatal (_("Intel L1OM is 64bit ELF only"));
2958 return bfd_arch_l1om;
2959 }
2960 else if (cpu_arch_isa == PROCESSOR_K1OM)
2961 {
2962 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2963 || flag_code != CODE_64BIT)
2964 as_fatal (_("Intel K1OM is 64bit ELF only"));
2965 return bfd_arch_k1om;
2966 }
2967 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2968 {
2969 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2970 || flag_code == CODE_64BIT)
2971 as_fatal (_("Intel MCU is 32bit ELF only"));
2972 return bfd_arch_iamcu;
2973 }
2974 else
2975 return bfd_arch_i386;
2976 }
2977
2978 unsigned long
2979 i386_mach (void)
2980 {
2981 if (!strncmp (default_arch, "x86_64", 6))
2982 {
2983 if (cpu_arch_isa == PROCESSOR_L1OM)
2984 {
2985 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2986 || default_arch[6] != '\0')
2987 as_fatal (_("Intel L1OM is 64bit ELF only"));
2988 return bfd_mach_l1om;
2989 }
2990 else if (cpu_arch_isa == PROCESSOR_K1OM)
2991 {
2992 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2993 || default_arch[6] != '\0')
2994 as_fatal (_("Intel K1OM is 64bit ELF only"));
2995 return bfd_mach_k1om;
2996 }
2997 else if (default_arch[6] == '\0')
2998 return bfd_mach_x86_64;
2999 else
3000 return bfd_mach_x64_32;
3001 }
3002 else if (!strcmp (default_arch, "i386")
3003 || !strcmp (default_arch, "iamcu"))
3004 {
3005 if (cpu_arch_isa == PROCESSOR_IAMCU)
3006 {
3007 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3008 as_fatal (_("Intel MCU is 32bit ELF only"));
3009 return bfd_mach_i386_iamcu;
3010 }
3011 else
3012 return bfd_mach_i386_i386;
3013 }
3014 else
3015 as_fatal (_("unknown architecture"));
3016 }
3017 \f
3018 void
3019 md_begin (void)
3020 {
3021 const char *hash_err;
3022
3023 /* Support pseudo prefixes like {disp32}. */
3024 lex_type ['{'] = LEX_BEGIN_NAME;
3025
3026 /* Initialize op_hash hash table. */
3027 op_hash = hash_new ();
3028
3029 {
3030 const insn_template *optab;
3031 templates *core_optab;
3032
3033 /* Setup for loop. */
3034 optab = i386_optab;
3035 core_optab = XNEW (templates);
3036 core_optab->start = optab;
3037
3038 while (1)
3039 {
3040 ++optab;
3041 if (optab->name == NULL
3042 || strcmp (optab->name, (optab - 1)->name) != 0)
3043 {
3044 /* different name --> ship out current template list;
3045 add to hash table; & begin anew. */
3046 core_optab->end = optab;
3047 hash_err = hash_insert (op_hash,
3048 (optab - 1)->name,
3049 (void *) core_optab);
3050 if (hash_err)
3051 {
3052 as_fatal (_("can't hash %s: %s"),
3053 (optab - 1)->name,
3054 hash_err);
3055 }
3056 if (optab->name == NULL)
3057 break;
3058 core_optab = XNEW (templates);
3059 core_optab->start = optab;
3060 }
3061 }
3062 }
3063
3064 /* Initialize reg_hash hash table. */
3065 reg_hash = hash_new ();
3066 {
3067 const reg_entry *regtab;
3068 unsigned int regtab_size = i386_regtab_size;
3069
3070 for (regtab = i386_regtab; regtab_size--; regtab++)
3071 {
3072 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3073 if (hash_err)
3074 as_fatal (_("can't hash %s: %s"),
3075 regtab->reg_name,
3076 hash_err);
3077 }
3078 }
3079
3080 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3081 {
3082 int c;
3083 char *p;
3084
3085 for (c = 0; c < 256; c++)
3086 {
3087 if (ISDIGIT (c))
3088 {
3089 digit_chars[c] = c;
3090 mnemonic_chars[c] = c;
3091 register_chars[c] = c;
3092 operand_chars[c] = c;
3093 }
3094 else if (ISLOWER (c))
3095 {
3096 mnemonic_chars[c] = c;
3097 register_chars[c] = c;
3098 operand_chars[c] = c;
3099 }
3100 else if (ISUPPER (c))
3101 {
3102 mnemonic_chars[c] = TOLOWER (c);
3103 register_chars[c] = mnemonic_chars[c];
3104 operand_chars[c] = c;
3105 }
3106 else if (c == '{' || c == '}')
3107 {
3108 mnemonic_chars[c] = c;
3109 operand_chars[c] = c;
3110 }
3111
3112 if (ISALPHA (c) || ISDIGIT (c))
3113 identifier_chars[c] = c;
3114 else if (c >= 128)
3115 {
3116 identifier_chars[c] = c;
3117 operand_chars[c] = c;
3118 }
3119 }
3120
3121 #ifdef LEX_AT
3122 identifier_chars['@'] = '@';
3123 #endif
3124 #ifdef LEX_QM
3125 identifier_chars['?'] = '?';
3126 operand_chars['?'] = '?';
3127 #endif
3128 digit_chars['-'] = '-';
3129 mnemonic_chars['_'] = '_';
3130 mnemonic_chars['-'] = '-';
3131 mnemonic_chars['.'] = '.';
3132 identifier_chars['_'] = '_';
3133 identifier_chars['.'] = '.';
3134
3135 for (p = operand_special_chars; *p != '\0'; p++)
3136 operand_chars[(unsigned char) *p] = *p;
3137 }
3138
3139 if (flag_code == CODE_64BIT)
3140 {
3141 #if defined (OBJ_COFF) && defined (TE_PE)
3142 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3143 ? 32 : 16);
3144 #else
3145 x86_dwarf2_return_column = 16;
3146 #endif
3147 x86_cie_data_alignment = -8;
3148 }
3149 else
3150 {
3151 x86_dwarf2_return_column = 8;
3152 x86_cie_data_alignment = -4;
3153 }
3154
3155 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3156 can be turned into BRANCH_PREFIX frag. */
3157 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3158 abort ();
3159 }
3160
3161 void
3162 i386_print_statistics (FILE *file)
3163 {
3164 hash_print_statistics (file, "i386 opcode", op_hash);
3165 hash_print_statistics (file, "i386 register", reg_hash);
3166 }
3167 \f
3168 #ifdef DEBUG386
3169
3170 /* Debugging routines for md_assemble. */
3171 static void pte (insn_template *);
3172 static void pt (i386_operand_type);
3173 static void pe (expressionS *);
3174 static void ps (symbolS *);
3175
3176 static void
3177 pi (const char *line, i386_insn *x)
3178 {
3179 unsigned int j;
3180
3181 fprintf (stdout, "%s: template ", line);
3182 pte (&x->tm);
3183 fprintf (stdout, " address: base %s index %s scale %x\n",
3184 x->base_reg ? x->base_reg->reg_name : "none",
3185 x->index_reg ? x->index_reg->reg_name : "none",
3186 x->log2_scale_factor);
3187 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3188 x->rm.mode, x->rm.reg, x->rm.regmem);
3189 fprintf (stdout, " sib: base %x index %x scale %x\n",
3190 x->sib.base, x->sib.index, x->sib.scale);
3191 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3192 (x->rex & REX_W) != 0,
3193 (x->rex & REX_R) != 0,
3194 (x->rex & REX_X) != 0,
3195 (x->rex & REX_B) != 0);
3196 for (j = 0; j < x->operands; j++)
3197 {
3198 fprintf (stdout, " #%d: ", j + 1);
3199 pt (x->types[j]);
3200 fprintf (stdout, "\n");
3201 if (x->types[j].bitfield.class == Reg
3202 || x->types[j].bitfield.class == RegMMX
3203 || x->types[j].bitfield.class == RegSIMD
3204 || x->types[j].bitfield.class == RegMask
3205 || x->types[j].bitfield.class == SReg
3206 || x->types[j].bitfield.class == RegCR
3207 || x->types[j].bitfield.class == RegDR
3208 || x->types[j].bitfield.class == RegTR
3209 || x->types[j].bitfield.class == RegBND)
3210 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3211 if (operand_type_check (x->types[j], imm))
3212 pe (x->op[j].imms);
3213 if (operand_type_check (x->types[j], disp))
3214 pe (x->op[j].disps);
3215 }
3216 }
3217
3218 static void
3219 pte (insn_template *t)
3220 {
3221 unsigned int j;
3222 fprintf (stdout, " %d operands ", t->operands);
3223 fprintf (stdout, "opcode %x ", t->base_opcode);
3224 if (t->extension_opcode != None)
3225 fprintf (stdout, "ext %x ", t->extension_opcode);
3226 if (t->opcode_modifier.d)
3227 fprintf (stdout, "D");
3228 if (t->opcode_modifier.w)
3229 fprintf (stdout, "W");
3230 fprintf (stdout, "\n");
3231 for (j = 0; j < t->operands; j++)
3232 {
3233 fprintf (stdout, " #%d type ", j + 1);
3234 pt (t->operand_types[j]);
3235 fprintf (stdout, "\n");
3236 }
3237 }
3238
3239 static void
3240 pe (expressionS *e)
3241 {
3242 fprintf (stdout, " operation %d\n", e->X_op);
3243 fprintf (stdout, " add_number %ld (%lx)\n",
3244 (long) e->X_add_number, (long) e->X_add_number);
3245 if (e->X_add_symbol)
3246 {
3247 fprintf (stdout, " add_symbol ");
3248 ps (e->X_add_symbol);
3249 fprintf (stdout, "\n");
3250 }
3251 if (e->X_op_symbol)
3252 {
3253 fprintf (stdout, " op_symbol ");
3254 ps (e->X_op_symbol);
3255 fprintf (stdout, "\n");
3256 }
3257 }
3258
3259 static void
3260 ps (symbolS *s)
3261 {
3262 fprintf (stdout, "%s type %s%s",
3263 S_GET_NAME (s),
3264 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3265 segment_name (S_GET_SEGMENT (s)));
3266 }
3267
3268 static struct type_name
3269 {
3270 i386_operand_type mask;
3271 const char *name;
3272 }
3273 const type_names[] =
3274 {
3275 { OPERAND_TYPE_REG8, "r8" },
3276 { OPERAND_TYPE_REG16, "r16" },
3277 { OPERAND_TYPE_REG32, "r32" },
3278 { OPERAND_TYPE_REG64, "r64" },
3279 { OPERAND_TYPE_ACC8, "acc8" },
3280 { OPERAND_TYPE_ACC16, "acc16" },
3281 { OPERAND_TYPE_ACC32, "acc32" },
3282 { OPERAND_TYPE_ACC64, "acc64" },
3283 { OPERAND_TYPE_IMM8, "i8" },
3284 { OPERAND_TYPE_IMM8, "i8s" },
3285 { OPERAND_TYPE_IMM16, "i16" },
3286 { OPERAND_TYPE_IMM32, "i32" },
3287 { OPERAND_TYPE_IMM32S, "i32s" },
3288 { OPERAND_TYPE_IMM64, "i64" },
3289 { OPERAND_TYPE_IMM1, "i1" },
3290 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3291 { OPERAND_TYPE_DISP8, "d8" },
3292 { OPERAND_TYPE_DISP16, "d16" },
3293 { OPERAND_TYPE_DISP32, "d32" },
3294 { OPERAND_TYPE_DISP32S, "d32s" },
3295 { OPERAND_TYPE_DISP64, "d64" },
3296 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3297 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3298 { OPERAND_TYPE_CONTROL, "control reg" },
3299 { OPERAND_TYPE_TEST, "test reg" },
3300 { OPERAND_TYPE_DEBUG, "debug reg" },
3301 { OPERAND_TYPE_FLOATREG, "FReg" },
3302 { OPERAND_TYPE_FLOATACC, "FAcc" },
3303 { OPERAND_TYPE_SREG, "SReg" },
3304 { OPERAND_TYPE_REGMMX, "rMMX" },
3305 { OPERAND_TYPE_REGXMM, "rXMM" },
3306 { OPERAND_TYPE_REGYMM, "rYMM" },
3307 { OPERAND_TYPE_REGZMM, "rZMM" },
3308 { OPERAND_TYPE_REGMASK, "Mask reg" },
3309 };
3310
3311 static void
3312 pt (i386_operand_type t)
3313 {
3314 unsigned int j;
3315 i386_operand_type a;
3316
3317 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3318 {
3319 a = operand_type_and (t, type_names[j].mask);
3320 if (operand_type_equal (&a, &type_names[j].mask))
3321 fprintf (stdout, "%s, ", type_names[j].name);
3322 }
3323 fflush (stdout);
3324 }
3325
3326 #endif /* DEBUG386 */
3327 \f
3328 static bfd_reloc_code_real_type
3329 reloc (unsigned int size,
3330 int pcrel,
3331 int sign,
3332 bfd_reloc_code_real_type other)
3333 {
3334 if (other != NO_RELOC)
3335 {
3336 reloc_howto_type *rel;
3337
3338 if (size == 8)
3339 switch (other)
3340 {
3341 case BFD_RELOC_X86_64_GOT32:
3342 return BFD_RELOC_X86_64_GOT64;
3343 break;
3344 case BFD_RELOC_X86_64_GOTPLT64:
3345 return BFD_RELOC_X86_64_GOTPLT64;
3346 break;
3347 case BFD_RELOC_X86_64_PLTOFF64:
3348 return BFD_RELOC_X86_64_PLTOFF64;
3349 break;
3350 case BFD_RELOC_X86_64_GOTPC32:
3351 other = BFD_RELOC_X86_64_GOTPC64;
3352 break;
3353 case BFD_RELOC_X86_64_GOTPCREL:
3354 other = BFD_RELOC_X86_64_GOTPCREL64;
3355 break;
3356 case BFD_RELOC_X86_64_TPOFF32:
3357 other = BFD_RELOC_X86_64_TPOFF64;
3358 break;
3359 case BFD_RELOC_X86_64_DTPOFF32:
3360 other = BFD_RELOC_X86_64_DTPOFF64;
3361 break;
3362 default:
3363 break;
3364 }
3365
3366 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3367 if (other == BFD_RELOC_SIZE32)
3368 {
3369 if (size == 8)
3370 other = BFD_RELOC_SIZE64;
3371 if (pcrel)
3372 {
3373 as_bad (_("there are no pc-relative size relocations"));
3374 return NO_RELOC;
3375 }
3376 }
3377 #endif
3378
3379 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3380 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3381 sign = -1;
3382
3383 rel = bfd_reloc_type_lookup (stdoutput, other);
3384 if (!rel)
3385 as_bad (_("unknown relocation (%u)"), other);
3386 else if (size != bfd_get_reloc_size (rel))
3387 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3388 bfd_get_reloc_size (rel),
3389 size);
3390 else if (pcrel && !rel->pc_relative)
3391 as_bad (_("non-pc-relative relocation for pc-relative field"));
3392 else if ((rel->complain_on_overflow == complain_overflow_signed
3393 && !sign)
3394 || (rel->complain_on_overflow == complain_overflow_unsigned
3395 && sign > 0))
3396 as_bad (_("relocated field and relocation type differ in signedness"));
3397 else
3398 return other;
3399 return NO_RELOC;
3400 }
3401
3402 if (pcrel)
3403 {
3404 if (!sign)
3405 as_bad (_("there are no unsigned pc-relative relocations"));
3406 switch (size)
3407 {
3408 case 1: return BFD_RELOC_8_PCREL;
3409 case 2: return BFD_RELOC_16_PCREL;
3410 case 4: return BFD_RELOC_32_PCREL;
3411 case 8: return BFD_RELOC_64_PCREL;
3412 }
3413 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3414 }
3415 else
3416 {
3417 if (sign > 0)
3418 switch (size)
3419 {
3420 case 4: return BFD_RELOC_X86_64_32S;
3421 }
3422 else
3423 switch (size)
3424 {
3425 case 1: return BFD_RELOC_8;
3426 case 2: return BFD_RELOC_16;
3427 case 4: return BFD_RELOC_32;
3428 case 8: return BFD_RELOC_64;
3429 }
3430 as_bad (_("cannot do %s %u byte relocation"),
3431 sign > 0 ? "signed" : "unsigned", size);
3432 }
3433
3434 return NO_RELOC;
3435 }
3436
3437 /* Here we decide which fixups can be adjusted to make them relative to
3438 the beginning of the section instead of the symbol. Basically we need
3439 to make sure that the dynamic relocations are done correctly, so in
3440 some cases we force the original symbol to be used. */
3441
3442 int
3443 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3444 {
3445 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3446 if (!IS_ELF)
3447 return 1;
3448
3449 /* Don't adjust pc-relative references to merge sections in 64-bit
3450 mode. */
3451 if (use_rela_relocations
3452 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3453 && fixP->fx_pcrel)
3454 return 0;
3455
3456 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3457 and changed later by validate_fix. */
3458 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3459 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3460 return 0;
3461
3462 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3463 for size relocations. */
3464 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3465 || fixP->fx_r_type == BFD_RELOC_SIZE64
3466 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3467 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3468 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3469 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3470 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3471 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3472 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3473 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3474 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3475 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3476 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3477 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3478 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3479 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3480 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3481 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3482 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3483 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3484 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3485 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3486 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3487 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3488 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3489 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3490 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3491 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3492 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3493 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3494 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3495 return 0;
3496 #endif
3497 return 1;
3498 }
3499
3500 static int
3501 intel_float_operand (const char *mnemonic)
3502 {
3503 /* Note that the value returned is meaningful only for opcodes with (memory)
3504 operands, hence the code here is free to improperly handle opcodes that
3505 have no operands (for better performance and smaller code). */
3506
3507 if (mnemonic[0] != 'f')
3508 return 0; /* non-math */
3509
3510 switch (mnemonic[1])
3511 {
3512 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3513 the fs segment override prefix not currently handled because no
3514 call path can make opcodes without operands get here */
3515 case 'i':
3516 return 2 /* integer op */;
3517 case 'l':
3518 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3519 return 3; /* fldcw/fldenv */
3520 break;
3521 case 'n':
3522 if (mnemonic[2] != 'o' /* fnop */)
3523 return 3; /* non-waiting control op */
3524 break;
3525 case 'r':
3526 if (mnemonic[2] == 's')
3527 return 3; /* frstor/frstpm */
3528 break;
3529 case 's':
3530 if (mnemonic[2] == 'a')
3531 return 3; /* fsave */
3532 if (mnemonic[2] == 't')
3533 {
3534 switch (mnemonic[3])
3535 {
3536 case 'c': /* fstcw */
3537 case 'd': /* fstdw */
3538 case 'e': /* fstenv */
3539 case 's': /* fsts[gw] */
3540 return 3;
3541 }
3542 }
3543 break;
3544 case 'x':
3545 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3546 return 0; /* fxsave/fxrstor are not really math ops */
3547 break;
3548 }
3549
3550 return 1;
3551 }
3552
3553 /* Build the VEX prefix. */
3554
3555 static void
3556 build_vex_prefix (const insn_template *t)
3557 {
3558 unsigned int register_specifier;
3559 unsigned int implied_prefix;
3560 unsigned int vector_length;
3561 unsigned int w;
3562
3563 /* Check register specifier. */
3564 if (i.vex.register_specifier)
3565 {
3566 register_specifier =
3567 ~register_number (i.vex.register_specifier) & 0xf;
3568 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3569 }
3570 else
3571 register_specifier = 0xf;
3572
3573 /* Use 2-byte VEX prefix by swapping destination and source operand
3574 if there are more than 1 register operand. */
3575 if (i.reg_operands > 1
3576 && i.vec_encoding != vex_encoding_vex3
3577 && i.dir_encoding == dir_encoding_default
3578 && i.operands == i.reg_operands
3579 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3580 && i.tm.opcode_modifier.vexopcode == VEX0F
3581 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3582 && i.rex == REX_B)
3583 {
3584 unsigned int xchg = i.operands - 1;
3585 union i386_op temp_op;
3586 i386_operand_type temp_type;
3587
3588 temp_type = i.types[xchg];
3589 i.types[xchg] = i.types[0];
3590 i.types[0] = temp_type;
3591 temp_op = i.op[xchg];
3592 i.op[xchg] = i.op[0];
3593 i.op[0] = temp_op;
3594
3595 gas_assert (i.rm.mode == 3);
3596
3597 i.rex = REX_R;
3598 xchg = i.rm.regmem;
3599 i.rm.regmem = i.rm.reg;
3600 i.rm.reg = xchg;
3601
3602 if (i.tm.opcode_modifier.d)
3603 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3604 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3605 else /* Use the next insn. */
3606 i.tm = t[1];
3607 }
3608
3609 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3610 are no memory operands and at least 3 register ones. */
3611 if (i.reg_operands >= 3
3612 && i.vec_encoding != vex_encoding_vex3
3613 && i.reg_operands == i.operands - i.imm_operands
3614 && i.tm.opcode_modifier.vex
3615 && i.tm.opcode_modifier.commutative
3616 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3617 && i.rex == REX_B
3618 && i.vex.register_specifier
3619 && !(i.vex.register_specifier->reg_flags & RegRex))
3620 {
3621 unsigned int xchg = i.operands - i.reg_operands;
3622 union i386_op temp_op;
3623 i386_operand_type temp_type;
3624
3625 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3626 gas_assert (!i.tm.opcode_modifier.sae);
3627 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3628 &i.types[i.operands - 3]));
3629 gas_assert (i.rm.mode == 3);
3630
3631 temp_type = i.types[xchg];
3632 i.types[xchg] = i.types[xchg + 1];
3633 i.types[xchg + 1] = temp_type;
3634 temp_op = i.op[xchg];
3635 i.op[xchg] = i.op[xchg + 1];
3636 i.op[xchg + 1] = temp_op;
3637
3638 i.rex = 0;
3639 xchg = i.rm.regmem | 8;
3640 i.rm.regmem = ~register_specifier & 0xf;
3641 gas_assert (!(i.rm.regmem & 8));
3642 i.vex.register_specifier += xchg - i.rm.regmem;
3643 register_specifier = ~xchg & 0xf;
3644 }
3645
3646 if (i.tm.opcode_modifier.vex == VEXScalar)
3647 vector_length = avxscalar;
3648 else if (i.tm.opcode_modifier.vex == VEX256)
3649 vector_length = 1;
3650 else
3651 {
3652 unsigned int op;
3653
3654 /* Determine vector length from the last multi-length vector
3655 operand. */
3656 vector_length = 0;
3657 for (op = t->operands; op--;)
3658 if (t->operand_types[op].bitfield.xmmword
3659 && t->operand_types[op].bitfield.ymmword
3660 && i.types[op].bitfield.ymmword)
3661 {
3662 vector_length = 1;
3663 break;
3664 }
3665 }
3666
3667 switch ((i.tm.base_opcode >> 8) & 0xff)
3668 {
3669 case 0:
3670 implied_prefix = 0;
3671 break;
3672 case DATA_PREFIX_OPCODE:
3673 implied_prefix = 1;
3674 break;
3675 case REPE_PREFIX_OPCODE:
3676 implied_prefix = 2;
3677 break;
3678 case REPNE_PREFIX_OPCODE:
3679 implied_prefix = 3;
3680 break;
3681 default:
3682 abort ();
3683 }
3684
3685 /* Check the REX.W bit and VEXW. */
3686 if (i.tm.opcode_modifier.vexw == VEXWIG)
3687 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3688 else if (i.tm.opcode_modifier.vexw)
3689 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3690 else
3691 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3692
3693 /* Use 2-byte VEX prefix if possible. */
3694 if (w == 0
3695 && i.vec_encoding != vex_encoding_vex3
3696 && i.tm.opcode_modifier.vexopcode == VEX0F
3697 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3698 {
3699 /* 2-byte VEX prefix. */
3700 unsigned int r;
3701
3702 i.vex.length = 2;
3703 i.vex.bytes[0] = 0xc5;
3704
3705 /* Check the REX.R bit. */
3706 r = (i.rex & REX_R) ? 0 : 1;
3707 i.vex.bytes[1] = (r << 7
3708 | register_specifier << 3
3709 | vector_length << 2
3710 | implied_prefix);
3711 }
3712 else
3713 {
3714 /* 3-byte VEX prefix. */
3715 unsigned int m;
3716
3717 i.vex.length = 3;
3718
3719 switch (i.tm.opcode_modifier.vexopcode)
3720 {
3721 case VEX0F:
3722 m = 0x1;
3723 i.vex.bytes[0] = 0xc4;
3724 break;
3725 case VEX0F38:
3726 m = 0x2;
3727 i.vex.bytes[0] = 0xc4;
3728 break;
3729 case VEX0F3A:
3730 m = 0x3;
3731 i.vex.bytes[0] = 0xc4;
3732 break;
3733 case XOP08:
3734 m = 0x8;
3735 i.vex.bytes[0] = 0x8f;
3736 break;
3737 case XOP09:
3738 m = 0x9;
3739 i.vex.bytes[0] = 0x8f;
3740 break;
3741 case XOP0A:
3742 m = 0xa;
3743 i.vex.bytes[0] = 0x8f;
3744 break;
3745 default:
3746 abort ();
3747 }
3748
3749 /* The high 3 bits of the second VEX byte are 1's compliment
3750 of RXB bits from REX. */
3751 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3752
3753 i.vex.bytes[2] = (w << 7
3754 | register_specifier << 3
3755 | vector_length << 2
3756 | implied_prefix);
3757 }
3758 }
3759
3760 static INLINE bfd_boolean
3761 is_evex_encoding (const insn_template *t)
3762 {
3763 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3764 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3765 || t->opcode_modifier.sae;
3766 }
3767
3768 static INLINE bfd_boolean
3769 is_any_vex_encoding (const insn_template *t)
3770 {
3771 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3772 || is_evex_encoding (t);
3773 }
3774
3775 /* Build the EVEX prefix. */
3776
3777 static void
3778 build_evex_prefix (void)
3779 {
3780 unsigned int register_specifier;
3781 unsigned int implied_prefix;
3782 unsigned int m, w;
3783 rex_byte vrex_used = 0;
3784
3785 /* Check register specifier. */
3786 if (i.vex.register_specifier)
3787 {
3788 gas_assert ((i.vrex & REX_X) == 0);
3789
3790 register_specifier = i.vex.register_specifier->reg_num;
3791 if ((i.vex.register_specifier->reg_flags & RegRex))
3792 register_specifier += 8;
3793 /* The upper 16 registers are encoded in the fourth byte of the
3794 EVEX prefix. */
3795 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3796 i.vex.bytes[3] = 0x8;
3797 register_specifier = ~register_specifier & 0xf;
3798 }
3799 else
3800 {
3801 register_specifier = 0xf;
3802
3803 /* Encode upper 16 vector index register in the fourth byte of
3804 the EVEX prefix. */
3805 if (!(i.vrex & REX_X))
3806 i.vex.bytes[3] = 0x8;
3807 else
3808 vrex_used |= REX_X;
3809 }
3810
3811 switch ((i.tm.base_opcode >> 8) & 0xff)
3812 {
3813 case 0:
3814 implied_prefix = 0;
3815 break;
3816 case DATA_PREFIX_OPCODE:
3817 implied_prefix = 1;
3818 break;
3819 case REPE_PREFIX_OPCODE:
3820 implied_prefix = 2;
3821 break;
3822 case REPNE_PREFIX_OPCODE:
3823 implied_prefix = 3;
3824 break;
3825 default:
3826 abort ();
3827 }
3828
3829 /* 4 byte EVEX prefix. */
3830 i.vex.length = 4;
3831 i.vex.bytes[0] = 0x62;
3832
3833 /* mmmm bits. */
3834 switch (i.tm.opcode_modifier.vexopcode)
3835 {
3836 case VEX0F:
3837 m = 1;
3838 break;
3839 case VEX0F38:
3840 m = 2;
3841 break;
3842 case VEX0F3A:
3843 m = 3;
3844 break;
3845 default:
3846 abort ();
3847 break;
3848 }
3849
3850 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3851 bits from REX. */
3852 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3853
3854 /* The fifth bit of the second EVEX byte is 1's compliment of the
3855 REX_R bit in VREX. */
3856 if (!(i.vrex & REX_R))
3857 i.vex.bytes[1] |= 0x10;
3858 else
3859 vrex_used |= REX_R;
3860
3861 if ((i.reg_operands + i.imm_operands) == i.operands)
3862 {
3863 /* When all operands are registers, the REX_X bit in REX is not
3864 used. We reuse it to encode the upper 16 registers, which is
3865 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3866 as 1's compliment. */
3867 if ((i.vrex & REX_B))
3868 {
3869 vrex_used |= REX_B;
3870 i.vex.bytes[1] &= ~0x40;
3871 }
3872 }
3873
3874 /* EVEX instructions shouldn't need the REX prefix. */
3875 i.vrex &= ~vrex_used;
3876 gas_assert (i.vrex == 0);
3877
3878 /* Check the REX.W bit and VEXW. */
3879 if (i.tm.opcode_modifier.vexw == VEXWIG)
3880 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3881 else if (i.tm.opcode_modifier.vexw)
3882 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3883 else
3884 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3885
3886 /* Encode the U bit. */
3887 implied_prefix |= 0x4;
3888
3889 /* The third byte of the EVEX prefix. */
3890 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3891
3892 /* The fourth byte of the EVEX prefix. */
3893 /* The zeroing-masking bit. */
3894 if (i.mask && i.mask->zeroing)
3895 i.vex.bytes[3] |= 0x80;
3896
3897 /* Don't always set the broadcast bit if there is no RC. */
3898 if (!i.rounding)
3899 {
3900 /* Encode the vector length. */
3901 unsigned int vec_length;
3902
3903 if (!i.tm.opcode_modifier.evex
3904 || i.tm.opcode_modifier.evex == EVEXDYN)
3905 {
3906 unsigned int op;
3907
3908 /* Determine vector length from the last multi-length vector
3909 operand. */
3910 for (op = i.operands; op--;)
3911 if (i.tm.operand_types[op].bitfield.xmmword
3912 + i.tm.operand_types[op].bitfield.ymmword
3913 + i.tm.operand_types[op].bitfield.zmmword > 1)
3914 {
3915 if (i.types[op].bitfield.zmmword)
3916 {
3917 i.tm.opcode_modifier.evex = EVEX512;
3918 break;
3919 }
3920 else if (i.types[op].bitfield.ymmword)
3921 {
3922 i.tm.opcode_modifier.evex = EVEX256;
3923 break;
3924 }
3925 else if (i.types[op].bitfield.xmmword)
3926 {
3927 i.tm.opcode_modifier.evex = EVEX128;
3928 break;
3929 }
3930 else if (i.broadcast && (int) op == i.broadcast->operand)
3931 {
3932 switch (i.broadcast->bytes)
3933 {
3934 case 64:
3935 i.tm.opcode_modifier.evex = EVEX512;
3936 break;
3937 case 32:
3938 i.tm.opcode_modifier.evex = EVEX256;
3939 break;
3940 case 16:
3941 i.tm.opcode_modifier.evex = EVEX128;
3942 break;
3943 default:
3944 abort ();
3945 }
3946 break;
3947 }
3948 }
3949
3950 if (op >= MAX_OPERANDS)
3951 abort ();
3952 }
3953
3954 switch (i.tm.opcode_modifier.evex)
3955 {
3956 case EVEXLIG: /* LL' is ignored */
3957 vec_length = evexlig << 5;
3958 break;
3959 case EVEX128:
3960 vec_length = 0 << 5;
3961 break;
3962 case EVEX256:
3963 vec_length = 1 << 5;
3964 break;
3965 case EVEX512:
3966 vec_length = 2 << 5;
3967 break;
3968 default:
3969 abort ();
3970 break;
3971 }
3972 i.vex.bytes[3] |= vec_length;
3973 /* Encode the broadcast bit. */
3974 if (i.broadcast)
3975 i.vex.bytes[3] |= 0x10;
3976 }
3977 else
3978 {
3979 if (i.rounding->type != saeonly)
3980 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3981 else
3982 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3983 }
3984
3985 if (i.mask && i.mask->mask)
3986 i.vex.bytes[3] |= i.mask->mask->reg_num;
3987 }
3988
3989 static void
3990 process_immext (void)
3991 {
3992 expressionS *exp;
3993
3994 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3995 which is coded in the same place as an 8-bit immediate field
3996 would be. Here we fake an 8-bit immediate operand from the
3997 opcode suffix stored in tm.extension_opcode.
3998
3999 AVX instructions also use this encoding, for some of
4000 3 argument instructions. */
4001
4002 gas_assert (i.imm_operands <= 1
4003 && (i.operands <= 2
4004 || (is_any_vex_encoding (&i.tm)
4005 && i.operands <= 4)));
4006
4007 exp = &im_expressions[i.imm_operands++];
4008 i.op[i.operands].imms = exp;
4009 i.types[i.operands] = imm8;
4010 i.operands++;
4011 exp->X_op = O_constant;
4012 exp->X_add_number = i.tm.extension_opcode;
4013 i.tm.extension_opcode = None;
4014 }
4015
4016
4017 static int
4018 check_hle (void)
4019 {
4020 switch (i.tm.opcode_modifier.hleprefixok)
4021 {
4022 default:
4023 abort ();
4024 case HLEPrefixNone:
4025 as_bad (_("invalid instruction `%s' after `%s'"),
4026 i.tm.name, i.hle_prefix);
4027 return 0;
4028 case HLEPrefixLock:
4029 if (i.prefix[LOCK_PREFIX])
4030 return 1;
4031 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4032 return 0;
4033 case HLEPrefixAny:
4034 return 1;
4035 case HLEPrefixRelease:
4036 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4037 {
4038 as_bad (_("instruction `%s' after `xacquire' not allowed"),
4039 i.tm.name);
4040 return 0;
4041 }
4042 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4043 {
4044 as_bad (_("memory destination needed for instruction `%s'"
4045 " after `xrelease'"), i.tm.name);
4046 return 0;
4047 }
4048 return 1;
4049 }
4050 }
4051
4052 /* Try the shortest encoding by shortening operand size. */
4053
4054 static void
4055 optimize_encoding (void)
4056 {
4057 unsigned int j;
4058
4059 if (optimize_for_space
4060 && !is_any_vex_encoding (&i.tm)
4061 && i.reg_operands == 1
4062 && i.imm_operands == 1
4063 && !i.types[1].bitfield.byte
4064 && i.op[0].imms->X_op == O_constant
4065 && fits_in_imm7 (i.op[0].imms->X_add_number)
4066 && (i.tm.base_opcode == 0xa8
4067 || (i.tm.base_opcode == 0xf6
4068 && i.tm.extension_opcode == 0x0)))
4069 {
4070 /* Optimize: -Os:
4071 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4072 */
4073 unsigned int base_regnum = i.op[1].regs->reg_num;
4074 if (flag_code == CODE_64BIT || base_regnum < 4)
4075 {
4076 i.types[1].bitfield.byte = 1;
4077 /* Ignore the suffix. */
4078 i.suffix = 0;
4079 /* Convert to byte registers. */
4080 if (i.types[1].bitfield.word)
4081 j = 16;
4082 else if (i.types[1].bitfield.dword)
4083 j = 32;
4084 else
4085 j = 48;
4086 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4087 j += 8;
4088 i.op[1].regs -= j;
4089 }
4090 }
4091 else if (flag_code == CODE_64BIT
4092 && !is_any_vex_encoding (&i.tm)
4093 && ((i.types[1].bitfield.qword
4094 && i.reg_operands == 1
4095 && i.imm_operands == 1
4096 && i.op[0].imms->X_op == O_constant
4097 && ((i.tm.base_opcode == 0xb8
4098 && i.tm.extension_opcode == None
4099 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4100 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4101 && ((i.tm.base_opcode == 0x24
4102 || i.tm.base_opcode == 0xa8)
4103 || (i.tm.base_opcode == 0x80
4104 && i.tm.extension_opcode == 0x4)
4105 || ((i.tm.base_opcode == 0xf6
4106 || (i.tm.base_opcode | 1) == 0xc7)
4107 && i.tm.extension_opcode == 0x0)))
4108 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4109 && i.tm.base_opcode == 0x83
4110 && i.tm.extension_opcode == 0x4)))
4111 || (i.types[0].bitfield.qword
4112 && ((i.reg_operands == 2
4113 && i.op[0].regs == i.op[1].regs
4114 && (i.tm.base_opcode == 0x30
4115 || i.tm.base_opcode == 0x28))
4116 || (i.reg_operands == 1
4117 && i.operands == 1
4118 && i.tm.base_opcode == 0x30)))))
4119 {
4120 /* Optimize: -O:
4121 andq $imm31, %r64 -> andl $imm31, %r32
4122 andq $imm7, %r64 -> andl $imm7, %r32
4123 testq $imm31, %r64 -> testl $imm31, %r32
4124 xorq %r64, %r64 -> xorl %r32, %r32
4125 subq %r64, %r64 -> subl %r32, %r32
4126 movq $imm31, %r64 -> movl $imm31, %r32
4127 movq $imm32, %r64 -> movl $imm32, %r32
4128 */
4129 i.tm.opcode_modifier.norex64 = 1;
4130 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4131 {
4132 /* Handle
4133 movq $imm31, %r64 -> movl $imm31, %r32
4134 movq $imm32, %r64 -> movl $imm32, %r32
4135 */
4136 i.tm.operand_types[0].bitfield.imm32 = 1;
4137 i.tm.operand_types[0].bitfield.imm32s = 0;
4138 i.tm.operand_types[0].bitfield.imm64 = 0;
4139 i.types[0].bitfield.imm32 = 1;
4140 i.types[0].bitfield.imm32s = 0;
4141 i.types[0].bitfield.imm64 = 0;
4142 i.types[1].bitfield.dword = 1;
4143 i.types[1].bitfield.qword = 0;
4144 if ((i.tm.base_opcode | 1) == 0xc7)
4145 {
4146 /* Handle
4147 movq $imm31, %r64 -> movl $imm31, %r32
4148 */
4149 i.tm.base_opcode = 0xb8;
4150 i.tm.extension_opcode = None;
4151 i.tm.opcode_modifier.w = 0;
4152 i.tm.opcode_modifier.modrm = 0;
4153 }
4154 }
4155 }
4156 else if (optimize > 1
4157 && !optimize_for_space
4158 && !is_any_vex_encoding (&i.tm)
4159 && i.reg_operands == 2
4160 && i.op[0].regs == i.op[1].regs
4161 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4162 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4163 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4164 {
4165 /* Optimize: -O2:
4166 andb %rN, %rN -> testb %rN, %rN
4167 andw %rN, %rN -> testw %rN, %rN
4168 andq %rN, %rN -> testq %rN, %rN
4169 orb %rN, %rN -> testb %rN, %rN
4170 orw %rN, %rN -> testw %rN, %rN
4171 orq %rN, %rN -> testq %rN, %rN
4172
4173 and outside of 64-bit mode
4174
4175 andl %rN, %rN -> testl %rN, %rN
4176 orl %rN, %rN -> testl %rN, %rN
4177 */
4178 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4179 }
4180 else if (i.reg_operands == 3
4181 && i.op[0].regs == i.op[1].regs
4182 && !i.types[2].bitfield.xmmword
4183 && (i.tm.opcode_modifier.vex
4184 || ((!i.mask || i.mask->zeroing)
4185 && !i.rounding
4186 && is_evex_encoding (&i.tm)
4187 && (i.vec_encoding != vex_encoding_evex
4188 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4189 || i.tm.cpu_flags.bitfield.cpuavx512vl
4190 || (i.tm.operand_types[2].bitfield.zmmword
4191 && i.types[2].bitfield.ymmword))))
4192 && ((i.tm.base_opcode == 0x55
4193 || i.tm.base_opcode == 0x6655
4194 || i.tm.base_opcode == 0x66df
4195 || i.tm.base_opcode == 0x57
4196 || i.tm.base_opcode == 0x6657
4197 || i.tm.base_opcode == 0x66ef
4198 || i.tm.base_opcode == 0x66f8
4199 || i.tm.base_opcode == 0x66f9
4200 || i.tm.base_opcode == 0x66fa
4201 || i.tm.base_opcode == 0x66fb
4202 || i.tm.base_opcode == 0x42
4203 || i.tm.base_opcode == 0x6642
4204 || i.tm.base_opcode == 0x47
4205 || i.tm.base_opcode == 0x6647)
4206 && i.tm.extension_opcode == None))
4207 {
4208 /* Optimize: -O1:
4209 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4210 vpsubq and vpsubw:
4211 EVEX VOP %zmmM, %zmmM, %zmmN
4212 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4213 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4214 EVEX VOP %ymmM, %ymmM, %ymmN
4215 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4216 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4217 VEX VOP %ymmM, %ymmM, %ymmN
4218 -> VEX VOP %xmmM, %xmmM, %xmmN
4219 VOP, one of vpandn and vpxor:
4220 VEX VOP %ymmM, %ymmM, %ymmN
4221 -> VEX VOP %xmmM, %xmmM, %xmmN
4222 VOP, one of vpandnd and vpandnq:
4223 EVEX VOP %zmmM, %zmmM, %zmmN
4224 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4225 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4226 EVEX VOP %ymmM, %ymmM, %ymmN
4227 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4228 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4229 VOP, one of vpxord and vpxorq:
4230 EVEX VOP %zmmM, %zmmM, %zmmN
4231 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4232 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4233 EVEX VOP %ymmM, %ymmM, %ymmN
4234 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4235 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4236 VOP, one of kxord and kxorq:
4237 VEX VOP %kM, %kM, %kN
4238 -> VEX kxorw %kM, %kM, %kN
4239 VOP, one of kandnd and kandnq:
4240 VEX VOP %kM, %kM, %kN
4241 -> VEX kandnw %kM, %kM, %kN
4242 */
4243 if (is_evex_encoding (&i.tm))
4244 {
4245 if (i.vec_encoding != vex_encoding_evex)
4246 {
4247 i.tm.opcode_modifier.vex = VEX128;
4248 i.tm.opcode_modifier.vexw = VEXW0;
4249 i.tm.opcode_modifier.evex = 0;
4250 }
4251 else if (optimize > 1)
4252 i.tm.opcode_modifier.evex = EVEX128;
4253 else
4254 return;
4255 }
4256 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4257 {
4258 i.tm.base_opcode &= 0xff;
4259 i.tm.opcode_modifier.vexw = VEXW0;
4260 }
4261 else
4262 i.tm.opcode_modifier.vex = VEX128;
4263
4264 if (i.tm.opcode_modifier.vex)
4265 for (j = 0; j < 3; j++)
4266 {
4267 i.types[j].bitfield.xmmword = 1;
4268 i.types[j].bitfield.ymmword = 0;
4269 }
4270 }
4271 else if (i.vec_encoding != vex_encoding_evex
4272 && !i.types[0].bitfield.zmmword
4273 && !i.types[1].bitfield.zmmword
4274 && !i.mask
4275 && !i.broadcast
4276 && is_evex_encoding (&i.tm)
4277 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4278 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4279 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4280 || (i.tm.base_opcode & ~4) == 0x66db
4281 || (i.tm.base_opcode & ~4) == 0x66eb)
4282 && i.tm.extension_opcode == None)
4283 {
4284 /* Optimize: -O1:
4285 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4286 vmovdqu32 and vmovdqu64:
4287 EVEX VOP %xmmM, %xmmN
4288 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4289 EVEX VOP %ymmM, %ymmN
4290 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4291 EVEX VOP %xmmM, mem
4292 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4293 EVEX VOP %ymmM, mem
4294 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4295 EVEX VOP mem, %xmmN
4296 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4297 EVEX VOP mem, %ymmN
4298 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4299 VOP, one of vpand, vpandn, vpor, vpxor:
4300 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4301 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4302 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4303 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4304 EVEX VOP{d,q} mem, %xmmM, %xmmN
4305 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4306 EVEX VOP{d,q} mem, %ymmM, %ymmN
4307 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4308 */
4309 for (j = 0; j < i.operands; j++)
4310 if (operand_type_check (i.types[j], disp)
4311 && i.op[j].disps->X_op == O_constant)
4312 {
4313 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4314 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4315 bytes, we choose EVEX Disp8 over VEX Disp32. */
4316 int evex_disp8, vex_disp8;
4317 unsigned int memshift = i.memshift;
4318 offsetT n = i.op[j].disps->X_add_number;
4319
4320 evex_disp8 = fits_in_disp8 (n);
4321 i.memshift = 0;
4322 vex_disp8 = fits_in_disp8 (n);
4323 if (evex_disp8 != vex_disp8)
4324 {
4325 i.memshift = memshift;
4326 return;
4327 }
4328
4329 i.types[j].bitfield.disp8 = vex_disp8;
4330 break;
4331 }
4332 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4333 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4334 i.tm.opcode_modifier.vex
4335 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4336 i.tm.opcode_modifier.vexw = VEXW0;
4337 /* VPAND, VPOR, and VPXOR are commutative. */
4338 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4339 i.tm.opcode_modifier.commutative = 1;
4340 i.tm.opcode_modifier.evex = 0;
4341 i.tm.opcode_modifier.masking = 0;
4342 i.tm.opcode_modifier.broadcast = 0;
4343 i.tm.opcode_modifier.disp8memshift = 0;
4344 i.memshift = 0;
4345 if (j < i.operands)
4346 i.types[j].bitfield.disp8
4347 = fits_in_disp8 (i.op[j].disps->X_add_number);
4348 }
4349 }
4350
4351 /* Return non-zero for load instruction. */
4352
4353 static int
4354 load_insn_p (void)
4355 {
4356 unsigned int dest;
4357 int any_vex_p = is_any_vex_encoding (&i.tm);
4358 unsigned int base_opcode = i.tm.base_opcode | 1;
4359
4360 if (!any_vex_p)
4361 {
4362 /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4363 prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4364 bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote. */
4365 if (i.tm.opcode_modifier.anysize)
4366 return 0;
4367
4368 /* pop, popf, popa. */
4369 if (strcmp (i.tm.name, "pop") == 0
4370 || i.tm.base_opcode == 0x9d
4371 || i.tm.base_opcode == 0x61)
4372 return 1;
4373
4374 /* movs, cmps, lods, scas. */
4375 if ((i.tm.base_opcode | 0xb) == 0xaf)
4376 return 1;
4377
4378 /* outs, xlatb. */
4379 if (base_opcode == 0x6f
4380 || i.tm.base_opcode == 0xd7)
4381 return 1;
4382 /* NB: For AMD-specific insns with implicit memory operands,
4383 they're intentionally not covered. */
4384 }
4385
4386 /* No memory operand. */
4387 if (!i.mem_operands)
4388 return 0;
4389
4390 if (any_vex_p)
4391 {
4392 /* vldmxcsr. */
4393 if (i.tm.base_opcode == 0xae
4394 && i.tm.opcode_modifier.vex
4395 && i.tm.opcode_modifier.vexopcode == VEX0F
4396 && i.tm.extension_opcode == 2)
4397 return 1;
4398 }
4399 else
4400 {
4401 /* test, not, neg, mul, imul, div, idiv. */
4402 if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4403 && i.tm.extension_opcode != 1)
4404 return 1;
4405
4406 /* inc, dec. */
4407 if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4408 return 1;
4409
4410 /* add, or, adc, sbb, and, sub, xor, cmp. */
4411 if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4412 return 1;
4413
4414 /* bt, bts, btr, btc. */
4415 if (i.tm.base_opcode == 0xfba
4416 && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4417 return 1;
4418
4419 /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4420 if ((base_opcode == 0xc1
4421 || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4422 && i.tm.extension_opcode != 6)
4423 return 1;
4424
4425 /* cmpxchg8b, cmpxchg16b, xrstors. */
4426 if (i.tm.base_opcode == 0xfc7
4427 && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4428 return 1;
4429
4430 /* fxrstor, ldmxcsr, xrstor. */
4431 if (i.tm.base_opcode == 0xfae
4432 && (i.tm.extension_opcode == 1
4433 || i.tm.extension_opcode == 2
4434 || i.tm.extension_opcode == 5))
4435 return 1;
4436
4437 /* lgdt, lidt, lmsw. */
4438 if (i.tm.base_opcode == 0xf01
4439 && (i.tm.extension_opcode == 2
4440 || i.tm.extension_opcode == 3
4441 || i.tm.extension_opcode == 6))
4442 return 1;
4443
4444 /* vmptrld */
4445 if (i.tm.base_opcode == 0xfc7
4446 && i.tm.extension_opcode == 6)
4447 return 1;
4448
4449 /* Check for x87 instructions. */
4450 if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4451 {
4452 /* Skip fst, fstp, fstenv, fstcw. */
4453 if (i.tm.base_opcode == 0xd9
4454 && (i.tm.extension_opcode == 2
4455 || i.tm.extension_opcode == 3
4456 || i.tm.extension_opcode == 6
4457 || i.tm.extension_opcode == 7))
4458 return 0;
4459
4460 /* Skip fisttp, fist, fistp, fstp. */
4461 if (i.tm.base_opcode == 0xdb
4462 && (i.tm.extension_opcode == 1
4463 || i.tm.extension_opcode == 2
4464 || i.tm.extension_opcode == 3
4465 || i.tm.extension_opcode == 7))
4466 return 0;
4467
4468 /* Skip fisttp, fst, fstp, fsave, fstsw. */
4469 if (i.tm.base_opcode == 0xdd
4470 && (i.tm.extension_opcode == 1
4471 || i.tm.extension_opcode == 2
4472 || i.tm.extension_opcode == 3
4473 || i.tm.extension_opcode == 6
4474 || i.tm.extension_opcode == 7))
4475 return 0;
4476
4477 /* Skip fisttp, fist, fistp, fbstp, fistp. */
4478 if (i.tm.base_opcode == 0xdf
4479 && (i.tm.extension_opcode == 1
4480 || i.tm.extension_opcode == 2
4481 || i.tm.extension_opcode == 3
4482 || i.tm.extension_opcode == 6
4483 || i.tm.extension_opcode == 7))
4484 return 0;
4485
4486 return 1;
4487 }
4488 }
4489
4490 dest = i.operands - 1;
4491
4492 /* Check fake imm8 operand and 3 source operands. */
4493 if ((i.tm.opcode_modifier.immext
4494 || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4495 && i.types[dest].bitfield.imm8)
4496 dest--;
4497
4498 /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd */
4499 if (!any_vex_p
4500 && (base_opcode == 0x1
4501 || base_opcode == 0x9
4502 || base_opcode == 0x11
4503 || base_opcode == 0x19
4504 || base_opcode == 0x21
4505 || base_opcode == 0x29
4506 || base_opcode == 0x31
4507 || base_opcode == 0x39
4508 || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4509 || base_opcode == 0xfc1))
4510 return 1;
4511
4512 /* Check for load instruction. */
4513 return (i.types[dest].bitfield.class != ClassNone
4514 || i.types[dest].bitfield.instance == Accum);
4515 }
4516
4517 /* Output lfence, 0xfaee8, after instruction. */
4518
4519 static void
4520 insert_lfence_after (void)
4521 {
4522 if (lfence_after_load && load_insn_p ())
4523 {
4524 /* There are also two REP string instructions that require
4525 special treatment. Specifically, the compare string (CMPS)
4526 and scan string (SCAS) instructions set EFLAGS in a manner
4527 that depends on the data being compared/scanned. When used
4528 with a REP prefix, the number of iterations may therefore
4529 vary depending on this data. If the data is a program secret
4530 chosen by the adversary using an LVI method,
4531 then this data-dependent behavior may leak some aspect
4532 of the secret. */
4533 if (((i.tm.base_opcode | 0x1) == 0xa7
4534 || (i.tm.base_opcode | 0x1) == 0xaf)
4535 && i.prefix[REP_PREFIX])
4536 {
4537 as_warn (_("`%s` changes flags which would affect control flow behavior"),
4538 i.tm.name);
4539 }
4540 char *p = frag_more (3);
4541 *p++ = 0xf;
4542 *p++ = 0xae;
4543 *p = 0xe8;
4544 }
4545 }
4546
4547 /* Output lfence, 0xfaee8, before instruction. */
4548
4549 static void
4550 insert_lfence_before (void)
4551 {
4552 char *p;
4553
4554 if (is_any_vex_encoding (&i.tm))
4555 return;
4556
4557 if (i.tm.base_opcode == 0xff
4558 && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4559 {
4560 /* Insert lfence before indirect branch if needed. */
4561
4562 if (lfence_before_indirect_branch == lfence_branch_none)
4563 return;
4564
4565 if (i.operands != 1)
4566 abort ();
4567
4568 if (i.reg_operands == 1)
4569 {
4570 /* Indirect branch via register. Don't insert lfence with
4571 -mlfence-after-load=yes. */
4572 if (lfence_after_load
4573 || lfence_before_indirect_branch == lfence_branch_memory)
4574 return;
4575 }
4576 else if (i.mem_operands == 1
4577 && lfence_before_indirect_branch != lfence_branch_register)
4578 {
4579 as_warn (_("indirect `%s` with memory operand should be avoided"),
4580 i.tm.name);
4581 return;
4582 }
4583 else
4584 return;
4585
4586 if (last_insn.kind != last_insn_other
4587 && last_insn.seg == now_seg)
4588 {
4589 as_warn_where (last_insn.file, last_insn.line,
4590 _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4591 last_insn.name, i.tm.name);
4592 return;
4593 }
4594
4595 p = frag_more (3);
4596 *p++ = 0xf;
4597 *p++ = 0xae;
4598 *p = 0xe8;
4599 return;
4600 }
4601
4602 /* Output or/not/shl and lfence before near ret. */
4603 if (lfence_before_ret != lfence_before_ret_none
4604 && (i.tm.base_opcode == 0xc2
4605 || i.tm.base_opcode == 0xc3))
4606 {
4607 if (last_insn.kind != last_insn_other
4608 && last_insn.seg == now_seg)
4609 {
4610 as_warn_where (last_insn.file, last_insn.line,
4611 _("`%s` skips -mlfence-before-ret on `%s`"),
4612 last_insn.name, i.tm.name);
4613 return;
4614 }
4615
4616 /* Near ret ingore operand size override under CPU64. */
4617 char prefix = flag_code == CODE_64BIT
4618 ? 0x48
4619 : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4620
4621 if (lfence_before_ret == lfence_before_ret_not)
4622 {
4623 /* not: 0xf71424, may add prefix
4624 for operand size override or 64-bit code. */
4625 p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4626 if (prefix)
4627 *p++ = prefix;
4628 *p++ = 0xf7;
4629 *p++ = 0x14;
4630 *p++ = 0x24;
4631 if (prefix)
4632 *p++ = prefix;
4633 *p++ = 0xf7;
4634 *p++ = 0x14;
4635 *p++ = 0x24;
4636 }
4637 else
4638 {
4639 p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4640 if (prefix)
4641 *p++ = prefix;
4642 if (lfence_before_ret == lfence_before_ret_or)
4643 {
4644 /* or: 0x830c2400, may add prefix
4645 for operand size override or 64-bit code. */
4646 *p++ = 0x83;
4647 *p++ = 0x0c;
4648 }
4649 else
4650 {
4651 /* shl: 0xc1242400, may add prefix
4652 for operand size override or 64-bit code. */
4653 *p++ = 0xc1;
4654 *p++ = 0x24;
4655 }
4656
4657 *p++ = 0x24;
4658 *p++ = 0x0;
4659 }
4660
4661 *p++ = 0xf;
4662 *p++ = 0xae;
4663 *p = 0xe8;
4664 }
4665 }
4666
4667 /* This is the guts of the machine-dependent assembler. LINE points to a
4668 machine dependent instruction. This function is supposed to emit
4669 the frags/bytes it assembles to. */
4670
4671 void
4672 md_assemble (char *line)
4673 {
4674 unsigned int j;
4675 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4676 const insn_template *t;
4677
4678 /* Initialize globals. */
4679 memset (&i, '\0', sizeof (i));
4680 for (j = 0; j < MAX_OPERANDS; j++)
4681 i.reloc[j] = NO_RELOC;
4682 memset (disp_expressions, '\0', sizeof (disp_expressions));
4683 memset (im_expressions, '\0', sizeof (im_expressions));
4684 save_stack_p = save_stack;
4685
4686 /* First parse an instruction mnemonic & call i386_operand for the operands.
4687 We assume that the scrubber has arranged it so that line[0] is the valid
4688 start of a (possibly prefixed) mnemonic. */
4689
4690 line = parse_insn (line, mnemonic);
4691 if (line == NULL)
4692 return;
4693 mnem_suffix = i.suffix;
4694
4695 line = parse_operands (line, mnemonic);
4696 this_operand = -1;
4697 xfree (i.memop1_string);
4698 i.memop1_string = NULL;
4699 if (line == NULL)
4700 return;
4701
4702 /* Now we've parsed the mnemonic into a set of templates, and have the
4703 operands at hand. */
4704
4705 /* All Intel opcodes have reversed operands except for "bound", "enter",
4706 "monitor*", "mwait*", "tpause", and "umwait". We also don't reverse
4707 intersegment "jmp" and "call" instructions with 2 immediate operands so
4708 that the immediate segment precedes the offset, as it does when in AT&T
4709 mode. */
4710 if (intel_syntax
4711 && i.operands > 1
4712 && (strcmp (mnemonic, "bound") != 0)
4713 && (strcmp (mnemonic, "invlpga") != 0)
4714 && (strncmp (mnemonic, "monitor", 7) != 0)
4715 && (strncmp (mnemonic, "mwait", 5) != 0)
4716 && (strcmp (mnemonic, "tpause") != 0)
4717 && (strcmp (mnemonic, "umwait") != 0)
4718 && !(operand_type_check (i.types[0], imm)
4719 && operand_type_check (i.types[1], imm)))
4720 swap_operands ();
4721
4722 /* The order of the immediates should be reversed
4723 for 2 immediates extrq and insertq instructions */
4724 if (i.imm_operands == 2
4725 && (strcmp (mnemonic, "extrq") == 0
4726 || strcmp (mnemonic, "insertq") == 0))
4727 swap_2_operands (0, 1);
4728
4729 if (i.imm_operands)
4730 optimize_imm ();
4731
4732 /* Don't optimize displacement for movabs since it only takes 64bit
4733 displacement. */
4734 if (i.disp_operands
4735 && i.disp_encoding != disp_encoding_32bit
4736 && (flag_code != CODE_64BIT
4737 || strcmp (mnemonic, "movabs") != 0))
4738 optimize_disp ();
4739
4740 /* Next, we find a template that matches the given insn,
4741 making sure the overlap of the given operands types is consistent
4742 with the template operand types. */
4743
4744 if (!(t = match_template (mnem_suffix)))
4745 return;
4746
4747 if (sse_check != check_none
4748 && !i.tm.opcode_modifier.noavx
4749 && !i.tm.cpu_flags.bitfield.cpuavx
4750 && !i.tm.cpu_flags.bitfield.cpuavx512f
4751 && (i.tm.cpu_flags.bitfield.cpusse
4752 || i.tm.cpu_flags.bitfield.cpusse2
4753 || i.tm.cpu_flags.bitfield.cpusse3
4754 || i.tm.cpu_flags.bitfield.cpussse3
4755 || i.tm.cpu_flags.bitfield.cpusse4_1
4756 || i.tm.cpu_flags.bitfield.cpusse4_2
4757 || i.tm.cpu_flags.bitfield.cpupclmul
4758 || i.tm.cpu_flags.bitfield.cpuaes
4759 || i.tm.cpu_flags.bitfield.cpusha
4760 || i.tm.cpu_flags.bitfield.cpugfni))
4761 {
4762 (sse_check == check_warning
4763 ? as_warn
4764 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4765 }
4766
4767 if (i.tm.opcode_modifier.fwait)
4768 if (!add_prefix (FWAIT_OPCODE))
4769 return;
4770
4771 /* Check if REP prefix is OK. */
4772 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4773 {
4774 as_bad (_("invalid instruction `%s' after `%s'"),
4775 i.tm.name, i.rep_prefix);
4776 return;
4777 }
4778
4779 /* Check for lock without a lockable instruction. Destination operand
4780 must be memory unless it is xchg (0x86). */
4781 if (i.prefix[LOCK_PREFIX]
4782 && (!i.tm.opcode_modifier.islockable
4783 || i.mem_operands == 0
4784 || (i.tm.base_opcode != 0x86
4785 && !(i.flags[i.operands - 1] & Operand_Mem))))
4786 {
4787 as_bad (_("expecting lockable instruction after `lock'"));
4788 return;
4789 }
4790
4791 /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns. */
4792 if (i.prefix[DATA_PREFIX]
4793 && (is_any_vex_encoding (&i.tm)
4794 || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4795 || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4796 {
4797 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4798 return;
4799 }
4800
4801 /* Check if HLE prefix is OK. */
4802 if (i.hle_prefix && !check_hle ())
4803 return;
4804
4805 /* Check BND prefix. */
4806 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4807 as_bad (_("expecting valid branch instruction after `bnd'"));
4808
4809 /* Check NOTRACK prefix. */
4810 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4811 as_bad (_("expecting indirect branch instruction after `notrack'"));
4812
4813 if (i.tm.cpu_flags.bitfield.cpumpx)
4814 {
4815 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4816 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4817 else if (flag_code != CODE_16BIT
4818 ? i.prefix[ADDR_PREFIX]
4819 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4820 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4821 }
4822
4823 /* Insert BND prefix. */
4824 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4825 {
4826 if (!i.prefix[BND_PREFIX])
4827 add_prefix (BND_PREFIX_OPCODE);
4828 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4829 {
4830 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4831 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4832 }
4833 }
4834
4835 /* Check string instruction segment overrides. */
4836 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4837 {
4838 gas_assert (i.mem_operands);
4839 if (!check_string ())
4840 return;
4841 i.disp_operands = 0;
4842 }
4843
4844 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4845 optimize_encoding ();
4846
4847 if (!process_suffix ())
4848 return;
4849
4850 /* Update operand types. */
4851 for (j = 0; j < i.operands; j++)
4852 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4853
4854 /* Make still unresolved immediate matches conform to size of immediate
4855 given in i.suffix. */
4856 if (!finalize_imm ())
4857 return;
4858
4859 if (i.types[0].bitfield.imm1)
4860 i.imm_operands = 0; /* kludge for shift insns. */
4861
4862 /* We only need to check those implicit registers for instructions
4863 with 3 operands or less. */
4864 if (i.operands <= 3)
4865 for (j = 0; j < i.operands; j++)
4866 if (i.types[j].bitfield.instance != InstanceNone
4867 && !i.types[j].bitfield.xmmword)
4868 i.reg_operands--;
4869
4870 /* For insns with operands there are more diddles to do to the opcode. */
4871 if (i.operands)
4872 {
4873 if (!process_operands ())
4874 return;
4875 }
4876 else
4877 {
4878 if (i.tm.opcode_modifier.immext)
4879 process_immext ();
4880
4881 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4882 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4883 as_warn (_("translating to `%sp'"), i.tm.name);
4884 }
4885
4886 if (is_any_vex_encoding (&i.tm))
4887 {
4888 if (!cpu_arch_flags.bitfield.cpui286)
4889 {
4890 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4891 i.tm.name);
4892 return;
4893 }
4894
4895 /* Check for explicit REX prefix. */
4896 if (i.prefix[REX_PREFIX] || i.rex_encoding)
4897 {
4898 as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4899 return;
4900 }
4901
4902 if (i.tm.opcode_modifier.vex)
4903 build_vex_prefix (t);
4904 else
4905 build_evex_prefix ();
4906
4907 /* The individual REX.RXBW bits got consumed. */
4908 i.rex &= REX_OPCODE;
4909 }
4910
4911 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4912 instructions may define INT_OPCODE as well, so avoid this corner
4913 case for those instructions that use MODRM. */
4914 if (i.tm.base_opcode == INT_OPCODE
4915 && !i.tm.opcode_modifier.modrm
4916 && i.op[0].imms->X_add_number == 3)
4917 {
4918 i.tm.base_opcode = INT3_OPCODE;
4919 i.imm_operands = 0;
4920 }
4921
4922 if ((i.tm.opcode_modifier.jump == JUMP
4923 || i.tm.opcode_modifier.jump == JUMP_BYTE
4924 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4925 && i.op[0].disps->X_op == O_constant)
4926 {
4927 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4928 the absolute address given by the constant. Since ix86 jumps and
4929 calls are pc relative, we need to generate a reloc. */
4930 i.op[0].disps->X_add_symbol = &abs_symbol;
4931 i.op[0].disps->X_op = O_symbol;
4932 }
4933
4934 /* For 8 bit registers we need an empty rex prefix. Also if the
4935 instruction already has a prefix, we need to convert old
4936 registers to new ones. */
4937
4938 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4939 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4940 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4941 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4942 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4943 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4944 && i.rex != 0))
4945 {
4946 int x;
4947
4948 i.rex |= REX_OPCODE;
4949 for (x = 0; x < 2; x++)
4950 {
4951 /* Look for 8 bit operand that uses old registers. */
4952 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4953 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4954 {
4955 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4956 /* In case it is "hi" register, give up. */
4957 if (i.op[x].regs->reg_num > 3)
4958 as_bad (_("can't encode register '%s%s' in an "
4959 "instruction requiring REX prefix."),
4960 register_prefix, i.op[x].regs->reg_name);
4961
4962 /* Otherwise it is equivalent to the extended register.
4963 Since the encoding doesn't change this is merely
4964 cosmetic cleanup for debug output. */
4965
4966 i.op[x].regs = i.op[x].regs + 8;
4967 }
4968 }
4969 }
4970
4971 if (i.rex == 0 && i.rex_encoding)
4972 {
4973 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4974 that uses legacy register. If it is "hi" register, don't add
4975 the REX_OPCODE byte. */
4976 int x;
4977 for (x = 0; x < 2; x++)
4978 if (i.types[x].bitfield.class == Reg
4979 && i.types[x].bitfield.byte
4980 && (i.op[x].regs->reg_flags & RegRex64) == 0
4981 && i.op[x].regs->reg_num > 3)
4982 {
4983 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4984 i.rex_encoding = FALSE;
4985 break;
4986 }
4987
4988 if (i.rex_encoding)
4989 i.rex = REX_OPCODE;
4990 }
4991
4992 if (i.rex != 0)
4993 add_prefix (REX_OPCODE | i.rex);
4994
4995 insert_lfence_before ();
4996
4997 /* We are ready to output the insn. */
4998 output_insn ();
4999
5000 insert_lfence_after ();
5001
5002 last_insn.seg = now_seg;
5003
5004 if (i.tm.opcode_modifier.isprefix)
5005 {
5006 last_insn.kind = last_insn_prefix;
5007 last_insn.name = i.tm.name;
5008 last_insn.file = as_where (&last_insn.line);
5009 }
5010 else
5011 last_insn.kind = last_insn_other;
5012 }
5013
5014 static char *
5015 parse_insn (char *line, char *mnemonic)
5016 {
5017 char *l = line;
5018 char *token_start = l;
5019 char *mnem_p;
5020 int supported;
5021 const insn_template *t;
5022 char *dot_p = NULL;
5023
5024 while (1)
5025 {
5026 mnem_p = mnemonic;
5027 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5028 {
5029 if (*mnem_p == '.')
5030 dot_p = mnem_p;
5031 mnem_p++;
5032 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5033 {
5034 as_bad (_("no such instruction: `%s'"), token_start);
5035 return NULL;
5036 }
5037 l++;
5038 }
5039 if (!is_space_char (*l)
5040 && *l != END_OF_INSN
5041 && (intel_syntax
5042 || (*l != PREFIX_SEPARATOR
5043 && *l != ',')))
5044 {
5045 as_bad (_("invalid character %s in mnemonic"),
5046 output_invalid (*l));
5047 return NULL;
5048 }
5049 if (token_start == l)
5050 {
5051 if (!intel_syntax && *l == PREFIX_SEPARATOR)
5052 as_bad (_("expecting prefix; got nothing"));
5053 else
5054 as_bad (_("expecting mnemonic; got nothing"));
5055 return NULL;
5056 }
5057
5058 /* Look up instruction (or prefix) via hash table. */
5059 current_templates = (const templates *) hash_find (op_hash, mnemonic);
5060
5061 if (*l != END_OF_INSN
5062 && (!is_space_char (*l) || l[1] != END_OF_INSN)
5063 && current_templates
5064 && current_templates->start->opcode_modifier.isprefix)
5065 {
5066 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5067 {
5068 as_bad ((flag_code != CODE_64BIT
5069 ? _("`%s' is only supported in 64-bit mode")
5070 : _("`%s' is not supported in 64-bit mode")),
5071 current_templates->start->name);
5072 return NULL;
5073 }
5074 /* If we are in 16-bit mode, do not allow addr16 or data16.
5075 Similarly, in 32-bit mode, do not allow addr32 or data32. */
5076 if ((current_templates->start->opcode_modifier.size == SIZE16
5077 || current_templates->start->opcode_modifier.size == SIZE32)
5078 && flag_code != CODE_64BIT
5079 && ((current_templates->start->opcode_modifier.size == SIZE32)
5080 ^ (flag_code == CODE_16BIT)))
5081 {
5082 as_bad (_("redundant %s prefix"),
5083 current_templates->start->name);
5084 return NULL;
5085 }
5086 if (current_templates->start->opcode_length == 0)
5087 {
5088 /* Handle pseudo prefixes. */
5089 switch (current_templates->start->base_opcode)
5090 {
5091 case 0x0:
5092 /* {disp8} */
5093 i.disp_encoding = disp_encoding_8bit;
5094 break;
5095 case 0x1:
5096 /* {disp32} */
5097 i.disp_encoding = disp_encoding_32bit;
5098 break;
5099 case 0x2:
5100 /* {load} */
5101 i.dir_encoding = dir_encoding_load;
5102 break;
5103 case 0x3:
5104 /* {store} */
5105 i.dir_encoding = dir_encoding_store;
5106 break;
5107 case 0x4:
5108 /* {vex} */
5109 i.vec_encoding = vex_encoding_vex;
5110 break;
5111 case 0x5:
5112 /* {vex3} */
5113 i.vec_encoding = vex_encoding_vex3;
5114 break;
5115 case 0x6:
5116 /* {evex} */
5117 i.vec_encoding = vex_encoding_evex;
5118 break;
5119 case 0x7:
5120 /* {rex} */
5121 i.rex_encoding = TRUE;
5122 break;
5123 case 0x8:
5124 /* {nooptimize} */
5125 i.no_optimize = TRUE;
5126 break;
5127 default:
5128 abort ();
5129 }
5130 }
5131 else
5132 {
5133 /* Add prefix, checking for repeated prefixes. */
5134 switch (add_prefix (current_templates->start->base_opcode))
5135 {
5136 case PREFIX_EXIST:
5137 return NULL;
5138 case PREFIX_DS:
5139 if (current_templates->start->cpu_flags.bitfield.cpuibt)
5140 i.notrack_prefix = current_templates->start->name;
5141 break;
5142 case PREFIX_REP:
5143 if (current_templates->start->cpu_flags.bitfield.cpuhle)
5144 i.hle_prefix = current_templates->start->name;
5145 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5146 i.bnd_prefix = current_templates->start->name;
5147 else
5148 i.rep_prefix = current_templates->start->name;
5149 break;
5150 default:
5151 break;
5152 }
5153 }
5154 /* Skip past PREFIX_SEPARATOR and reset token_start. */
5155 token_start = ++l;
5156 }
5157 else
5158 break;
5159 }
5160
5161 if (!current_templates)
5162 {
5163 /* Deprecated functionality (new code should use pseudo-prefixes instead):
5164 Check if we should swap operand or force 32bit displacement in
5165 encoding. */
5166 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5167 i.dir_encoding = dir_encoding_swap;
5168 else if (mnem_p - 3 == dot_p
5169 && dot_p[1] == 'd'
5170 && dot_p[2] == '8')
5171 i.disp_encoding = disp_encoding_8bit;
5172 else if (mnem_p - 4 == dot_p
5173 && dot_p[1] == 'd'
5174 && dot_p[2] == '3'
5175 && dot_p[3] == '2')
5176 i.disp_encoding = disp_encoding_32bit;
5177 else
5178 goto check_suffix;
5179 mnem_p = dot_p;
5180 *dot_p = '\0';
5181 current_templates = (const templates *) hash_find (op_hash, mnemonic);
5182 }
5183
5184 if (!current_templates)
5185 {
5186 check_suffix:
5187 if (mnem_p > mnemonic)
5188 {
5189 /* See if we can get a match by trimming off a suffix. */
5190 switch (mnem_p[-1])
5191 {
5192 case WORD_MNEM_SUFFIX:
5193 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5194 i.suffix = SHORT_MNEM_SUFFIX;
5195 else
5196 /* Fall through. */
5197 case BYTE_MNEM_SUFFIX:
5198 case QWORD_MNEM_SUFFIX:
5199 i.suffix = mnem_p[-1];
5200 mnem_p[-1] = '\0';
5201 current_templates = (const templates *) hash_find (op_hash,
5202 mnemonic);
5203 break;
5204 case SHORT_MNEM_SUFFIX:
5205 case LONG_MNEM_SUFFIX:
5206 if (!intel_syntax)
5207 {
5208 i.suffix = mnem_p[-1];
5209 mnem_p[-1] = '\0';
5210 current_templates = (const templates *) hash_find (op_hash,
5211 mnemonic);
5212 }
5213 break;
5214
5215 /* Intel Syntax. */
5216 case 'd':
5217 if (intel_syntax)
5218 {
5219 if (intel_float_operand (mnemonic) == 1)
5220 i.suffix = SHORT_MNEM_SUFFIX;
5221 else
5222 i.suffix = LONG_MNEM_SUFFIX;
5223 mnem_p[-1] = '\0';
5224 current_templates = (const templates *) hash_find (op_hash,
5225 mnemonic);
5226 }
5227 break;
5228 }
5229 }
5230
5231 if (!current_templates)
5232 {
5233 as_bad (_("no such instruction: `%s'"), token_start);
5234 return NULL;
5235 }
5236 }
5237
5238 if (current_templates->start->opcode_modifier.jump == JUMP
5239 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5240 {
5241 /* Check for a branch hint. We allow ",pt" and ",pn" for
5242 predict taken and predict not taken respectively.
5243 I'm not sure that branch hints actually do anything on loop
5244 and jcxz insns (JumpByte) for current Pentium4 chips. They
5245 may work in the future and it doesn't hurt to accept them
5246 now. */
5247 if (l[0] == ',' && l[1] == 'p')
5248 {
5249 if (l[2] == 't')
5250 {
5251 if (!add_prefix (DS_PREFIX_OPCODE))
5252 return NULL;
5253 l += 3;
5254 }
5255 else if (l[2] == 'n')
5256 {
5257 if (!add_prefix (CS_PREFIX_OPCODE))
5258 return NULL;
5259 l += 3;
5260 }
5261 }
5262 }
5263 /* Any other comma loses. */
5264 if (*l == ',')
5265 {
5266 as_bad (_("invalid character %s in mnemonic"),
5267 output_invalid (*l));
5268 return NULL;
5269 }
5270
5271 /* Check if instruction is supported on specified architecture. */
5272 supported = 0;
5273 for (t = current_templates->start; t < current_templates->end; ++t)
5274 {
5275 supported |= cpu_flags_match (t);
5276 if (supported == CPU_FLAGS_PERFECT_MATCH)
5277 {
5278 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5279 as_warn (_("use .code16 to ensure correct addressing mode"));
5280
5281 return l;
5282 }
5283 }
5284
5285 if (!(supported & CPU_FLAGS_64BIT_MATCH))
5286 as_bad (flag_code == CODE_64BIT
5287 ? _("`%s' is not supported in 64-bit mode")
5288 : _("`%s' is only supported in 64-bit mode"),
5289 current_templates->start->name);
5290 else
5291 as_bad (_("`%s' is not supported on `%s%s'"),
5292 current_templates->start->name,
5293 cpu_arch_name ? cpu_arch_name : default_arch,
5294 cpu_sub_arch_name ? cpu_sub_arch_name : "");
5295
5296 return NULL;
5297 }
5298
5299 static char *
5300 parse_operands (char *l, const char *mnemonic)
5301 {
5302 char *token_start;
5303
5304 /* 1 if operand is pending after ','. */
5305 unsigned int expecting_operand = 0;
5306
5307 /* Non-zero if operand parens not balanced. */
5308 unsigned int paren_not_balanced;
5309
5310 while (*l != END_OF_INSN)
5311 {
5312 /* Skip optional white space before operand. */
5313 if (is_space_char (*l))
5314 ++l;
5315 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5316 {
5317 as_bad (_("invalid character %s before operand %d"),
5318 output_invalid (*l),
5319 i.operands + 1);
5320 return NULL;
5321 }
5322 token_start = l; /* After white space. */
5323 paren_not_balanced = 0;
5324 while (paren_not_balanced || *l != ',')
5325 {
5326 if (*l == END_OF_INSN)
5327 {
5328 if (paren_not_balanced)
5329 {
5330 if (!intel_syntax)
5331 as_bad (_("unbalanced parenthesis in operand %d."),
5332 i.operands + 1);
5333 else
5334 as_bad (_("unbalanced brackets in operand %d."),
5335 i.operands + 1);
5336 return NULL;
5337 }
5338 else
5339 break; /* we are done */
5340 }
5341 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5342 {
5343 as_bad (_("invalid character %s in operand %d"),
5344 output_invalid (*l),
5345 i.operands + 1);
5346 return NULL;
5347 }
5348 if (!intel_syntax)
5349 {
5350 if (*l == '(')
5351 ++paren_not_balanced;
5352 if (*l == ')')
5353 --paren_not_balanced;
5354 }
5355 else
5356 {
5357 if (*l == '[')
5358 ++paren_not_balanced;
5359 if (*l == ']')
5360 --paren_not_balanced;
5361 }
5362 l++;
5363 }
5364 if (l != token_start)
5365 { /* Yes, we've read in another operand. */
5366 unsigned int operand_ok;
5367 this_operand = i.operands++;
5368 if (i.operands > MAX_OPERANDS)
5369 {
5370 as_bad (_("spurious operands; (%d operands/instruction max)"),
5371 MAX_OPERANDS);
5372 return NULL;
5373 }
5374 i.types[this_operand].bitfield.unspecified = 1;
5375 /* Now parse operand adding info to 'i' as we go along. */
5376 END_STRING_AND_SAVE (l);
5377
5378 if (i.mem_operands > 1)
5379 {
5380 as_bad (_("too many memory references for `%s'"),
5381 mnemonic);
5382 return 0;
5383 }
5384
5385 if (intel_syntax)
5386 operand_ok =
5387 i386_intel_operand (token_start,
5388 intel_float_operand (mnemonic));
5389 else
5390 operand_ok = i386_att_operand (token_start);
5391
5392 RESTORE_END_STRING (l);
5393 if (!operand_ok)
5394 return NULL;
5395 }
5396 else
5397 {
5398 if (expecting_operand)
5399 {
5400 expecting_operand_after_comma:
5401 as_bad (_("expecting operand after ','; got nothing"));
5402 return NULL;
5403 }
5404 if (*l == ',')
5405 {
5406 as_bad (_("expecting operand before ','; got nothing"));
5407 return NULL;
5408 }
5409 }
5410
5411 /* Now *l must be either ',' or END_OF_INSN. */
5412 if (*l == ',')
5413 {
5414 if (*++l == END_OF_INSN)
5415 {
5416 /* Just skip it, if it's \n complain. */
5417 goto expecting_operand_after_comma;
5418 }
5419 expecting_operand = 1;
5420 }
5421 }
5422 return l;
5423 }
5424
5425 static void
5426 swap_2_operands (int xchg1, int xchg2)
5427 {
5428 union i386_op temp_op;
5429 i386_operand_type temp_type;
5430 unsigned int temp_flags;
5431 enum bfd_reloc_code_real temp_reloc;
5432
5433 temp_type = i.types[xchg2];
5434 i.types[xchg2] = i.types[xchg1];
5435 i.types[xchg1] = temp_type;
5436
5437 temp_flags = i.flags[xchg2];
5438 i.flags[xchg2] = i.flags[xchg1];
5439 i.flags[xchg1] = temp_flags;
5440
5441 temp_op = i.op[xchg2];
5442 i.op[xchg2] = i.op[xchg1];
5443 i.op[xchg1] = temp_op;
5444
5445 temp_reloc = i.reloc[xchg2];
5446 i.reloc[xchg2] = i.reloc[xchg1];
5447 i.reloc[xchg1] = temp_reloc;
5448
5449 if (i.mask)
5450 {
5451 if (i.mask->operand == xchg1)
5452 i.mask->operand = xchg2;
5453 else if (i.mask->operand == xchg2)
5454 i.mask->operand = xchg1;
5455 }
5456 if (i.broadcast)
5457 {
5458 if (i.broadcast->operand == xchg1)
5459 i.broadcast->operand = xchg2;
5460 else if (i.broadcast->operand == xchg2)
5461 i.broadcast->operand = xchg1;
5462 }
5463 if (i.rounding)
5464 {
5465 if (i.rounding->operand == xchg1)
5466 i.rounding->operand = xchg2;
5467 else if (i.rounding->operand == xchg2)
5468 i.rounding->operand = xchg1;
5469 }
5470 }
5471
5472 static void
5473 swap_operands (void)
5474 {
5475 switch (i.operands)
5476 {
5477 case 5:
5478 case 4:
5479 swap_2_operands (1, i.operands - 2);
5480 /* Fall through. */
5481 case 3:
5482 case 2:
5483 swap_2_operands (0, i.operands - 1);
5484 break;
5485 default:
5486 abort ();
5487 }
5488
5489 if (i.mem_operands == 2)
5490 {
5491 const seg_entry *temp_seg;
5492 temp_seg = i.seg[0];
5493 i.seg[0] = i.seg[1];
5494 i.seg[1] = temp_seg;
5495 }
5496 }
5497
5498 /* Try to ensure constant immediates are represented in the smallest
5499 opcode possible. */
5500 static void
5501 optimize_imm (void)
5502 {
5503 char guess_suffix = 0;
5504 int op;
5505
5506 if (i.suffix)
5507 guess_suffix = i.suffix;
5508 else if (i.reg_operands)
5509 {
5510 /* Figure out a suffix from the last register operand specified.
5511 We can't do this properly yet, i.e. excluding special register
5512 instances, but the following works for instructions with
5513 immediates. In any case, we can't set i.suffix yet. */
5514 for (op = i.operands; --op >= 0;)
5515 if (i.types[op].bitfield.class != Reg)
5516 continue;
5517 else if (i.types[op].bitfield.byte)
5518 {
5519 guess_suffix = BYTE_MNEM_SUFFIX;
5520 break;
5521 }
5522 else if (i.types[op].bitfield.word)
5523 {
5524 guess_suffix = WORD_MNEM_SUFFIX;
5525 break;
5526 }
5527 else if (i.types[op].bitfield.dword)
5528 {
5529 guess_suffix = LONG_MNEM_SUFFIX;
5530 break;
5531 }
5532 else if (i.types[op].bitfield.qword)
5533 {
5534 guess_suffix = QWORD_MNEM_SUFFIX;
5535 break;
5536 }
5537 }
5538 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5539 guess_suffix = WORD_MNEM_SUFFIX;
5540
5541 for (op = i.operands; --op >= 0;)
5542 if (operand_type_check (i.types[op], imm))
5543 {
5544 switch (i.op[op].imms->X_op)
5545 {
5546 case O_constant:
5547 /* If a suffix is given, this operand may be shortened. */
5548 switch (guess_suffix)
5549 {
5550 case LONG_MNEM_SUFFIX:
5551 i.types[op].bitfield.imm32 = 1;
5552 i.types[op].bitfield.imm64 = 1;
5553 break;
5554 case WORD_MNEM_SUFFIX:
5555 i.types[op].bitfield.imm16 = 1;
5556 i.types[op].bitfield.imm32 = 1;
5557 i.types[op].bitfield.imm32s = 1;
5558 i.types[op].bitfield.imm64 = 1;
5559 break;
5560 case BYTE_MNEM_SUFFIX:
5561 i.types[op].bitfield.imm8 = 1;
5562 i.types[op].bitfield.imm8s = 1;
5563 i.types[op].bitfield.imm16 = 1;
5564 i.types[op].bitfield.imm32 = 1;
5565 i.types[op].bitfield.imm32s = 1;
5566 i.types[op].bitfield.imm64 = 1;
5567 break;
5568 }
5569
5570 /* If this operand is at most 16 bits, convert it
5571 to a signed 16 bit number before trying to see
5572 whether it will fit in an even smaller size.
5573 This allows a 16-bit operand such as $0xffe0 to
5574 be recognised as within Imm8S range. */
5575 if ((i.types[op].bitfield.imm16)
5576 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5577 {
5578 i.op[op].imms->X_add_number =
5579 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5580 }
5581 #ifdef BFD64
5582 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5583 if ((i.types[op].bitfield.imm32)
5584 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5585 == 0))
5586 {
5587 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5588 ^ ((offsetT) 1 << 31))
5589 - ((offsetT) 1 << 31));
5590 }
5591 #endif
5592 i.types[op]
5593 = operand_type_or (i.types[op],
5594 smallest_imm_type (i.op[op].imms->X_add_number));
5595
5596 /* We must avoid matching of Imm32 templates when 64bit
5597 only immediate is available. */
5598 if (guess_suffix == QWORD_MNEM_SUFFIX)
5599 i.types[op].bitfield.imm32 = 0;
5600 break;
5601
5602 case O_absent:
5603 case O_register:
5604 abort ();
5605
5606 /* Symbols and expressions. */
5607 default:
5608 /* Convert symbolic operand to proper sizes for matching, but don't
5609 prevent matching a set of insns that only supports sizes other
5610 than those matching the insn suffix. */
5611 {
5612 i386_operand_type mask, allowed;
5613 const insn_template *t;
5614
5615 operand_type_set (&mask, 0);
5616 operand_type_set (&allowed, 0);
5617
5618 for (t = current_templates->start;
5619 t < current_templates->end;
5620 ++t)
5621 {
5622 allowed = operand_type_or (allowed, t->operand_types[op]);
5623 allowed = operand_type_and (allowed, anyimm);
5624 }
5625 switch (guess_suffix)
5626 {
5627 case QWORD_MNEM_SUFFIX:
5628 mask.bitfield.imm64 = 1;
5629 mask.bitfield.imm32s = 1;
5630 break;
5631 case LONG_MNEM_SUFFIX:
5632 mask.bitfield.imm32 = 1;
5633 break;
5634 case WORD_MNEM_SUFFIX:
5635 mask.bitfield.imm16 = 1;
5636 break;
5637 case BYTE_MNEM_SUFFIX:
5638 mask.bitfield.imm8 = 1;
5639 break;
5640 default:
5641 break;
5642 }
5643 allowed = operand_type_and (mask, allowed);
5644 if (!operand_type_all_zero (&allowed))
5645 i.types[op] = operand_type_and (i.types[op], mask);
5646 }
5647 break;
5648 }
5649 }
5650 }
5651
5652 /* Try to use the smallest displacement type too. */
5653 static void
5654 optimize_disp (void)
5655 {
5656 int op;
5657
5658 for (op = i.operands; --op >= 0;)
5659 if (operand_type_check (i.types[op], disp))
5660 {
5661 if (i.op[op].disps->X_op == O_constant)
5662 {
5663 offsetT op_disp = i.op[op].disps->X_add_number;
5664
5665 if (i.types[op].bitfield.disp16
5666 && (op_disp & ~(offsetT) 0xffff) == 0)
5667 {
5668 /* If this operand is at most 16 bits, convert
5669 to a signed 16 bit number and don't use 64bit
5670 displacement. */
5671 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5672 i.types[op].bitfield.disp64 = 0;
5673 }
5674 #ifdef BFD64
5675 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5676 if (i.types[op].bitfield.disp32
5677 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5678 {
5679 /* If this operand is at most 32 bits, convert
5680 to a signed 32 bit number and don't use 64bit
5681 displacement. */
5682 op_disp &= (((offsetT) 2 << 31) - 1);
5683 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5684 i.types[op].bitfield.disp64 = 0;
5685 }
5686 #endif
5687 if (!op_disp && i.types[op].bitfield.baseindex)
5688 {
5689 i.types[op].bitfield.disp8 = 0;
5690 i.types[op].bitfield.disp16 = 0;
5691 i.types[op].bitfield.disp32 = 0;
5692 i.types[op].bitfield.disp32s = 0;
5693 i.types[op].bitfield.disp64 = 0;
5694 i.op[op].disps = 0;
5695 i.disp_operands--;
5696 }
5697 else if (flag_code == CODE_64BIT)
5698 {
5699 if (fits_in_signed_long (op_disp))
5700 {
5701 i.types[op].bitfield.disp64 = 0;
5702 i.types[op].bitfield.disp32s = 1;
5703 }
5704 if (i.prefix[ADDR_PREFIX]
5705 && fits_in_unsigned_long (op_disp))
5706 i.types[op].bitfield.disp32 = 1;
5707 }
5708 if ((i.types[op].bitfield.disp32
5709 || i.types[op].bitfield.disp32s
5710 || i.types[op].bitfield.disp16)
5711 && fits_in_disp8 (op_disp))
5712 i.types[op].bitfield.disp8 = 1;
5713 }
5714 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5715 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5716 {
5717 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5718 i.op[op].disps, 0, i.reloc[op]);
5719 i.types[op].bitfield.disp8 = 0;
5720 i.types[op].bitfield.disp16 = 0;
5721 i.types[op].bitfield.disp32 = 0;
5722 i.types[op].bitfield.disp32s = 0;
5723 i.types[op].bitfield.disp64 = 0;
5724 }
5725 else
5726 /* We only support 64bit displacement on constants. */
5727 i.types[op].bitfield.disp64 = 0;
5728 }
5729 }
5730
5731 /* Return 1 if there is a match in broadcast bytes between operand
5732 GIVEN and instruction template T. */
5733
5734 static INLINE int
5735 match_broadcast_size (const insn_template *t, unsigned int given)
5736 {
5737 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5738 && i.types[given].bitfield.byte)
5739 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5740 && i.types[given].bitfield.word)
5741 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5742 && i.types[given].bitfield.dword)
5743 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5744 && i.types[given].bitfield.qword));
5745 }
5746
5747 /* Check if operands are valid for the instruction. */
5748
5749 static int
5750 check_VecOperands (const insn_template *t)
5751 {
5752 unsigned int op;
5753 i386_cpu_flags cpu;
5754
5755 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5756 any one operand are implicity requiring AVX512VL support if the actual
5757 operand size is YMMword or XMMword. Since this function runs after
5758 template matching, there's no need to check for YMMword/XMMword in
5759 the template. */
5760 cpu = cpu_flags_and (t->cpu_flags, avx512);
5761 if (!cpu_flags_all_zero (&cpu)
5762 && !t->cpu_flags.bitfield.cpuavx512vl
5763 && !cpu_arch_flags.bitfield.cpuavx512vl)
5764 {
5765 for (op = 0; op < t->operands; ++op)
5766 {
5767 if (t->operand_types[op].bitfield.zmmword
5768 && (i.types[op].bitfield.ymmword
5769 || i.types[op].bitfield.xmmword))
5770 {
5771 i.error = unsupported;
5772 return 1;
5773 }
5774 }
5775 }
5776
5777 /* Without VSIB byte, we can't have a vector register for index. */
5778 if (!t->opcode_modifier.sib
5779 && i.index_reg
5780 && (i.index_reg->reg_type.bitfield.xmmword
5781 || i.index_reg->reg_type.bitfield.ymmword
5782 || i.index_reg->reg_type.bitfield.zmmword))
5783 {
5784 i.error = unsupported_vector_index_register;
5785 return 1;
5786 }
5787
5788 /* Check if default mask is allowed. */
5789 if (t->opcode_modifier.nodefmask
5790 && (!i.mask || i.mask->mask->reg_num == 0))
5791 {
5792 i.error = no_default_mask;
5793 return 1;
5794 }
5795
5796 /* For VSIB byte, we need a vector register for index, and all vector
5797 registers must be distinct. */
5798 if (t->opcode_modifier.sib)
5799 {
5800 if (!i.index_reg
5801 || !((t->opcode_modifier.sib == VECSIB128
5802 && i.index_reg->reg_type.bitfield.xmmword)
5803 || (t->opcode_modifier.sib == VECSIB256
5804 && i.index_reg->reg_type.bitfield.ymmword)
5805 || (t->opcode_modifier.sib == VECSIB512
5806 && i.index_reg->reg_type.bitfield.zmmword)))
5807 {
5808 i.error = invalid_vsib_address;
5809 return 1;
5810 }
5811
5812 gas_assert (i.reg_operands == 2 || i.mask);
5813 if (i.reg_operands == 2 && !i.mask)
5814 {
5815 gas_assert (i.types[0].bitfield.class == RegSIMD);
5816 gas_assert (i.types[0].bitfield.xmmword
5817 || i.types[0].bitfield.ymmword);
5818 gas_assert (i.types[2].bitfield.class == RegSIMD);
5819 gas_assert (i.types[2].bitfield.xmmword
5820 || i.types[2].bitfield.ymmword);
5821 if (operand_check == check_none)
5822 return 0;
5823 if (register_number (i.op[0].regs)
5824 != register_number (i.index_reg)
5825 && register_number (i.op[2].regs)
5826 != register_number (i.index_reg)
5827 && register_number (i.op[0].regs)
5828 != register_number (i.op[2].regs))
5829 return 0;
5830 if (operand_check == check_error)
5831 {
5832 i.error = invalid_vector_register_set;
5833 return 1;
5834 }
5835 as_warn (_("mask, index, and destination registers should be distinct"));
5836 }
5837 else if (i.reg_operands == 1 && i.mask)
5838 {
5839 if (i.types[1].bitfield.class == RegSIMD
5840 && (i.types[1].bitfield.xmmword
5841 || i.types[1].bitfield.ymmword
5842 || i.types[1].bitfield.zmmword)
5843 && (register_number (i.op[1].regs)
5844 == register_number (i.index_reg)))
5845 {
5846 if (operand_check == check_error)
5847 {
5848 i.error = invalid_vector_register_set;
5849 return 1;
5850 }
5851 if (operand_check != check_none)
5852 as_warn (_("index and destination registers should be distinct"));
5853 }
5854 }
5855 }
5856
5857 /* Check if broadcast is supported by the instruction and is applied
5858 to the memory operand. */
5859 if (i.broadcast)
5860 {
5861 i386_operand_type type, overlap;
5862
5863 /* Check if specified broadcast is supported in this instruction,
5864 and its broadcast bytes match the memory operand. */
5865 op = i.broadcast->operand;
5866 if (!t->opcode_modifier.broadcast
5867 || !(i.flags[op] & Operand_Mem)
5868 || (!i.types[op].bitfield.unspecified
5869 && !match_broadcast_size (t, op)))
5870 {
5871 bad_broadcast:
5872 i.error = unsupported_broadcast;
5873 return 1;
5874 }
5875
5876 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5877 * i.broadcast->type);
5878 operand_type_set (&type, 0);
5879 switch (i.broadcast->bytes)
5880 {
5881 case 2:
5882 type.bitfield.word = 1;
5883 break;
5884 case 4:
5885 type.bitfield.dword = 1;
5886 break;
5887 case 8:
5888 type.bitfield.qword = 1;
5889 break;
5890 case 16:
5891 type.bitfield.xmmword = 1;
5892 break;
5893 case 32:
5894 type.bitfield.ymmword = 1;
5895 break;
5896 case 64:
5897 type.bitfield.zmmword = 1;
5898 break;
5899 default:
5900 goto bad_broadcast;
5901 }
5902
5903 overlap = operand_type_and (type, t->operand_types[op]);
5904 if (t->operand_types[op].bitfield.class == RegSIMD
5905 && t->operand_types[op].bitfield.byte
5906 + t->operand_types[op].bitfield.word
5907 + t->operand_types[op].bitfield.dword
5908 + t->operand_types[op].bitfield.qword > 1)
5909 {
5910 overlap.bitfield.xmmword = 0;
5911 overlap.bitfield.ymmword = 0;
5912 overlap.bitfield.zmmword = 0;
5913 }
5914 if (operand_type_all_zero (&overlap))
5915 goto bad_broadcast;
5916
5917 if (t->opcode_modifier.checkregsize)
5918 {
5919 unsigned int j;
5920
5921 type.bitfield.baseindex = 1;
5922 for (j = 0; j < i.operands; ++j)
5923 {
5924 if (j != op
5925 && !operand_type_register_match(i.types[j],
5926 t->operand_types[j],
5927 type,
5928 t->operand_types[op]))
5929 goto bad_broadcast;
5930 }
5931 }
5932 }
5933 /* If broadcast is supported in this instruction, we need to check if
5934 operand of one-element size isn't specified without broadcast. */
5935 else if (t->opcode_modifier.broadcast && i.mem_operands)
5936 {
5937 /* Find memory operand. */
5938 for (op = 0; op < i.operands; op++)
5939 if (i.flags[op] & Operand_Mem)
5940 break;
5941 gas_assert (op < i.operands);
5942 /* Check size of the memory operand. */
5943 if (match_broadcast_size (t, op))
5944 {
5945 i.error = broadcast_needed;
5946 return 1;
5947 }
5948 }
5949 else
5950 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5951
5952 /* Check if requested masking is supported. */
5953 if (i.mask)
5954 {
5955 switch (t->opcode_modifier.masking)
5956 {
5957 case BOTH_MASKING:
5958 break;
5959 case MERGING_MASKING:
5960 if (i.mask->zeroing)
5961 {
5962 case 0:
5963 i.error = unsupported_masking;
5964 return 1;
5965 }
5966 break;
5967 case DYNAMIC_MASKING:
5968 /* Memory destinations allow only merging masking. */
5969 if (i.mask->zeroing && i.mem_operands)
5970 {
5971 /* Find memory operand. */
5972 for (op = 0; op < i.operands; op++)
5973 if (i.flags[op] & Operand_Mem)
5974 break;
5975 gas_assert (op < i.operands);
5976 if (op == i.operands - 1)
5977 {
5978 i.error = unsupported_masking;
5979 return 1;
5980 }
5981 }
5982 break;
5983 default:
5984 abort ();
5985 }
5986 }
5987
5988 /* Check if masking is applied to dest operand. */
5989 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5990 {
5991 i.error = mask_not_on_destination;
5992 return 1;
5993 }
5994
5995 /* Check RC/SAE. */
5996 if (i.rounding)
5997 {
5998 if (!t->opcode_modifier.sae
5999 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
6000 {
6001 i.error = unsupported_rc_sae;
6002 return 1;
6003 }
6004 /* If the instruction has several immediate operands and one of
6005 them is rounding, the rounding operand should be the last
6006 immediate operand. */
6007 if (i.imm_operands > 1
6008 && i.rounding->operand != (int) (i.imm_operands - 1))
6009 {
6010 i.error = rc_sae_operand_not_last_imm;
6011 return 1;
6012 }
6013 }
6014
6015 /* Check the special Imm4 cases; must be the first operand. */
6016 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6017 {
6018 if (i.op[0].imms->X_op != O_constant
6019 || !fits_in_imm4 (i.op[0].imms->X_add_number))
6020 {
6021 i.error = bad_imm4;
6022 return 1;
6023 }
6024
6025 /* Turn off Imm<N> so that update_imm won't complain. */
6026 operand_type_set (&i.types[0], 0);
6027 }
6028
6029 /* Check vector Disp8 operand. */
6030 if (t->opcode_modifier.disp8memshift
6031 && i.disp_encoding != disp_encoding_32bit)
6032 {
6033 if (i.broadcast)
6034 i.memshift = t->opcode_modifier.broadcast - 1;
6035 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6036 i.memshift = t->opcode_modifier.disp8memshift;
6037 else
6038 {
6039 const i386_operand_type *type = NULL;
6040
6041 i.memshift = 0;
6042 for (op = 0; op < i.operands; op++)
6043 if (i.flags[op] & Operand_Mem)
6044 {
6045 if (t->opcode_modifier.evex == EVEXLIG)
6046 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6047 else if (t->operand_types[op].bitfield.xmmword
6048 + t->operand_types[op].bitfield.ymmword
6049 + t->operand_types[op].bitfield.zmmword <= 1)
6050 type = &t->operand_types[op];
6051 else if (!i.types[op].bitfield.unspecified)
6052 type = &i.types[op];
6053 }
6054 else if (i.types[op].bitfield.class == RegSIMD
6055 && t->opcode_modifier.evex != EVEXLIG)
6056 {
6057 if (i.types[op].bitfield.zmmword)
6058 i.memshift = 6;
6059 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6060 i.memshift = 5;
6061 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6062 i.memshift = 4;
6063 }
6064
6065 if (type)
6066 {
6067 if (type->bitfield.zmmword)
6068 i.memshift = 6;
6069 else if (type->bitfield.ymmword)
6070 i.memshift = 5;
6071 else if (type->bitfield.xmmword)
6072 i.memshift = 4;
6073 }
6074
6075 /* For the check in fits_in_disp8(). */
6076 if (i.memshift == 0)
6077 i.memshift = -1;
6078 }
6079
6080 for (op = 0; op < i.operands; op++)
6081 if (operand_type_check (i.types[op], disp)
6082 && i.op[op].disps->X_op == O_constant)
6083 {
6084 if (fits_in_disp8 (i.op[op].disps->X_add_number))
6085 {
6086 i.types[op].bitfield.disp8 = 1;
6087 return 0;
6088 }
6089 i.types[op].bitfield.disp8 = 0;
6090 }
6091 }
6092
6093 i.memshift = 0;
6094
6095 return 0;
6096 }
6097
6098 /* Check if encoding requirements are met by the instruction. */
6099
6100 static int
6101 VEX_check_encoding (const insn_template *t)
6102 {
6103 if (i.vec_encoding == vex_encoding_error)
6104 {
6105 i.error = unsupported;
6106 return 1;
6107 }
6108
6109 if (i.vec_encoding == vex_encoding_evex)
6110 {
6111 /* This instruction must be encoded with EVEX prefix. */
6112 if (!is_evex_encoding (t))
6113 {
6114 i.error = unsupported;
6115 return 1;
6116 }
6117 return 0;
6118 }
6119
6120 if (!t->opcode_modifier.vex)
6121 {
6122 /* This instruction template doesn't have VEX prefix. */
6123 if (i.vec_encoding != vex_encoding_default)
6124 {
6125 i.error = unsupported;
6126 return 1;
6127 }
6128 return 0;
6129 }
6130
6131 return 0;
6132 }
6133
6134 static const insn_template *
6135 match_template (char mnem_suffix)
6136 {
6137 /* Points to template once we've found it. */
6138 const insn_template *t;
6139 i386_operand_type overlap0, overlap1, overlap2, overlap3;
6140 i386_operand_type overlap4;
6141 unsigned int found_reverse_match;
6142 i386_opcode_modifier suffix_check;
6143 i386_operand_type operand_types [MAX_OPERANDS];
6144 int addr_prefix_disp;
6145 unsigned int j, size_match, check_register;
6146 enum i386_error specific_error = 0;
6147
6148 #if MAX_OPERANDS != 5
6149 # error "MAX_OPERANDS must be 5."
6150 #endif
6151
6152 found_reverse_match = 0;
6153 addr_prefix_disp = -1;
6154
6155 /* Prepare for mnemonic suffix check. */
6156 memset (&suffix_check, 0, sizeof (suffix_check));
6157 switch (mnem_suffix)
6158 {
6159 case BYTE_MNEM_SUFFIX:
6160 suffix_check.no_bsuf = 1;
6161 break;
6162 case WORD_MNEM_SUFFIX:
6163 suffix_check.no_wsuf = 1;
6164 break;
6165 case SHORT_MNEM_SUFFIX:
6166 suffix_check.no_ssuf = 1;
6167 break;
6168 case LONG_MNEM_SUFFIX:
6169 suffix_check.no_lsuf = 1;
6170 break;
6171 case QWORD_MNEM_SUFFIX:
6172 suffix_check.no_qsuf = 1;
6173 break;
6174 default:
6175 /* NB: In Intel syntax, normally we can check for memory operand
6176 size when there is no mnemonic suffix. But jmp and call have
6177 2 different encodings with Dword memory operand size, one with
6178 No_ldSuf and the other without. i.suffix is set to
6179 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
6180 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6181 suffix_check.no_ldsuf = 1;
6182 }
6183
6184 /* Must have right number of operands. */
6185 i.error = number_of_operands_mismatch;
6186
6187 for (t = current_templates->start; t < current_templates->end; t++)
6188 {
6189 addr_prefix_disp = -1;
6190 found_reverse_match = 0;
6191
6192 if (i.operands != t->operands)
6193 continue;
6194
6195 /* Check processor support. */
6196 i.error = unsupported;
6197 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6198 continue;
6199
6200 /* Check AT&T mnemonic. */
6201 i.error = unsupported_with_intel_mnemonic;
6202 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6203 continue;
6204
6205 /* Check AT&T/Intel syntax. */
6206 i.error = unsupported_syntax;
6207 if ((intel_syntax && t->opcode_modifier.attsyntax)
6208 || (!intel_syntax && t->opcode_modifier.intelsyntax))
6209 continue;
6210
6211 /* Check Intel64/AMD64 ISA. */
6212 switch (isa64)
6213 {
6214 default:
6215 /* Default: Don't accept Intel64. */
6216 if (t->opcode_modifier.isa64 == INTEL64)
6217 continue;
6218 break;
6219 case amd64:
6220 /* -mamd64: Don't accept Intel64 and Intel64 only. */
6221 if (t->opcode_modifier.isa64 >= INTEL64)
6222 continue;
6223 break;
6224 case intel64:
6225 /* -mintel64: Don't accept AMD64. */
6226 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6227 continue;
6228 break;
6229 }
6230
6231 /* Check the suffix. */
6232 i.error = invalid_instruction_suffix;
6233 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6234 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6235 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6236 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6237 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6238 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6239 continue;
6240
6241 size_match = operand_size_match (t);
6242 if (!size_match)
6243 continue;
6244
6245 /* This is intentionally not
6246
6247 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6248
6249 as the case of a missing * on the operand is accepted (perhaps with
6250 a warning, issued further down). */
6251 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6252 {
6253 i.error = operand_type_mismatch;
6254 continue;
6255 }
6256
6257 for (j = 0; j < MAX_OPERANDS; j++)
6258 operand_types[j] = t->operand_types[j];
6259
6260 /* In general, don't allow
6261 - 64-bit operands outside of 64-bit mode,
6262 - 32-bit operands on pre-386. */
6263 j = i.imm_operands + (t->operands > i.imm_operands + 1);
6264 if (((i.suffix == QWORD_MNEM_SUFFIX
6265 && flag_code != CODE_64BIT
6266 && (t->base_opcode != 0x0fc7
6267 || t->extension_opcode != 1 /* cmpxchg8b */))
6268 || (i.suffix == LONG_MNEM_SUFFIX
6269 && !cpu_arch_flags.bitfield.cpui386))
6270 && (intel_syntax
6271 ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6272 && !intel_float_operand (t->name))
6273 : intel_float_operand (t->name) != 2)
6274 && (t->operands == i.imm_operands
6275 || (operand_types[i.imm_operands].bitfield.class != RegMMX
6276 && operand_types[i.imm_operands].bitfield.class != RegSIMD
6277 && operand_types[i.imm_operands].bitfield.class != RegMask)
6278 || (operand_types[j].bitfield.class != RegMMX
6279 && operand_types[j].bitfield.class != RegSIMD
6280 && operand_types[j].bitfield.class != RegMask))
6281 && !t->opcode_modifier.sib)
6282 continue;
6283
6284 /* Do not verify operands when there are none. */
6285 if (!t->operands)
6286 {
6287 if (VEX_check_encoding (t))
6288 {
6289 specific_error = i.error;
6290 continue;
6291 }
6292
6293 /* We've found a match; break out of loop. */
6294 break;
6295 }
6296
6297 if (!t->opcode_modifier.jump
6298 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6299 {
6300 /* There should be only one Disp operand. */
6301 for (j = 0; j < MAX_OPERANDS; j++)
6302 if (operand_type_check (operand_types[j], disp))
6303 break;
6304 if (j < MAX_OPERANDS)
6305 {
6306 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6307
6308 addr_prefix_disp = j;
6309
6310 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6311 operand into Disp32/Disp32/Disp16/Disp32 operand. */
6312 switch (flag_code)
6313 {
6314 case CODE_16BIT:
6315 override = !override;
6316 /* Fall through. */
6317 case CODE_32BIT:
6318 if (operand_types[j].bitfield.disp32
6319 && operand_types[j].bitfield.disp16)
6320 {
6321 operand_types[j].bitfield.disp16 = override;
6322 operand_types[j].bitfield.disp32 = !override;
6323 }
6324 operand_types[j].bitfield.disp32s = 0;
6325 operand_types[j].bitfield.disp64 = 0;
6326 break;
6327
6328 case CODE_64BIT:
6329 if (operand_types[j].bitfield.disp32s
6330 || operand_types[j].bitfield.disp64)
6331 {
6332 operand_types[j].bitfield.disp64 &= !override;
6333 operand_types[j].bitfield.disp32s &= !override;
6334 operand_types[j].bitfield.disp32 = override;
6335 }
6336 operand_types[j].bitfield.disp16 = 0;
6337 break;
6338 }
6339 }
6340 }
6341
6342 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
6343 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6344 continue;
6345
6346 /* We check register size if needed. */
6347 if (t->opcode_modifier.checkregsize)
6348 {
6349 check_register = (1 << t->operands) - 1;
6350 if (i.broadcast)
6351 check_register &= ~(1 << i.broadcast->operand);
6352 }
6353 else
6354 check_register = 0;
6355
6356 overlap0 = operand_type_and (i.types[0], operand_types[0]);
6357 switch (t->operands)
6358 {
6359 case 1:
6360 if (!operand_type_match (overlap0, i.types[0]))
6361 continue;
6362 break;
6363 case 2:
6364 /* xchg %eax, %eax is a special case. It is an alias for nop
6365 only in 32bit mode and we can use opcode 0x90. In 64bit
6366 mode, we can't use 0x90 for xchg %eax, %eax since it should
6367 zero-extend %eax to %rax. */
6368 if (flag_code == CODE_64BIT
6369 && t->base_opcode == 0x90
6370 && i.types[0].bitfield.instance == Accum
6371 && i.types[0].bitfield.dword
6372 && i.types[1].bitfield.instance == Accum
6373 && i.types[1].bitfield.dword)
6374 continue;
6375 /* xrelease mov %eax, <disp> is another special case. It must not
6376 match the accumulator-only encoding of mov. */
6377 if (flag_code != CODE_64BIT
6378 && i.hle_prefix
6379 && t->base_opcode == 0xa0
6380 && i.types[0].bitfield.instance == Accum
6381 && (i.flags[1] & Operand_Mem))
6382 continue;
6383 /* Fall through. */
6384
6385 case 3:
6386 if (!(size_match & MATCH_STRAIGHT))
6387 goto check_reverse;
6388 /* Reverse direction of operands if swapping is possible in the first
6389 place (operands need to be symmetric) and
6390 - the load form is requested, and the template is a store form,
6391 - the store form is requested, and the template is a load form,
6392 - the non-default (swapped) form is requested. */
6393 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6394 if (t->opcode_modifier.d && i.reg_operands == i.operands
6395 && !operand_type_all_zero (&overlap1))
6396 switch (i.dir_encoding)
6397 {
6398 case dir_encoding_load:
6399 if (operand_type_check (operand_types[i.operands - 1], anymem)
6400 || t->opcode_modifier.regmem)
6401 goto check_reverse;
6402 break;
6403
6404 case dir_encoding_store:
6405 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6406 && !t->opcode_modifier.regmem)
6407 goto check_reverse;
6408 break;
6409
6410 case dir_encoding_swap:
6411 goto check_reverse;
6412
6413 case dir_encoding_default:
6414 break;
6415 }
6416 /* If we want store form, we skip the current load. */
6417 if ((i.dir_encoding == dir_encoding_store
6418 || i.dir_encoding == dir_encoding_swap)
6419 && i.mem_operands == 0
6420 && t->opcode_modifier.load)
6421 continue;
6422 /* Fall through. */
6423 case 4:
6424 case 5:
6425 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6426 if (!operand_type_match (overlap0, i.types[0])
6427 || !operand_type_match (overlap1, i.types[1])
6428 || ((check_register & 3) == 3
6429 && !operand_type_register_match (i.types[0],
6430 operand_types[0],
6431 i.types[1],
6432 operand_types[1])))
6433 {
6434 /* Check if other direction is valid ... */
6435 if (!t->opcode_modifier.d)
6436 continue;
6437
6438 check_reverse:
6439 if (!(size_match & MATCH_REVERSE))
6440 continue;
6441 /* Try reversing direction of operands. */
6442 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6443 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6444 if (!operand_type_match (overlap0, i.types[0])
6445 || !operand_type_match (overlap1, i.types[i.operands - 1])
6446 || (check_register
6447 && !operand_type_register_match (i.types[0],
6448 operand_types[i.operands - 1],
6449 i.types[i.operands - 1],
6450 operand_types[0])))
6451 {
6452 /* Does not match either direction. */
6453 continue;
6454 }
6455 /* found_reverse_match holds which of D or FloatR
6456 we've found. */
6457 if (!t->opcode_modifier.d)
6458 found_reverse_match = 0;
6459 else if (operand_types[0].bitfield.tbyte)
6460 found_reverse_match = Opcode_FloatD;
6461 else if (operand_types[0].bitfield.xmmword
6462 || operand_types[i.operands - 1].bitfield.xmmword
6463 || operand_types[0].bitfield.class == RegMMX
6464 || operand_types[i.operands - 1].bitfield.class == RegMMX
6465 || is_any_vex_encoding(t))
6466 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6467 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6468 else
6469 found_reverse_match = Opcode_D;
6470 if (t->opcode_modifier.floatr)
6471 found_reverse_match |= Opcode_FloatR;
6472 }
6473 else
6474 {
6475 /* Found a forward 2 operand match here. */
6476 switch (t->operands)
6477 {
6478 case 5:
6479 overlap4 = operand_type_and (i.types[4],
6480 operand_types[4]);
6481 /* Fall through. */
6482 case 4:
6483 overlap3 = operand_type_and (i.types[3],
6484 operand_types[3]);
6485 /* Fall through. */
6486 case 3:
6487 overlap2 = operand_type_and (i.types[2],
6488 operand_types[2]);
6489 break;
6490 }
6491
6492 switch (t->operands)
6493 {
6494 case 5:
6495 if (!operand_type_match (overlap4, i.types[4])
6496 || !operand_type_register_match (i.types[3],
6497 operand_types[3],
6498 i.types[4],
6499 operand_types[4]))
6500 continue;
6501 /* Fall through. */
6502 case 4:
6503 if (!operand_type_match (overlap3, i.types[3])
6504 || ((check_register & 0xa) == 0xa
6505 && !operand_type_register_match (i.types[1],
6506 operand_types[1],
6507 i.types[3],
6508 operand_types[3]))
6509 || ((check_register & 0xc) == 0xc
6510 && !operand_type_register_match (i.types[2],
6511 operand_types[2],
6512 i.types[3],
6513 operand_types[3])))
6514 continue;
6515 /* Fall through. */
6516 case 3:
6517 /* Here we make use of the fact that there are no
6518 reverse match 3 operand instructions. */
6519 if (!operand_type_match (overlap2, i.types[2])
6520 || ((check_register & 5) == 5
6521 && !operand_type_register_match (i.types[0],
6522 operand_types[0],
6523 i.types[2],
6524 operand_types[2]))
6525 || ((check_register & 6) == 6
6526 && !operand_type_register_match (i.types[1],
6527 operand_types[1],
6528 i.types[2],
6529 operand_types[2])))
6530 continue;
6531 break;
6532 }
6533 }
6534 /* Found either forward/reverse 2, 3 or 4 operand match here:
6535 slip through to break. */
6536 }
6537
6538 /* Check if vector operands are valid. */
6539 if (check_VecOperands (t))
6540 {
6541 specific_error = i.error;
6542 continue;
6543 }
6544
6545 /* Check if VEX/EVEX encoding requirements can be satisfied. */
6546 if (VEX_check_encoding (t))
6547 {
6548 specific_error = i.error;
6549 continue;
6550 }
6551
6552 /* We've found a match; break out of loop. */
6553 break;
6554 }
6555
6556 if (t == current_templates->end)
6557 {
6558 /* We found no match. */
6559 const char *err_msg;
6560 switch (specific_error ? specific_error : i.error)
6561 {
6562 default:
6563 abort ();
6564 case operand_size_mismatch:
6565 err_msg = _("operand size mismatch");
6566 break;
6567 case operand_type_mismatch:
6568 err_msg = _("operand type mismatch");
6569 break;
6570 case register_type_mismatch:
6571 err_msg = _("register type mismatch");
6572 break;
6573 case number_of_operands_mismatch:
6574 err_msg = _("number of operands mismatch");
6575 break;
6576 case invalid_instruction_suffix:
6577 err_msg = _("invalid instruction suffix");
6578 break;
6579 case bad_imm4:
6580 err_msg = _("constant doesn't fit in 4 bits");
6581 break;
6582 case unsupported_with_intel_mnemonic:
6583 err_msg = _("unsupported with Intel mnemonic");
6584 break;
6585 case unsupported_syntax:
6586 err_msg = _("unsupported syntax");
6587 break;
6588 case unsupported:
6589 as_bad (_("unsupported instruction `%s'"),
6590 current_templates->start->name);
6591 return NULL;
6592 case invalid_vsib_address:
6593 err_msg = _("invalid VSIB address");
6594 break;
6595 case invalid_vector_register_set:
6596 err_msg = _("mask, index, and destination registers must be distinct");
6597 break;
6598 case unsupported_vector_index_register:
6599 err_msg = _("unsupported vector index register");
6600 break;
6601 case unsupported_broadcast:
6602 err_msg = _("unsupported broadcast");
6603 break;
6604 case broadcast_needed:
6605 err_msg = _("broadcast is needed for operand of such type");
6606 break;
6607 case unsupported_masking:
6608 err_msg = _("unsupported masking");
6609 break;
6610 case mask_not_on_destination:
6611 err_msg = _("mask not on destination operand");
6612 break;
6613 case no_default_mask:
6614 err_msg = _("default mask isn't allowed");
6615 break;
6616 case unsupported_rc_sae:
6617 err_msg = _("unsupported static rounding/sae");
6618 break;
6619 case rc_sae_operand_not_last_imm:
6620 if (intel_syntax)
6621 err_msg = _("RC/SAE operand must precede immediate operands");
6622 else
6623 err_msg = _("RC/SAE operand must follow immediate operands");
6624 break;
6625 case invalid_register_operand:
6626 err_msg = _("invalid register operand");
6627 break;
6628 }
6629 as_bad (_("%s for `%s'"), err_msg,
6630 current_templates->start->name);
6631 return NULL;
6632 }
6633
6634 if (!quiet_warnings)
6635 {
6636 if (!intel_syntax
6637 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6638 as_warn (_("indirect %s without `*'"), t->name);
6639
6640 if (t->opcode_modifier.isprefix
6641 && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6642 {
6643 /* Warn them that a data or address size prefix doesn't
6644 affect assembly of the next line of code. */
6645 as_warn (_("stand-alone `%s' prefix"), t->name);
6646 }
6647 }
6648
6649 /* Copy the template we found. */
6650 i.tm = *t;
6651
6652 if (addr_prefix_disp != -1)
6653 i.tm.operand_types[addr_prefix_disp]
6654 = operand_types[addr_prefix_disp];
6655
6656 if (found_reverse_match)
6657 {
6658 /* If we found a reverse match we must alter the opcode direction
6659 bit and clear/flip the regmem modifier one. found_reverse_match
6660 holds bits to change (different for int & float insns). */
6661
6662 i.tm.base_opcode ^= found_reverse_match;
6663
6664 i.tm.operand_types[0] = operand_types[i.operands - 1];
6665 i.tm.operand_types[i.operands - 1] = operand_types[0];
6666
6667 /* Certain SIMD insns have their load forms specified in the opcode
6668 table, and hence we need to _set_ RegMem instead of clearing it.
6669 We need to avoid setting the bit though on insns like KMOVW. */
6670 i.tm.opcode_modifier.regmem
6671 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6672 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6673 && !i.tm.opcode_modifier.regmem;
6674 }
6675
6676 return t;
6677 }
6678
6679 static int
6680 check_string (void)
6681 {
6682 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6683 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6684
6685 if (i.seg[op] != NULL && i.seg[op] != &es)
6686 {
6687 as_bad (_("`%s' operand %u must use `%ses' segment"),
6688 i.tm.name,
6689 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6690 register_prefix);
6691 return 0;
6692 }
6693
6694 /* There's only ever one segment override allowed per instruction.
6695 This instruction possibly has a legal segment override on the
6696 second operand, so copy the segment to where non-string
6697 instructions store it, allowing common code. */
6698 i.seg[op] = i.seg[1];
6699
6700 return 1;
6701 }
6702
6703 static int
6704 process_suffix (void)
6705 {
6706 /* If matched instruction specifies an explicit instruction mnemonic
6707 suffix, use it. */
6708 if (i.tm.opcode_modifier.size == SIZE16)
6709 i.suffix = WORD_MNEM_SUFFIX;
6710 else if (i.tm.opcode_modifier.size == SIZE32)
6711 i.suffix = LONG_MNEM_SUFFIX;
6712 else if (i.tm.opcode_modifier.size == SIZE64)
6713 i.suffix = QWORD_MNEM_SUFFIX;
6714 else if (i.reg_operands
6715 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6716 && !i.tm.opcode_modifier.addrprefixopreg)
6717 {
6718 unsigned int numop = i.operands;
6719
6720 /* movsx/movzx want only their source operand considered here, for the
6721 ambiguity checking below. The suffix will be replaced afterwards
6722 to represent the destination (register). */
6723 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6724 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6725 --i.operands;
6726
6727 /* crc32 needs REX.W set regardless of suffix / source operand size. */
6728 if (i.tm.base_opcode == 0xf20f38f0
6729 && i.tm.operand_types[1].bitfield.qword)
6730 i.rex |= REX_W;
6731
6732 /* If there's no instruction mnemonic suffix we try to invent one
6733 based on GPR operands. */
6734 if (!i.suffix)
6735 {
6736 /* We take i.suffix from the last register operand specified,
6737 Destination register type is more significant than source
6738 register type. crc32 in SSE4.2 prefers source register
6739 type. */
6740 unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6741
6742 while (op--)
6743 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6744 || i.tm.operand_types[op].bitfield.instance == Accum)
6745 {
6746 if (i.types[op].bitfield.class != Reg)
6747 continue;
6748 if (i.types[op].bitfield.byte)
6749 i.suffix = BYTE_MNEM_SUFFIX;
6750 else if (i.types[op].bitfield.word)
6751 i.suffix = WORD_MNEM_SUFFIX;
6752 else if (i.types[op].bitfield.dword)
6753 i.suffix = LONG_MNEM_SUFFIX;
6754 else if (i.types[op].bitfield.qword)
6755 i.suffix = QWORD_MNEM_SUFFIX;
6756 else
6757 continue;
6758 break;
6759 }
6760
6761 /* As an exception, movsx/movzx silently default to a byte source
6762 in AT&T mode. */
6763 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6764 && !i.suffix && !intel_syntax)
6765 i.suffix = BYTE_MNEM_SUFFIX;
6766 }
6767 else if (i.suffix == BYTE_MNEM_SUFFIX)
6768 {
6769 if (intel_syntax
6770 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6771 && i.tm.opcode_modifier.no_bsuf)
6772 i.suffix = 0;
6773 else if (!check_byte_reg ())
6774 return 0;
6775 }
6776 else if (i.suffix == LONG_MNEM_SUFFIX)
6777 {
6778 if (intel_syntax
6779 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6780 && i.tm.opcode_modifier.no_lsuf
6781 && !i.tm.opcode_modifier.todword
6782 && !i.tm.opcode_modifier.toqword)
6783 i.suffix = 0;
6784 else if (!check_long_reg ())
6785 return 0;
6786 }
6787 else if (i.suffix == QWORD_MNEM_SUFFIX)
6788 {
6789 if (intel_syntax
6790 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6791 && i.tm.opcode_modifier.no_qsuf
6792 && !i.tm.opcode_modifier.todword
6793 && !i.tm.opcode_modifier.toqword)
6794 i.suffix = 0;
6795 else if (!check_qword_reg ())
6796 return 0;
6797 }
6798 else if (i.suffix == WORD_MNEM_SUFFIX)
6799 {
6800 if (intel_syntax
6801 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6802 && i.tm.opcode_modifier.no_wsuf)
6803 i.suffix = 0;
6804 else if (!check_word_reg ())
6805 return 0;
6806 }
6807 else if (intel_syntax
6808 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6809 /* Do nothing if the instruction is going to ignore the prefix. */
6810 ;
6811 else
6812 abort ();
6813
6814 /* Undo the movsx/movzx change done above. */
6815 i.operands = numop;
6816 }
6817 else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6818 && !i.suffix)
6819 {
6820 i.suffix = stackop_size;
6821 if (stackop_size == LONG_MNEM_SUFFIX)
6822 {
6823 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6824 .code16gcc directive to support 16-bit mode with
6825 32-bit address. For IRET without a suffix, generate
6826 16-bit IRET (opcode 0xcf) to return from an interrupt
6827 handler. */
6828 if (i.tm.base_opcode == 0xcf)
6829 {
6830 i.suffix = WORD_MNEM_SUFFIX;
6831 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6832 }
6833 /* Warn about changed behavior for segment register push/pop. */
6834 else if ((i.tm.base_opcode | 1) == 0x07)
6835 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6836 i.tm.name);
6837 }
6838 }
6839 else if (!i.suffix
6840 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6841 || i.tm.opcode_modifier.jump == JUMP_BYTE
6842 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6843 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6844 && i.tm.extension_opcode <= 3)))
6845 {
6846 switch (flag_code)
6847 {
6848 case CODE_64BIT:
6849 if (!i.tm.opcode_modifier.no_qsuf)
6850 {
6851 if (i.tm.opcode_modifier.jump == JUMP_BYTE
6852 || i.tm.opcode_modifier.no_lsuf)
6853 i.suffix = QWORD_MNEM_SUFFIX;
6854 break;
6855 }
6856 /* Fall through. */
6857 case CODE_32BIT:
6858 if (!i.tm.opcode_modifier.no_lsuf)
6859 i.suffix = LONG_MNEM_SUFFIX;
6860 break;
6861 case CODE_16BIT:
6862 if (!i.tm.opcode_modifier.no_wsuf)
6863 i.suffix = WORD_MNEM_SUFFIX;
6864 break;
6865 }
6866 }
6867
6868 if (!i.suffix
6869 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6870 /* Also cover lret/retf/iret in 64-bit mode. */
6871 || (flag_code == CODE_64BIT
6872 && !i.tm.opcode_modifier.no_lsuf
6873 && !i.tm.opcode_modifier.no_qsuf))
6874 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6875 /* Explicit sizing prefixes are assumed to disambiguate insns. */
6876 && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
6877 /* Accept FLDENV et al without suffix. */
6878 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6879 {
6880 unsigned int suffixes, evex = 0;
6881
6882 suffixes = !i.tm.opcode_modifier.no_bsuf;
6883 if (!i.tm.opcode_modifier.no_wsuf)
6884 suffixes |= 1 << 1;
6885 if (!i.tm.opcode_modifier.no_lsuf)
6886 suffixes |= 1 << 2;
6887 if (!i.tm.opcode_modifier.no_ldsuf)
6888 suffixes |= 1 << 3;
6889 if (!i.tm.opcode_modifier.no_ssuf)
6890 suffixes |= 1 << 4;
6891 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6892 suffixes |= 1 << 5;
6893
6894 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6895 also suitable for AT&T syntax mode, it was requested that this be
6896 restricted to just Intel syntax. */
6897 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6898 {
6899 unsigned int op;
6900
6901 for (op = 0; op < i.tm.operands; ++op)
6902 {
6903 if (is_evex_encoding (&i.tm)
6904 && !cpu_arch_flags.bitfield.cpuavx512vl)
6905 {
6906 if (i.tm.operand_types[op].bitfield.ymmword)
6907 i.tm.operand_types[op].bitfield.xmmword = 0;
6908 if (i.tm.operand_types[op].bitfield.zmmword)
6909 i.tm.operand_types[op].bitfield.ymmword = 0;
6910 if (!i.tm.opcode_modifier.evex
6911 || i.tm.opcode_modifier.evex == EVEXDYN)
6912 i.tm.opcode_modifier.evex = EVEX512;
6913 }
6914
6915 if (i.tm.operand_types[op].bitfield.xmmword
6916 + i.tm.operand_types[op].bitfield.ymmword
6917 + i.tm.operand_types[op].bitfield.zmmword < 2)
6918 continue;
6919
6920 /* Any properly sized operand disambiguates the insn. */
6921 if (i.types[op].bitfield.xmmword
6922 || i.types[op].bitfield.ymmword
6923 || i.types[op].bitfield.zmmword)
6924 {
6925 suffixes &= ~(7 << 6);
6926 evex = 0;
6927 break;
6928 }
6929
6930 if ((i.flags[op] & Operand_Mem)
6931 && i.tm.operand_types[op].bitfield.unspecified)
6932 {
6933 if (i.tm.operand_types[op].bitfield.xmmword)
6934 suffixes |= 1 << 6;
6935 if (i.tm.operand_types[op].bitfield.ymmword)
6936 suffixes |= 1 << 7;
6937 if (i.tm.operand_types[op].bitfield.zmmword)
6938 suffixes |= 1 << 8;
6939 if (is_evex_encoding (&i.tm))
6940 evex = EVEX512;
6941 }
6942 }
6943 }
6944
6945 /* Are multiple suffixes / operand sizes allowed? */
6946 if (suffixes & (suffixes - 1))
6947 {
6948 if (intel_syntax
6949 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6950 || operand_check == check_error))
6951 {
6952 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6953 return 0;
6954 }
6955 if (operand_check == check_error)
6956 {
6957 as_bad (_("no instruction mnemonic suffix given and "
6958 "no register operands; can't size `%s'"), i.tm.name);
6959 return 0;
6960 }
6961 if (operand_check == check_warning)
6962 as_warn (_("%s; using default for `%s'"),
6963 intel_syntax
6964 ? _("ambiguous operand size")
6965 : _("no instruction mnemonic suffix given and "
6966 "no register operands"),
6967 i.tm.name);
6968
6969 if (i.tm.opcode_modifier.floatmf)
6970 i.suffix = SHORT_MNEM_SUFFIX;
6971 else if ((i.tm.base_opcode | 8) == 0xfbe
6972 || (i.tm.base_opcode == 0x63
6973 && i.tm.cpu_flags.bitfield.cpu64))
6974 /* handled below */;
6975 else if (evex)
6976 i.tm.opcode_modifier.evex = evex;
6977 else if (flag_code == CODE_16BIT)
6978 i.suffix = WORD_MNEM_SUFFIX;
6979 else if (!i.tm.opcode_modifier.no_lsuf)
6980 i.suffix = LONG_MNEM_SUFFIX;
6981 else
6982 i.suffix = QWORD_MNEM_SUFFIX;
6983 }
6984 }
6985
6986 if ((i.tm.base_opcode | 8) == 0xfbe
6987 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6988 {
6989 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
6990 In AT&T syntax, if there is no suffix (warned about above), the default
6991 will be byte extension. */
6992 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
6993 i.tm.base_opcode |= 1;
6994
6995 /* For further processing, the suffix should represent the destination
6996 (register). This is already the case when one was used with
6997 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
6998 no suffix to begin with. */
6999 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7000 {
7001 if (i.types[1].bitfield.word)
7002 i.suffix = WORD_MNEM_SUFFIX;
7003 else if (i.types[1].bitfield.qword)
7004 i.suffix = QWORD_MNEM_SUFFIX;
7005 else
7006 i.suffix = LONG_MNEM_SUFFIX;
7007
7008 i.tm.opcode_modifier.w = 0;
7009 }
7010 }
7011
7012 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7013 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7014 != (i.tm.operand_types[1].bitfield.class == Reg);
7015
7016 /* Change the opcode based on the operand size given by i.suffix. */
7017 switch (i.suffix)
7018 {
7019 /* Size floating point instruction. */
7020 case LONG_MNEM_SUFFIX:
7021 if (i.tm.opcode_modifier.floatmf)
7022 {
7023 i.tm.base_opcode ^= 4;
7024 break;
7025 }
7026 /* fall through */
7027 case WORD_MNEM_SUFFIX:
7028 case QWORD_MNEM_SUFFIX:
7029 /* It's not a byte, select word/dword operation. */
7030 if (i.tm.opcode_modifier.w)
7031 {
7032 if (i.short_form)
7033 i.tm.base_opcode |= 8;
7034 else
7035 i.tm.base_opcode |= 1;
7036 }
7037 /* fall through */
7038 case SHORT_MNEM_SUFFIX:
7039 /* Now select between word & dword operations via the operand
7040 size prefix, except for instructions that will ignore this
7041 prefix anyway. */
7042 if (i.suffix != QWORD_MNEM_SUFFIX
7043 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7044 && !i.tm.opcode_modifier.floatmf
7045 && !is_any_vex_encoding (&i.tm)
7046 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7047 || (flag_code == CODE_64BIT
7048 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7049 {
7050 unsigned int prefix = DATA_PREFIX_OPCODE;
7051
7052 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7053 prefix = ADDR_PREFIX_OPCODE;
7054
7055 if (!add_prefix (prefix))
7056 return 0;
7057 }
7058
7059 /* Set mode64 for an operand. */
7060 if (i.suffix == QWORD_MNEM_SUFFIX
7061 && flag_code == CODE_64BIT
7062 && !i.tm.opcode_modifier.norex64
7063 && !i.tm.opcode_modifier.vexw
7064 /* Special case for xchg %rax,%rax. It is NOP and doesn't
7065 need rex64. */
7066 && ! (i.operands == 2
7067 && i.tm.base_opcode == 0x90
7068 && i.tm.extension_opcode == None
7069 && i.types[0].bitfield.instance == Accum
7070 && i.types[0].bitfield.qword
7071 && i.types[1].bitfield.instance == Accum
7072 && i.types[1].bitfield.qword))
7073 i.rex |= REX_W;
7074
7075 break;
7076
7077 case 0:
7078 /* Select word/dword/qword operation with explict data sizing prefix
7079 when there are no suitable register operands. */
7080 if (i.tm.opcode_modifier.w
7081 && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7082 && (!i.reg_operands
7083 || (i.reg_operands == 1
7084 /* ShiftCount */
7085 && (i.tm.operand_types[0].bitfield.instance == RegC
7086 /* InOutPortReg */
7087 || i.tm.operand_types[0].bitfield.instance == RegD
7088 || i.tm.operand_types[1].bitfield.instance == RegD
7089 /* CRC32 */
7090 || i.tm.base_opcode == 0xf20f38f0))))
7091 i.tm.base_opcode |= 1;
7092 break;
7093 }
7094
7095 if (i.tm.opcode_modifier.addrprefixopreg)
7096 {
7097 gas_assert (!i.suffix);
7098 gas_assert (i.reg_operands);
7099
7100 if (i.tm.operand_types[0].bitfield.instance == Accum
7101 || i.operands == 1)
7102 {
7103 /* The address size override prefix changes the size of the
7104 first operand. */
7105 if (flag_code == CODE_64BIT
7106 && i.op[0].regs->reg_type.bitfield.word)
7107 {
7108 as_bad (_("16-bit addressing unavailable for `%s'"),
7109 i.tm.name);
7110 return 0;
7111 }
7112
7113 if ((flag_code == CODE_32BIT
7114 ? i.op[0].regs->reg_type.bitfield.word
7115 : i.op[0].regs->reg_type.bitfield.dword)
7116 && !add_prefix (ADDR_PREFIX_OPCODE))
7117 return 0;
7118 }
7119 else
7120 {
7121 /* Check invalid register operand when the address size override
7122 prefix changes the size of register operands. */
7123 unsigned int op;
7124 enum { need_word, need_dword, need_qword } need;
7125
7126 if (flag_code == CODE_32BIT)
7127 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7128 else if (i.prefix[ADDR_PREFIX])
7129 need = need_dword;
7130 else
7131 need = flag_code == CODE_64BIT ? need_qword : need_word;
7132
7133 for (op = 0; op < i.operands; op++)
7134 {
7135 if (i.types[op].bitfield.class != Reg)
7136 continue;
7137
7138 switch (need)
7139 {
7140 case need_word:
7141 if (i.op[op].regs->reg_type.bitfield.word)
7142 continue;
7143 break;
7144 case need_dword:
7145 if (i.op[op].regs->reg_type.bitfield.dword)
7146 continue;
7147 break;
7148 case need_qword:
7149 if (i.op[op].regs->reg_type.bitfield.qword)
7150 continue;
7151 break;
7152 }
7153
7154 as_bad (_("invalid register operand size for `%s'"),
7155 i.tm.name);
7156 return 0;
7157 }
7158 }
7159 }
7160
7161 return 1;
7162 }
7163
7164 static int
7165 check_byte_reg (void)
7166 {
7167 int op;
7168
7169 for (op = i.operands; --op >= 0;)
7170 {
7171 /* Skip non-register operands. */
7172 if (i.types[op].bitfield.class != Reg)
7173 continue;
7174
7175 /* If this is an eight bit register, it's OK. If it's the 16 or
7176 32 bit version of an eight bit register, we will just use the
7177 low portion, and that's OK too. */
7178 if (i.types[op].bitfield.byte)
7179 continue;
7180
7181 /* I/O port address operands are OK too. */
7182 if (i.tm.operand_types[op].bitfield.instance == RegD
7183 && i.tm.operand_types[op].bitfield.word)
7184 continue;
7185
7186 /* crc32 only wants its source operand checked here. */
7187 if (i.tm.base_opcode == 0xf20f38f0 && op)
7188 continue;
7189
7190 /* Any other register is bad. */
7191 as_bad (_("`%s%s' not allowed with `%s%c'"),
7192 register_prefix, i.op[op].regs->reg_name,
7193 i.tm.name, i.suffix);
7194 return 0;
7195 }
7196 return 1;
7197 }
7198
7199 static int
7200 check_long_reg (void)
7201 {
7202 int op;
7203
7204 for (op = i.operands; --op >= 0;)
7205 /* Skip non-register operands. */
7206 if (i.types[op].bitfield.class != Reg)
7207 continue;
7208 /* Reject eight bit registers, except where the template requires
7209 them. (eg. movzb) */
7210 else if (i.types[op].bitfield.byte
7211 && (i.tm.operand_types[op].bitfield.class == Reg
7212 || i.tm.operand_types[op].bitfield.instance == Accum)
7213 && (i.tm.operand_types[op].bitfield.word
7214 || i.tm.operand_types[op].bitfield.dword))
7215 {
7216 as_bad (_("`%s%s' not allowed with `%s%c'"),
7217 register_prefix,
7218 i.op[op].regs->reg_name,
7219 i.tm.name,
7220 i.suffix);
7221 return 0;
7222 }
7223 /* Error if the e prefix on a general reg is missing. */
7224 else if (i.types[op].bitfield.word
7225 && (i.tm.operand_types[op].bitfield.class == Reg
7226 || i.tm.operand_types[op].bitfield.instance == Accum)
7227 && i.tm.operand_types[op].bitfield.dword)
7228 {
7229 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7230 register_prefix, i.op[op].regs->reg_name,
7231 i.suffix);
7232 return 0;
7233 }
7234 /* Warn if the r prefix on a general reg is present. */
7235 else if (i.types[op].bitfield.qword
7236 && (i.tm.operand_types[op].bitfield.class == Reg
7237 || i.tm.operand_types[op].bitfield.instance == Accum)
7238 && i.tm.operand_types[op].bitfield.dword)
7239 {
7240 if (intel_syntax
7241 && i.tm.opcode_modifier.toqword
7242 && i.types[0].bitfield.class != RegSIMD)
7243 {
7244 /* Convert to QWORD. We want REX byte. */
7245 i.suffix = QWORD_MNEM_SUFFIX;
7246 }
7247 else
7248 {
7249 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7250 register_prefix, i.op[op].regs->reg_name,
7251 i.suffix);
7252 return 0;
7253 }
7254 }
7255 return 1;
7256 }
7257
7258 static int
7259 check_qword_reg (void)
7260 {
7261 int op;
7262
7263 for (op = i.operands; --op >= 0; )
7264 /* Skip non-register operands. */
7265 if (i.types[op].bitfield.class != Reg)
7266 continue;
7267 /* Reject eight bit registers, except where the template requires
7268 them. (eg. movzb) */
7269 else if (i.types[op].bitfield.byte
7270 && (i.tm.operand_types[op].bitfield.class == Reg
7271 || i.tm.operand_types[op].bitfield.instance == Accum)
7272 && (i.tm.operand_types[op].bitfield.word
7273 || i.tm.operand_types[op].bitfield.dword))
7274 {
7275 as_bad (_("`%s%s' not allowed with `%s%c'"),
7276 register_prefix,
7277 i.op[op].regs->reg_name,
7278 i.tm.name,
7279 i.suffix);
7280 return 0;
7281 }
7282 /* Warn if the r prefix on a general reg is missing. */
7283 else if ((i.types[op].bitfield.word
7284 || i.types[op].bitfield.dword)
7285 && (i.tm.operand_types[op].bitfield.class == Reg
7286 || i.tm.operand_types[op].bitfield.instance == Accum)
7287 && i.tm.operand_types[op].bitfield.qword)
7288 {
7289 /* Prohibit these changes in the 64bit mode, since the
7290 lowering is more complicated. */
7291 if (intel_syntax
7292 && i.tm.opcode_modifier.todword
7293 && i.types[0].bitfield.class != RegSIMD)
7294 {
7295 /* Convert to DWORD. We don't want REX byte. */
7296 i.suffix = LONG_MNEM_SUFFIX;
7297 }
7298 else
7299 {
7300 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7301 register_prefix, i.op[op].regs->reg_name,
7302 i.suffix);
7303 return 0;
7304 }
7305 }
7306 return 1;
7307 }
7308
7309 static int
7310 check_word_reg (void)
7311 {
7312 int op;
7313 for (op = i.operands; --op >= 0;)
7314 /* Skip non-register operands. */
7315 if (i.types[op].bitfield.class != Reg)
7316 continue;
7317 /* Reject eight bit registers, except where the template requires
7318 them. (eg. movzb) */
7319 else if (i.types[op].bitfield.byte
7320 && (i.tm.operand_types[op].bitfield.class == Reg
7321 || i.tm.operand_types[op].bitfield.instance == Accum)
7322 && (i.tm.operand_types[op].bitfield.word
7323 || i.tm.operand_types[op].bitfield.dword))
7324 {
7325 as_bad (_("`%s%s' not allowed with `%s%c'"),
7326 register_prefix,
7327 i.op[op].regs->reg_name,
7328 i.tm.name,
7329 i.suffix);
7330 return 0;
7331 }
7332 /* Error if the e or r prefix on a general reg is present. */
7333 else if ((i.types[op].bitfield.dword
7334 || i.types[op].bitfield.qword)
7335 && (i.tm.operand_types[op].bitfield.class == Reg
7336 || i.tm.operand_types[op].bitfield.instance == Accum)
7337 && i.tm.operand_types[op].bitfield.word)
7338 {
7339 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7340 register_prefix, i.op[op].regs->reg_name,
7341 i.suffix);
7342 return 0;
7343 }
7344 return 1;
7345 }
7346
7347 static int
7348 update_imm (unsigned int j)
7349 {
7350 i386_operand_type overlap = i.types[j];
7351 if ((overlap.bitfield.imm8
7352 || overlap.bitfield.imm8s
7353 || overlap.bitfield.imm16
7354 || overlap.bitfield.imm32
7355 || overlap.bitfield.imm32s
7356 || overlap.bitfield.imm64)
7357 && !operand_type_equal (&overlap, &imm8)
7358 && !operand_type_equal (&overlap, &imm8s)
7359 && !operand_type_equal (&overlap, &imm16)
7360 && !operand_type_equal (&overlap, &imm32)
7361 && !operand_type_equal (&overlap, &imm32s)
7362 && !operand_type_equal (&overlap, &imm64))
7363 {
7364 if (i.suffix)
7365 {
7366 i386_operand_type temp;
7367
7368 operand_type_set (&temp, 0);
7369 if (i.suffix == BYTE_MNEM_SUFFIX)
7370 {
7371 temp.bitfield.imm8 = overlap.bitfield.imm8;
7372 temp.bitfield.imm8s = overlap.bitfield.imm8s;
7373 }
7374 else if (i.suffix == WORD_MNEM_SUFFIX)
7375 temp.bitfield.imm16 = overlap.bitfield.imm16;
7376 else if (i.suffix == QWORD_MNEM_SUFFIX)
7377 {
7378 temp.bitfield.imm64 = overlap.bitfield.imm64;
7379 temp.bitfield.imm32s = overlap.bitfield.imm32s;
7380 }
7381 else
7382 temp.bitfield.imm32 = overlap.bitfield.imm32;
7383 overlap = temp;
7384 }
7385 else if (operand_type_equal (&overlap, &imm16_32_32s)
7386 || operand_type_equal (&overlap, &imm16_32)
7387 || operand_type_equal (&overlap, &imm16_32s))
7388 {
7389 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7390 overlap = imm16;
7391 else
7392 overlap = imm32s;
7393 }
7394 else if (i.prefix[REX_PREFIX] & REX_W)
7395 overlap = operand_type_and (overlap, imm32s);
7396 else if (i.prefix[DATA_PREFIX])
7397 overlap = operand_type_and (overlap,
7398 flag_code != CODE_16BIT ? imm16 : imm32);
7399 if (!operand_type_equal (&overlap, &imm8)
7400 && !operand_type_equal (&overlap, &imm8s)
7401 && !operand_type_equal (&overlap, &imm16)
7402 && !operand_type_equal (&overlap, &imm32)
7403 && !operand_type_equal (&overlap, &imm32s)
7404 && !operand_type_equal (&overlap, &imm64))
7405 {
7406 as_bad (_("no instruction mnemonic suffix given; "
7407 "can't determine immediate size"));
7408 return 0;
7409 }
7410 }
7411 i.types[j] = overlap;
7412
7413 return 1;
7414 }
7415
7416 static int
7417 finalize_imm (void)
7418 {
7419 unsigned int j, n;
7420
7421 /* Update the first 2 immediate operands. */
7422 n = i.operands > 2 ? 2 : i.operands;
7423 if (n)
7424 {
7425 for (j = 0; j < n; j++)
7426 if (update_imm (j) == 0)
7427 return 0;
7428
7429 /* The 3rd operand can't be immediate operand. */
7430 gas_assert (operand_type_check (i.types[2], imm) == 0);
7431 }
7432
7433 return 1;
7434 }
7435
7436 static int
7437 process_operands (void)
7438 {
7439 /* Default segment register this instruction will use for memory
7440 accesses. 0 means unknown. This is only for optimizing out
7441 unnecessary segment overrides. */
7442 const seg_entry *default_seg = 0;
7443
7444 if (i.tm.opcode_modifier.sse2avx)
7445 {
7446 /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7447 need converting. */
7448 i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7449 i.prefix[REX_PREFIX] = 0;
7450 i.rex_encoding = 0;
7451 }
7452 /* ImmExt should be processed after SSE2AVX. */
7453 else if (i.tm.opcode_modifier.immext)
7454 process_immext ();
7455
7456 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7457 {
7458 unsigned int dupl = i.operands;
7459 unsigned int dest = dupl - 1;
7460 unsigned int j;
7461
7462 /* The destination must be an xmm register. */
7463 gas_assert (i.reg_operands
7464 && MAX_OPERANDS > dupl
7465 && operand_type_equal (&i.types[dest], &regxmm));
7466
7467 if (i.tm.operand_types[0].bitfield.instance == Accum
7468 && i.tm.operand_types[0].bitfield.xmmword)
7469 {
7470 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7471 {
7472 /* Keep xmm0 for instructions with VEX prefix and 3
7473 sources. */
7474 i.tm.operand_types[0].bitfield.instance = InstanceNone;
7475 i.tm.operand_types[0].bitfield.class = RegSIMD;
7476 goto duplicate;
7477 }
7478 else
7479 {
7480 /* We remove the first xmm0 and keep the number of
7481 operands unchanged, which in fact duplicates the
7482 destination. */
7483 for (j = 1; j < i.operands; j++)
7484 {
7485 i.op[j - 1] = i.op[j];
7486 i.types[j - 1] = i.types[j];
7487 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7488 i.flags[j - 1] = i.flags[j];
7489 }
7490 }
7491 }
7492 else if (i.tm.opcode_modifier.implicit1stxmm0)
7493 {
7494 gas_assert ((MAX_OPERANDS - 1) > dupl
7495 && (i.tm.opcode_modifier.vexsources
7496 == VEX3SOURCES));
7497
7498 /* Add the implicit xmm0 for instructions with VEX prefix
7499 and 3 sources. */
7500 for (j = i.operands; j > 0; j--)
7501 {
7502 i.op[j] = i.op[j - 1];
7503 i.types[j] = i.types[j - 1];
7504 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7505 i.flags[j] = i.flags[j - 1];
7506 }
7507 i.op[0].regs
7508 = (const reg_entry *) hash_find (reg_hash, "xmm0");
7509 i.types[0] = regxmm;
7510 i.tm.operand_types[0] = regxmm;
7511
7512 i.operands += 2;
7513 i.reg_operands += 2;
7514 i.tm.operands += 2;
7515
7516 dupl++;
7517 dest++;
7518 i.op[dupl] = i.op[dest];
7519 i.types[dupl] = i.types[dest];
7520 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7521 i.flags[dupl] = i.flags[dest];
7522 }
7523 else
7524 {
7525 duplicate:
7526 i.operands++;
7527 i.reg_operands++;
7528 i.tm.operands++;
7529
7530 i.op[dupl] = i.op[dest];
7531 i.types[dupl] = i.types[dest];
7532 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7533 i.flags[dupl] = i.flags[dest];
7534 }
7535
7536 if (i.tm.opcode_modifier.immext)
7537 process_immext ();
7538 }
7539 else if (i.tm.operand_types[0].bitfield.instance == Accum
7540 && i.tm.operand_types[0].bitfield.xmmword)
7541 {
7542 unsigned int j;
7543
7544 for (j = 1; j < i.operands; j++)
7545 {
7546 i.op[j - 1] = i.op[j];
7547 i.types[j - 1] = i.types[j];
7548
7549 /* We need to adjust fields in i.tm since they are used by
7550 build_modrm_byte. */
7551 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7552
7553 i.flags[j - 1] = i.flags[j];
7554 }
7555
7556 i.operands--;
7557 i.reg_operands--;
7558 i.tm.operands--;
7559 }
7560 else if (i.tm.opcode_modifier.implicitquadgroup)
7561 {
7562 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7563
7564 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7565 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7566 regnum = register_number (i.op[1].regs);
7567 first_reg_in_group = regnum & ~3;
7568 last_reg_in_group = first_reg_in_group + 3;
7569 if (regnum != first_reg_in_group)
7570 as_warn (_("source register `%s%s' implicitly denotes"
7571 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7572 register_prefix, i.op[1].regs->reg_name,
7573 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7574 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7575 i.tm.name);
7576 }
7577 else if (i.tm.opcode_modifier.regkludge)
7578 {
7579 /* The imul $imm, %reg instruction is converted into
7580 imul $imm, %reg, %reg, and the clr %reg instruction
7581 is converted into xor %reg, %reg. */
7582
7583 unsigned int first_reg_op;
7584
7585 if (operand_type_check (i.types[0], reg))
7586 first_reg_op = 0;
7587 else
7588 first_reg_op = 1;
7589 /* Pretend we saw the extra register operand. */
7590 gas_assert (i.reg_operands == 1
7591 && i.op[first_reg_op + 1].regs == 0);
7592 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7593 i.types[first_reg_op + 1] = i.types[first_reg_op];
7594 i.operands++;
7595 i.reg_operands++;
7596 }
7597
7598 if (i.tm.opcode_modifier.modrm)
7599 {
7600 /* The opcode is completed (modulo i.tm.extension_opcode which
7601 must be put into the modrm byte). Now, we make the modrm and
7602 index base bytes based on all the info we've collected. */
7603
7604 default_seg = build_modrm_byte ();
7605 }
7606 else if (i.types[0].bitfield.class == SReg)
7607 {
7608 if (flag_code != CODE_64BIT
7609 ? i.tm.base_opcode == POP_SEG_SHORT
7610 && i.op[0].regs->reg_num == 1
7611 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7612 && i.op[0].regs->reg_num < 4)
7613 {
7614 as_bad (_("you can't `%s %s%s'"),
7615 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7616 return 0;
7617 }
7618 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7619 {
7620 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7621 i.tm.opcode_length = 2;
7622 }
7623 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7624 }
7625 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7626 {
7627 default_seg = &ds;
7628 }
7629 else if (i.tm.opcode_modifier.isstring)
7630 {
7631 /* For the string instructions that allow a segment override
7632 on one of their operands, the default segment is ds. */
7633 default_seg = &ds;
7634 }
7635 else if (i.short_form)
7636 {
7637 /* The register or float register operand is in operand
7638 0 or 1. */
7639 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7640
7641 /* Register goes in low 3 bits of opcode. */
7642 i.tm.base_opcode |= i.op[op].regs->reg_num;
7643 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7644 i.rex |= REX_B;
7645 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7646 {
7647 /* Warn about some common errors, but press on regardless.
7648 The first case can be generated by gcc (<= 2.8.1). */
7649 if (i.operands == 2)
7650 {
7651 /* Reversed arguments on faddp, fsubp, etc. */
7652 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7653 register_prefix, i.op[!intel_syntax].regs->reg_name,
7654 register_prefix, i.op[intel_syntax].regs->reg_name);
7655 }
7656 else
7657 {
7658 /* Extraneous `l' suffix on fp insn. */
7659 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7660 register_prefix, i.op[0].regs->reg_name);
7661 }
7662 }
7663 }
7664
7665 if ((i.seg[0] || i.prefix[SEG_PREFIX])
7666 && i.tm.base_opcode == 0x8d /* lea */
7667 && !is_any_vex_encoding(&i.tm))
7668 {
7669 if (!quiet_warnings)
7670 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7671 if (optimize)
7672 {
7673 i.seg[0] = NULL;
7674 i.prefix[SEG_PREFIX] = 0;
7675 }
7676 }
7677
7678 /* If a segment was explicitly specified, and the specified segment
7679 is neither the default nor the one already recorded from a prefix,
7680 use an opcode prefix to select it. If we never figured out what
7681 the default segment is, then default_seg will be zero at this
7682 point, and the specified segment prefix will always be used. */
7683 if (i.seg[0]
7684 && i.seg[0] != default_seg
7685 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7686 {
7687 if (!add_prefix (i.seg[0]->seg_prefix))
7688 return 0;
7689 }
7690 return 1;
7691 }
7692
7693 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7694 bfd_boolean do_sse2avx)
7695 {
7696 if (r->reg_flags & RegRex)
7697 {
7698 if (i.rex & rex_bit)
7699 as_bad (_("same type of prefix used twice"));
7700 i.rex |= rex_bit;
7701 }
7702 else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7703 {
7704 gas_assert (i.vex.register_specifier == r);
7705 i.vex.register_specifier += 8;
7706 }
7707
7708 if (r->reg_flags & RegVRex)
7709 i.vrex |= rex_bit;
7710 }
7711
7712 static const seg_entry *
7713 build_modrm_byte (void)
7714 {
7715 const seg_entry *default_seg = 0;
7716 unsigned int source, dest;
7717 int vex_3_sources;
7718
7719 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7720 if (vex_3_sources)
7721 {
7722 unsigned int nds, reg_slot;
7723 expressionS *exp;
7724
7725 dest = i.operands - 1;
7726 nds = dest - 1;
7727
7728 /* There are 2 kinds of instructions:
7729 1. 5 operands: 4 register operands or 3 register operands
7730 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7731 VexW0 or VexW1. The destination must be either XMM, YMM or
7732 ZMM register.
7733 2. 4 operands: 4 register operands or 3 register operands
7734 plus 1 memory operand, with VexXDS. */
7735 gas_assert ((i.reg_operands == 4
7736 || (i.reg_operands == 3 && i.mem_operands == 1))
7737 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7738 && i.tm.opcode_modifier.vexw
7739 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7740
7741 /* If VexW1 is set, the first non-immediate operand is the source and
7742 the second non-immediate one is encoded in the immediate operand. */
7743 if (i.tm.opcode_modifier.vexw == VEXW1)
7744 {
7745 source = i.imm_operands;
7746 reg_slot = i.imm_operands + 1;
7747 }
7748 else
7749 {
7750 source = i.imm_operands + 1;
7751 reg_slot = i.imm_operands;
7752 }
7753
7754 if (i.imm_operands == 0)
7755 {
7756 /* When there is no immediate operand, generate an 8bit
7757 immediate operand to encode the first operand. */
7758 exp = &im_expressions[i.imm_operands++];
7759 i.op[i.operands].imms = exp;
7760 i.types[i.operands] = imm8;
7761 i.operands++;
7762
7763 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7764 exp->X_op = O_constant;
7765 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7766 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7767 }
7768 else
7769 {
7770 gas_assert (i.imm_operands == 1);
7771 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7772 gas_assert (!i.tm.opcode_modifier.immext);
7773
7774 /* Turn on Imm8 again so that output_imm will generate it. */
7775 i.types[0].bitfield.imm8 = 1;
7776
7777 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7778 i.op[0].imms->X_add_number
7779 |= register_number (i.op[reg_slot].regs) << 4;
7780 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7781 }
7782
7783 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7784 i.vex.register_specifier = i.op[nds].regs;
7785 }
7786 else
7787 source = dest = 0;
7788
7789 /* i.reg_operands MUST be the number of real register operands;
7790 implicit registers do not count. If there are 3 register
7791 operands, it must be a instruction with VexNDS. For a
7792 instruction with VexNDD, the destination register is encoded
7793 in VEX prefix. If there are 4 register operands, it must be
7794 a instruction with VEX prefix and 3 sources. */
7795 if (i.mem_operands == 0
7796 && ((i.reg_operands == 2
7797 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7798 || (i.reg_operands == 3
7799 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7800 || (i.reg_operands == 4 && vex_3_sources)))
7801 {
7802 switch (i.operands)
7803 {
7804 case 2:
7805 source = 0;
7806 break;
7807 case 3:
7808 /* When there are 3 operands, one of them may be immediate,
7809 which may be the first or the last operand. Otherwise,
7810 the first operand must be shift count register (cl) or it
7811 is an instruction with VexNDS. */
7812 gas_assert (i.imm_operands == 1
7813 || (i.imm_operands == 0
7814 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7815 || (i.types[0].bitfield.instance == RegC
7816 && i.types[0].bitfield.byte))));
7817 if (operand_type_check (i.types[0], imm)
7818 || (i.types[0].bitfield.instance == RegC
7819 && i.types[0].bitfield.byte))
7820 source = 1;
7821 else
7822 source = 0;
7823 break;
7824 case 4:
7825 /* When there are 4 operands, the first two must be 8bit
7826 immediate operands. The source operand will be the 3rd
7827 one.
7828
7829 For instructions with VexNDS, if the first operand
7830 an imm8, the source operand is the 2nd one. If the last
7831 operand is imm8, the source operand is the first one. */
7832 gas_assert ((i.imm_operands == 2
7833 && i.types[0].bitfield.imm8
7834 && i.types[1].bitfield.imm8)
7835 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7836 && i.imm_operands == 1
7837 && (i.types[0].bitfield.imm8
7838 || i.types[i.operands - 1].bitfield.imm8
7839 || i.rounding)));
7840 if (i.imm_operands == 2)
7841 source = 2;
7842 else
7843 {
7844 if (i.types[0].bitfield.imm8)
7845 source = 1;
7846 else
7847 source = 0;
7848 }
7849 break;
7850 case 5:
7851 if (is_evex_encoding (&i.tm))
7852 {
7853 /* For EVEX instructions, when there are 5 operands, the
7854 first one must be immediate operand. If the second one
7855 is immediate operand, the source operand is the 3th
7856 one. If the last one is immediate operand, the source
7857 operand is the 2nd one. */
7858 gas_assert (i.imm_operands == 2
7859 && i.tm.opcode_modifier.sae
7860 && operand_type_check (i.types[0], imm));
7861 if (operand_type_check (i.types[1], imm))
7862 source = 2;
7863 else if (operand_type_check (i.types[4], imm))
7864 source = 1;
7865 else
7866 abort ();
7867 }
7868 break;
7869 default:
7870 abort ();
7871 }
7872
7873 if (!vex_3_sources)
7874 {
7875 dest = source + 1;
7876
7877 /* RC/SAE operand could be between DEST and SRC. That happens
7878 when one operand is GPR and the other one is XMM/YMM/ZMM
7879 register. */
7880 if (i.rounding && i.rounding->operand == (int) dest)
7881 dest++;
7882
7883 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7884 {
7885 /* For instructions with VexNDS, the register-only source
7886 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7887 register. It is encoded in VEX prefix. */
7888
7889 i386_operand_type op;
7890 unsigned int vvvv;
7891
7892 /* Check register-only source operand when two source
7893 operands are swapped. */
7894 if (!i.tm.operand_types[source].bitfield.baseindex
7895 && i.tm.operand_types[dest].bitfield.baseindex)
7896 {
7897 vvvv = source;
7898 source = dest;
7899 }
7900 else
7901 vvvv = dest;
7902
7903 op = i.tm.operand_types[vvvv];
7904 if ((dest + 1) >= i.operands
7905 || ((op.bitfield.class != Reg
7906 || (!op.bitfield.dword && !op.bitfield.qword))
7907 && op.bitfield.class != RegSIMD
7908 && !operand_type_equal (&op, &regmask)))
7909 abort ();
7910 i.vex.register_specifier = i.op[vvvv].regs;
7911 dest++;
7912 }
7913 }
7914
7915 i.rm.mode = 3;
7916 /* One of the register operands will be encoded in the i.rm.reg
7917 field, the other in the combined i.rm.mode and i.rm.regmem
7918 fields. If no form of this instruction supports a memory
7919 destination operand, then we assume the source operand may
7920 sometimes be a memory operand and so we need to store the
7921 destination in the i.rm.reg field. */
7922 if (!i.tm.opcode_modifier.regmem
7923 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7924 {
7925 i.rm.reg = i.op[dest].regs->reg_num;
7926 i.rm.regmem = i.op[source].regs->reg_num;
7927 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7928 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7929 i.has_regmmx = TRUE;
7930 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7931 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7932 {
7933 if (i.types[dest].bitfield.zmmword
7934 || i.types[source].bitfield.zmmword)
7935 i.has_regzmm = TRUE;
7936 else if (i.types[dest].bitfield.ymmword
7937 || i.types[source].bitfield.ymmword)
7938 i.has_regymm = TRUE;
7939 else
7940 i.has_regxmm = TRUE;
7941 }
7942 set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
7943 set_rex_vrex (i.op[source].regs, REX_B, FALSE);
7944 }
7945 else
7946 {
7947 i.rm.reg = i.op[source].regs->reg_num;
7948 i.rm.regmem = i.op[dest].regs->reg_num;
7949 set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
7950 set_rex_vrex (i.op[source].regs, REX_R, FALSE);
7951 }
7952 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7953 {
7954 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7955 abort ();
7956 i.rex &= ~REX_R;
7957 add_prefix (LOCK_PREFIX_OPCODE);
7958 }
7959 }
7960 else
7961 { /* If it's not 2 reg operands... */
7962 unsigned int mem;
7963
7964 if (i.mem_operands)
7965 {
7966 unsigned int fake_zero_displacement = 0;
7967 unsigned int op;
7968
7969 for (op = 0; op < i.operands; op++)
7970 if (i.flags[op] & Operand_Mem)
7971 break;
7972 gas_assert (op < i.operands);
7973
7974 if (i.tm.opcode_modifier.sib)
7975 {
7976 if (i.index_reg->reg_num == RegIZ)
7977 abort ();
7978
7979 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7980 if (!i.base_reg)
7981 {
7982 i.sib.base = NO_BASE_REGISTER;
7983 i.sib.scale = i.log2_scale_factor;
7984 i.types[op].bitfield.disp8 = 0;
7985 i.types[op].bitfield.disp16 = 0;
7986 i.types[op].bitfield.disp64 = 0;
7987 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7988 {
7989 /* Must be 32 bit */
7990 i.types[op].bitfield.disp32 = 1;
7991 i.types[op].bitfield.disp32s = 0;
7992 }
7993 else
7994 {
7995 i.types[op].bitfield.disp32 = 0;
7996 i.types[op].bitfield.disp32s = 1;
7997 }
7998 }
7999 i.sib.index = i.index_reg->reg_num;
8000 set_rex_vrex (i.index_reg, REX_X, FALSE);
8001 }
8002
8003 default_seg = &ds;
8004
8005 if (i.base_reg == 0)
8006 {
8007 i.rm.mode = 0;
8008 if (!i.disp_operands)
8009 fake_zero_displacement = 1;
8010 if (i.index_reg == 0)
8011 {
8012 i386_operand_type newdisp;
8013
8014 gas_assert (!i.tm.opcode_modifier.sib);
8015 /* Operand is just <disp> */
8016 if (flag_code == CODE_64BIT)
8017 {
8018 /* 64bit mode overwrites the 32bit absolute
8019 addressing by RIP relative addressing and
8020 absolute addressing is encoded by one of the
8021 redundant SIB forms. */
8022 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8023 i.sib.base = NO_BASE_REGISTER;
8024 i.sib.index = NO_INDEX_REGISTER;
8025 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
8026 }
8027 else if ((flag_code == CODE_16BIT)
8028 ^ (i.prefix[ADDR_PREFIX] != 0))
8029 {
8030 i.rm.regmem = NO_BASE_REGISTER_16;
8031 newdisp = disp16;
8032 }
8033 else
8034 {
8035 i.rm.regmem = NO_BASE_REGISTER;
8036 newdisp = disp32;
8037 }
8038 i.types[op] = operand_type_and_not (i.types[op], anydisp);
8039 i.types[op] = operand_type_or (i.types[op], newdisp);
8040 }
8041 else if (!i.tm.opcode_modifier.sib)
8042 {
8043 /* !i.base_reg && i.index_reg */
8044 if (i.index_reg->reg_num == RegIZ)
8045 i.sib.index = NO_INDEX_REGISTER;
8046 else
8047 i.sib.index = i.index_reg->reg_num;
8048 i.sib.base = NO_BASE_REGISTER;
8049 i.sib.scale = i.log2_scale_factor;
8050 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8051 i.types[op].bitfield.disp8 = 0;
8052 i.types[op].bitfield.disp16 = 0;
8053 i.types[op].bitfield.disp64 = 0;
8054 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8055 {
8056 /* Must be 32 bit */
8057 i.types[op].bitfield.disp32 = 1;
8058 i.types[op].bitfield.disp32s = 0;
8059 }
8060 else
8061 {
8062 i.types[op].bitfield.disp32 = 0;
8063 i.types[op].bitfield.disp32s = 1;
8064 }
8065 if ((i.index_reg->reg_flags & RegRex) != 0)
8066 i.rex |= REX_X;
8067 }
8068 }
8069 /* RIP addressing for 64bit mode. */
8070 else if (i.base_reg->reg_num == RegIP)
8071 {
8072 gas_assert (!i.tm.opcode_modifier.sib);
8073 i.rm.regmem = NO_BASE_REGISTER;
8074 i.types[op].bitfield.disp8 = 0;
8075 i.types[op].bitfield.disp16 = 0;
8076 i.types[op].bitfield.disp32 = 0;
8077 i.types[op].bitfield.disp32s = 1;
8078 i.types[op].bitfield.disp64 = 0;
8079 i.flags[op] |= Operand_PCrel;
8080 if (! i.disp_operands)
8081 fake_zero_displacement = 1;
8082 }
8083 else if (i.base_reg->reg_type.bitfield.word)
8084 {
8085 gas_assert (!i.tm.opcode_modifier.sib);
8086 switch (i.base_reg->reg_num)
8087 {
8088 case 3: /* (%bx) */
8089 if (i.index_reg == 0)
8090 i.rm.regmem = 7;
8091 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
8092 i.rm.regmem = i.index_reg->reg_num - 6;
8093 break;
8094 case 5: /* (%bp) */
8095 default_seg = &ss;
8096 if (i.index_reg == 0)
8097 {
8098 i.rm.regmem = 6;
8099 if (operand_type_check (i.types[op], disp) == 0)
8100 {
8101 /* fake (%bp) into 0(%bp) */
8102 i.types[op].bitfield.disp8 = 1;
8103 fake_zero_displacement = 1;
8104 }
8105 }
8106 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
8107 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8108 break;
8109 default: /* (%si) -> 4 or (%di) -> 5 */
8110 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8111 }
8112 i.rm.mode = mode_from_disp_size (i.types[op]);
8113 }
8114 else /* i.base_reg and 32/64 bit mode */
8115 {
8116 if (flag_code == CODE_64BIT
8117 && operand_type_check (i.types[op], disp))
8118 {
8119 i.types[op].bitfield.disp16 = 0;
8120 i.types[op].bitfield.disp64 = 0;
8121 if (i.prefix[ADDR_PREFIX] == 0)
8122 {
8123 i.types[op].bitfield.disp32 = 0;
8124 i.types[op].bitfield.disp32s = 1;
8125 }
8126 else
8127 {
8128 i.types[op].bitfield.disp32 = 1;
8129 i.types[op].bitfield.disp32s = 0;
8130 }
8131 }
8132
8133 if (!i.tm.opcode_modifier.sib)
8134 i.rm.regmem = i.base_reg->reg_num;
8135 if ((i.base_reg->reg_flags & RegRex) != 0)
8136 i.rex |= REX_B;
8137 i.sib.base = i.base_reg->reg_num;
8138 /* x86-64 ignores REX prefix bit here to avoid decoder
8139 complications. */
8140 if (!(i.base_reg->reg_flags & RegRex)
8141 && (i.base_reg->reg_num == EBP_REG_NUM
8142 || i.base_reg->reg_num == ESP_REG_NUM))
8143 default_seg = &ss;
8144 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8145 {
8146 fake_zero_displacement = 1;
8147 i.types[op].bitfield.disp8 = 1;
8148 }
8149 i.sib.scale = i.log2_scale_factor;
8150 if (i.index_reg == 0)
8151 {
8152 gas_assert (!i.tm.opcode_modifier.sib);
8153 /* <disp>(%esp) becomes two byte modrm with no index
8154 register. We've already stored the code for esp
8155 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8156 Any base register besides %esp will not use the
8157 extra modrm byte. */
8158 i.sib.index = NO_INDEX_REGISTER;
8159 }
8160 else if (!i.tm.opcode_modifier.sib)
8161 {
8162 if (i.index_reg->reg_num == RegIZ)
8163 i.sib.index = NO_INDEX_REGISTER;
8164 else
8165 i.sib.index = i.index_reg->reg_num;
8166 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8167 if ((i.index_reg->reg_flags & RegRex) != 0)
8168 i.rex |= REX_X;
8169 }
8170
8171 if (i.disp_operands
8172 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8173 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8174 i.rm.mode = 0;
8175 else
8176 {
8177 if (!fake_zero_displacement
8178 && !i.disp_operands
8179 && i.disp_encoding)
8180 {
8181 fake_zero_displacement = 1;
8182 if (i.disp_encoding == disp_encoding_8bit)
8183 i.types[op].bitfield.disp8 = 1;
8184 else
8185 i.types[op].bitfield.disp32 = 1;
8186 }
8187 i.rm.mode = mode_from_disp_size (i.types[op]);
8188 }
8189 }
8190
8191 if (fake_zero_displacement)
8192 {
8193 /* Fakes a zero displacement assuming that i.types[op]
8194 holds the correct displacement size. */
8195 expressionS *exp;
8196
8197 gas_assert (i.op[op].disps == 0);
8198 exp = &disp_expressions[i.disp_operands++];
8199 i.op[op].disps = exp;
8200 exp->X_op = O_constant;
8201 exp->X_add_number = 0;
8202 exp->X_add_symbol = (symbolS *) 0;
8203 exp->X_op_symbol = (symbolS *) 0;
8204 }
8205
8206 mem = op;
8207 }
8208 else
8209 mem = ~0;
8210
8211 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8212 {
8213 if (operand_type_check (i.types[0], imm))
8214 i.vex.register_specifier = NULL;
8215 else
8216 {
8217 /* VEX.vvvv encodes one of the sources when the first
8218 operand is not an immediate. */
8219 if (i.tm.opcode_modifier.vexw == VEXW0)
8220 i.vex.register_specifier = i.op[0].regs;
8221 else
8222 i.vex.register_specifier = i.op[1].regs;
8223 }
8224
8225 /* Destination is a XMM register encoded in the ModRM.reg
8226 and VEX.R bit. */
8227 i.rm.reg = i.op[2].regs->reg_num;
8228 if ((i.op[2].regs->reg_flags & RegRex) != 0)
8229 i.rex |= REX_R;
8230
8231 /* ModRM.rm and VEX.B encodes the other source. */
8232 if (!i.mem_operands)
8233 {
8234 i.rm.mode = 3;
8235
8236 if (i.tm.opcode_modifier.vexw == VEXW0)
8237 i.rm.regmem = i.op[1].regs->reg_num;
8238 else
8239 i.rm.regmem = i.op[0].regs->reg_num;
8240
8241 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8242 i.rex |= REX_B;
8243 }
8244 }
8245 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8246 {
8247 i.vex.register_specifier = i.op[2].regs;
8248 if (!i.mem_operands)
8249 {
8250 i.rm.mode = 3;
8251 i.rm.regmem = i.op[1].regs->reg_num;
8252 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8253 i.rex |= REX_B;
8254 }
8255 }
8256 /* Fill in i.rm.reg or i.rm.regmem field with register operand
8257 (if any) based on i.tm.extension_opcode. Again, we must be
8258 careful to make sure that segment/control/debug/test/MMX
8259 registers are coded into the i.rm.reg field. */
8260 else if (i.reg_operands)
8261 {
8262 unsigned int op;
8263 unsigned int vex_reg = ~0;
8264
8265 for (op = 0; op < i.operands; op++)
8266 {
8267 if (i.types[op].bitfield.class == Reg
8268 || i.types[op].bitfield.class == RegBND
8269 || i.types[op].bitfield.class == RegMask
8270 || i.types[op].bitfield.class == SReg
8271 || i.types[op].bitfield.class == RegCR
8272 || i.types[op].bitfield.class == RegDR
8273 || i.types[op].bitfield.class == RegTR)
8274 break;
8275 if (i.types[op].bitfield.class == RegSIMD)
8276 {
8277 if (i.types[op].bitfield.zmmword)
8278 i.has_regzmm = TRUE;
8279 else if (i.types[op].bitfield.ymmword)
8280 i.has_regymm = TRUE;
8281 else
8282 i.has_regxmm = TRUE;
8283 break;
8284 }
8285 if (i.types[op].bitfield.class == RegMMX)
8286 {
8287 i.has_regmmx = TRUE;
8288 break;
8289 }
8290 }
8291
8292 if (vex_3_sources)
8293 op = dest;
8294 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8295 {
8296 /* For instructions with VexNDS, the register-only
8297 source operand is encoded in VEX prefix. */
8298 gas_assert (mem != (unsigned int) ~0);
8299
8300 if (op > mem)
8301 {
8302 vex_reg = op++;
8303 gas_assert (op < i.operands);
8304 }
8305 else
8306 {
8307 /* Check register-only source operand when two source
8308 operands are swapped. */
8309 if (!i.tm.operand_types[op].bitfield.baseindex
8310 && i.tm.operand_types[op + 1].bitfield.baseindex)
8311 {
8312 vex_reg = op;
8313 op += 2;
8314 gas_assert (mem == (vex_reg + 1)
8315 && op < i.operands);
8316 }
8317 else
8318 {
8319 vex_reg = op + 1;
8320 gas_assert (vex_reg < i.operands);
8321 }
8322 }
8323 }
8324 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8325 {
8326 /* For instructions with VexNDD, the register destination
8327 is encoded in VEX prefix. */
8328 if (i.mem_operands == 0)
8329 {
8330 /* There is no memory operand. */
8331 gas_assert ((op + 2) == i.operands);
8332 vex_reg = op + 1;
8333 }
8334 else
8335 {
8336 /* There are only 2 non-immediate operands. */
8337 gas_assert (op < i.imm_operands + 2
8338 && i.operands == i.imm_operands + 2);
8339 vex_reg = i.imm_operands + 1;
8340 }
8341 }
8342 else
8343 gas_assert (op < i.operands);
8344
8345 if (vex_reg != (unsigned int) ~0)
8346 {
8347 i386_operand_type *type = &i.tm.operand_types[vex_reg];
8348
8349 if ((type->bitfield.class != Reg
8350 || (!type->bitfield.dword && !type->bitfield.qword))
8351 && type->bitfield.class != RegSIMD
8352 && !operand_type_equal (type, &regmask))
8353 abort ();
8354
8355 i.vex.register_specifier = i.op[vex_reg].regs;
8356 }
8357
8358 /* Don't set OP operand twice. */
8359 if (vex_reg != op)
8360 {
8361 /* If there is an extension opcode to put here, the
8362 register number must be put into the regmem field. */
8363 if (i.tm.extension_opcode != None)
8364 {
8365 i.rm.regmem = i.op[op].regs->reg_num;
8366 set_rex_vrex (i.op[op].regs, REX_B,
8367 i.tm.opcode_modifier.sse2avx);
8368 }
8369 else
8370 {
8371 i.rm.reg = i.op[op].regs->reg_num;
8372 set_rex_vrex (i.op[op].regs, REX_R,
8373 i.tm.opcode_modifier.sse2avx);
8374 }
8375 }
8376
8377 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8378 must set it to 3 to indicate this is a register operand
8379 in the regmem field. */
8380 if (!i.mem_operands)
8381 i.rm.mode = 3;
8382 }
8383
8384 /* Fill in i.rm.reg field with extension opcode (if any). */
8385 if (i.tm.extension_opcode != None)
8386 i.rm.reg = i.tm.extension_opcode;
8387 }
8388 return default_seg;
8389 }
8390
8391 static unsigned int
8392 flip_code16 (unsigned int code16)
8393 {
8394 gas_assert (i.tm.operands == 1);
8395
8396 return !(i.prefix[REX_PREFIX] & REX_W)
8397 && (code16 ? i.tm.operand_types[0].bitfield.disp32
8398 || i.tm.operand_types[0].bitfield.disp32s
8399 : i.tm.operand_types[0].bitfield.disp16)
8400 ? CODE16 : 0;
8401 }
8402
8403 static void
8404 output_branch (void)
8405 {
8406 char *p;
8407 int size;
8408 int code16;
8409 int prefix;
8410 relax_substateT subtype;
8411 symbolS *sym;
8412 offsetT off;
8413
8414 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8415 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8416
8417 prefix = 0;
8418 if (i.prefix[DATA_PREFIX] != 0)
8419 {
8420 prefix = 1;
8421 i.prefixes -= 1;
8422 code16 ^= flip_code16(code16);
8423 }
8424 /* Pentium4 branch hints. */
8425 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8426 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8427 {
8428 prefix++;
8429 i.prefixes--;
8430 }
8431 if (i.prefix[REX_PREFIX] != 0)
8432 {
8433 prefix++;
8434 i.prefixes--;
8435 }
8436
8437 /* BND prefixed jump. */
8438 if (i.prefix[BND_PREFIX] != 0)
8439 {
8440 prefix++;
8441 i.prefixes--;
8442 }
8443
8444 if (i.prefixes != 0)
8445 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8446
8447 /* It's always a symbol; End frag & setup for relax.
8448 Make sure there is enough room in this frag for the largest
8449 instruction we may generate in md_convert_frag. This is 2
8450 bytes for the opcode and room for the prefix and largest
8451 displacement. */
8452 frag_grow (prefix + 2 + 4);
8453 /* Prefix and 1 opcode byte go in fr_fix. */
8454 p = frag_more (prefix + 1);
8455 if (i.prefix[DATA_PREFIX] != 0)
8456 *p++ = DATA_PREFIX_OPCODE;
8457 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8458 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8459 *p++ = i.prefix[SEG_PREFIX];
8460 if (i.prefix[BND_PREFIX] != 0)
8461 *p++ = BND_PREFIX_OPCODE;
8462 if (i.prefix[REX_PREFIX] != 0)
8463 *p++ = i.prefix[REX_PREFIX];
8464 *p = i.tm.base_opcode;
8465
8466 if ((unsigned char) *p == JUMP_PC_RELATIVE)
8467 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8468 else if (cpu_arch_flags.bitfield.cpui386)
8469 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8470 else
8471 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8472 subtype |= code16;
8473
8474 sym = i.op[0].disps->X_add_symbol;
8475 off = i.op[0].disps->X_add_number;
8476
8477 if (i.op[0].disps->X_op != O_constant
8478 && i.op[0].disps->X_op != O_symbol)
8479 {
8480 /* Handle complex expressions. */
8481 sym = make_expr_symbol (i.op[0].disps);
8482 off = 0;
8483 }
8484
8485 /* 1 possible extra opcode + 4 byte displacement go in var part.
8486 Pass reloc in fr_var. */
8487 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8488 }
8489
8490 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8491 /* Return TRUE iff PLT32 relocation should be used for branching to
8492 symbol S. */
8493
8494 static bfd_boolean
8495 need_plt32_p (symbolS *s)
8496 {
8497 /* PLT32 relocation is ELF only. */
8498 if (!IS_ELF)
8499 return FALSE;
8500
8501 #ifdef TE_SOLARIS
8502 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8503 krtld support it. */
8504 return FALSE;
8505 #endif
8506
8507 /* Since there is no need to prepare for PLT branch on x86-64, we
8508 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8509 be used as a marker for 32-bit PC-relative branches. */
8510 if (!object_64bit)
8511 return FALSE;
8512
8513 /* Weak or undefined symbol need PLT32 relocation. */
8514 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8515 return TRUE;
8516
8517 /* Non-global symbol doesn't need PLT32 relocation. */
8518 if (! S_IS_EXTERNAL (s))
8519 return FALSE;
8520
8521 /* Other global symbols need PLT32 relocation. NB: Symbol with
8522 non-default visibilities are treated as normal global symbol
8523 so that PLT32 relocation can be used as a marker for 32-bit
8524 PC-relative branches. It is useful for linker relaxation. */
8525 return TRUE;
8526 }
8527 #endif
8528
8529 static void
8530 output_jump (void)
8531 {
8532 char *p;
8533 int size;
8534 fixS *fixP;
8535 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8536
8537 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8538 {
8539 /* This is a loop or jecxz type instruction. */
8540 size = 1;
8541 if (i.prefix[ADDR_PREFIX] != 0)
8542 {
8543 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8544 i.prefixes -= 1;
8545 }
8546 /* Pentium4 branch hints. */
8547 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8548 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8549 {
8550 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8551 i.prefixes--;
8552 }
8553 }
8554 else
8555 {
8556 int code16;
8557
8558 code16 = 0;
8559 if (flag_code == CODE_16BIT)
8560 code16 = CODE16;
8561
8562 if (i.prefix[DATA_PREFIX] != 0)
8563 {
8564 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8565 i.prefixes -= 1;
8566 code16 ^= flip_code16(code16);
8567 }
8568
8569 size = 4;
8570 if (code16)
8571 size = 2;
8572 }
8573
8574 /* BND prefixed jump. */
8575 if (i.prefix[BND_PREFIX] != 0)
8576 {
8577 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8578 i.prefixes -= 1;
8579 }
8580
8581 if (i.prefix[REX_PREFIX] != 0)
8582 {
8583 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8584 i.prefixes -= 1;
8585 }
8586
8587 if (i.prefixes != 0)
8588 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8589
8590 p = frag_more (i.tm.opcode_length + size);
8591 switch (i.tm.opcode_length)
8592 {
8593 case 2:
8594 *p++ = i.tm.base_opcode >> 8;
8595 /* Fall through. */
8596 case 1:
8597 *p++ = i.tm.base_opcode;
8598 break;
8599 default:
8600 abort ();
8601 }
8602
8603 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8604 if (size == 4
8605 && jump_reloc == NO_RELOC
8606 && need_plt32_p (i.op[0].disps->X_add_symbol))
8607 jump_reloc = BFD_RELOC_X86_64_PLT32;
8608 #endif
8609
8610 jump_reloc = reloc (size, 1, 1, jump_reloc);
8611
8612 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8613 i.op[0].disps, 1, jump_reloc);
8614
8615 /* All jumps handled here are signed, but don't use a signed limit
8616 check for 32 and 16 bit jumps as we want to allow wrap around at
8617 4G and 64k respectively. */
8618 if (size == 1)
8619 fixP->fx_signed = 1;
8620 }
8621
8622 static void
8623 output_interseg_jump (void)
8624 {
8625 char *p;
8626 int size;
8627 int prefix;
8628 int code16;
8629
8630 code16 = 0;
8631 if (flag_code == CODE_16BIT)
8632 code16 = CODE16;
8633
8634 prefix = 0;
8635 if (i.prefix[DATA_PREFIX] != 0)
8636 {
8637 prefix = 1;
8638 i.prefixes -= 1;
8639 code16 ^= CODE16;
8640 }
8641
8642 gas_assert (!i.prefix[REX_PREFIX]);
8643
8644 size = 4;
8645 if (code16)
8646 size = 2;
8647
8648 if (i.prefixes != 0)
8649 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8650
8651 /* 1 opcode; 2 segment; offset */
8652 p = frag_more (prefix + 1 + 2 + size);
8653
8654 if (i.prefix[DATA_PREFIX] != 0)
8655 *p++ = DATA_PREFIX_OPCODE;
8656
8657 if (i.prefix[REX_PREFIX] != 0)
8658 *p++ = i.prefix[REX_PREFIX];
8659
8660 *p++ = i.tm.base_opcode;
8661 if (i.op[1].imms->X_op == O_constant)
8662 {
8663 offsetT n = i.op[1].imms->X_add_number;
8664
8665 if (size == 2
8666 && !fits_in_unsigned_word (n)
8667 && !fits_in_signed_word (n))
8668 {
8669 as_bad (_("16-bit jump out of range"));
8670 return;
8671 }
8672 md_number_to_chars (p, n, size);
8673 }
8674 else
8675 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8676 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8677 if (i.op[0].imms->X_op != O_constant)
8678 as_bad (_("can't handle non absolute segment in `%s'"),
8679 i.tm.name);
8680 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8681 }
8682
8683 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8684 void
8685 x86_cleanup (void)
8686 {
8687 char *p;
8688 asection *seg = now_seg;
8689 subsegT subseg = now_subseg;
8690 asection *sec;
8691 unsigned int alignment, align_size_1;
8692 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8693 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8694 unsigned int padding;
8695
8696 if (!IS_ELF || !x86_used_note)
8697 return;
8698
8699 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8700
8701 /* The .note.gnu.property section layout:
8702
8703 Field Length Contents
8704 ---- ---- ----
8705 n_namsz 4 4
8706 n_descsz 4 The note descriptor size
8707 n_type 4 NT_GNU_PROPERTY_TYPE_0
8708 n_name 4 "GNU"
8709 n_desc n_descsz The program property array
8710 .... .... ....
8711 */
8712
8713 /* Create the .note.gnu.property section. */
8714 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8715 bfd_set_section_flags (sec,
8716 (SEC_ALLOC
8717 | SEC_LOAD
8718 | SEC_DATA
8719 | SEC_HAS_CONTENTS
8720 | SEC_READONLY));
8721
8722 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8723 {
8724 align_size_1 = 7;
8725 alignment = 3;
8726 }
8727 else
8728 {
8729 align_size_1 = 3;
8730 alignment = 2;
8731 }
8732
8733 bfd_set_section_alignment (sec, alignment);
8734 elf_section_type (sec) = SHT_NOTE;
8735
8736 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8737 + 4-byte data */
8738 isa_1_descsz_raw = 4 + 4 + 4;
8739 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8740 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8741
8742 feature_2_descsz_raw = isa_1_descsz;
8743 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8744 + 4-byte data */
8745 feature_2_descsz_raw += 4 + 4 + 4;
8746 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8747 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8748 & ~align_size_1);
8749
8750 descsz = feature_2_descsz;
8751 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8752 p = frag_more (4 + 4 + 4 + 4 + descsz);
8753
8754 /* Write n_namsz. */
8755 md_number_to_chars (p, (valueT) 4, 4);
8756
8757 /* Write n_descsz. */
8758 md_number_to_chars (p + 4, (valueT) descsz, 4);
8759
8760 /* Write n_type. */
8761 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8762
8763 /* Write n_name. */
8764 memcpy (p + 4 * 3, "GNU", 4);
8765
8766 /* Write 4-byte type. */
8767 md_number_to_chars (p + 4 * 4,
8768 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8769
8770 /* Write 4-byte data size. */
8771 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8772
8773 /* Write 4-byte data. */
8774 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8775
8776 /* Zero out paddings. */
8777 padding = isa_1_descsz - isa_1_descsz_raw;
8778 if (padding)
8779 memset (p + 4 * 7, 0, padding);
8780
8781 /* Write 4-byte type. */
8782 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8783 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8784
8785 /* Write 4-byte data size. */
8786 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8787
8788 /* Write 4-byte data. */
8789 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8790 (valueT) x86_feature_2_used, 4);
8791
8792 /* Zero out paddings. */
8793 padding = feature_2_descsz - feature_2_descsz_raw;
8794 if (padding)
8795 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8796
8797 /* We probably can't restore the current segment, for there likely
8798 isn't one yet... */
8799 if (seg && subseg)
8800 subseg_set (seg, subseg);
8801 }
8802 #endif
8803
8804 static unsigned int
8805 encoding_length (const fragS *start_frag, offsetT start_off,
8806 const char *frag_now_ptr)
8807 {
8808 unsigned int len = 0;
8809
8810 if (start_frag != frag_now)
8811 {
8812 const fragS *fr = start_frag;
8813
8814 do {
8815 len += fr->fr_fix;
8816 fr = fr->fr_next;
8817 } while (fr && fr != frag_now);
8818 }
8819
8820 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8821 }
8822
8823 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8824 be macro-fused with conditional jumps.
8825 NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8826 or is one of the following format:
8827
8828 cmp m, imm
8829 add m, imm
8830 sub m, imm
8831 test m, imm
8832 and m, imm
8833 inc m
8834 dec m
8835
8836 it is unfusible. */
8837
8838 static int
8839 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8840 {
8841 /* No RIP address. */
8842 if (i.base_reg && i.base_reg->reg_num == RegIP)
8843 return 0;
8844
8845 /* No VEX/EVEX encoding. */
8846 if (is_any_vex_encoding (&i.tm))
8847 return 0;
8848
8849 /* add, sub without add/sub m, imm. */
8850 if (i.tm.base_opcode <= 5
8851 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8852 || ((i.tm.base_opcode | 3) == 0x83
8853 && (i.tm.extension_opcode == 0x5
8854 || i.tm.extension_opcode == 0x0)))
8855 {
8856 *mf_cmp_p = mf_cmp_alu_cmp;
8857 return !(i.mem_operands && i.imm_operands);
8858 }
8859
8860 /* and without and m, imm. */
8861 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8862 || ((i.tm.base_opcode | 3) == 0x83
8863 && i.tm.extension_opcode == 0x4))
8864 {
8865 *mf_cmp_p = mf_cmp_test_and;
8866 return !(i.mem_operands && i.imm_operands);
8867 }
8868
8869 /* test without test m imm. */
8870 if ((i.tm.base_opcode | 1) == 0x85
8871 || (i.tm.base_opcode | 1) == 0xa9
8872 || ((i.tm.base_opcode | 1) == 0xf7
8873 && i.tm.extension_opcode == 0))
8874 {
8875 *mf_cmp_p = mf_cmp_test_and;
8876 return !(i.mem_operands && i.imm_operands);
8877 }
8878
8879 /* cmp without cmp m, imm. */
8880 if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8881 || ((i.tm.base_opcode | 3) == 0x83
8882 && (i.tm.extension_opcode == 0x7)))
8883 {
8884 *mf_cmp_p = mf_cmp_alu_cmp;
8885 return !(i.mem_operands && i.imm_operands);
8886 }
8887
8888 /* inc, dec without inc/dec m. */
8889 if ((i.tm.cpu_flags.bitfield.cpuno64
8890 && (i.tm.base_opcode | 0xf) == 0x4f)
8891 || ((i.tm.base_opcode | 1) == 0xff
8892 && i.tm.extension_opcode <= 0x1))
8893 {
8894 *mf_cmp_p = mf_cmp_incdec;
8895 return !i.mem_operands;
8896 }
8897
8898 return 0;
8899 }
8900
8901 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8902
8903 static int
8904 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
8905 {
8906 /* NB: Don't work with COND_JUMP86 without i386. */
8907 if (!align_branch_power
8908 || now_seg == absolute_section
8909 || !cpu_arch_flags.bitfield.cpui386
8910 || !(align_branch & align_branch_fused_bit))
8911 return 0;
8912
8913 if (maybe_fused_with_jcc_p (mf_cmp_p))
8914 {
8915 if (last_insn.kind == last_insn_other
8916 || last_insn.seg != now_seg)
8917 return 1;
8918 if (flag_debug)
8919 as_warn_where (last_insn.file, last_insn.line,
8920 _("`%s` skips -malign-branch-boundary on `%s`"),
8921 last_insn.name, i.tm.name);
8922 }
8923
8924 return 0;
8925 }
8926
8927 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
8928
8929 static int
8930 add_branch_prefix_frag_p (void)
8931 {
8932 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8933 to PadLock instructions since they include prefixes in opcode. */
8934 if (!align_branch_power
8935 || !align_branch_prefix_size
8936 || now_seg == absolute_section
8937 || i.tm.cpu_flags.bitfield.cpupadlock
8938 || !cpu_arch_flags.bitfield.cpui386)
8939 return 0;
8940
8941 /* Don't add prefix if it is a prefix or there is no operand in case
8942 that segment prefix is special. */
8943 if (!i.operands || i.tm.opcode_modifier.isprefix)
8944 return 0;
8945
8946 if (last_insn.kind == last_insn_other
8947 || last_insn.seg != now_seg)
8948 return 1;
8949
8950 if (flag_debug)
8951 as_warn_where (last_insn.file, last_insn.line,
8952 _("`%s` skips -malign-branch-boundary on `%s`"),
8953 last_insn.name, i.tm.name);
8954
8955 return 0;
8956 }
8957
8958 /* Return 1 if a BRANCH_PADDING frag should be generated. */
8959
8960 static int
8961 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
8962 enum mf_jcc_kind *mf_jcc_p)
8963 {
8964 int add_padding;
8965
8966 /* NB: Don't work with COND_JUMP86 without i386. */
8967 if (!align_branch_power
8968 || now_seg == absolute_section
8969 || !cpu_arch_flags.bitfield.cpui386)
8970 return 0;
8971
8972 add_padding = 0;
8973
8974 /* Check for jcc and direct jmp. */
8975 if (i.tm.opcode_modifier.jump == JUMP)
8976 {
8977 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8978 {
8979 *branch_p = align_branch_jmp;
8980 add_padding = align_branch & align_branch_jmp_bit;
8981 }
8982 else
8983 {
8984 /* Because J<cc> and JN<cc> share same group in macro-fusible table,
8985 igore the lowest bit. */
8986 *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
8987 *branch_p = align_branch_jcc;
8988 if ((align_branch & align_branch_jcc_bit))
8989 add_padding = 1;
8990 }
8991 }
8992 else if (is_any_vex_encoding (&i.tm))
8993 return 0;
8994 else if ((i.tm.base_opcode | 1) == 0xc3)
8995 {
8996 /* Near ret. */
8997 *branch_p = align_branch_ret;
8998 if ((align_branch & align_branch_ret_bit))
8999 add_padding = 1;
9000 }
9001 else
9002 {
9003 /* Check for indirect jmp, direct and indirect calls. */
9004 if (i.tm.base_opcode == 0xe8)
9005 {
9006 /* Direct call. */
9007 *branch_p = align_branch_call;
9008 if ((align_branch & align_branch_call_bit))
9009 add_padding = 1;
9010 }
9011 else if (i.tm.base_opcode == 0xff
9012 && (i.tm.extension_opcode == 2
9013 || i.tm.extension_opcode == 4))
9014 {
9015 /* Indirect call and jmp. */
9016 *branch_p = align_branch_indirect;
9017 if ((align_branch & align_branch_indirect_bit))
9018 add_padding = 1;
9019 }
9020
9021 if (add_padding
9022 && i.disp_operands
9023 && tls_get_addr
9024 && (i.op[0].disps->X_op == O_symbol
9025 || (i.op[0].disps->X_op == O_subtract
9026 && i.op[0].disps->X_op_symbol == GOT_symbol)))
9027 {
9028 symbolS *s = i.op[0].disps->X_add_symbol;
9029 /* No padding to call to global or undefined tls_get_addr. */
9030 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9031 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9032 return 0;
9033 }
9034 }
9035
9036 if (add_padding
9037 && last_insn.kind != last_insn_other
9038 && last_insn.seg == now_seg)
9039 {
9040 if (flag_debug)
9041 as_warn_where (last_insn.file, last_insn.line,
9042 _("`%s` skips -malign-branch-boundary on `%s`"),
9043 last_insn.name, i.tm.name);
9044 return 0;
9045 }
9046
9047 return add_padding;
9048 }
9049
9050 static void
9051 output_insn (void)
9052 {
9053 fragS *insn_start_frag;
9054 offsetT insn_start_off;
9055 fragS *fragP = NULL;
9056 enum align_branch_kind branch = align_branch_none;
9057 /* The initializer is arbitrary just to avoid uninitialized error.
9058 it's actually either assigned in add_branch_padding_frag_p
9059 or never be used. */
9060 enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9061
9062 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9063 if (IS_ELF && x86_used_note)
9064 {
9065 if (i.tm.cpu_flags.bitfield.cpucmov)
9066 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
9067 if (i.tm.cpu_flags.bitfield.cpusse)
9068 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
9069 if (i.tm.cpu_flags.bitfield.cpusse2)
9070 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
9071 if (i.tm.cpu_flags.bitfield.cpusse3)
9072 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
9073 if (i.tm.cpu_flags.bitfield.cpussse3)
9074 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
9075 if (i.tm.cpu_flags.bitfield.cpusse4_1)
9076 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
9077 if (i.tm.cpu_flags.bitfield.cpusse4_2)
9078 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
9079 if (i.tm.cpu_flags.bitfield.cpuavx)
9080 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
9081 if (i.tm.cpu_flags.bitfield.cpuavx2)
9082 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
9083 if (i.tm.cpu_flags.bitfield.cpufma)
9084 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
9085 if (i.tm.cpu_flags.bitfield.cpuavx512f)
9086 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
9087 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
9088 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
9089 if (i.tm.cpu_flags.bitfield.cpuavx512er)
9090 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
9091 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
9092 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
9093 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
9094 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
9095 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
9096 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
9097 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
9098 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
9099 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
9100 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
9101 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
9102 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
9103 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
9104 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
9105 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
9106 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
9107 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
9108 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
9109 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
9110 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
9111 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
9112 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
9113 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
9114 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
9115
9116 if (i.tm.cpu_flags.bitfield.cpu8087
9117 || i.tm.cpu_flags.bitfield.cpu287
9118 || i.tm.cpu_flags.bitfield.cpu387
9119 || i.tm.cpu_flags.bitfield.cpu687
9120 || i.tm.cpu_flags.bitfield.cpufisttp)
9121 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9122 if (i.has_regmmx
9123 || i.tm.base_opcode == 0xf77 /* emms */
9124 || i.tm.base_opcode == 0xf0e /* femms */
9125 || i.tm.base_opcode == 0xf2a /* cvtpi2ps */
9126 || i.tm.base_opcode == 0x660f2a /* cvtpi2pd */)
9127 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9128 if (i.has_regxmm)
9129 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9130 if (i.has_regymm)
9131 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9132 if (i.has_regzmm)
9133 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9134 if (i.tm.cpu_flags.bitfield.cpufxsr)
9135 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9136 if (i.tm.cpu_flags.bitfield.cpuxsave)
9137 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9138 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9139 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9140 if (i.tm.cpu_flags.bitfield.cpuxsavec)
9141 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9142 }
9143 #endif
9144
9145 /* Tie dwarf2 debug info to the address at the start of the insn.
9146 We can't do this after the insn has been output as the current
9147 frag may have been closed off. eg. by frag_var. */
9148 dwarf2_emit_insn (0);
9149
9150 insn_start_frag = frag_now;
9151 insn_start_off = frag_now_fix ();
9152
9153 if (add_branch_padding_frag_p (&branch, &mf_jcc))
9154 {
9155 char *p;
9156 /* Branch can be 8 bytes. Leave some room for prefixes. */
9157 unsigned int max_branch_padding_size = 14;
9158
9159 /* Align section to boundary. */
9160 record_alignment (now_seg, align_branch_power);
9161
9162 /* Make room for padding. */
9163 frag_grow (max_branch_padding_size);
9164
9165 /* Start of the padding. */
9166 p = frag_more (0);
9167
9168 fragP = frag_now;
9169
9170 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9171 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9172 NULL, 0, p);
9173
9174 fragP->tc_frag_data.mf_type = mf_jcc;
9175 fragP->tc_frag_data.branch_type = branch;
9176 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9177 }
9178
9179 /* Output jumps. */
9180 if (i.tm.opcode_modifier.jump == JUMP)
9181 output_branch ();
9182 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9183 || i.tm.opcode_modifier.jump == JUMP_DWORD)
9184 output_jump ();
9185 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9186 output_interseg_jump ();
9187 else
9188 {
9189 /* Output normal instructions here. */
9190 char *p;
9191 unsigned char *q;
9192 unsigned int j;
9193 unsigned int prefix;
9194 enum mf_cmp_kind mf_cmp;
9195
9196 if (avoid_fence
9197 && (i.tm.base_opcode == 0xfaee8
9198 || i.tm.base_opcode == 0xfaef0
9199 || i.tm.base_opcode == 0xfaef8))
9200 {
9201 /* Encode lfence, mfence, and sfence as
9202 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
9203 offsetT val = 0x240483f0ULL;
9204 p = frag_more (5);
9205 md_number_to_chars (p, val, 5);
9206 return;
9207 }
9208
9209 /* Some processors fail on LOCK prefix. This options makes
9210 assembler ignore LOCK prefix and serves as a workaround. */
9211 if (omit_lock_prefix)
9212 {
9213 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9214 return;
9215 i.prefix[LOCK_PREFIX] = 0;
9216 }
9217
9218 if (branch)
9219 /* Skip if this is a branch. */
9220 ;
9221 else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9222 {
9223 /* Make room for padding. */
9224 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9225 p = frag_more (0);
9226
9227 fragP = frag_now;
9228
9229 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9230 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9231 NULL, 0, p);
9232
9233 fragP->tc_frag_data.mf_type = mf_cmp;
9234 fragP->tc_frag_data.branch_type = align_branch_fused;
9235 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9236 }
9237 else if (add_branch_prefix_frag_p ())
9238 {
9239 unsigned int max_prefix_size = align_branch_prefix_size;
9240
9241 /* Make room for padding. */
9242 frag_grow (max_prefix_size);
9243 p = frag_more (0);
9244
9245 fragP = frag_now;
9246
9247 frag_var (rs_machine_dependent, max_prefix_size, 0,
9248 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9249 NULL, 0, p);
9250
9251 fragP->tc_frag_data.max_bytes = max_prefix_size;
9252 }
9253
9254 /* Since the VEX/EVEX prefix contains the implicit prefix, we
9255 don't need the explicit prefix. */
9256 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9257 {
9258 switch (i.tm.opcode_length)
9259 {
9260 case 3:
9261 if (i.tm.base_opcode & 0xff000000)
9262 {
9263 prefix = (i.tm.base_opcode >> 24) & 0xff;
9264 if (!i.tm.cpu_flags.bitfield.cpupadlock
9265 || prefix != REPE_PREFIX_OPCODE
9266 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
9267 add_prefix (prefix);
9268 }
9269 break;
9270 case 2:
9271 if ((i.tm.base_opcode & 0xff0000) != 0)
9272 {
9273 prefix = (i.tm.base_opcode >> 16) & 0xff;
9274 add_prefix (prefix);
9275 }
9276 break;
9277 case 1:
9278 break;
9279 case 0:
9280 /* Check for pseudo prefixes. */
9281 as_bad_where (insn_start_frag->fr_file,
9282 insn_start_frag->fr_line,
9283 _("pseudo prefix without instruction"));
9284 return;
9285 default:
9286 abort ();
9287 }
9288
9289 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9290 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9291 R_X86_64_GOTTPOFF relocation so that linker can safely
9292 perform IE->LE optimization. A dummy REX_OPCODE prefix
9293 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9294 relocation for GDesc -> IE/LE optimization. */
9295 if (x86_elf_abi == X86_64_X32_ABI
9296 && i.operands == 2
9297 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9298 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9299 && i.prefix[REX_PREFIX] == 0)
9300 add_prefix (REX_OPCODE);
9301 #endif
9302
9303 /* The prefix bytes. */
9304 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9305 if (*q)
9306 FRAG_APPEND_1_CHAR (*q);
9307 }
9308 else
9309 {
9310 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9311 if (*q)
9312 switch (j)
9313 {
9314 case SEG_PREFIX:
9315 case ADDR_PREFIX:
9316 FRAG_APPEND_1_CHAR (*q);
9317 break;
9318 default:
9319 /* There should be no other prefixes for instructions
9320 with VEX prefix. */
9321 abort ();
9322 }
9323
9324 /* For EVEX instructions i.vrex should become 0 after
9325 build_evex_prefix. For VEX instructions upper 16 registers
9326 aren't available, so VREX should be 0. */
9327 if (i.vrex)
9328 abort ();
9329 /* Now the VEX prefix. */
9330 p = frag_more (i.vex.length);
9331 for (j = 0; j < i.vex.length; j++)
9332 p[j] = i.vex.bytes[j];
9333 }
9334
9335 /* Now the opcode; be careful about word order here! */
9336 if (i.tm.opcode_length == 1)
9337 {
9338 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9339 }
9340 else
9341 {
9342 switch (i.tm.opcode_length)
9343 {
9344 case 4:
9345 p = frag_more (4);
9346 *p++ = (i.tm.base_opcode >> 24) & 0xff;
9347 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9348 break;
9349 case 3:
9350 p = frag_more (3);
9351 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9352 break;
9353 case 2:
9354 p = frag_more (2);
9355 break;
9356 default:
9357 abort ();
9358 break;
9359 }
9360
9361 /* Put out high byte first: can't use md_number_to_chars! */
9362 *p++ = (i.tm.base_opcode >> 8) & 0xff;
9363 *p = i.tm.base_opcode & 0xff;
9364 }
9365
9366 /* Now the modrm byte and sib byte (if present). */
9367 if (i.tm.opcode_modifier.modrm)
9368 {
9369 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
9370 | i.rm.reg << 3
9371 | i.rm.mode << 6));
9372 /* If i.rm.regmem == ESP (4)
9373 && i.rm.mode != (Register mode)
9374 && not 16 bit
9375 ==> need second modrm byte. */
9376 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9377 && i.rm.mode != 3
9378 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9379 FRAG_APPEND_1_CHAR ((i.sib.base << 0
9380 | i.sib.index << 3
9381 | i.sib.scale << 6));
9382 }
9383
9384 if (i.disp_operands)
9385 output_disp (insn_start_frag, insn_start_off);
9386
9387 if (i.imm_operands)
9388 output_imm (insn_start_frag, insn_start_off);
9389
9390 /*
9391 * frag_now_fix () returning plain abs_section_offset when we're in the
9392 * absolute section, and abs_section_offset not getting updated as data
9393 * gets added to the frag breaks the logic below.
9394 */
9395 if (now_seg != absolute_section)
9396 {
9397 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9398 if (j > 15)
9399 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9400 j);
9401 else if (fragP)
9402 {
9403 /* NB: Don't add prefix with GOTPC relocation since
9404 output_disp() above depends on the fixed encoding
9405 length. Can't add prefix with TLS relocation since
9406 it breaks TLS linker optimization. */
9407 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9408 /* Prefix count on the current instruction. */
9409 unsigned int count = i.vex.length;
9410 unsigned int k;
9411 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9412 /* REX byte is encoded in VEX/EVEX prefix. */
9413 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9414 count++;
9415
9416 /* Count prefixes for extended opcode maps. */
9417 if (!i.vex.length)
9418 switch (i.tm.opcode_length)
9419 {
9420 case 3:
9421 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9422 {
9423 count++;
9424 switch ((i.tm.base_opcode >> 8) & 0xff)
9425 {
9426 case 0x38:
9427 case 0x3a:
9428 count++;
9429 break;
9430 default:
9431 break;
9432 }
9433 }
9434 break;
9435 case 2:
9436 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9437 count++;
9438 break;
9439 case 1:
9440 break;
9441 default:
9442 abort ();
9443 }
9444
9445 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9446 == BRANCH_PREFIX)
9447 {
9448 /* Set the maximum prefix size in BRANCH_PREFIX
9449 frag. */
9450 if (fragP->tc_frag_data.max_bytes > max)
9451 fragP->tc_frag_data.max_bytes = max;
9452 if (fragP->tc_frag_data.max_bytes > count)
9453 fragP->tc_frag_data.max_bytes -= count;
9454 else
9455 fragP->tc_frag_data.max_bytes = 0;
9456 }
9457 else
9458 {
9459 /* Remember the maximum prefix size in FUSED_JCC_PADDING
9460 frag. */
9461 unsigned int max_prefix_size;
9462 if (align_branch_prefix_size > max)
9463 max_prefix_size = max;
9464 else
9465 max_prefix_size = align_branch_prefix_size;
9466 if (max_prefix_size > count)
9467 fragP->tc_frag_data.max_prefix_length
9468 = max_prefix_size - count;
9469 }
9470
9471 /* Use existing segment prefix if possible. Use CS
9472 segment prefix in 64-bit mode. In 32-bit mode, use SS
9473 segment prefix with ESP/EBP base register and use DS
9474 segment prefix without ESP/EBP base register. */
9475 if (i.prefix[SEG_PREFIX])
9476 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9477 else if (flag_code == CODE_64BIT)
9478 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9479 else if (i.base_reg
9480 && (i.base_reg->reg_num == 4
9481 || i.base_reg->reg_num == 5))
9482 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9483 else
9484 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9485 }
9486 }
9487 }
9488
9489 /* NB: Don't work with COND_JUMP86 without i386. */
9490 if (align_branch_power
9491 && now_seg != absolute_section
9492 && cpu_arch_flags.bitfield.cpui386)
9493 {
9494 /* Terminate each frag so that we can add prefix and check for
9495 fused jcc. */
9496 frag_wane (frag_now);
9497 frag_new (0);
9498 }
9499
9500 #ifdef DEBUG386
9501 if (flag_debug)
9502 {
9503 pi ("" /*line*/, &i);
9504 }
9505 #endif /* DEBUG386 */
9506 }
9507
9508 /* Return the size of the displacement operand N. */
9509
9510 static int
9511 disp_size (unsigned int n)
9512 {
9513 int size = 4;
9514
9515 if (i.types[n].bitfield.disp64)
9516 size = 8;
9517 else if (i.types[n].bitfield.disp8)
9518 size = 1;
9519 else if (i.types[n].bitfield.disp16)
9520 size = 2;
9521 return size;
9522 }
9523
9524 /* Return the size of the immediate operand N. */
9525
9526 static int
9527 imm_size (unsigned int n)
9528 {
9529 int size = 4;
9530 if (i.types[n].bitfield.imm64)
9531 size = 8;
9532 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9533 size = 1;
9534 else if (i.types[n].bitfield.imm16)
9535 size = 2;
9536 return size;
9537 }
9538
9539 static void
9540 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9541 {
9542 char *p;
9543 unsigned int n;
9544
9545 for (n = 0; n < i.operands; n++)
9546 {
9547 if (operand_type_check (i.types[n], disp))
9548 {
9549 if (i.op[n].disps->X_op == O_constant)
9550 {
9551 int size = disp_size (n);
9552 offsetT val = i.op[n].disps->X_add_number;
9553
9554 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9555 size);
9556 p = frag_more (size);
9557 md_number_to_chars (p, val, size);
9558 }
9559 else
9560 {
9561 enum bfd_reloc_code_real reloc_type;
9562 int size = disp_size (n);
9563 int sign = i.types[n].bitfield.disp32s;
9564 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9565 fixS *fixP;
9566
9567 /* We can't have 8 bit displacement here. */
9568 gas_assert (!i.types[n].bitfield.disp8);
9569
9570 /* The PC relative address is computed relative
9571 to the instruction boundary, so in case immediate
9572 fields follows, we need to adjust the value. */
9573 if (pcrel && i.imm_operands)
9574 {
9575 unsigned int n1;
9576 int sz = 0;
9577
9578 for (n1 = 0; n1 < i.operands; n1++)
9579 if (operand_type_check (i.types[n1], imm))
9580 {
9581 /* Only one immediate is allowed for PC
9582 relative address. */
9583 gas_assert (sz == 0);
9584 sz = imm_size (n1);
9585 i.op[n].disps->X_add_number -= sz;
9586 }
9587 /* We should find the immediate. */
9588 gas_assert (sz != 0);
9589 }
9590
9591 p = frag_more (size);
9592 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9593 if (GOT_symbol
9594 && GOT_symbol == i.op[n].disps->X_add_symbol
9595 && (((reloc_type == BFD_RELOC_32
9596 || reloc_type == BFD_RELOC_X86_64_32S
9597 || (reloc_type == BFD_RELOC_64
9598 && object_64bit))
9599 && (i.op[n].disps->X_op == O_symbol
9600 || (i.op[n].disps->X_op == O_add
9601 && ((symbol_get_value_expression
9602 (i.op[n].disps->X_op_symbol)->X_op)
9603 == O_subtract))))
9604 || reloc_type == BFD_RELOC_32_PCREL))
9605 {
9606 if (!object_64bit)
9607 {
9608 reloc_type = BFD_RELOC_386_GOTPC;
9609 i.has_gotpc_tls_reloc = TRUE;
9610 i.op[n].imms->X_add_number +=
9611 encoding_length (insn_start_frag, insn_start_off, p);
9612 }
9613 else if (reloc_type == BFD_RELOC_64)
9614 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9615 else
9616 /* Don't do the adjustment for x86-64, as there
9617 the pcrel addressing is relative to the _next_
9618 insn, and that is taken care of in other code. */
9619 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9620 }
9621 else if (align_branch_power)
9622 {
9623 switch (reloc_type)
9624 {
9625 case BFD_RELOC_386_TLS_GD:
9626 case BFD_RELOC_386_TLS_LDM:
9627 case BFD_RELOC_386_TLS_IE:
9628 case BFD_RELOC_386_TLS_IE_32:
9629 case BFD_RELOC_386_TLS_GOTIE:
9630 case BFD_RELOC_386_TLS_GOTDESC:
9631 case BFD_RELOC_386_TLS_DESC_CALL:
9632 case BFD_RELOC_X86_64_TLSGD:
9633 case BFD_RELOC_X86_64_TLSLD:
9634 case BFD_RELOC_X86_64_GOTTPOFF:
9635 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9636 case BFD_RELOC_X86_64_TLSDESC_CALL:
9637 i.has_gotpc_tls_reloc = TRUE;
9638 default:
9639 break;
9640 }
9641 }
9642 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9643 size, i.op[n].disps, pcrel,
9644 reloc_type);
9645 /* Check for "call/jmp *mem", "mov mem, %reg",
9646 "test %reg, mem" and "binop mem, %reg" where binop
9647 is one of adc, add, and, cmp, or, sbb, sub, xor
9648 instructions without data prefix. Always generate
9649 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9650 if (i.prefix[DATA_PREFIX] == 0
9651 && (generate_relax_relocations
9652 || (!object_64bit
9653 && i.rm.mode == 0
9654 && i.rm.regmem == 5))
9655 && (i.rm.mode == 2
9656 || (i.rm.mode == 0 && i.rm.regmem == 5))
9657 && !is_any_vex_encoding(&i.tm)
9658 && ((i.operands == 1
9659 && i.tm.base_opcode == 0xff
9660 && (i.rm.reg == 2 || i.rm.reg == 4))
9661 || (i.operands == 2
9662 && (i.tm.base_opcode == 0x8b
9663 || i.tm.base_opcode == 0x85
9664 || (i.tm.base_opcode & ~0x38) == 0x03))))
9665 {
9666 if (object_64bit)
9667 {
9668 fixP->fx_tcbit = i.rex != 0;
9669 if (i.base_reg
9670 && (i.base_reg->reg_num == RegIP))
9671 fixP->fx_tcbit2 = 1;
9672 }
9673 else
9674 fixP->fx_tcbit2 = 1;
9675 }
9676 }
9677 }
9678 }
9679 }
9680
9681 static void
9682 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9683 {
9684 char *p;
9685 unsigned int n;
9686
9687 for (n = 0; n < i.operands; n++)
9688 {
9689 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9690 if (i.rounding && (int) n == i.rounding->operand)
9691 continue;
9692
9693 if (operand_type_check (i.types[n], imm))
9694 {
9695 if (i.op[n].imms->X_op == O_constant)
9696 {
9697 int size = imm_size (n);
9698 offsetT val;
9699
9700 val = offset_in_range (i.op[n].imms->X_add_number,
9701 size);
9702 p = frag_more (size);
9703 md_number_to_chars (p, val, size);
9704 }
9705 else
9706 {
9707 /* Not absolute_section.
9708 Need a 32-bit fixup (don't support 8bit
9709 non-absolute imms). Try to support other
9710 sizes ... */
9711 enum bfd_reloc_code_real reloc_type;
9712 int size = imm_size (n);
9713 int sign;
9714
9715 if (i.types[n].bitfield.imm32s
9716 && (i.suffix == QWORD_MNEM_SUFFIX
9717 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9718 sign = 1;
9719 else
9720 sign = 0;
9721
9722 p = frag_more (size);
9723 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9724
9725 /* This is tough to explain. We end up with this one if we
9726 * have operands that look like
9727 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9728 * obtain the absolute address of the GOT, and it is strongly
9729 * preferable from a performance point of view to avoid using
9730 * a runtime relocation for this. The actual sequence of
9731 * instructions often look something like:
9732 *
9733 * call .L66
9734 * .L66:
9735 * popl %ebx
9736 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9737 *
9738 * The call and pop essentially return the absolute address
9739 * of the label .L66 and store it in %ebx. The linker itself
9740 * will ultimately change the first operand of the addl so
9741 * that %ebx points to the GOT, but to keep things simple, the
9742 * .o file must have this operand set so that it generates not
9743 * the absolute address of .L66, but the absolute address of
9744 * itself. This allows the linker itself simply treat a GOTPC
9745 * relocation as asking for a pcrel offset to the GOT to be
9746 * added in, and the addend of the relocation is stored in the
9747 * operand field for the instruction itself.
9748 *
9749 * Our job here is to fix the operand so that it would add
9750 * the correct offset so that %ebx would point to itself. The
9751 * thing that is tricky is that .-.L66 will point to the
9752 * beginning of the instruction, so we need to further modify
9753 * the operand so that it will point to itself. There are
9754 * other cases where you have something like:
9755 *
9756 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9757 *
9758 * and here no correction would be required. Internally in
9759 * the assembler we treat operands of this form as not being
9760 * pcrel since the '.' is explicitly mentioned, and I wonder
9761 * whether it would simplify matters to do it this way. Who
9762 * knows. In earlier versions of the PIC patches, the
9763 * pcrel_adjust field was used to store the correction, but
9764 * since the expression is not pcrel, I felt it would be
9765 * confusing to do it this way. */
9766
9767 if ((reloc_type == BFD_RELOC_32
9768 || reloc_type == BFD_RELOC_X86_64_32S
9769 || reloc_type == BFD_RELOC_64)
9770 && GOT_symbol
9771 && GOT_symbol == i.op[n].imms->X_add_symbol
9772 && (i.op[n].imms->X_op == O_symbol
9773 || (i.op[n].imms->X_op == O_add
9774 && ((symbol_get_value_expression
9775 (i.op[n].imms->X_op_symbol)->X_op)
9776 == O_subtract))))
9777 {
9778 if (!object_64bit)
9779 reloc_type = BFD_RELOC_386_GOTPC;
9780 else if (size == 4)
9781 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9782 else if (size == 8)
9783 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9784 i.has_gotpc_tls_reloc = TRUE;
9785 i.op[n].imms->X_add_number +=
9786 encoding_length (insn_start_frag, insn_start_off, p);
9787 }
9788 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9789 i.op[n].imms, 0, reloc_type);
9790 }
9791 }
9792 }
9793 }
9794 \f
9795 /* x86_cons_fix_new is called via the expression parsing code when a
9796 reloc is needed. We use this hook to get the correct .got reloc. */
9797 static int cons_sign = -1;
9798
9799 void
9800 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9801 expressionS *exp, bfd_reloc_code_real_type r)
9802 {
9803 r = reloc (len, 0, cons_sign, r);
9804
9805 #ifdef TE_PE
9806 if (exp->X_op == O_secrel)
9807 {
9808 exp->X_op = O_symbol;
9809 r = BFD_RELOC_32_SECREL;
9810 }
9811 #endif
9812
9813 fix_new_exp (frag, off, len, exp, 0, r);
9814 }
9815
9816 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9817 purpose of the `.dc.a' internal pseudo-op. */
9818
9819 int
9820 x86_address_bytes (void)
9821 {
9822 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9823 return 4;
9824 return stdoutput->arch_info->bits_per_address / 8;
9825 }
9826
9827 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9828 || defined (LEX_AT)
9829 # define lex_got(reloc, adjust, types) NULL
9830 #else
9831 /* Parse operands of the form
9832 <symbol>@GOTOFF+<nnn>
9833 and similar .plt or .got references.
9834
9835 If we find one, set up the correct relocation in RELOC and copy the
9836 input string, minus the `@GOTOFF' into a malloc'd buffer for
9837 parsing by the calling routine. Return this buffer, and if ADJUST
9838 is non-null set it to the length of the string we removed from the
9839 input line. Otherwise return NULL. */
9840 static char *
9841 lex_got (enum bfd_reloc_code_real *rel,
9842 int *adjust,
9843 i386_operand_type *types)
9844 {
9845 /* Some of the relocations depend on the size of what field is to
9846 be relocated. But in our callers i386_immediate and i386_displacement
9847 we don't yet know the operand size (this will be set by insn
9848 matching). Hence we record the word32 relocation here,
9849 and adjust the reloc according to the real size in reloc(). */
9850 static const struct {
9851 const char *str;
9852 int len;
9853 const enum bfd_reloc_code_real rel[2];
9854 const i386_operand_type types64;
9855 } gotrel[] = {
9856 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9857 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9858 BFD_RELOC_SIZE32 },
9859 OPERAND_TYPE_IMM32_64 },
9860 #endif
9861 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9862 BFD_RELOC_X86_64_PLTOFF64 },
9863 OPERAND_TYPE_IMM64 },
9864 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9865 BFD_RELOC_X86_64_PLT32 },
9866 OPERAND_TYPE_IMM32_32S_DISP32 },
9867 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9868 BFD_RELOC_X86_64_GOTPLT64 },
9869 OPERAND_TYPE_IMM64_DISP64 },
9870 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9871 BFD_RELOC_X86_64_GOTOFF64 },
9872 OPERAND_TYPE_IMM64_DISP64 },
9873 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9874 BFD_RELOC_X86_64_GOTPCREL },
9875 OPERAND_TYPE_IMM32_32S_DISP32 },
9876 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9877 BFD_RELOC_X86_64_TLSGD },
9878 OPERAND_TYPE_IMM32_32S_DISP32 },
9879 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9880 _dummy_first_bfd_reloc_code_real },
9881 OPERAND_TYPE_NONE },
9882 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9883 BFD_RELOC_X86_64_TLSLD },
9884 OPERAND_TYPE_IMM32_32S_DISP32 },
9885 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9886 BFD_RELOC_X86_64_GOTTPOFF },
9887 OPERAND_TYPE_IMM32_32S_DISP32 },
9888 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9889 BFD_RELOC_X86_64_TPOFF32 },
9890 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9891 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9892 _dummy_first_bfd_reloc_code_real },
9893 OPERAND_TYPE_NONE },
9894 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9895 BFD_RELOC_X86_64_DTPOFF32 },
9896 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9897 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9898 _dummy_first_bfd_reloc_code_real },
9899 OPERAND_TYPE_NONE },
9900 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9901 _dummy_first_bfd_reloc_code_real },
9902 OPERAND_TYPE_NONE },
9903 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9904 BFD_RELOC_X86_64_GOT32 },
9905 OPERAND_TYPE_IMM32_32S_64_DISP32 },
9906 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9907 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9908 OPERAND_TYPE_IMM32_32S_DISP32 },
9909 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9910 BFD_RELOC_X86_64_TLSDESC_CALL },
9911 OPERAND_TYPE_IMM32_32S_DISP32 },
9912 };
9913 char *cp;
9914 unsigned int j;
9915
9916 #if defined (OBJ_MAYBE_ELF)
9917 if (!IS_ELF)
9918 return NULL;
9919 #endif
9920
9921 for (cp = input_line_pointer; *cp != '@'; cp++)
9922 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9923 return NULL;
9924
9925 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9926 {
9927 int len = gotrel[j].len;
9928 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9929 {
9930 if (gotrel[j].rel[object_64bit] != 0)
9931 {
9932 int first, second;
9933 char *tmpbuf, *past_reloc;
9934
9935 *rel = gotrel[j].rel[object_64bit];
9936
9937 if (types)
9938 {
9939 if (flag_code != CODE_64BIT)
9940 {
9941 types->bitfield.imm32 = 1;
9942 types->bitfield.disp32 = 1;
9943 }
9944 else
9945 *types = gotrel[j].types64;
9946 }
9947
9948 if (j != 0 && GOT_symbol == NULL)
9949 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9950
9951 /* The length of the first part of our input line. */
9952 first = cp - input_line_pointer;
9953
9954 /* The second part goes from after the reloc token until
9955 (and including) an end_of_line char or comma. */
9956 past_reloc = cp + 1 + len;
9957 cp = past_reloc;
9958 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9959 ++cp;
9960 second = cp + 1 - past_reloc;
9961
9962 /* Allocate and copy string. The trailing NUL shouldn't
9963 be necessary, but be safe. */
9964 tmpbuf = XNEWVEC (char, first + second + 2);
9965 memcpy (tmpbuf, input_line_pointer, first);
9966 if (second != 0 && *past_reloc != ' ')
9967 /* Replace the relocation token with ' ', so that
9968 errors like foo@GOTOFF1 will be detected. */
9969 tmpbuf[first++] = ' ';
9970 else
9971 /* Increment length by 1 if the relocation token is
9972 removed. */
9973 len++;
9974 if (adjust)
9975 *adjust = len;
9976 memcpy (tmpbuf + first, past_reloc, second);
9977 tmpbuf[first + second] = '\0';
9978 return tmpbuf;
9979 }
9980
9981 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9982 gotrel[j].str, 1 << (5 + object_64bit));
9983 return NULL;
9984 }
9985 }
9986
9987 /* Might be a symbol version string. Don't as_bad here. */
9988 return NULL;
9989 }
9990 #endif
9991
9992 #ifdef TE_PE
9993 #ifdef lex_got
9994 #undef lex_got
9995 #endif
9996 /* Parse operands of the form
9997 <symbol>@SECREL32+<nnn>
9998
9999 If we find one, set up the correct relocation in RELOC and copy the
10000 input string, minus the `@SECREL32' into a malloc'd buffer for
10001 parsing by the calling routine. Return this buffer, and if ADJUST
10002 is non-null set it to the length of the string we removed from the
10003 input line. Otherwise return NULL.
10004
10005 This function is copied from the ELF version above adjusted for PE targets. */
10006
10007 static char *
10008 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10009 int *adjust ATTRIBUTE_UNUSED,
10010 i386_operand_type *types)
10011 {
10012 static const struct
10013 {
10014 const char *str;
10015 int len;
10016 const enum bfd_reloc_code_real rel[2];
10017 const i386_operand_type types64;
10018 }
10019 gotrel[] =
10020 {
10021 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
10022 BFD_RELOC_32_SECREL },
10023 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10024 };
10025
10026 char *cp;
10027 unsigned j;
10028
10029 for (cp = input_line_pointer; *cp != '@'; cp++)
10030 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10031 return NULL;
10032
10033 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10034 {
10035 int len = gotrel[j].len;
10036
10037 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10038 {
10039 if (gotrel[j].rel[object_64bit] != 0)
10040 {
10041 int first, second;
10042 char *tmpbuf, *past_reloc;
10043
10044 *rel = gotrel[j].rel[object_64bit];
10045 if (adjust)
10046 *adjust = len;
10047
10048 if (types)
10049 {
10050 if (flag_code != CODE_64BIT)
10051 {
10052 types->bitfield.imm32 = 1;
10053 types->bitfield.disp32 = 1;
10054 }
10055 else
10056 *types = gotrel[j].types64;
10057 }
10058
10059 /* The length of the first part of our input line. */
10060 first = cp - input_line_pointer;
10061
10062 /* The second part goes from after the reloc token until
10063 (and including) an end_of_line char or comma. */
10064 past_reloc = cp + 1 + len;
10065 cp = past_reloc;
10066 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10067 ++cp;
10068 second = cp + 1 - past_reloc;
10069
10070 /* Allocate and copy string. The trailing NUL shouldn't
10071 be necessary, but be safe. */
10072 tmpbuf = XNEWVEC (char, first + second + 2);
10073 memcpy (tmpbuf, input_line_pointer, first);
10074 if (second != 0 && *past_reloc != ' ')
10075 /* Replace the relocation token with ' ', so that
10076 errors like foo@SECLREL321 will be detected. */
10077 tmpbuf[first++] = ' ';
10078 memcpy (tmpbuf + first, past_reloc, second);
10079 tmpbuf[first + second] = '\0';
10080 return tmpbuf;
10081 }
10082
10083 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10084 gotrel[j].str, 1 << (5 + object_64bit));
10085 return NULL;
10086 }
10087 }
10088
10089 /* Might be a symbol version string. Don't as_bad here. */
10090 return NULL;
10091 }
10092
10093 #endif /* TE_PE */
10094
10095 bfd_reloc_code_real_type
10096 x86_cons (expressionS *exp, int size)
10097 {
10098 bfd_reloc_code_real_type got_reloc = NO_RELOC;
10099
10100 intel_syntax = -intel_syntax;
10101
10102 exp->X_md = 0;
10103 if (size == 4 || (object_64bit && size == 8))
10104 {
10105 /* Handle @GOTOFF and the like in an expression. */
10106 char *save;
10107 char *gotfree_input_line;
10108 int adjust = 0;
10109
10110 save = input_line_pointer;
10111 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10112 if (gotfree_input_line)
10113 input_line_pointer = gotfree_input_line;
10114
10115 expression (exp);
10116
10117 if (gotfree_input_line)
10118 {
10119 /* expression () has merrily parsed up to the end of line,
10120 or a comma - in the wrong buffer. Transfer how far
10121 input_line_pointer has moved to the right buffer. */
10122 input_line_pointer = (save
10123 + (input_line_pointer - gotfree_input_line)
10124 + adjust);
10125 free (gotfree_input_line);
10126 if (exp->X_op == O_constant
10127 || exp->X_op == O_absent
10128 || exp->X_op == O_illegal
10129 || exp->X_op == O_register
10130 || exp->X_op == O_big)
10131 {
10132 char c = *input_line_pointer;
10133 *input_line_pointer = 0;
10134 as_bad (_("missing or invalid expression `%s'"), save);
10135 *input_line_pointer = c;
10136 }
10137 else if ((got_reloc == BFD_RELOC_386_PLT32
10138 || got_reloc == BFD_RELOC_X86_64_PLT32)
10139 && exp->X_op != O_symbol)
10140 {
10141 char c = *input_line_pointer;
10142 *input_line_pointer = 0;
10143 as_bad (_("invalid PLT expression `%s'"), save);
10144 *input_line_pointer = c;
10145 }
10146 }
10147 }
10148 else
10149 expression (exp);
10150
10151 intel_syntax = -intel_syntax;
10152
10153 if (intel_syntax)
10154 i386_intel_simplify (exp);
10155
10156 return got_reloc;
10157 }
10158
10159 static void
10160 signed_cons (int size)
10161 {
10162 if (flag_code == CODE_64BIT)
10163 cons_sign = 1;
10164 cons (size);
10165 cons_sign = -1;
10166 }
10167
10168 #ifdef TE_PE
10169 static void
10170 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10171 {
10172 expressionS exp;
10173
10174 do
10175 {
10176 expression (&exp);
10177 if (exp.X_op == O_symbol)
10178 exp.X_op = O_secrel;
10179
10180 emit_expr (&exp, 4);
10181 }
10182 while (*input_line_pointer++ == ',');
10183
10184 input_line_pointer--;
10185 demand_empty_rest_of_line ();
10186 }
10187 #endif
10188
10189 /* Handle Vector operations. */
10190
10191 static char *
10192 check_VecOperations (char *op_string, char *op_end)
10193 {
10194 const reg_entry *mask;
10195 const char *saved;
10196 char *end_op;
10197
10198 while (*op_string
10199 && (op_end == NULL || op_string < op_end))
10200 {
10201 saved = op_string;
10202 if (*op_string == '{')
10203 {
10204 op_string++;
10205
10206 /* Check broadcasts. */
10207 if (strncmp (op_string, "1to", 3) == 0)
10208 {
10209 int bcst_type;
10210
10211 if (i.broadcast)
10212 goto duplicated_vec_op;
10213
10214 op_string += 3;
10215 if (*op_string == '8')
10216 bcst_type = 8;
10217 else if (*op_string == '4')
10218 bcst_type = 4;
10219 else if (*op_string == '2')
10220 bcst_type = 2;
10221 else if (*op_string == '1'
10222 && *(op_string+1) == '6')
10223 {
10224 bcst_type = 16;
10225 op_string++;
10226 }
10227 else
10228 {
10229 as_bad (_("Unsupported broadcast: `%s'"), saved);
10230 return NULL;
10231 }
10232 op_string++;
10233
10234 broadcast_op.type = bcst_type;
10235 broadcast_op.operand = this_operand;
10236 broadcast_op.bytes = 0;
10237 i.broadcast = &broadcast_op;
10238 }
10239 /* Check masking operation. */
10240 else if ((mask = parse_register (op_string, &end_op)) != NULL)
10241 {
10242 if (mask == &bad_reg)
10243 return NULL;
10244
10245 /* k0 can't be used for write mask. */
10246 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10247 {
10248 as_bad (_("`%s%s' can't be used for write mask"),
10249 register_prefix, mask->reg_name);
10250 return NULL;
10251 }
10252
10253 if (!i.mask)
10254 {
10255 mask_op.mask = mask;
10256 mask_op.zeroing = 0;
10257 mask_op.operand = this_operand;
10258 i.mask = &mask_op;
10259 }
10260 else
10261 {
10262 if (i.mask->mask)
10263 goto duplicated_vec_op;
10264
10265 i.mask->mask = mask;
10266
10267 /* Only "{z}" is allowed here. No need to check
10268 zeroing mask explicitly. */
10269 if (i.mask->operand != this_operand)
10270 {
10271 as_bad (_("invalid write mask `%s'"), saved);
10272 return NULL;
10273 }
10274 }
10275
10276 op_string = end_op;
10277 }
10278 /* Check zeroing-flag for masking operation. */
10279 else if (*op_string == 'z')
10280 {
10281 if (!i.mask)
10282 {
10283 mask_op.mask = NULL;
10284 mask_op.zeroing = 1;
10285 mask_op.operand = this_operand;
10286 i.mask = &mask_op;
10287 }
10288 else
10289 {
10290 if (i.mask->zeroing)
10291 {
10292 duplicated_vec_op:
10293 as_bad (_("duplicated `%s'"), saved);
10294 return NULL;
10295 }
10296
10297 i.mask->zeroing = 1;
10298
10299 /* Only "{%k}" is allowed here. No need to check mask
10300 register explicitly. */
10301 if (i.mask->operand != this_operand)
10302 {
10303 as_bad (_("invalid zeroing-masking `%s'"),
10304 saved);
10305 return NULL;
10306 }
10307 }
10308
10309 op_string++;
10310 }
10311 else
10312 goto unknown_vec_op;
10313
10314 if (*op_string != '}')
10315 {
10316 as_bad (_("missing `}' in `%s'"), saved);
10317 return NULL;
10318 }
10319 op_string++;
10320
10321 /* Strip whitespace since the addition of pseudo prefixes
10322 changed how the scrubber treats '{'. */
10323 if (is_space_char (*op_string))
10324 ++op_string;
10325
10326 continue;
10327 }
10328 unknown_vec_op:
10329 /* We don't know this one. */
10330 as_bad (_("unknown vector operation: `%s'"), saved);
10331 return NULL;
10332 }
10333
10334 if (i.mask && i.mask->zeroing && !i.mask->mask)
10335 {
10336 as_bad (_("zeroing-masking only allowed with write mask"));
10337 return NULL;
10338 }
10339
10340 return op_string;
10341 }
10342
10343 static int
10344 i386_immediate (char *imm_start)
10345 {
10346 char *save_input_line_pointer;
10347 char *gotfree_input_line;
10348 segT exp_seg = 0;
10349 expressionS *exp;
10350 i386_operand_type types;
10351
10352 operand_type_set (&types, ~0);
10353
10354 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10355 {
10356 as_bad (_("at most %d immediate operands are allowed"),
10357 MAX_IMMEDIATE_OPERANDS);
10358 return 0;
10359 }
10360
10361 exp = &im_expressions[i.imm_operands++];
10362 i.op[this_operand].imms = exp;
10363
10364 if (is_space_char (*imm_start))
10365 ++imm_start;
10366
10367 save_input_line_pointer = input_line_pointer;
10368 input_line_pointer = imm_start;
10369
10370 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10371 if (gotfree_input_line)
10372 input_line_pointer = gotfree_input_line;
10373
10374 exp_seg = expression (exp);
10375
10376 SKIP_WHITESPACE ();
10377
10378 /* Handle vector operations. */
10379 if (*input_line_pointer == '{')
10380 {
10381 input_line_pointer = check_VecOperations (input_line_pointer,
10382 NULL);
10383 if (input_line_pointer == NULL)
10384 return 0;
10385 }
10386
10387 if (*input_line_pointer)
10388 as_bad (_("junk `%s' after expression"), input_line_pointer);
10389
10390 input_line_pointer = save_input_line_pointer;
10391 if (gotfree_input_line)
10392 {
10393 free (gotfree_input_line);
10394
10395 if (exp->X_op == O_constant || exp->X_op == O_register)
10396 exp->X_op = O_illegal;
10397 }
10398
10399 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10400 }
10401
10402 static int
10403 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10404 i386_operand_type types, const char *imm_start)
10405 {
10406 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10407 {
10408 if (imm_start)
10409 as_bad (_("missing or invalid immediate expression `%s'"),
10410 imm_start);
10411 return 0;
10412 }
10413 else if (exp->X_op == O_constant)
10414 {
10415 /* Size it properly later. */
10416 i.types[this_operand].bitfield.imm64 = 1;
10417 /* If not 64bit, sign extend val. */
10418 if (flag_code != CODE_64BIT
10419 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10420 exp->X_add_number
10421 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10422 }
10423 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10424 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10425 && exp_seg != absolute_section
10426 && exp_seg != text_section
10427 && exp_seg != data_section
10428 && exp_seg != bss_section
10429 && exp_seg != undefined_section
10430 && !bfd_is_com_section (exp_seg))
10431 {
10432 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10433 return 0;
10434 }
10435 #endif
10436 else if (!intel_syntax && exp_seg == reg_section)
10437 {
10438 if (imm_start)
10439 as_bad (_("illegal immediate register operand %s"), imm_start);
10440 return 0;
10441 }
10442 else
10443 {
10444 /* This is an address. The size of the address will be
10445 determined later, depending on destination register,
10446 suffix, or the default for the section. */
10447 i.types[this_operand].bitfield.imm8 = 1;
10448 i.types[this_operand].bitfield.imm16 = 1;
10449 i.types[this_operand].bitfield.imm32 = 1;
10450 i.types[this_operand].bitfield.imm32s = 1;
10451 i.types[this_operand].bitfield.imm64 = 1;
10452 i.types[this_operand] = operand_type_and (i.types[this_operand],
10453 types);
10454 }
10455
10456 return 1;
10457 }
10458
10459 static char *
10460 i386_scale (char *scale)
10461 {
10462 offsetT val;
10463 char *save = input_line_pointer;
10464
10465 input_line_pointer = scale;
10466 val = get_absolute_expression ();
10467
10468 switch (val)
10469 {
10470 case 1:
10471 i.log2_scale_factor = 0;
10472 break;
10473 case 2:
10474 i.log2_scale_factor = 1;
10475 break;
10476 case 4:
10477 i.log2_scale_factor = 2;
10478 break;
10479 case 8:
10480 i.log2_scale_factor = 3;
10481 break;
10482 default:
10483 {
10484 char sep = *input_line_pointer;
10485
10486 *input_line_pointer = '\0';
10487 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10488 scale);
10489 *input_line_pointer = sep;
10490 input_line_pointer = save;
10491 return NULL;
10492 }
10493 }
10494 if (i.log2_scale_factor != 0 && i.index_reg == 0)
10495 {
10496 as_warn (_("scale factor of %d without an index register"),
10497 1 << i.log2_scale_factor);
10498 i.log2_scale_factor = 0;
10499 }
10500 scale = input_line_pointer;
10501 input_line_pointer = save;
10502 return scale;
10503 }
10504
10505 static int
10506 i386_displacement (char *disp_start, char *disp_end)
10507 {
10508 expressionS *exp;
10509 segT exp_seg = 0;
10510 char *save_input_line_pointer;
10511 char *gotfree_input_line;
10512 int override;
10513 i386_operand_type bigdisp, types = anydisp;
10514 int ret;
10515
10516 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10517 {
10518 as_bad (_("at most %d displacement operands are allowed"),
10519 MAX_MEMORY_OPERANDS);
10520 return 0;
10521 }
10522
10523 operand_type_set (&bigdisp, 0);
10524 if (i.jumpabsolute
10525 || i.types[this_operand].bitfield.baseindex
10526 || (current_templates->start->opcode_modifier.jump != JUMP
10527 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10528 {
10529 i386_addressing_mode ();
10530 override = (i.prefix[ADDR_PREFIX] != 0);
10531 if (flag_code == CODE_64BIT)
10532 {
10533 if (!override)
10534 {
10535 bigdisp.bitfield.disp32s = 1;
10536 bigdisp.bitfield.disp64 = 1;
10537 }
10538 else
10539 bigdisp.bitfield.disp32 = 1;
10540 }
10541 else if ((flag_code == CODE_16BIT) ^ override)
10542 bigdisp.bitfield.disp16 = 1;
10543 else
10544 bigdisp.bitfield.disp32 = 1;
10545 }
10546 else
10547 {
10548 /* For PC-relative branches, the width of the displacement may be
10549 dependent upon data size, but is never dependent upon address size.
10550 Also make sure to not unintentionally match against a non-PC-relative
10551 branch template. */
10552 static templates aux_templates;
10553 const insn_template *t = current_templates->start;
10554 bfd_boolean has_intel64 = FALSE;
10555
10556 aux_templates.start = t;
10557 while (++t < current_templates->end)
10558 {
10559 if (t->opcode_modifier.jump
10560 != current_templates->start->opcode_modifier.jump)
10561 break;
10562 if ((t->opcode_modifier.isa64 >= INTEL64))
10563 has_intel64 = TRUE;
10564 }
10565 if (t < current_templates->end)
10566 {
10567 aux_templates.end = t;
10568 current_templates = &aux_templates;
10569 }
10570
10571 override = (i.prefix[DATA_PREFIX] != 0);
10572 if (flag_code == CODE_64BIT)
10573 {
10574 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10575 && (!intel64 || !has_intel64))
10576 bigdisp.bitfield.disp16 = 1;
10577 else
10578 bigdisp.bitfield.disp32s = 1;
10579 }
10580 else
10581 {
10582 if (!override)
10583 override = (i.suffix == (flag_code != CODE_16BIT
10584 ? WORD_MNEM_SUFFIX
10585 : LONG_MNEM_SUFFIX));
10586 bigdisp.bitfield.disp32 = 1;
10587 if ((flag_code == CODE_16BIT) ^ override)
10588 {
10589 bigdisp.bitfield.disp32 = 0;
10590 bigdisp.bitfield.disp16 = 1;
10591 }
10592 }
10593 }
10594 i.types[this_operand] = operand_type_or (i.types[this_operand],
10595 bigdisp);
10596
10597 exp = &disp_expressions[i.disp_operands];
10598 i.op[this_operand].disps = exp;
10599 i.disp_operands++;
10600 save_input_line_pointer = input_line_pointer;
10601 input_line_pointer = disp_start;
10602 END_STRING_AND_SAVE (disp_end);
10603
10604 #ifndef GCC_ASM_O_HACK
10605 #define GCC_ASM_O_HACK 0
10606 #endif
10607 #if GCC_ASM_O_HACK
10608 END_STRING_AND_SAVE (disp_end + 1);
10609 if (i.types[this_operand].bitfield.baseIndex
10610 && displacement_string_end[-1] == '+')
10611 {
10612 /* This hack is to avoid a warning when using the "o"
10613 constraint within gcc asm statements.
10614 For instance:
10615
10616 #define _set_tssldt_desc(n,addr,limit,type) \
10617 __asm__ __volatile__ ( \
10618 "movw %w2,%0\n\t" \
10619 "movw %w1,2+%0\n\t" \
10620 "rorl $16,%1\n\t" \
10621 "movb %b1,4+%0\n\t" \
10622 "movb %4,5+%0\n\t" \
10623 "movb $0,6+%0\n\t" \
10624 "movb %h1,7+%0\n\t" \
10625 "rorl $16,%1" \
10626 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10627
10628 This works great except that the output assembler ends
10629 up looking a bit weird if it turns out that there is
10630 no offset. You end up producing code that looks like:
10631
10632 #APP
10633 movw $235,(%eax)
10634 movw %dx,2+(%eax)
10635 rorl $16,%edx
10636 movb %dl,4+(%eax)
10637 movb $137,5+(%eax)
10638 movb $0,6+(%eax)
10639 movb %dh,7+(%eax)
10640 rorl $16,%edx
10641 #NO_APP
10642
10643 So here we provide the missing zero. */
10644
10645 *displacement_string_end = '0';
10646 }
10647 #endif
10648 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10649 if (gotfree_input_line)
10650 input_line_pointer = gotfree_input_line;
10651
10652 exp_seg = expression (exp);
10653
10654 SKIP_WHITESPACE ();
10655 if (*input_line_pointer)
10656 as_bad (_("junk `%s' after expression"), input_line_pointer);
10657 #if GCC_ASM_O_HACK
10658 RESTORE_END_STRING (disp_end + 1);
10659 #endif
10660 input_line_pointer = save_input_line_pointer;
10661 if (gotfree_input_line)
10662 {
10663 free (gotfree_input_line);
10664
10665 if (exp->X_op == O_constant || exp->X_op == O_register)
10666 exp->X_op = O_illegal;
10667 }
10668
10669 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10670
10671 RESTORE_END_STRING (disp_end);
10672
10673 return ret;
10674 }
10675
10676 static int
10677 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10678 i386_operand_type types, const char *disp_start)
10679 {
10680 i386_operand_type bigdisp;
10681 int ret = 1;
10682
10683 /* We do this to make sure that the section symbol is in
10684 the symbol table. We will ultimately change the relocation
10685 to be relative to the beginning of the section. */
10686 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10687 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10688 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10689 {
10690 if (exp->X_op != O_symbol)
10691 goto inv_disp;
10692
10693 if (S_IS_LOCAL (exp->X_add_symbol)
10694 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10695 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10696 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10697 exp->X_op = O_subtract;
10698 exp->X_op_symbol = GOT_symbol;
10699 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10700 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10701 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10702 i.reloc[this_operand] = BFD_RELOC_64;
10703 else
10704 i.reloc[this_operand] = BFD_RELOC_32;
10705 }
10706
10707 else if (exp->X_op == O_absent
10708 || exp->X_op == O_illegal
10709 || exp->X_op == O_big)
10710 {
10711 inv_disp:
10712 as_bad (_("missing or invalid displacement expression `%s'"),
10713 disp_start);
10714 ret = 0;
10715 }
10716
10717 else if (flag_code == CODE_64BIT
10718 && !i.prefix[ADDR_PREFIX]
10719 && exp->X_op == O_constant)
10720 {
10721 /* Since displacement is signed extended to 64bit, don't allow
10722 disp32 and turn off disp32s if they are out of range. */
10723 i.types[this_operand].bitfield.disp32 = 0;
10724 if (!fits_in_signed_long (exp->X_add_number))
10725 {
10726 i.types[this_operand].bitfield.disp32s = 0;
10727 if (i.types[this_operand].bitfield.baseindex)
10728 {
10729 as_bad (_("0x%lx out range of signed 32bit displacement"),
10730 (long) exp->X_add_number);
10731 ret = 0;
10732 }
10733 }
10734 }
10735
10736 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10737 else if (exp->X_op != O_constant
10738 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10739 && exp_seg != absolute_section
10740 && exp_seg != text_section
10741 && exp_seg != data_section
10742 && exp_seg != bss_section
10743 && exp_seg != undefined_section
10744 && !bfd_is_com_section (exp_seg))
10745 {
10746 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10747 ret = 0;
10748 }
10749 #endif
10750
10751 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10752 /* Constants get taken care of by optimize_disp(). */
10753 && exp->X_op != O_constant)
10754 i.types[this_operand].bitfield.disp8 = 1;
10755
10756 /* Check if this is a displacement only operand. */
10757 bigdisp = i.types[this_operand];
10758 bigdisp.bitfield.disp8 = 0;
10759 bigdisp.bitfield.disp16 = 0;
10760 bigdisp.bitfield.disp32 = 0;
10761 bigdisp.bitfield.disp32s = 0;
10762 bigdisp.bitfield.disp64 = 0;
10763 if (operand_type_all_zero (&bigdisp))
10764 i.types[this_operand] = operand_type_and (i.types[this_operand],
10765 types);
10766
10767 return ret;
10768 }
10769
10770 /* Return the active addressing mode, taking address override and
10771 registers forming the address into consideration. Update the
10772 address override prefix if necessary. */
10773
10774 static enum flag_code
10775 i386_addressing_mode (void)
10776 {
10777 enum flag_code addr_mode;
10778
10779 if (i.prefix[ADDR_PREFIX])
10780 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10781 else if (flag_code == CODE_16BIT
10782 && current_templates->start->cpu_flags.bitfield.cpumpx
10783 /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10784 from md_assemble() by "is not a valid base/index expression"
10785 when there is a base and/or index. */
10786 && !i.types[this_operand].bitfield.baseindex)
10787 {
10788 /* MPX insn memory operands with neither base nor index must be forced
10789 to use 32-bit addressing in 16-bit mode. */
10790 addr_mode = CODE_32BIT;
10791 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10792 ++i.prefixes;
10793 gas_assert (!i.types[this_operand].bitfield.disp16);
10794 gas_assert (!i.types[this_operand].bitfield.disp32);
10795 }
10796 else
10797 {
10798 addr_mode = flag_code;
10799
10800 #if INFER_ADDR_PREFIX
10801 if (i.mem_operands == 0)
10802 {
10803 /* Infer address prefix from the first memory operand. */
10804 const reg_entry *addr_reg = i.base_reg;
10805
10806 if (addr_reg == NULL)
10807 addr_reg = i.index_reg;
10808
10809 if (addr_reg)
10810 {
10811 if (addr_reg->reg_type.bitfield.dword)
10812 addr_mode = CODE_32BIT;
10813 else if (flag_code != CODE_64BIT
10814 && addr_reg->reg_type.bitfield.word)
10815 addr_mode = CODE_16BIT;
10816
10817 if (addr_mode != flag_code)
10818 {
10819 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10820 i.prefixes += 1;
10821 /* Change the size of any displacement too. At most one
10822 of Disp16 or Disp32 is set.
10823 FIXME. There doesn't seem to be any real need for
10824 separate Disp16 and Disp32 flags. The same goes for
10825 Imm16 and Imm32. Removing them would probably clean
10826 up the code quite a lot. */
10827 if (flag_code != CODE_64BIT
10828 && (i.types[this_operand].bitfield.disp16
10829 || i.types[this_operand].bitfield.disp32))
10830 i.types[this_operand]
10831 = operand_type_xor (i.types[this_operand], disp16_32);
10832 }
10833 }
10834 }
10835 #endif
10836 }
10837
10838 return addr_mode;
10839 }
10840
10841 /* Make sure the memory operand we've been dealt is valid.
10842 Return 1 on success, 0 on a failure. */
10843
10844 static int
10845 i386_index_check (const char *operand_string)
10846 {
10847 const char *kind = "base/index";
10848 enum flag_code addr_mode = i386_addressing_mode ();
10849
10850 if (current_templates->start->opcode_modifier.isstring
10851 && !current_templates->start->cpu_flags.bitfield.cpupadlock
10852 && (current_templates->end[-1].opcode_modifier.isstring
10853 || i.mem_operands))
10854 {
10855 /* Memory operands of string insns are special in that they only allow
10856 a single register (rDI, rSI, or rBX) as their memory address. */
10857 const reg_entry *expected_reg;
10858 static const char *di_si[][2] =
10859 {
10860 { "esi", "edi" },
10861 { "si", "di" },
10862 { "rsi", "rdi" }
10863 };
10864 static const char *bx[] = { "ebx", "bx", "rbx" };
10865
10866 kind = "string address";
10867
10868 if (current_templates->start->opcode_modifier.repprefixok)
10869 {
10870 int es_op = current_templates->end[-1].opcode_modifier.isstring
10871 - IS_STRING_ES_OP0;
10872 int op = 0;
10873
10874 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10875 || ((!i.mem_operands != !intel_syntax)
10876 && current_templates->end[-1].operand_types[1]
10877 .bitfield.baseindex))
10878 op = 1;
10879 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10880 }
10881 else
10882 expected_reg = hash_find (reg_hash, bx[addr_mode]);
10883
10884 if (i.base_reg != expected_reg
10885 || i.index_reg
10886 || operand_type_check (i.types[this_operand], disp))
10887 {
10888 /* The second memory operand must have the same size as
10889 the first one. */
10890 if (i.mem_operands
10891 && i.base_reg
10892 && !((addr_mode == CODE_64BIT
10893 && i.base_reg->reg_type.bitfield.qword)
10894 || (addr_mode == CODE_32BIT
10895 ? i.base_reg->reg_type.bitfield.dword
10896 : i.base_reg->reg_type.bitfield.word)))
10897 goto bad_address;
10898
10899 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10900 operand_string,
10901 intel_syntax ? '[' : '(',
10902 register_prefix,
10903 expected_reg->reg_name,
10904 intel_syntax ? ']' : ')');
10905 return 1;
10906 }
10907 else
10908 return 1;
10909
10910 bad_address:
10911 as_bad (_("`%s' is not a valid %s expression"),
10912 operand_string, kind);
10913 return 0;
10914 }
10915 else
10916 {
10917 if (addr_mode != CODE_16BIT)
10918 {
10919 /* 32-bit/64-bit checks. */
10920 if ((i.base_reg
10921 && ((addr_mode == CODE_64BIT
10922 ? !i.base_reg->reg_type.bitfield.qword
10923 : !i.base_reg->reg_type.bitfield.dword)
10924 || (i.index_reg && i.base_reg->reg_num == RegIP)
10925 || i.base_reg->reg_num == RegIZ))
10926 || (i.index_reg
10927 && !i.index_reg->reg_type.bitfield.xmmword
10928 && !i.index_reg->reg_type.bitfield.ymmword
10929 && !i.index_reg->reg_type.bitfield.zmmword
10930 && ((addr_mode == CODE_64BIT
10931 ? !i.index_reg->reg_type.bitfield.qword
10932 : !i.index_reg->reg_type.bitfield.dword)
10933 || !i.index_reg->reg_type.bitfield.baseindex)))
10934 goto bad_address;
10935
10936 /* bndmk, bndldx, and bndstx have special restrictions. */
10937 if (current_templates->start->base_opcode == 0xf30f1b
10938 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10939 {
10940 /* They cannot use RIP-relative addressing. */
10941 if (i.base_reg && i.base_reg->reg_num == RegIP)
10942 {
10943 as_bad (_("`%s' cannot be used here"), operand_string);
10944 return 0;
10945 }
10946
10947 /* bndldx and bndstx ignore their scale factor. */
10948 if (current_templates->start->base_opcode != 0xf30f1b
10949 && i.log2_scale_factor)
10950 as_warn (_("register scaling is being ignored here"));
10951 }
10952 }
10953 else
10954 {
10955 /* 16-bit checks. */
10956 if ((i.base_reg
10957 && (!i.base_reg->reg_type.bitfield.word
10958 || !i.base_reg->reg_type.bitfield.baseindex))
10959 || (i.index_reg
10960 && (!i.index_reg->reg_type.bitfield.word
10961 || !i.index_reg->reg_type.bitfield.baseindex
10962 || !(i.base_reg
10963 && i.base_reg->reg_num < 6
10964 && i.index_reg->reg_num >= 6
10965 && i.log2_scale_factor == 0))))
10966 goto bad_address;
10967 }
10968 }
10969 return 1;
10970 }
10971
10972 /* Handle vector immediates. */
10973
10974 static int
10975 RC_SAE_immediate (const char *imm_start)
10976 {
10977 unsigned int match_found, j;
10978 const char *pstr = imm_start;
10979 expressionS *exp;
10980
10981 if (*pstr != '{')
10982 return 0;
10983
10984 pstr++;
10985 match_found = 0;
10986 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10987 {
10988 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10989 {
10990 if (!i.rounding)
10991 {
10992 rc_op.type = RC_NamesTable[j].type;
10993 rc_op.operand = this_operand;
10994 i.rounding = &rc_op;
10995 }
10996 else
10997 {
10998 as_bad (_("duplicated `%s'"), imm_start);
10999 return 0;
11000 }
11001 pstr += RC_NamesTable[j].len;
11002 match_found = 1;
11003 break;
11004 }
11005 }
11006 if (!match_found)
11007 return 0;
11008
11009 if (*pstr++ != '}')
11010 {
11011 as_bad (_("Missing '}': '%s'"), imm_start);
11012 return 0;
11013 }
11014 /* RC/SAE immediate string should contain nothing more. */;
11015 if (*pstr != 0)
11016 {
11017 as_bad (_("Junk after '}': '%s'"), imm_start);
11018 return 0;
11019 }
11020
11021 exp = &im_expressions[i.imm_operands++];
11022 i.op[this_operand].imms = exp;
11023
11024 exp->X_op = O_constant;
11025 exp->X_add_number = 0;
11026 exp->X_add_symbol = (symbolS *) 0;
11027 exp->X_op_symbol = (symbolS *) 0;
11028
11029 i.types[this_operand].bitfield.imm8 = 1;
11030 return 1;
11031 }
11032
11033 /* Only string instructions can have a second memory operand, so
11034 reduce current_templates to just those if it contains any. */
11035 static int
11036 maybe_adjust_templates (void)
11037 {
11038 const insn_template *t;
11039
11040 gas_assert (i.mem_operands == 1);
11041
11042 for (t = current_templates->start; t < current_templates->end; ++t)
11043 if (t->opcode_modifier.isstring)
11044 break;
11045
11046 if (t < current_templates->end)
11047 {
11048 static templates aux_templates;
11049 bfd_boolean recheck;
11050
11051 aux_templates.start = t;
11052 for (; t < current_templates->end; ++t)
11053 if (!t->opcode_modifier.isstring)
11054 break;
11055 aux_templates.end = t;
11056
11057 /* Determine whether to re-check the first memory operand. */
11058 recheck = (aux_templates.start != current_templates->start
11059 || t != current_templates->end);
11060
11061 current_templates = &aux_templates;
11062
11063 if (recheck)
11064 {
11065 i.mem_operands = 0;
11066 if (i.memop1_string != NULL
11067 && i386_index_check (i.memop1_string) == 0)
11068 return 0;
11069 i.mem_operands = 1;
11070 }
11071 }
11072
11073 return 1;
11074 }
11075
11076 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
11077 on error. */
11078
11079 static int
11080 i386_att_operand (char *operand_string)
11081 {
11082 const reg_entry *r;
11083 char *end_op;
11084 char *op_string = operand_string;
11085
11086 if (is_space_char (*op_string))
11087 ++op_string;
11088
11089 /* We check for an absolute prefix (differentiating,
11090 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
11091 if (*op_string == ABSOLUTE_PREFIX)
11092 {
11093 ++op_string;
11094 if (is_space_char (*op_string))
11095 ++op_string;
11096 i.jumpabsolute = TRUE;
11097 }
11098
11099 /* Check if operand is a register. */
11100 if ((r = parse_register (op_string, &end_op)) != NULL)
11101 {
11102 i386_operand_type temp;
11103
11104 if (r == &bad_reg)
11105 return 0;
11106
11107 /* Check for a segment override by searching for ':' after a
11108 segment register. */
11109 op_string = end_op;
11110 if (is_space_char (*op_string))
11111 ++op_string;
11112 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11113 {
11114 switch (r->reg_num)
11115 {
11116 case 0:
11117 i.seg[i.mem_operands] = &es;
11118 break;
11119 case 1:
11120 i.seg[i.mem_operands] = &cs;
11121 break;
11122 case 2:
11123 i.seg[i.mem_operands] = &ss;
11124 break;
11125 case 3:
11126 i.seg[i.mem_operands] = &ds;
11127 break;
11128 case 4:
11129 i.seg[i.mem_operands] = &fs;
11130 break;
11131 case 5:
11132 i.seg[i.mem_operands] = &gs;
11133 break;
11134 }
11135
11136 /* Skip the ':' and whitespace. */
11137 ++op_string;
11138 if (is_space_char (*op_string))
11139 ++op_string;
11140
11141 if (!is_digit_char (*op_string)
11142 && !is_identifier_char (*op_string)
11143 && *op_string != '('
11144 && *op_string != ABSOLUTE_PREFIX)
11145 {
11146 as_bad (_("bad memory operand `%s'"), op_string);
11147 return 0;
11148 }
11149 /* Handle case of %es:*foo. */
11150 if (*op_string == ABSOLUTE_PREFIX)
11151 {
11152 ++op_string;
11153 if (is_space_char (*op_string))
11154 ++op_string;
11155 i.jumpabsolute = TRUE;
11156 }
11157 goto do_memory_reference;
11158 }
11159
11160 /* Handle vector operations. */
11161 if (*op_string == '{')
11162 {
11163 op_string = check_VecOperations (op_string, NULL);
11164 if (op_string == NULL)
11165 return 0;
11166 }
11167
11168 if (*op_string)
11169 {
11170 as_bad (_("junk `%s' after register"), op_string);
11171 return 0;
11172 }
11173 temp = r->reg_type;
11174 temp.bitfield.baseindex = 0;
11175 i.types[this_operand] = operand_type_or (i.types[this_operand],
11176 temp);
11177 i.types[this_operand].bitfield.unspecified = 0;
11178 i.op[this_operand].regs = r;
11179 i.reg_operands++;
11180 }
11181 else if (*op_string == REGISTER_PREFIX)
11182 {
11183 as_bad (_("bad register name `%s'"), op_string);
11184 return 0;
11185 }
11186 else if (*op_string == IMMEDIATE_PREFIX)
11187 {
11188 ++op_string;
11189 if (i.jumpabsolute)
11190 {
11191 as_bad (_("immediate operand illegal with absolute jump"));
11192 return 0;
11193 }
11194 if (!i386_immediate (op_string))
11195 return 0;
11196 }
11197 else if (RC_SAE_immediate (operand_string))
11198 {
11199 /* If it is a RC or SAE immediate, do nothing. */
11200 ;
11201 }
11202 else if (is_digit_char (*op_string)
11203 || is_identifier_char (*op_string)
11204 || *op_string == '"'
11205 || *op_string == '(')
11206 {
11207 /* This is a memory reference of some sort. */
11208 char *base_string;
11209
11210 /* Start and end of displacement string expression (if found). */
11211 char *displacement_string_start;
11212 char *displacement_string_end;
11213 char *vop_start;
11214
11215 do_memory_reference:
11216 if (i.mem_operands == 1 && !maybe_adjust_templates ())
11217 return 0;
11218 if ((i.mem_operands == 1
11219 && !current_templates->start->opcode_modifier.isstring)
11220 || i.mem_operands == 2)
11221 {
11222 as_bad (_("too many memory references for `%s'"),
11223 current_templates->start->name);
11224 return 0;
11225 }
11226
11227 /* Check for base index form. We detect the base index form by
11228 looking for an ')' at the end of the operand, searching
11229 for the '(' matching it, and finding a REGISTER_PREFIX or ','
11230 after the '('. */
11231 base_string = op_string + strlen (op_string);
11232
11233 /* Handle vector operations. */
11234 vop_start = strchr (op_string, '{');
11235 if (vop_start && vop_start < base_string)
11236 {
11237 if (check_VecOperations (vop_start, base_string) == NULL)
11238 return 0;
11239 base_string = vop_start;
11240 }
11241
11242 --base_string;
11243 if (is_space_char (*base_string))
11244 --base_string;
11245
11246 /* If we only have a displacement, set-up for it to be parsed later. */
11247 displacement_string_start = op_string;
11248 displacement_string_end = base_string + 1;
11249
11250 if (*base_string == ')')
11251 {
11252 char *temp_string;
11253 unsigned int parens_balanced = 1;
11254 /* We've already checked that the number of left & right ()'s are
11255 equal, so this loop will not be infinite. */
11256 do
11257 {
11258 base_string--;
11259 if (*base_string == ')')
11260 parens_balanced++;
11261 if (*base_string == '(')
11262 parens_balanced--;
11263 }
11264 while (parens_balanced);
11265
11266 temp_string = base_string;
11267
11268 /* Skip past '(' and whitespace. */
11269 ++base_string;
11270 if (is_space_char (*base_string))
11271 ++base_string;
11272
11273 if (*base_string == ','
11274 || ((i.base_reg = parse_register (base_string, &end_op))
11275 != NULL))
11276 {
11277 displacement_string_end = temp_string;
11278
11279 i.types[this_operand].bitfield.baseindex = 1;
11280
11281 if (i.base_reg)
11282 {
11283 if (i.base_reg == &bad_reg)
11284 return 0;
11285 base_string = end_op;
11286 if (is_space_char (*base_string))
11287 ++base_string;
11288 }
11289
11290 /* There may be an index reg or scale factor here. */
11291 if (*base_string == ',')
11292 {
11293 ++base_string;
11294 if (is_space_char (*base_string))
11295 ++base_string;
11296
11297 if ((i.index_reg = parse_register (base_string, &end_op))
11298 != NULL)
11299 {
11300 if (i.index_reg == &bad_reg)
11301 return 0;
11302 base_string = end_op;
11303 if (is_space_char (*base_string))
11304 ++base_string;
11305 if (*base_string == ',')
11306 {
11307 ++base_string;
11308 if (is_space_char (*base_string))
11309 ++base_string;
11310 }
11311 else if (*base_string != ')')
11312 {
11313 as_bad (_("expecting `,' or `)' "
11314 "after index register in `%s'"),
11315 operand_string);
11316 return 0;
11317 }
11318 }
11319 else if (*base_string == REGISTER_PREFIX)
11320 {
11321 end_op = strchr (base_string, ',');
11322 if (end_op)
11323 *end_op = '\0';
11324 as_bad (_("bad register name `%s'"), base_string);
11325 return 0;
11326 }
11327
11328 /* Check for scale factor. */
11329 if (*base_string != ')')
11330 {
11331 char *end_scale = i386_scale (base_string);
11332
11333 if (!end_scale)
11334 return 0;
11335
11336 base_string = end_scale;
11337 if (is_space_char (*base_string))
11338 ++base_string;
11339 if (*base_string != ')')
11340 {
11341 as_bad (_("expecting `)' "
11342 "after scale factor in `%s'"),
11343 operand_string);
11344 return 0;
11345 }
11346 }
11347 else if (!i.index_reg)
11348 {
11349 as_bad (_("expecting index register or scale factor "
11350 "after `,'; got '%c'"),
11351 *base_string);
11352 return 0;
11353 }
11354 }
11355 else if (*base_string != ')')
11356 {
11357 as_bad (_("expecting `,' or `)' "
11358 "after base register in `%s'"),
11359 operand_string);
11360 return 0;
11361 }
11362 }
11363 else if (*base_string == REGISTER_PREFIX)
11364 {
11365 end_op = strchr (base_string, ',');
11366 if (end_op)
11367 *end_op = '\0';
11368 as_bad (_("bad register name `%s'"), base_string);
11369 return 0;
11370 }
11371 }
11372
11373 /* If there's an expression beginning the operand, parse it,
11374 assuming displacement_string_start and
11375 displacement_string_end are meaningful. */
11376 if (displacement_string_start != displacement_string_end)
11377 {
11378 if (!i386_displacement (displacement_string_start,
11379 displacement_string_end))
11380 return 0;
11381 }
11382
11383 /* Special case for (%dx) while doing input/output op. */
11384 if (i.base_reg
11385 && i.base_reg->reg_type.bitfield.instance == RegD
11386 && i.base_reg->reg_type.bitfield.word
11387 && i.index_reg == 0
11388 && i.log2_scale_factor == 0
11389 && i.seg[i.mem_operands] == 0
11390 && !operand_type_check (i.types[this_operand], disp))
11391 {
11392 i.types[this_operand] = i.base_reg->reg_type;
11393 return 1;
11394 }
11395
11396 if (i386_index_check (operand_string) == 0)
11397 return 0;
11398 i.flags[this_operand] |= Operand_Mem;
11399 if (i.mem_operands == 0)
11400 i.memop1_string = xstrdup (operand_string);
11401 i.mem_operands++;
11402 }
11403 else
11404 {
11405 /* It's not a memory operand; argh! */
11406 as_bad (_("invalid char %s beginning operand %d `%s'"),
11407 output_invalid (*op_string),
11408 this_operand + 1,
11409 op_string);
11410 return 0;
11411 }
11412 return 1; /* Normal return. */
11413 }
11414 \f
11415 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11416 that an rs_machine_dependent frag may reach. */
11417
11418 unsigned int
11419 i386_frag_max_var (fragS *frag)
11420 {
11421 /* The only relaxable frags are for jumps.
11422 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
11423 gas_assert (frag->fr_type == rs_machine_dependent);
11424 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11425 }
11426
11427 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11428 static int
11429 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11430 {
11431 /* STT_GNU_IFUNC symbol must go through PLT. */
11432 if ((symbol_get_bfdsym (fr_symbol)->flags
11433 & BSF_GNU_INDIRECT_FUNCTION) != 0)
11434 return 0;
11435
11436 if (!S_IS_EXTERNAL (fr_symbol))
11437 /* Symbol may be weak or local. */
11438 return !S_IS_WEAK (fr_symbol);
11439
11440 /* Global symbols with non-default visibility can't be preempted. */
11441 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11442 return 1;
11443
11444 if (fr_var != NO_RELOC)
11445 switch ((enum bfd_reloc_code_real) fr_var)
11446 {
11447 case BFD_RELOC_386_PLT32:
11448 case BFD_RELOC_X86_64_PLT32:
11449 /* Symbol with PLT relocation may be preempted. */
11450 return 0;
11451 default:
11452 abort ();
11453 }
11454
11455 /* Global symbols with default visibility in a shared library may be
11456 preempted by another definition. */
11457 return !shared;
11458 }
11459 #endif
11460
11461 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11462 Note also work for Skylake and Cascadelake.
11463 ---------------------------------------------------------------------
11464 | JCC | ADD/SUB/CMP | INC/DEC | TEST/AND |
11465 | ------ | ----------- | ------- | -------- |
11466 | Jo | N | N | Y |
11467 | Jno | N | N | Y |
11468 | Jc/Jb | Y | N | Y |
11469 | Jae/Jnb | Y | N | Y |
11470 | Je/Jz | Y | Y | Y |
11471 | Jne/Jnz | Y | Y | Y |
11472 | Jna/Jbe | Y | N | Y |
11473 | Ja/Jnbe | Y | N | Y |
11474 | Js | N | N | Y |
11475 | Jns | N | N | Y |
11476 | Jp/Jpe | N | N | Y |
11477 | Jnp/Jpo | N | N | Y |
11478 | Jl/Jnge | Y | Y | Y |
11479 | Jge/Jnl | Y | Y | Y |
11480 | Jle/Jng | Y | Y | Y |
11481 | Jg/Jnle | Y | Y | Y |
11482 --------------------------------------------------------------------- */
11483 static int
11484 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11485 {
11486 if (mf_cmp == mf_cmp_alu_cmp)
11487 return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11488 || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11489 if (mf_cmp == mf_cmp_incdec)
11490 return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11491 || mf_jcc == mf_jcc_jle);
11492 if (mf_cmp == mf_cmp_test_and)
11493 return 1;
11494 return 0;
11495 }
11496
11497 /* Return the next non-empty frag. */
11498
11499 static fragS *
11500 i386_next_non_empty_frag (fragS *fragP)
11501 {
11502 /* There may be a frag with a ".fill 0" when there is no room in
11503 the current frag for frag_grow in output_insn. */
11504 for (fragP = fragP->fr_next;
11505 (fragP != NULL
11506 && fragP->fr_type == rs_fill
11507 && fragP->fr_fix == 0);
11508 fragP = fragP->fr_next)
11509 ;
11510 return fragP;
11511 }
11512
11513 /* Return the next jcc frag after BRANCH_PADDING. */
11514
11515 static fragS *
11516 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11517 {
11518 fragS *branch_fragP;
11519 if (!pad_fragP)
11520 return NULL;
11521
11522 if (pad_fragP->fr_type == rs_machine_dependent
11523 && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11524 == BRANCH_PADDING))
11525 {
11526 branch_fragP = i386_next_non_empty_frag (pad_fragP);
11527 if (branch_fragP->fr_type != rs_machine_dependent)
11528 return NULL;
11529 if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11530 && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11531 pad_fragP->tc_frag_data.mf_type))
11532 return branch_fragP;
11533 }
11534
11535 return NULL;
11536 }
11537
11538 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
11539
11540 static void
11541 i386_classify_machine_dependent_frag (fragS *fragP)
11542 {
11543 fragS *cmp_fragP;
11544 fragS *pad_fragP;
11545 fragS *branch_fragP;
11546 fragS *next_fragP;
11547 unsigned int max_prefix_length;
11548
11549 if (fragP->tc_frag_data.classified)
11550 return;
11551
11552 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11553 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11554 for (next_fragP = fragP;
11555 next_fragP != NULL;
11556 next_fragP = next_fragP->fr_next)
11557 {
11558 next_fragP->tc_frag_data.classified = 1;
11559 if (next_fragP->fr_type == rs_machine_dependent)
11560 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11561 {
11562 case BRANCH_PADDING:
11563 /* The BRANCH_PADDING frag must be followed by a branch
11564 frag. */
11565 branch_fragP = i386_next_non_empty_frag (next_fragP);
11566 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11567 break;
11568 case FUSED_JCC_PADDING:
11569 /* Check if this is a fused jcc:
11570 FUSED_JCC_PADDING
11571 CMP like instruction
11572 BRANCH_PADDING
11573 COND_JUMP
11574 */
11575 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11576 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11577 branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11578 if (branch_fragP)
11579 {
11580 /* The BRANCH_PADDING frag is merged with the
11581 FUSED_JCC_PADDING frag. */
11582 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11583 /* CMP like instruction size. */
11584 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11585 frag_wane (pad_fragP);
11586 /* Skip to branch_fragP. */
11587 next_fragP = branch_fragP;
11588 }
11589 else if (next_fragP->tc_frag_data.max_prefix_length)
11590 {
11591 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11592 a fused jcc. */
11593 next_fragP->fr_subtype
11594 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11595 next_fragP->tc_frag_data.max_bytes
11596 = next_fragP->tc_frag_data.max_prefix_length;
11597 /* This will be updated in the BRANCH_PREFIX scan. */
11598 next_fragP->tc_frag_data.max_prefix_length = 0;
11599 }
11600 else
11601 frag_wane (next_fragP);
11602 break;
11603 }
11604 }
11605
11606 /* Stop if there is no BRANCH_PREFIX. */
11607 if (!align_branch_prefix_size)
11608 return;
11609
11610 /* Scan for BRANCH_PREFIX. */
11611 for (; fragP != NULL; fragP = fragP->fr_next)
11612 {
11613 if (fragP->fr_type != rs_machine_dependent
11614 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11615 != BRANCH_PREFIX))
11616 continue;
11617
11618 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11619 COND_JUMP_PREFIX. */
11620 max_prefix_length = 0;
11621 for (next_fragP = fragP;
11622 next_fragP != NULL;
11623 next_fragP = next_fragP->fr_next)
11624 {
11625 if (next_fragP->fr_type == rs_fill)
11626 /* Skip rs_fill frags. */
11627 continue;
11628 else if (next_fragP->fr_type != rs_machine_dependent)
11629 /* Stop for all other frags. */
11630 break;
11631
11632 /* rs_machine_dependent frags. */
11633 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11634 == BRANCH_PREFIX)
11635 {
11636 /* Count BRANCH_PREFIX frags. */
11637 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11638 {
11639 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11640 frag_wane (next_fragP);
11641 }
11642 else
11643 max_prefix_length
11644 += next_fragP->tc_frag_data.max_bytes;
11645 }
11646 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11647 == BRANCH_PADDING)
11648 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11649 == FUSED_JCC_PADDING))
11650 {
11651 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11652 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11653 break;
11654 }
11655 else
11656 /* Stop for other rs_machine_dependent frags. */
11657 break;
11658 }
11659
11660 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11661
11662 /* Skip to the next frag. */
11663 fragP = next_fragP;
11664 }
11665 }
11666
11667 /* Compute padding size for
11668
11669 FUSED_JCC_PADDING
11670 CMP like instruction
11671 BRANCH_PADDING
11672 COND_JUMP/UNCOND_JUMP
11673
11674 or
11675
11676 BRANCH_PADDING
11677 COND_JUMP/UNCOND_JUMP
11678 */
11679
11680 static int
11681 i386_branch_padding_size (fragS *fragP, offsetT address)
11682 {
11683 unsigned int offset, size, padding_size;
11684 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11685
11686 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11687 if (!address)
11688 address = fragP->fr_address;
11689 address += fragP->fr_fix;
11690
11691 /* CMP like instrunction size. */
11692 size = fragP->tc_frag_data.cmp_size;
11693
11694 /* The base size of the branch frag. */
11695 size += branch_fragP->fr_fix;
11696
11697 /* Add opcode and displacement bytes for the rs_machine_dependent
11698 branch frag. */
11699 if (branch_fragP->fr_type == rs_machine_dependent)
11700 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11701
11702 /* Check if branch is within boundary and doesn't end at the last
11703 byte. */
11704 offset = address & ((1U << align_branch_power) - 1);
11705 if ((offset + size) >= (1U << align_branch_power))
11706 /* Padding needed to avoid crossing boundary. */
11707 padding_size = (1U << align_branch_power) - offset;
11708 else
11709 /* No padding needed. */
11710 padding_size = 0;
11711
11712 /* The return value may be saved in tc_frag_data.length which is
11713 unsigned byte. */
11714 if (!fits_in_unsigned_byte (padding_size))
11715 abort ();
11716
11717 return padding_size;
11718 }
11719
11720 /* i386_generic_table_relax_frag()
11721
11722 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11723 grow/shrink padding to align branch frags. Hand others to
11724 relax_frag(). */
11725
11726 long
11727 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11728 {
11729 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11730 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11731 {
11732 long padding_size = i386_branch_padding_size (fragP, 0);
11733 long grow = padding_size - fragP->tc_frag_data.length;
11734
11735 /* When the BRANCH_PREFIX frag is used, the computed address
11736 must match the actual address and there should be no padding. */
11737 if (fragP->tc_frag_data.padding_address
11738 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11739 || padding_size))
11740 abort ();
11741
11742 /* Update the padding size. */
11743 if (grow)
11744 fragP->tc_frag_data.length = padding_size;
11745
11746 return grow;
11747 }
11748 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11749 {
11750 fragS *padding_fragP, *next_fragP;
11751 long padding_size, left_size, last_size;
11752
11753 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11754 if (!padding_fragP)
11755 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11756 return (fragP->tc_frag_data.length
11757 - fragP->tc_frag_data.last_length);
11758
11759 /* Compute the relative address of the padding frag in the very
11760 first time where the BRANCH_PREFIX frag sizes are zero. */
11761 if (!fragP->tc_frag_data.padding_address)
11762 fragP->tc_frag_data.padding_address
11763 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11764
11765 /* First update the last length from the previous interation. */
11766 left_size = fragP->tc_frag_data.prefix_length;
11767 for (next_fragP = fragP;
11768 next_fragP != padding_fragP;
11769 next_fragP = next_fragP->fr_next)
11770 if (next_fragP->fr_type == rs_machine_dependent
11771 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11772 == BRANCH_PREFIX))
11773 {
11774 if (left_size)
11775 {
11776 int max = next_fragP->tc_frag_data.max_bytes;
11777 if (max)
11778 {
11779 int size;
11780 if (max > left_size)
11781 size = left_size;
11782 else
11783 size = max;
11784 left_size -= size;
11785 next_fragP->tc_frag_data.last_length = size;
11786 }
11787 }
11788 else
11789 next_fragP->tc_frag_data.last_length = 0;
11790 }
11791
11792 /* Check the padding size for the padding frag. */
11793 padding_size = i386_branch_padding_size
11794 (padding_fragP, (fragP->fr_address
11795 + fragP->tc_frag_data.padding_address));
11796
11797 last_size = fragP->tc_frag_data.prefix_length;
11798 /* Check if there is change from the last interation. */
11799 if (padding_size == last_size)
11800 {
11801 /* Update the expected address of the padding frag. */
11802 padding_fragP->tc_frag_data.padding_address
11803 = (fragP->fr_address + padding_size
11804 + fragP->tc_frag_data.padding_address);
11805 return 0;
11806 }
11807
11808 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11809 {
11810 /* No padding if there is no sufficient room. Clear the
11811 expected address of the padding frag. */
11812 padding_fragP->tc_frag_data.padding_address = 0;
11813 padding_size = 0;
11814 }
11815 else
11816 /* Store the expected address of the padding frag. */
11817 padding_fragP->tc_frag_data.padding_address
11818 = (fragP->fr_address + padding_size
11819 + fragP->tc_frag_data.padding_address);
11820
11821 fragP->tc_frag_data.prefix_length = padding_size;
11822
11823 /* Update the length for the current interation. */
11824 left_size = padding_size;
11825 for (next_fragP = fragP;
11826 next_fragP != padding_fragP;
11827 next_fragP = next_fragP->fr_next)
11828 if (next_fragP->fr_type == rs_machine_dependent
11829 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11830 == BRANCH_PREFIX))
11831 {
11832 if (left_size)
11833 {
11834 int max = next_fragP->tc_frag_data.max_bytes;
11835 if (max)
11836 {
11837 int size;
11838 if (max > left_size)
11839 size = left_size;
11840 else
11841 size = max;
11842 left_size -= size;
11843 next_fragP->tc_frag_data.length = size;
11844 }
11845 }
11846 else
11847 next_fragP->tc_frag_data.length = 0;
11848 }
11849
11850 return (fragP->tc_frag_data.length
11851 - fragP->tc_frag_data.last_length);
11852 }
11853 return relax_frag (segment, fragP, stretch);
11854 }
11855
11856 /* md_estimate_size_before_relax()
11857
11858 Called just before relax() for rs_machine_dependent frags. The x86
11859 assembler uses these frags to handle variable size jump
11860 instructions.
11861
11862 Any symbol that is now undefined will not become defined.
11863 Return the correct fr_subtype in the frag.
11864 Return the initial "guess for variable size of frag" to caller.
11865 The guess is actually the growth beyond the fixed part. Whatever
11866 we do to grow the fixed or variable part contributes to our
11867 returned value. */
11868
11869 int
11870 md_estimate_size_before_relax (fragS *fragP, segT segment)
11871 {
11872 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11873 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11874 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11875 {
11876 i386_classify_machine_dependent_frag (fragP);
11877 return fragP->tc_frag_data.length;
11878 }
11879
11880 /* We've already got fragP->fr_subtype right; all we have to do is
11881 check for un-relaxable symbols. On an ELF system, we can't relax
11882 an externally visible symbol, because it may be overridden by a
11883 shared library. */
11884 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11885 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11886 || (IS_ELF
11887 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11888 fragP->fr_var))
11889 #endif
11890 #if defined (OBJ_COFF) && defined (TE_PE)
11891 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11892 && S_IS_WEAK (fragP->fr_symbol))
11893 #endif
11894 )
11895 {
11896 /* Symbol is undefined in this segment, or we need to keep a
11897 reloc so that weak symbols can be overridden. */
11898 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11899 enum bfd_reloc_code_real reloc_type;
11900 unsigned char *opcode;
11901 int old_fr_fix;
11902
11903 if (fragP->fr_var != NO_RELOC)
11904 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11905 else if (size == 2)
11906 reloc_type = BFD_RELOC_16_PCREL;
11907 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11908 else if (need_plt32_p (fragP->fr_symbol))
11909 reloc_type = BFD_RELOC_X86_64_PLT32;
11910 #endif
11911 else
11912 reloc_type = BFD_RELOC_32_PCREL;
11913
11914 old_fr_fix = fragP->fr_fix;
11915 opcode = (unsigned char *) fragP->fr_opcode;
11916
11917 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11918 {
11919 case UNCOND_JUMP:
11920 /* Make jmp (0xeb) a (d)word displacement jump. */
11921 opcode[0] = 0xe9;
11922 fragP->fr_fix += size;
11923 fix_new (fragP, old_fr_fix, size,
11924 fragP->fr_symbol,
11925 fragP->fr_offset, 1,
11926 reloc_type);
11927 break;
11928
11929 case COND_JUMP86:
11930 if (size == 2
11931 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11932 {
11933 /* Negate the condition, and branch past an
11934 unconditional jump. */
11935 opcode[0] ^= 1;
11936 opcode[1] = 3;
11937 /* Insert an unconditional jump. */
11938 opcode[2] = 0xe9;
11939 /* We added two extra opcode bytes, and have a two byte
11940 offset. */
11941 fragP->fr_fix += 2 + 2;
11942 fix_new (fragP, old_fr_fix + 2, 2,
11943 fragP->fr_symbol,
11944 fragP->fr_offset, 1,
11945 reloc_type);
11946 break;
11947 }
11948 /* Fall through. */
11949
11950 case COND_JUMP:
11951 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11952 {
11953 fixS *fixP;
11954
11955 fragP->fr_fix += 1;
11956 fixP = fix_new (fragP, old_fr_fix, 1,
11957 fragP->fr_symbol,
11958 fragP->fr_offset, 1,
11959 BFD_RELOC_8_PCREL);
11960 fixP->fx_signed = 1;
11961 break;
11962 }
11963
11964 /* This changes the byte-displacement jump 0x7N
11965 to the (d)word-displacement jump 0x0f,0x8N. */
11966 opcode[1] = opcode[0] + 0x10;
11967 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11968 /* We've added an opcode byte. */
11969 fragP->fr_fix += 1 + size;
11970 fix_new (fragP, old_fr_fix + 1, size,
11971 fragP->fr_symbol,
11972 fragP->fr_offset, 1,
11973 reloc_type);
11974 break;
11975
11976 default:
11977 BAD_CASE (fragP->fr_subtype);
11978 break;
11979 }
11980 frag_wane (fragP);
11981 return fragP->fr_fix - old_fr_fix;
11982 }
11983
11984 /* Guess size depending on current relax state. Initially the relax
11985 state will correspond to a short jump and we return 1, because
11986 the variable part of the frag (the branch offset) is one byte
11987 long. However, we can relax a section more than once and in that
11988 case we must either set fr_subtype back to the unrelaxed state,
11989 or return the value for the appropriate branch. */
11990 return md_relax_table[fragP->fr_subtype].rlx_length;
11991 }
11992
11993 /* Called after relax() is finished.
11994
11995 In: Address of frag.
11996 fr_type == rs_machine_dependent.
11997 fr_subtype is what the address relaxed to.
11998
11999 Out: Any fixSs and constants are set up.
12000 Caller will turn frag into a ".space 0". */
12001
12002 void
12003 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12004 fragS *fragP)
12005 {
12006 unsigned char *opcode;
12007 unsigned char *where_to_put_displacement = NULL;
12008 offsetT target_address;
12009 offsetT opcode_address;
12010 unsigned int extension = 0;
12011 offsetT displacement_from_opcode_start;
12012
12013 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12014 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12015 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12016 {
12017 /* Generate nop padding. */
12018 unsigned int size = fragP->tc_frag_data.length;
12019 if (size)
12020 {
12021 if (size > fragP->tc_frag_data.max_bytes)
12022 abort ();
12023
12024 if (flag_debug)
12025 {
12026 const char *msg;
12027 const char *branch = "branch";
12028 const char *prefix = "";
12029 fragS *padding_fragP;
12030 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12031 == BRANCH_PREFIX)
12032 {
12033 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12034 switch (fragP->tc_frag_data.default_prefix)
12035 {
12036 default:
12037 abort ();
12038 break;
12039 case CS_PREFIX_OPCODE:
12040 prefix = " cs";
12041 break;
12042 case DS_PREFIX_OPCODE:
12043 prefix = " ds";
12044 break;
12045 case ES_PREFIX_OPCODE:
12046 prefix = " es";
12047 break;
12048 case FS_PREFIX_OPCODE:
12049 prefix = " fs";
12050 break;
12051 case GS_PREFIX_OPCODE:
12052 prefix = " gs";
12053 break;
12054 case SS_PREFIX_OPCODE:
12055 prefix = " ss";
12056 break;
12057 }
12058 if (padding_fragP)
12059 msg = _("%s:%u: add %d%s at 0x%llx to align "
12060 "%s within %d-byte boundary\n");
12061 else
12062 msg = _("%s:%u: add additional %d%s at 0x%llx to "
12063 "align %s within %d-byte boundary\n");
12064 }
12065 else
12066 {
12067 padding_fragP = fragP;
12068 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12069 "%s within %d-byte boundary\n");
12070 }
12071
12072 if (padding_fragP)
12073 switch (padding_fragP->tc_frag_data.branch_type)
12074 {
12075 case align_branch_jcc:
12076 branch = "jcc";
12077 break;
12078 case align_branch_fused:
12079 branch = "fused jcc";
12080 break;
12081 case align_branch_jmp:
12082 branch = "jmp";
12083 break;
12084 case align_branch_call:
12085 branch = "call";
12086 break;
12087 case align_branch_indirect:
12088 branch = "indiret branch";
12089 break;
12090 case align_branch_ret:
12091 branch = "ret";
12092 break;
12093 default:
12094 break;
12095 }
12096
12097 fprintf (stdout, msg,
12098 fragP->fr_file, fragP->fr_line, size, prefix,
12099 (long long) fragP->fr_address, branch,
12100 1 << align_branch_power);
12101 }
12102 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12103 memset (fragP->fr_opcode,
12104 fragP->tc_frag_data.default_prefix, size);
12105 else
12106 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12107 size, 0);
12108 fragP->fr_fix += size;
12109 }
12110 return;
12111 }
12112
12113 opcode = (unsigned char *) fragP->fr_opcode;
12114
12115 /* Address we want to reach in file space. */
12116 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12117
12118 /* Address opcode resides at in file space. */
12119 opcode_address = fragP->fr_address + fragP->fr_fix;
12120
12121 /* Displacement from opcode start to fill into instruction. */
12122 displacement_from_opcode_start = target_address - opcode_address;
12123
12124 if ((fragP->fr_subtype & BIG) == 0)
12125 {
12126 /* Don't have to change opcode. */
12127 extension = 1; /* 1 opcode + 1 displacement */
12128 where_to_put_displacement = &opcode[1];
12129 }
12130 else
12131 {
12132 if (no_cond_jump_promotion
12133 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12134 as_warn_where (fragP->fr_file, fragP->fr_line,
12135 _("long jump required"));
12136
12137 switch (fragP->fr_subtype)
12138 {
12139 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12140 extension = 4; /* 1 opcode + 4 displacement */
12141 opcode[0] = 0xe9;
12142 where_to_put_displacement = &opcode[1];
12143 break;
12144
12145 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12146 extension = 2; /* 1 opcode + 2 displacement */
12147 opcode[0] = 0xe9;
12148 where_to_put_displacement = &opcode[1];
12149 break;
12150
12151 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12152 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12153 extension = 5; /* 2 opcode + 4 displacement */
12154 opcode[1] = opcode[0] + 0x10;
12155 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12156 where_to_put_displacement = &opcode[2];
12157 break;
12158
12159 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12160 extension = 3; /* 2 opcode + 2 displacement */
12161 opcode[1] = opcode[0] + 0x10;
12162 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12163 where_to_put_displacement = &opcode[2];
12164 break;
12165
12166 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12167 extension = 4;
12168 opcode[0] ^= 1;
12169 opcode[1] = 3;
12170 opcode[2] = 0xe9;
12171 where_to_put_displacement = &opcode[3];
12172 break;
12173
12174 default:
12175 BAD_CASE (fragP->fr_subtype);
12176 break;
12177 }
12178 }
12179
12180 /* If size if less then four we are sure that the operand fits,
12181 but if it's 4, then it could be that the displacement is larger
12182 then -/+ 2GB. */
12183 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12184 && object_64bit
12185 && ((addressT) (displacement_from_opcode_start - extension
12186 + ((addressT) 1 << 31))
12187 > (((addressT) 2 << 31) - 1)))
12188 {
12189 as_bad_where (fragP->fr_file, fragP->fr_line,
12190 _("jump target out of range"));
12191 /* Make us emit 0. */
12192 displacement_from_opcode_start = extension;
12193 }
12194 /* Now put displacement after opcode. */
12195 md_number_to_chars ((char *) where_to_put_displacement,
12196 (valueT) (displacement_from_opcode_start - extension),
12197 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12198 fragP->fr_fix += extension;
12199 }
12200 \f
12201 /* Apply a fixup (fixP) to segment data, once it has been determined
12202 by our caller that we have all the info we need to fix it up.
12203
12204 Parameter valP is the pointer to the value of the bits.
12205
12206 On the 386, immediates, displacements, and data pointers are all in
12207 the same (little-endian) format, so we don't need to care about which
12208 we are handling. */
12209
12210 void
12211 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12212 {
12213 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12214 valueT value = *valP;
12215
12216 #if !defined (TE_Mach)
12217 if (fixP->fx_pcrel)
12218 {
12219 switch (fixP->fx_r_type)
12220 {
12221 default:
12222 break;
12223
12224 case BFD_RELOC_64:
12225 fixP->fx_r_type = BFD_RELOC_64_PCREL;
12226 break;
12227 case BFD_RELOC_32:
12228 case BFD_RELOC_X86_64_32S:
12229 fixP->fx_r_type = BFD_RELOC_32_PCREL;
12230 break;
12231 case BFD_RELOC_16:
12232 fixP->fx_r_type = BFD_RELOC_16_PCREL;
12233 break;
12234 case BFD_RELOC_8:
12235 fixP->fx_r_type = BFD_RELOC_8_PCREL;
12236 break;
12237 }
12238 }
12239
12240 if (fixP->fx_addsy != NULL
12241 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12242 || fixP->fx_r_type == BFD_RELOC_64_PCREL
12243 || fixP->fx_r_type == BFD_RELOC_16_PCREL
12244 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12245 && !use_rela_relocations)
12246 {
12247 /* This is a hack. There should be a better way to handle this.
12248 This covers for the fact that bfd_install_relocation will
12249 subtract the current location (for partial_inplace, PC relative
12250 relocations); see more below. */
12251 #ifndef OBJ_AOUT
12252 if (IS_ELF
12253 #ifdef TE_PE
12254 || OUTPUT_FLAVOR == bfd_target_coff_flavour
12255 #endif
12256 )
12257 value += fixP->fx_where + fixP->fx_frag->fr_address;
12258 #endif
12259 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12260 if (IS_ELF)
12261 {
12262 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12263
12264 if ((sym_seg == seg
12265 || (symbol_section_p (fixP->fx_addsy)
12266 && sym_seg != absolute_section))
12267 && !generic_force_reloc (fixP))
12268 {
12269 /* Yes, we add the values in twice. This is because
12270 bfd_install_relocation subtracts them out again. I think
12271 bfd_install_relocation is broken, but I don't dare change
12272 it. FIXME. */
12273 value += fixP->fx_where + fixP->fx_frag->fr_address;
12274 }
12275 }
12276 #endif
12277 #if defined (OBJ_COFF) && defined (TE_PE)
12278 /* For some reason, the PE format does not store a
12279 section address offset for a PC relative symbol. */
12280 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12281 || S_IS_WEAK (fixP->fx_addsy))
12282 value += md_pcrel_from (fixP);
12283 #endif
12284 }
12285 #if defined (OBJ_COFF) && defined (TE_PE)
12286 if (fixP->fx_addsy != NULL
12287 && S_IS_WEAK (fixP->fx_addsy)
12288 /* PR 16858: Do not modify weak function references. */
12289 && ! fixP->fx_pcrel)
12290 {
12291 #if !defined (TE_PEP)
12292 /* For x86 PE weak function symbols are neither PC-relative
12293 nor do they set S_IS_FUNCTION. So the only reliable way
12294 to detect them is to check the flags of their containing
12295 section. */
12296 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12297 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12298 ;
12299 else
12300 #endif
12301 value -= S_GET_VALUE (fixP->fx_addsy);
12302 }
12303 #endif
12304
12305 /* Fix a few things - the dynamic linker expects certain values here,
12306 and we must not disappoint it. */
12307 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12308 if (IS_ELF && fixP->fx_addsy)
12309 switch (fixP->fx_r_type)
12310 {
12311 case BFD_RELOC_386_PLT32:
12312 case BFD_RELOC_X86_64_PLT32:
12313 /* Make the jump instruction point to the address of the operand.
12314 At runtime we merely add the offset to the actual PLT entry.
12315 NB: Subtract the offset size only for jump instructions. */
12316 if (fixP->fx_pcrel)
12317 value = -4;
12318 break;
12319
12320 case BFD_RELOC_386_TLS_GD:
12321 case BFD_RELOC_386_TLS_LDM:
12322 case BFD_RELOC_386_TLS_IE_32:
12323 case BFD_RELOC_386_TLS_IE:
12324 case BFD_RELOC_386_TLS_GOTIE:
12325 case BFD_RELOC_386_TLS_GOTDESC:
12326 case BFD_RELOC_X86_64_TLSGD:
12327 case BFD_RELOC_X86_64_TLSLD:
12328 case BFD_RELOC_X86_64_GOTTPOFF:
12329 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12330 value = 0; /* Fully resolved at runtime. No addend. */
12331 /* Fallthrough */
12332 case BFD_RELOC_386_TLS_LE:
12333 case BFD_RELOC_386_TLS_LDO_32:
12334 case BFD_RELOC_386_TLS_LE_32:
12335 case BFD_RELOC_X86_64_DTPOFF32:
12336 case BFD_RELOC_X86_64_DTPOFF64:
12337 case BFD_RELOC_X86_64_TPOFF32:
12338 case BFD_RELOC_X86_64_TPOFF64:
12339 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12340 break;
12341
12342 case BFD_RELOC_386_TLS_DESC_CALL:
12343 case BFD_RELOC_X86_64_TLSDESC_CALL:
12344 value = 0; /* Fully resolved at runtime. No addend. */
12345 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12346 fixP->fx_done = 0;
12347 return;
12348
12349 case BFD_RELOC_VTABLE_INHERIT:
12350 case BFD_RELOC_VTABLE_ENTRY:
12351 fixP->fx_done = 0;
12352 return;
12353
12354 default:
12355 break;
12356 }
12357 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
12358 *valP = value;
12359 #endif /* !defined (TE_Mach) */
12360
12361 /* Are we finished with this relocation now? */
12362 if (fixP->fx_addsy == NULL)
12363 fixP->fx_done = 1;
12364 #if defined (OBJ_COFF) && defined (TE_PE)
12365 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12366 {
12367 fixP->fx_done = 0;
12368 /* Remember value for tc_gen_reloc. */
12369 fixP->fx_addnumber = value;
12370 /* Clear out the frag for now. */
12371 value = 0;
12372 }
12373 #endif
12374 else if (use_rela_relocations)
12375 {
12376 fixP->fx_no_overflow = 1;
12377 /* Remember value for tc_gen_reloc. */
12378 fixP->fx_addnumber = value;
12379 value = 0;
12380 }
12381
12382 md_number_to_chars (p, value, fixP->fx_size);
12383 }
12384 \f
12385 const char *
12386 md_atof (int type, char *litP, int *sizeP)
12387 {
12388 /* This outputs the LITTLENUMs in REVERSE order;
12389 in accord with the bigendian 386. */
12390 return ieee_md_atof (type, litP, sizeP, FALSE);
12391 }
12392 \f
12393 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12394
12395 static char *
12396 output_invalid (int c)
12397 {
12398 if (ISPRINT (c))
12399 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12400 "'%c'", c);
12401 else
12402 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12403 "(0x%x)", (unsigned char) c);
12404 return output_invalid_buf;
12405 }
12406
12407 /* Verify that @r can be used in the current context. */
12408
12409 static bfd_boolean check_register (const reg_entry *r)
12410 {
12411 if (allow_pseudo_reg)
12412 return TRUE;
12413
12414 if (operand_type_all_zero (&r->reg_type))
12415 return FALSE;
12416
12417 if ((r->reg_type.bitfield.dword
12418 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12419 || r->reg_type.bitfield.class == RegCR
12420 || r->reg_type.bitfield.class == RegDR)
12421 && !cpu_arch_flags.bitfield.cpui386)
12422 return FALSE;
12423
12424 if (r->reg_type.bitfield.class == RegTR
12425 && (flag_code == CODE_64BIT
12426 || !cpu_arch_flags.bitfield.cpui386
12427 || cpu_arch_isa_flags.bitfield.cpui586
12428 || cpu_arch_isa_flags.bitfield.cpui686))
12429 return FALSE;
12430
12431 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12432 return FALSE;
12433
12434 if (!cpu_arch_flags.bitfield.cpuavx512f)
12435 {
12436 if (r->reg_type.bitfield.zmmword
12437 || r->reg_type.bitfield.class == RegMask)
12438 return FALSE;
12439
12440 if (!cpu_arch_flags.bitfield.cpuavx)
12441 {
12442 if (r->reg_type.bitfield.ymmword)
12443 return FALSE;
12444
12445 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12446 return FALSE;
12447 }
12448 }
12449
12450 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12451 return FALSE;
12452
12453 /* Don't allow fake index register unless allow_index_reg isn't 0. */
12454 if (!allow_index_reg && r->reg_num == RegIZ)
12455 return FALSE;
12456
12457 /* Upper 16 vector registers are only available with VREX in 64bit
12458 mode, and require EVEX encoding. */
12459 if (r->reg_flags & RegVRex)
12460 {
12461 if (!cpu_arch_flags.bitfield.cpuavx512f
12462 || flag_code != CODE_64BIT)
12463 return FALSE;
12464
12465 if (i.vec_encoding == vex_encoding_default)
12466 i.vec_encoding = vex_encoding_evex;
12467 else if (i.vec_encoding != vex_encoding_evex)
12468 i.vec_encoding = vex_encoding_error;
12469 }
12470
12471 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12472 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12473 && flag_code != CODE_64BIT)
12474 return FALSE;
12475
12476 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12477 && !intel_syntax)
12478 return FALSE;
12479
12480 return TRUE;
12481 }
12482
12483 /* REG_STRING starts *before* REGISTER_PREFIX. */
12484
12485 static const reg_entry *
12486 parse_real_register (char *reg_string, char **end_op)
12487 {
12488 char *s = reg_string;
12489 char *p;
12490 char reg_name_given[MAX_REG_NAME_SIZE + 1];
12491 const reg_entry *r;
12492
12493 /* Skip possible REGISTER_PREFIX and possible whitespace. */
12494 if (*s == REGISTER_PREFIX)
12495 ++s;
12496
12497 if (is_space_char (*s))
12498 ++s;
12499
12500 p = reg_name_given;
12501 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12502 {
12503 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12504 return (const reg_entry *) NULL;
12505 s++;
12506 }
12507
12508 /* For naked regs, make sure that we are not dealing with an identifier.
12509 This prevents confusing an identifier like `eax_var' with register
12510 `eax'. */
12511 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12512 return (const reg_entry *) NULL;
12513
12514 *end_op = s;
12515
12516 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
12517
12518 /* Handle floating point regs, allowing spaces in the (i) part. */
12519 if (r == i386_regtab /* %st is first entry of table */)
12520 {
12521 if (!cpu_arch_flags.bitfield.cpu8087
12522 && !cpu_arch_flags.bitfield.cpu287
12523 && !cpu_arch_flags.bitfield.cpu387
12524 && !allow_pseudo_reg)
12525 return (const reg_entry *) NULL;
12526
12527 if (is_space_char (*s))
12528 ++s;
12529 if (*s == '(')
12530 {
12531 ++s;
12532 if (is_space_char (*s))
12533 ++s;
12534 if (*s >= '0' && *s <= '7')
12535 {
12536 int fpr = *s - '0';
12537 ++s;
12538 if (is_space_char (*s))
12539 ++s;
12540 if (*s == ')')
12541 {
12542 *end_op = s + 1;
12543 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
12544 know (r);
12545 return r + fpr;
12546 }
12547 }
12548 /* We have "%st(" then garbage. */
12549 return (const reg_entry *) NULL;
12550 }
12551 }
12552
12553 return r && check_register (r) ? r : NULL;
12554 }
12555
12556 /* REG_STRING starts *before* REGISTER_PREFIX. */
12557
12558 static const reg_entry *
12559 parse_register (char *reg_string, char **end_op)
12560 {
12561 const reg_entry *r;
12562
12563 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12564 r = parse_real_register (reg_string, end_op);
12565 else
12566 r = NULL;
12567 if (!r)
12568 {
12569 char *save = input_line_pointer;
12570 char c;
12571 symbolS *symbolP;
12572
12573 input_line_pointer = reg_string;
12574 c = get_symbol_name (&reg_string);
12575 symbolP = symbol_find (reg_string);
12576 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12577 {
12578 const expressionS *e = symbol_get_value_expression (symbolP);
12579
12580 know (e->X_op == O_register);
12581 know (e->X_add_number >= 0
12582 && (valueT) e->X_add_number < i386_regtab_size);
12583 r = i386_regtab + e->X_add_number;
12584 if (!check_register (r))
12585 {
12586 as_bad (_("register '%s%s' cannot be used here"),
12587 register_prefix, r->reg_name);
12588 r = &bad_reg;
12589 }
12590 *end_op = input_line_pointer;
12591 }
12592 *input_line_pointer = c;
12593 input_line_pointer = save;
12594 }
12595 return r;
12596 }
12597
12598 int
12599 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12600 {
12601 const reg_entry *r;
12602 char *end = input_line_pointer;
12603
12604 *end = *nextcharP;
12605 r = parse_register (name, &input_line_pointer);
12606 if (r && end <= input_line_pointer)
12607 {
12608 *nextcharP = *input_line_pointer;
12609 *input_line_pointer = 0;
12610 if (r != &bad_reg)
12611 {
12612 e->X_op = O_register;
12613 e->X_add_number = r - i386_regtab;
12614 }
12615 else
12616 e->X_op = O_illegal;
12617 return 1;
12618 }
12619 input_line_pointer = end;
12620 *end = 0;
12621 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12622 }
12623
12624 void
12625 md_operand (expressionS *e)
12626 {
12627 char *end;
12628 const reg_entry *r;
12629
12630 switch (*input_line_pointer)
12631 {
12632 case REGISTER_PREFIX:
12633 r = parse_real_register (input_line_pointer, &end);
12634 if (r)
12635 {
12636 e->X_op = O_register;
12637 e->X_add_number = r - i386_regtab;
12638 input_line_pointer = end;
12639 }
12640 break;
12641
12642 case '[':
12643 gas_assert (intel_syntax);
12644 end = input_line_pointer++;
12645 expression (e);
12646 if (*input_line_pointer == ']')
12647 {
12648 ++input_line_pointer;
12649 e->X_op_symbol = make_expr_symbol (e);
12650 e->X_add_symbol = NULL;
12651 e->X_add_number = 0;
12652 e->X_op = O_index;
12653 }
12654 else
12655 {
12656 e->X_op = O_absent;
12657 input_line_pointer = end;
12658 }
12659 break;
12660 }
12661 }
12662
12663 \f
12664 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12665 const char *md_shortopts = "kVQ:sqnO::";
12666 #else
12667 const char *md_shortopts = "qnO::";
12668 #endif
12669
12670 #define OPTION_32 (OPTION_MD_BASE + 0)
12671 #define OPTION_64 (OPTION_MD_BASE + 1)
12672 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12673 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12674 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12675 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12676 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12677 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12678 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12679 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12680 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12681 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12682 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12683 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12684 #define OPTION_X32 (OPTION_MD_BASE + 14)
12685 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12686 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12687 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12688 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12689 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12690 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12691 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12692 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12693 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12694 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12695 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12696 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12697 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12698 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12699 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12700 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12701 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12702 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12703 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12704
12705 struct option md_longopts[] =
12706 {
12707 {"32", no_argument, NULL, OPTION_32},
12708 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12709 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12710 {"64", no_argument, NULL, OPTION_64},
12711 #endif
12712 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12713 {"x32", no_argument, NULL, OPTION_X32},
12714 {"mshared", no_argument, NULL, OPTION_MSHARED},
12715 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12716 #endif
12717 {"divide", no_argument, NULL, OPTION_DIVIDE},
12718 {"march", required_argument, NULL, OPTION_MARCH},
12719 {"mtune", required_argument, NULL, OPTION_MTUNE},
12720 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12721 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12722 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12723 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12724 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12725 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12726 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12727 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12728 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12729 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12730 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12731 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12732 # if defined (TE_PE) || defined (TE_PEP)
12733 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12734 #endif
12735 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12736 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12737 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12738 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12739 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12740 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12741 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12742 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12743 {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12744 {"mlfence-before-indirect-branch", required_argument, NULL,
12745 OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12746 {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12747 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12748 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12749 {NULL, no_argument, NULL, 0}
12750 };
12751 size_t md_longopts_size = sizeof (md_longopts);
12752
12753 int
12754 md_parse_option (int c, const char *arg)
12755 {
12756 unsigned int j;
12757 char *arch, *next, *saved, *type;
12758
12759 switch (c)
12760 {
12761 case 'n':
12762 optimize_align_code = 0;
12763 break;
12764
12765 case 'q':
12766 quiet_warnings = 1;
12767 break;
12768
12769 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12770 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12771 should be emitted or not. FIXME: Not implemented. */
12772 case 'Q':
12773 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12774 return 0;
12775 break;
12776
12777 /* -V: SVR4 argument to print version ID. */
12778 case 'V':
12779 print_version_id ();
12780 break;
12781
12782 /* -k: Ignore for FreeBSD compatibility. */
12783 case 'k':
12784 break;
12785
12786 case 's':
12787 /* -s: On i386 Solaris, this tells the native assembler to use
12788 .stab instead of .stab.excl. We always use .stab anyhow. */
12789 break;
12790
12791 case OPTION_MSHARED:
12792 shared = 1;
12793 break;
12794
12795 case OPTION_X86_USED_NOTE:
12796 if (strcasecmp (arg, "yes") == 0)
12797 x86_used_note = 1;
12798 else if (strcasecmp (arg, "no") == 0)
12799 x86_used_note = 0;
12800 else
12801 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12802 break;
12803
12804
12805 #endif
12806 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12807 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12808 case OPTION_64:
12809 {
12810 const char **list, **l;
12811
12812 list = bfd_target_list ();
12813 for (l = list; *l != NULL; l++)
12814 if (CONST_STRNEQ (*l, "elf64-x86-64")
12815 || strcmp (*l, "coff-x86-64") == 0
12816 || strcmp (*l, "pe-x86-64") == 0
12817 || strcmp (*l, "pei-x86-64") == 0
12818 || strcmp (*l, "mach-o-x86-64") == 0)
12819 {
12820 default_arch = "x86_64";
12821 break;
12822 }
12823 if (*l == NULL)
12824 as_fatal (_("no compiled in support for x86_64"));
12825 free (list);
12826 }
12827 break;
12828 #endif
12829
12830 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12831 case OPTION_X32:
12832 if (IS_ELF)
12833 {
12834 const char **list, **l;
12835
12836 list = bfd_target_list ();
12837 for (l = list; *l != NULL; l++)
12838 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12839 {
12840 default_arch = "x86_64:32";
12841 break;
12842 }
12843 if (*l == NULL)
12844 as_fatal (_("no compiled in support for 32bit x86_64"));
12845 free (list);
12846 }
12847 else
12848 as_fatal (_("32bit x86_64 is only supported for ELF"));
12849 break;
12850 #endif
12851
12852 case OPTION_32:
12853 default_arch = "i386";
12854 break;
12855
12856 case OPTION_DIVIDE:
12857 #ifdef SVR4_COMMENT_CHARS
12858 {
12859 char *n, *t;
12860 const char *s;
12861
12862 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12863 t = n;
12864 for (s = i386_comment_chars; *s != '\0'; s++)
12865 if (*s != '/')
12866 *t++ = *s;
12867 *t = '\0';
12868 i386_comment_chars = n;
12869 }
12870 #endif
12871 break;
12872
12873 case OPTION_MARCH:
12874 saved = xstrdup (arg);
12875 arch = saved;
12876 /* Allow -march=+nosse. */
12877 if (*arch == '+')
12878 arch++;
12879 do
12880 {
12881 if (*arch == '.')
12882 as_fatal (_("invalid -march= option: `%s'"), arg);
12883 next = strchr (arch, '+');
12884 if (next)
12885 *next++ = '\0';
12886 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12887 {
12888 if (strcmp (arch, cpu_arch [j].name) == 0)
12889 {
12890 /* Processor. */
12891 if (! cpu_arch[j].flags.bitfield.cpui386)
12892 continue;
12893
12894 cpu_arch_name = cpu_arch[j].name;
12895 cpu_sub_arch_name = NULL;
12896 cpu_arch_flags = cpu_arch[j].flags;
12897 cpu_arch_isa = cpu_arch[j].type;
12898 cpu_arch_isa_flags = cpu_arch[j].flags;
12899 if (!cpu_arch_tune_set)
12900 {
12901 cpu_arch_tune = cpu_arch_isa;
12902 cpu_arch_tune_flags = cpu_arch_isa_flags;
12903 }
12904 break;
12905 }
12906 else if (*cpu_arch [j].name == '.'
12907 && strcmp (arch, cpu_arch [j].name + 1) == 0)
12908 {
12909 /* ISA extension. */
12910 i386_cpu_flags flags;
12911
12912 flags = cpu_flags_or (cpu_arch_flags,
12913 cpu_arch[j].flags);
12914
12915 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12916 {
12917 if (cpu_sub_arch_name)
12918 {
12919 char *name = cpu_sub_arch_name;
12920 cpu_sub_arch_name = concat (name,
12921 cpu_arch[j].name,
12922 (const char *) NULL);
12923 free (name);
12924 }
12925 else
12926 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12927 cpu_arch_flags = flags;
12928 cpu_arch_isa_flags = flags;
12929 }
12930 else
12931 cpu_arch_isa_flags
12932 = cpu_flags_or (cpu_arch_isa_flags,
12933 cpu_arch[j].flags);
12934 break;
12935 }
12936 }
12937
12938 if (j >= ARRAY_SIZE (cpu_arch))
12939 {
12940 /* Disable an ISA extension. */
12941 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12942 if (strcmp (arch, cpu_noarch [j].name) == 0)
12943 {
12944 i386_cpu_flags flags;
12945
12946 flags = cpu_flags_and_not (cpu_arch_flags,
12947 cpu_noarch[j].flags);
12948 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12949 {
12950 if (cpu_sub_arch_name)
12951 {
12952 char *name = cpu_sub_arch_name;
12953 cpu_sub_arch_name = concat (arch,
12954 (const char *) NULL);
12955 free (name);
12956 }
12957 else
12958 cpu_sub_arch_name = xstrdup (arch);
12959 cpu_arch_flags = flags;
12960 cpu_arch_isa_flags = flags;
12961 }
12962 break;
12963 }
12964
12965 if (j >= ARRAY_SIZE (cpu_noarch))
12966 j = ARRAY_SIZE (cpu_arch);
12967 }
12968
12969 if (j >= ARRAY_SIZE (cpu_arch))
12970 as_fatal (_("invalid -march= option: `%s'"), arg);
12971
12972 arch = next;
12973 }
12974 while (next != NULL);
12975 free (saved);
12976 break;
12977
12978 case OPTION_MTUNE:
12979 if (*arg == '.')
12980 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12981 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12982 {
12983 if (strcmp (arg, cpu_arch [j].name) == 0)
12984 {
12985 cpu_arch_tune_set = 1;
12986 cpu_arch_tune = cpu_arch [j].type;
12987 cpu_arch_tune_flags = cpu_arch[j].flags;
12988 break;
12989 }
12990 }
12991 if (j >= ARRAY_SIZE (cpu_arch))
12992 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12993 break;
12994
12995 case OPTION_MMNEMONIC:
12996 if (strcasecmp (arg, "att") == 0)
12997 intel_mnemonic = 0;
12998 else if (strcasecmp (arg, "intel") == 0)
12999 intel_mnemonic = 1;
13000 else
13001 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13002 break;
13003
13004 case OPTION_MSYNTAX:
13005 if (strcasecmp (arg, "att") == 0)
13006 intel_syntax = 0;
13007 else if (strcasecmp (arg, "intel") == 0)
13008 intel_syntax = 1;
13009 else
13010 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13011 break;
13012
13013 case OPTION_MINDEX_REG:
13014 allow_index_reg = 1;
13015 break;
13016
13017 case OPTION_MNAKED_REG:
13018 allow_naked_reg = 1;
13019 break;
13020
13021 case OPTION_MSSE2AVX:
13022 sse2avx = 1;
13023 break;
13024
13025 case OPTION_MSSE_CHECK:
13026 if (strcasecmp (arg, "error") == 0)
13027 sse_check = check_error;
13028 else if (strcasecmp (arg, "warning") == 0)
13029 sse_check = check_warning;
13030 else if (strcasecmp (arg, "none") == 0)
13031 sse_check = check_none;
13032 else
13033 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13034 break;
13035
13036 case OPTION_MOPERAND_CHECK:
13037 if (strcasecmp (arg, "error") == 0)
13038 operand_check = check_error;
13039 else if (strcasecmp (arg, "warning") == 0)
13040 operand_check = check_warning;
13041 else if (strcasecmp (arg, "none") == 0)
13042 operand_check = check_none;
13043 else
13044 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13045 break;
13046
13047 case OPTION_MAVXSCALAR:
13048 if (strcasecmp (arg, "128") == 0)
13049 avxscalar = vex128;
13050 else if (strcasecmp (arg, "256") == 0)
13051 avxscalar = vex256;
13052 else
13053 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13054 break;
13055
13056 case OPTION_MVEXWIG:
13057 if (strcmp (arg, "0") == 0)
13058 vexwig = vexw0;
13059 else if (strcmp (arg, "1") == 0)
13060 vexwig = vexw1;
13061 else
13062 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13063 break;
13064
13065 case OPTION_MADD_BND_PREFIX:
13066 add_bnd_prefix = 1;
13067 break;
13068
13069 case OPTION_MEVEXLIG:
13070 if (strcmp (arg, "128") == 0)
13071 evexlig = evexl128;
13072 else if (strcmp (arg, "256") == 0)
13073 evexlig = evexl256;
13074 else if (strcmp (arg, "512") == 0)
13075 evexlig = evexl512;
13076 else
13077 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13078 break;
13079
13080 case OPTION_MEVEXRCIG:
13081 if (strcmp (arg, "rne") == 0)
13082 evexrcig = rne;
13083 else if (strcmp (arg, "rd") == 0)
13084 evexrcig = rd;
13085 else if (strcmp (arg, "ru") == 0)
13086 evexrcig = ru;
13087 else if (strcmp (arg, "rz") == 0)
13088 evexrcig = rz;
13089 else
13090 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13091 break;
13092
13093 case OPTION_MEVEXWIG:
13094 if (strcmp (arg, "0") == 0)
13095 evexwig = evexw0;
13096 else if (strcmp (arg, "1") == 0)
13097 evexwig = evexw1;
13098 else
13099 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13100 break;
13101
13102 # if defined (TE_PE) || defined (TE_PEP)
13103 case OPTION_MBIG_OBJ:
13104 use_big_obj = 1;
13105 break;
13106 #endif
13107
13108 case OPTION_MOMIT_LOCK_PREFIX:
13109 if (strcasecmp (arg, "yes") == 0)
13110 omit_lock_prefix = 1;
13111 else if (strcasecmp (arg, "no") == 0)
13112 omit_lock_prefix = 0;
13113 else
13114 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13115 break;
13116
13117 case OPTION_MFENCE_AS_LOCK_ADD:
13118 if (strcasecmp (arg, "yes") == 0)
13119 avoid_fence = 1;
13120 else if (strcasecmp (arg, "no") == 0)
13121 avoid_fence = 0;
13122 else
13123 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13124 break;
13125
13126 case OPTION_MLFENCE_AFTER_LOAD:
13127 if (strcasecmp (arg, "yes") == 0)
13128 lfence_after_load = 1;
13129 else if (strcasecmp (arg, "no") == 0)
13130 lfence_after_load = 0;
13131 else
13132 as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13133 break;
13134
13135 case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13136 if (strcasecmp (arg, "all") == 0)
13137 {
13138 lfence_before_indirect_branch = lfence_branch_all;
13139 if (lfence_before_ret == lfence_before_ret_none)
13140 lfence_before_ret = lfence_before_ret_shl;
13141 }
13142 else if (strcasecmp (arg, "memory") == 0)
13143 lfence_before_indirect_branch = lfence_branch_memory;
13144 else if (strcasecmp (arg, "register") == 0)
13145 lfence_before_indirect_branch = lfence_branch_register;
13146 else if (strcasecmp (arg, "none") == 0)
13147 lfence_before_indirect_branch = lfence_branch_none;
13148 else
13149 as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13150 arg);
13151 break;
13152
13153 case OPTION_MLFENCE_BEFORE_RET:
13154 if (strcasecmp (arg, "or") == 0)
13155 lfence_before_ret = lfence_before_ret_or;
13156 else if (strcasecmp (arg, "not") == 0)
13157 lfence_before_ret = lfence_before_ret_not;
13158 else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13159 lfence_before_ret = lfence_before_ret_shl;
13160 else if (strcasecmp (arg, "none") == 0)
13161 lfence_before_ret = lfence_before_ret_none;
13162 else
13163 as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13164 arg);
13165 break;
13166
13167 case OPTION_MRELAX_RELOCATIONS:
13168 if (strcasecmp (arg, "yes") == 0)
13169 generate_relax_relocations = 1;
13170 else if (strcasecmp (arg, "no") == 0)
13171 generate_relax_relocations = 0;
13172 else
13173 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13174 break;
13175
13176 case OPTION_MALIGN_BRANCH_BOUNDARY:
13177 {
13178 char *end;
13179 long int align = strtoul (arg, &end, 0);
13180 if (*end == '\0')
13181 {
13182 if (align == 0)
13183 {
13184 align_branch_power = 0;
13185 break;
13186 }
13187 else if (align >= 16)
13188 {
13189 int align_power;
13190 for (align_power = 0;
13191 (align & 1) == 0;
13192 align >>= 1, align_power++)
13193 continue;
13194 /* Limit alignment power to 31. */
13195 if (align == 1 && align_power < 32)
13196 {
13197 align_branch_power = align_power;
13198 break;
13199 }
13200 }
13201 }
13202 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13203 }
13204 break;
13205
13206 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13207 {
13208 char *end;
13209 int align = strtoul (arg, &end, 0);
13210 /* Some processors only support 5 prefixes. */
13211 if (*end == '\0' && align >= 0 && align < 6)
13212 {
13213 align_branch_prefix_size = align;
13214 break;
13215 }
13216 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13217 arg);
13218 }
13219 break;
13220
13221 case OPTION_MALIGN_BRANCH:
13222 align_branch = 0;
13223 saved = xstrdup (arg);
13224 type = saved;
13225 do
13226 {
13227 next = strchr (type, '+');
13228 if (next)
13229 *next++ = '\0';
13230 if (strcasecmp (type, "jcc") == 0)
13231 align_branch |= align_branch_jcc_bit;
13232 else if (strcasecmp (type, "fused") == 0)
13233 align_branch |= align_branch_fused_bit;
13234 else if (strcasecmp (type, "jmp") == 0)
13235 align_branch |= align_branch_jmp_bit;
13236 else if (strcasecmp (type, "call") == 0)
13237 align_branch |= align_branch_call_bit;
13238 else if (strcasecmp (type, "ret") == 0)
13239 align_branch |= align_branch_ret_bit;
13240 else if (strcasecmp (type, "indirect") == 0)
13241 align_branch |= align_branch_indirect_bit;
13242 else
13243 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13244 type = next;
13245 }
13246 while (next != NULL);
13247 free (saved);
13248 break;
13249
13250 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13251 align_branch_power = 5;
13252 align_branch_prefix_size = 5;
13253 align_branch = (align_branch_jcc_bit
13254 | align_branch_fused_bit
13255 | align_branch_jmp_bit);
13256 break;
13257
13258 case OPTION_MAMD64:
13259 isa64 = amd64;
13260 break;
13261
13262 case OPTION_MINTEL64:
13263 isa64 = intel64;
13264 break;
13265
13266 case 'O':
13267 if (arg == NULL)
13268 {
13269 optimize = 1;
13270 /* Turn off -Os. */
13271 optimize_for_space = 0;
13272 }
13273 else if (*arg == 's')
13274 {
13275 optimize_for_space = 1;
13276 /* Turn on all encoding optimizations. */
13277 optimize = INT_MAX;
13278 }
13279 else
13280 {
13281 optimize = atoi (arg);
13282 /* Turn off -Os. */
13283 optimize_for_space = 0;
13284 }
13285 break;
13286
13287 default:
13288 return 0;
13289 }
13290 return 1;
13291 }
13292
13293 #define MESSAGE_TEMPLATE \
13294 " "
13295
13296 static char *
13297 output_message (FILE *stream, char *p, char *message, char *start,
13298 int *left_p, const char *name, int len)
13299 {
13300 int size = sizeof (MESSAGE_TEMPLATE);
13301 int left = *left_p;
13302
13303 /* Reserve 2 spaces for ", " or ",\0" */
13304 left -= len + 2;
13305
13306 /* Check if there is any room. */
13307 if (left >= 0)
13308 {
13309 if (p != start)
13310 {
13311 *p++ = ',';
13312 *p++ = ' ';
13313 }
13314 p = mempcpy (p, name, len);
13315 }
13316 else
13317 {
13318 /* Output the current message now and start a new one. */
13319 *p++ = ',';
13320 *p = '\0';
13321 fprintf (stream, "%s\n", message);
13322 p = start;
13323 left = size - (start - message) - len - 2;
13324
13325 gas_assert (left >= 0);
13326
13327 p = mempcpy (p, name, len);
13328 }
13329
13330 *left_p = left;
13331 return p;
13332 }
13333
13334 static void
13335 show_arch (FILE *stream, int ext, int check)
13336 {
13337 static char message[] = MESSAGE_TEMPLATE;
13338 char *start = message + 27;
13339 char *p;
13340 int size = sizeof (MESSAGE_TEMPLATE);
13341 int left;
13342 const char *name;
13343 int len;
13344 unsigned int j;
13345
13346 p = start;
13347 left = size - (start - message);
13348 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13349 {
13350 /* Should it be skipped? */
13351 if (cpu_arch [j].skip)
13352 continue;
13353
13354 name = cpu_arch [j].name;
13355 len = cpu_arch [j].len;
13356 if (*name == '.')
13357 {
13358 /* It is an extension. Skip if we aren't asked to show it. */
13359 if (ext)
13360 {
13361 name++;
13362 len--;
13363 }
13364 else
13365 continue;
13366 }
13367 else if (ext)
13368 {
13369 /* It is an processor. Skip if we show only extension. */
13370 continue;
13371 }
13372 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13373 {
13374 /* It is an impossible processor - skip. */
13375 continue;
13376 }
13377
13378 p = output_message (stream, p, message, start, &left, name, len);
13379 }
13380
13381 /* Display disabled extensions. */
13382 if (ext)
13383 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13384 {
13385 name = cpu_noarch [j].name;
13386 len = cpu_noarch [j].len;
13387 p = output_message (stream, p, message, start, &left, name,
13388 len);
13389 }
13390
13391 *p = '\0';
13392 fprintf (stream, "%s\n", message);
13393 }
13394
13395 void
13396 md_show_usage (FILE *stream)
13397 {
13398 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13399 fprintf (stream, _("\
13400 -Qy, -Qn ignored\n\
13401 -V print assembler version number\n\
13402 -k ignored\n"));
13403 #endif
13404 fprintf (stream, _("\
13405 -n Do not optimize code alignment\n\
13406 -q quieten some warnings\n"));
13407 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13408 fprintf (stream, _("\
13409 -s ignored\n"));
13410 #endif
13411 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13412 || defined (TE_PE) || defined (TE_PEP))
13413 fprintf (stream, _("\
13414 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
13415 #endif
13416 #ifdef SVR4_COMMENT_CHARS
13417 fprintf (stream, _("\
13418 --divide do not treat `/' as a comment character\n"));
13419 #else
13420 fprintf (stream, _("\
13421 --divide ignored\n"));
13422 #endif
13423 fprintf (stream, _("\
13424 -march=CPU[,+EXTENSION...]\n\
13425 generate code for CPU and EXTENSION, CPU is one of:\n"));
13426 show_arch (stream, 0, 1);
13427 fprintf (stream, _("\
13428 EXTENSION is combination of:\n"));
13429 show_arch (stream, 1, 0);
13430 fprintf (stream, _("\
13431 -mtune=CPU optimize for CPU, CPU is one of:\n"));
13432 show_arch (stream, 0, 0);
13433 fprintf (stream, _("\
13434 -msse2avx encode SSE instructions with VEX prefix\n"));
13435 fprintf (stream, _("\
13436 -msse-check=[none|error|warning] (default: warning)\n\
13437 check SSE instructions\n"));
13438 fprintf (stream, _("\
13439 -moperand-check=[none|error|warning] (default: warning)\n\
13440 check operand combinations for validity\n"));
13441 fprintf (stream, _("\
13442 -mavxscalar=[128|256] (default: 128)\n\
13443 encode scalar AVX instructions with specific vector\n\
13444 length\n"));
13445 fprintf (stream, _("\
13446 -mvexwig=[0|1] (default: 0)\n\
13447 encode VEX instructions with specific VEX.W value\n\
13448 for VEX.W bit ignored instructions\n"));
13449 fprintf (stream, _("\
13450 -mevexlig=[128|256|512] (default: 128)\n\
13451 encode scalar EVEX instructions with specific vector\n\
13452 length\n"));
13453 fprintf (stream, _("\
13454 -mevexwig=[0|1] (default: 0)\n\
13455 encode EVEX instructions with specific EVEX.W value\n\
13456 for EVEX.W bit ignored instructions\n"));
13457 fprintf (stream, _("\
13458 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13459 encode EVEX instructions with specific EVEX.RC value\n\
13460 for SAE-only ignored instructions\n"));
13461 fprintf (stream, _("\
13462 -mmnemonic=[att|intel] "));
13463 if (SYSV386_COMPAT)
13464 fprintf (stream, _("(default: att)\n"));
13465 else
13466 fprintf (stream, _("(default: intel)\n"));
13467 fprintf (stream, _("\
13468 use AT&T/Intel mnemonic\n"));
13469 fprintf (stream, _("\
13470 -msyntax=[att|intel] (default: att)\n\
13471 use AT&T/Intel syntax\n"));
13472 fprintf (stream, _("\
13473 -mindex-reg support pseudo index registers\n"));
13474 fprintf (stream, _("\
13475 -mnaked-reg don't require `%%' prefix for registers\n"));
13476 fprintf (stream, _("\
13477 -madd-bnd-prefix add BND prefix for all valid branches\n"));
13478 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13479 fprintf (stream, _("\
13480 -mshared disable branch optimization for shared code\n"));
13481 fprintf (stream, _("\
13482 -mx86-used-note=[no|yes] "));
13483 if (DEFAULT_X86_USED_NOTE)
13484 fprintf (stream, _("(default: yes)\n"));
13485 else
13486 fprintf (stream, _("(default: no)\n"));
13487 fprintf (stream, _("\
13488 generate x86 used ISA and feature properties\n"));
13489 #endif
13490 #if defined (TE_PE) || defined (TE_PEP)
13491 fprintf (stream, _("\
13492 -mbig-obj generate big object files\n"));
13493 #endif
13494 fprintf (stream, _("\
13495 -momit-lock-prefix=[no|yes] (default: no)\n\
13496 strip all lock prefixes\n"));
13497 fprintf (stream, _("\
13498 -mfence-as-lock-add=[no|yes] (default: no)\n\
13499 encode lfence, mfence and sfence as\n\
13500 lock addl $0x0, (%%{re}sp)\n"));
13501 fprintf (stream, _("\
13502 -mrelax-relocations=[no|yes] "));
13503 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13504 fprintf (stream, _("(default: yes)\n"));
13505 else
13506 fprintf (stream, _("(default: no)\n"));
13507 fprintf (stream, _("\
13508 generate relax relocations\n"));
13509 fprintf (stream, _("\
13510 -malign-branch-boundary=NUM (default: 0)\n\
13511 align branches within NUM byte boundary\n"));
13512 fprintf (stream, _("\
13513 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13514 TYPE is combination of jcc, fused, jmp, call, ret,\n\
13515 indirect\n\
13516 specify types of branches to align\n"));
13517 fprintf (stream, _("\
13518 -malign-branch-prefix-size=NUM (default: 5)\n\
13519 align branches with NUM prefixes per instruction\n"));
13520 fprintf (stream, _("\
13521 -mbranches-within-32B-boundaries\n\
13522 align branches within 32 byte boundary\n"));
13523 fprintf (stream, _("\
13524 -mlfence-after-load=[no|yes] (default: no)\n\
13525 generate lfence after load\n"));
13526 fprintf (stream, _("\
13527 -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13528 generate lfence before indirect near branch\n"));
13529 fprintf (stream, _("\
13530 -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13531 generate lfence before ret\n"));
13532 fprintf (stream, _("\
13533 -mamd64 accept only AMD64 ISA [default]\n"));
13534 fprintf (stream, _("\
13535 -mintel64 accept only Intel64 ISA\n"));
13536 }
13537
13538 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13539 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13540 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13541
13542 /* Pick the target format to use. */
13543
13544 const char *
13545 i386_target_format (void)
13546 {
13547 if (!strncmp (default_arch, "x86_64", 6))
13548 {
13549 update_code_flag (CODE_64BIT, 1);
13550 if (default_arch[6] == '\0')
13551 x86_elf_abi = X86_64_ABI;
13552 else
13553 x86_elf_abi = X86_64_X32_ABI;
13554 }
13555 else if (!strcmp (default_arch, "i386"))
13556 update_code_flag (CODE_32BIT, 1);
13557 else if (!strcmp (default_arch, "iamcu"))
13558 {
13559 update_code_flag (CODE_32BIT, 1);
13560 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13561 {
13562 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13563 cpu_arch_name = "iamcu";
13564 cpu_sub_arch_name = NULL;
13565 cpu_arch_flags = iamcu_flags;
13566 cpu_arch_isa = PROCESSOR_IAMCU;
13567 cpu_arch_isa_flags = iamcu_flags;
13568 if (!cpu_arch_tune_set)
13569 {
13570 cpu_arch_tune = cpu_arch_isa;
13571 cpu_arch_tune_flags = cpu_arch_isa_flags;
13572 }
13573 }
13574 else if (cpu_arch_isa != PROCESSOR_IAMCU)
13575 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13576 cpu_arch_name);
13577 }
13578 else
13579 as_fatal (_("unknown architecture"));
13580
13581 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13582 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13583 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13584 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13585
13586 switch (OUTPUT_FLAVOR)
13587 {
13588 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13589 case bfd_target_aout_flavour:
13590 return AOUT_TARGET_FORMAT;
13591 #endif
13592 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13593 # if defined (TE_PE) || defined (TE_PEP)
13594 case bfd_target_coff_flavour:
13595 if (flag_code == CODE_64BIT)
13596 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13597 else
13598 return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13599 # elif defined (TE_GO32)
13600 case bfd_target_coff_flavour:
13601 return "coff-go32";
13602 # else
13603 case bfd_target_coff_flavour:
13604 return "coff-i386";
13605 # endif
13606 #endif
13607 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13608 case bfd_target_elf_flavour:
13609 {
13610 const char *format;
13611
13612 switch (x86_elf_abi)
13613 {
13614 default:
13615 format = ELF_TARGET_FORMAT;
13616 #ifndef TE_SOLARIS
13617 tls_get_addr = "___tls_get_addr";
13618 #endif
13619 break;
13620 case X86_64_ABI:
13621 use_rela_relocations = 1;
13622 object_64bit = 1;
13623 #ifndef TE_SOLARIS
13624 tls_get_addr = "__tls_get_addr";
13625 #endif
13626 format = ELF_TARGET_FORMAT64;
13627 break;
13628 case X86_64_X32_ABI:
13629 use_rela_relocations = 1;
13630 object_64bit = 1;
13631 #ifndef TE_SOLARIS
13632 tls_get_addr = "__tls_get_addr";
13633 #endif
13634 disallow_64bit_reloc = 1;
13635 format = ELF_TARGET_FORMAT32;
13636 break;
13637 }
13638 if (cpu_arch_isa == PROCESSOR_L1OM)
13639 {
13640 if (x86_elf_abi != X86_64_ABI)
13641 as_fatal (_("Intel L1OM is 64bit only"));
13642 return ELF_TARGET_L1OM_FORMAT;
13643 }
13644 else if (cpu_arch_isa == PROCESSOR_K1OM)
13645 {
13646 if (x86_elf_abi != X86_64_ABI)
13647 as_fatal (_("Intel K1OM is 64bit only"));
13648 return ELF_TARGET_K1OM_FORMAT;
13649 }
13650 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13651 {
13652 if (x86_elf_abi != I386_ABI)
13653 as_fatal (_("Intel MCU is 32bit only"));
13654 return ELF_TARGET_IAMCU_FORMAT;
13655 }
13656 else
13657 return format;
13658 }
13659 #endif
13660 #if defined (OBJ_MACH_O)
13661 case bfd_target_mach_o_flavour:
13662 if (flag_code == CODE_64BIT)
13663 {
13664 use_rela_relocations = 1;
13665 object_64bit = 1;
13666 return "mach-o-x86-64";
13667 }
13668 else
13669 return "mach-o-i386";
13670 #endif
13671 default:
13672 abort ();
13673 return NULL;
13674 }
13675 }
13676
13677 #endif /* OBJ_MAYBE_ more than one */
13678 \f
13679 symbolS *
13680 md_undefined_symbol (char *name)
13681 {
13682 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13683 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13684 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13685 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13686 {
13687 if (!GOT_symbol)
13688 {
13689 if (symbol_find (name))
13690 as_bad (_("GOT already in symbol table"));
13691 GOT_symbol = symbol_new (name, undefined_section,
13692 (valueT) 0, &zero_address_frag);
13693 };
13694 return GOT_symbol;
13695 }
13696 return 0;
13697 }
13698
13699 /* Round up a section size to the appropriate boundary. */
13700
13701 valueT
13702 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13703 {
13704 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13705 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13706 {
13707 /* For a.out, force the section size to be aligned. If we don't do
13708 this, BFD will align it for us, but it will not write out the
13709 final bytes of the section. This may be a bug in BFD, but it is
13710 easier to fix it here since that is how the other a.out targets
13711 work. */
13712 int align;
13713
13714 align = bfd_section_alignment (segment);
13715 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13716 }
13717 #endif
13718
13719 return size;
13720 }
13721
13722 /* On the i386, PC-relative offsets are relative to the start of the
13723 next instruction. That is, the address of the offset, plus its
13724 size, since the offset is always the last part of the insn. */
13725
13726 long
13727 md_pcrel_from (fixS *fixP)
13728 {
13729 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13730 }
13731
13732 #ifndef I386COFF
13733
13734 static void
13735 s_bss (int ignore ATTRIBUTE_UNUSED)
13736 {
13737 int temp;
13738
13739 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13740 if (IS_ELF)
13741 obj_elf_section_change_hook ();
13742 #endif
13743 temp = get_absolute_expression ();
13744 subseg_set (bss_section, (subsegT) temp);
13745 demand_empty_rest_of_line ();
13746 }
13747
13748 #endif
13749
13750 /* Remember constant directive. */
13751
13752 void
13753 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13754 {
13755 if (last_insn.kind != last_insn_directive
13756 && (bfd_section_flags (now_seg) & SEC_CODE))
13757 {
13758 last_insn.seg = now_seg;
13759 last_insn.kind = last_insn_directive;
13760 last_insn.name = "constant directive";
13761 last_insn.file = as_where (&last_insn.line);
13762 if (lfence_before_ret != lfence_before_ret_none)
13763 {
13764 if (lfence_before_indirect_branch != lfence_branch_none)
13765 as_warn (_("constant directive skips -mlfence-before-ret "
13766 "and -mlfence-before-indirect-branch"));
13767 else
13768 as_warn (_("constant directive skips -mlfence-before-ret"));
13769 }
13770 else if (lfence_before_indirect_branch != lfence_branch_none)
13771 as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13772 }
13773 }
13774
13775 void
13776 i386_validate_fix (fixS *fixp)
13777 {
13778 if (fixp->fx_subsy)
13779 {
13780 if (fixp->fx_subsy == GOT_symbol)
13781 {
13782 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13783 {
13784 if (!object_64bit)
13785 abort ();
13786 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13787 if (fixp->fx_tcbit2)
13788 fixp->fx_r_type = (fixp->fx_tcbit
13789 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13790 : BFD_RELOC_X86_64_GOTPCRELX);
13791 else
13792 #endif
13793 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13794 }
13795 else
13796 {
13797 if (!object_64bit)
13798 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13799 else
13800 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13801 }
13802 fixp->fx_subsy = 0;
13803 }
13804 }
13805 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13806 else if (!object_64bit)
13807 {
13808 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13809 && fixp->fx_tcbit2)
13810 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13811 }
13812 #endif
13813 }
13814
13815 arelent *
13816 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13817 {
13818 arelent *rel;
13819 bfd_reloc_code_real_type code;
13820
13821 switch (fixp->fx_r_type)
13822 {
13823 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13824 case BFD_RELOC_SIZE32:
13825 case BFD_RELOC_SIZE64:
13826 if (S_IS_DEFINED (fixp->fx_addsy)
13827 && !S_IS_EXTERNAL (fixp->fx_addsy))
13828 {
13829 /* Resolve size relocation against local symbol to size of
13830 the symbol plus addend. */
13831 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13832 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13833 && !fits_in_unsigned_long (value))
13834 as_bad_where (fixp->fx_file, fixp->fx_line,
13835 _("symbol size computation overflow"));
13836 fixp->fx_addsy = NULL;
13837 fixp->fx_subsy = NULL;
13838 md_apply_fix (fixp, (valueT *) &value, NULL);
13839 return NULL;
13840 }
13841 #endif
13842 /* Fall through. */
13843
13844 case BFD_RELOC_X86_64_PLT32:
13845 case BFD_RELOC_X86_64_GOT32:
13846 case BFD_RELOC_X86_64_GOTPCREL:
13847 case BFD_RELOC_X86_64_GOTPCRELX:
13848 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13849 case BFD_RELOC_386_PLT32:
13850 case BFD_RELOC_386_GOT32:
13851 case BFD_RELOC_386_GOT32X:
13852 case BFD_RELOC_386_GOTOFF:
13853 case BFD_RELOC_386_GOTPC:
13854 case BFD_RELOC_386_TLS_GD:
13855 case BFD_RELOC_386_TLS_LDM:
13856 case BFD_RELOC_386_TLS_LDO_32:
13857 case BFD_RELOC_386_TLS_IE_32:
13858 case BFD_RELOC_386_TLS_IE:
13859 case BFD_RELOC_386_TLS_GOTIE:
13860 case BFD_RELOC_386_TLS_LE_32:
13861 case BFD_RELOC_386_TLS_LE:
13862 case BFD_RELOC_386_TLS_GOTDESC:
13863 case BFD_RELOC_386_TLS_DESC_CALL:
13864 case BFD_RELOC_X86_64_TLSGD:
13865 case BFD_RELOC_X86_64_TLSLD:
13866 case BFD_RELOC_X86_64_DTPOFF32:
13867 case BFD_RELOC_X86_64_DTPOFF64:
13868 case BFD_RELOC_X86_64_GOTTPOFF:
13869 case BFD_RELOC_X86_64_TPOFF32:
13870 case BFD_RELOC_X86_64_TPOFF64:
13871 case BFD_RELOC_X86_64_GOTOFF64:
13872 case BFD_RELOC_X86_64_GOTPC32:
13873 case BFD_RELOC_X86_64_GOT64:
13874 case BFD_RELOC_X86_64_GOTPCREL64:
13875 case BFD_RELOC_X86_64_GOTPC64:
13876 case BFD_RELOC_X86_64_GOTPLT64:
13877 case BFD_RELOC_X86_64_PLTOFF64:
13878 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13879 case BFD_RELOC_X86_64_TLSDESC_CALL:
13880 case BFD_RELOC_RVA:
13881 case BFD_RELOC_VTABLE_ENTRY:
13882 case BFD_RELOC_VTABLE_INHERIT:
13883 #ifdef TE_PE
13884 case BFD_RELOC_32_SECREL:
13885 #endif
13886 code = fixp->fx_r_type;
13887 break;
13888 case BFD_RELOC_X86_64_32S:
13889 if (!fixp->fx_pcrel)
13890 {
13891 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13892 code = fixp->fx_r_type;
13893 break;
13894 }
13895 /* Fall through. */
13896 default:
13897 if (fixp->fx_pcrel)
13898 {
13899 switch (fixp->fx_size)
13900 {
13901 default:
13902 as_bad_where (fixp->fx_file, fixp->fx_line,
13903 _("can not do %d byte pc-relative relocation"),
13904 fixp->fx_size);
13905 code = BFD_RELOC_32_PCREL;
13906 break;
13907 case 1: code = BFD_RELOC_8_PCREL; break;
13908 case 2: code = BFD_RELOC_16_PCREL; break;
13909 case 4: code = BFD_RELOC_32_PCREL; break;
13910 #ifdef BFD64
13911 case 8: code = BFD_RELOC_64_PCREL; break;
13912 #endif
13913 }
13914 }
13915 else
13916 {
13917 switch (fixp->fx_size)
13918 {
13919 default:
13920 as_bad_where (fixp->fx_file, fixp->fx_line,
13921 _("can not do %d byte relocation"),
13922 fixp->fx_size);
13923 code = BFD_RELOC_32;
13924 break;
13925 case 1: code = BFD_RELOC_8; break;
13926 case 2: code = BFD_RELOC_16; break;
13927 case 4: code = BFD_RELOC_32; break;
13928 #ifdef BFD64
13929 case 8: code = BFD_RELOC_64; break;
13930 #endif
13931 }
13932 }
13933 break;
13934 }
13935
13936 if ((code == BFD_RELOC_32
13937 || code == BFD_RELOC_32_PCREL
13938 || code == BFD_RELOC_X86_64_32S)
13939 && GOT_symbol
13940 && fixp->fx_addsy == GOT_symbol)
13941 {
13942 if (!object_64bit)
13943 code = BFD_RELOC_386_GOTPC;
13944 else
13945 code = BFD_RELOC_X86_64_GOTPC32;
13946 }
13947 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13948 && GOT_symbol
13949 && fixp->fx_addsy == GOT_symbol)
13950 {
13951 code = BFD_RELOC_X86_64_GOTPC64;
13952 }
13953
13954 rel = XNEW (arelent);
13955 rel->sym_ptr_ptr = XNEW (asymbol *);
13956 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13957
13958 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13959
13960 if (!use_rela_relocations)
13961 {
13962 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13963 vtable entry to be used in the relocation's section offset. */
13964 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13965 rel->address = fixp->fx_offset;
13966 #if defined (OBJ_COFF) && defined (TE_PE)
13967 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13968 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13969 else
13970 #endif
13971 rel->addend = 0;
13972 }
13973 /* Use the rela in 64bit mode. */
13974 else
13975 {
13976 if (disallow_64bit_reloc)
13977 switch (code)
13978 {
13979 case BFD_RELOC_X86_64_DTPOFF64:
13980 case BFD_RELOC_X86_64_TPOFF64:
13981 case BFD_RELOC_64_PCREL:
13982 case BFD_RELOC_X86_64_GOTOFF64:
13983 case BFD_RELOC_X86_64_GOT64:
13984 case BFD_RELOC_X86_64_GOTPCREL64:
13985 case BFD_RELOC_X86_64_GOTPC64:
13986 case BFD_RELOC_X86_64_GOTPLT64:
13987 case BFD_RELOC_X86_64_PLTOFF64:
13988 as_bad_where (fixp->fx_file, fixp->fx_line,
13989 _("cannot represent relocation type %s in x32 mode"),
13990 bfd_get_reloc_code_name (code));
13991 break;
13992 default:
13993 break;
13994 }
13995
13996 if (!fixp->fx_pcrel)
13997 rel->addend = fixp->fx_offset;
13998 else
13999 switch (code)
14000 {
14001 case BFD_RELOC_X86_64_PLT32:
14002 case BFD_RELOC_X86_64_GOT32:
14003 case BFD_RELOC_X86_64_GOTPCREL:
14004 case BFD_RELOC_X86_64_GOTPCRELX:
14005 case BFD_RELOC_X86_64_REX_GOTPCRELX:
14006 case BFD_RELOC_X86_64_TLSGD:
14007 case BFD_RELOC_X86_64_TLSLD:
14008 case BFD_RELOC_X86_64_GOTTPOFF:
14009 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14010 case BFD_RELOC_X86_64_TLSDESC_CALL:
14011 rel->addend = fixp->fx_offset - fixp->fx_size;
14012 break;
14013 default:
14014 rel->addend = (section->vma
14015 - fixp->fx_size
14016 + fixp->fx_addnumber
14017 + md_pcrel_from (fixp));
14018 break;
14019 }
14020 }
14021
14022 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14023 if (rel->howto == NULL)
14024 {
14025 as_bad_where (fixp->fx_file, fixp->fx_line,
14026 _("cannot represent relocation type %s"),
14027 bfd_get_reloc_code_name (code));
14028 /* Set howto to a garbage value so that we can keep going. */
14029 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14030 gas_assert (rel->howto != NULL);
14031 }
14032
14033 return rel;
14034 }
14035
14036 #include "tc-i386-intel.c"
14037
14038 void
14039 tc_x86_parse_to_dw2regnum (expressionS *exp)
14040 {
14041 int saved_naked_reg;
14042 char saved_register_dot;
14043
14044 saved_naked_reg = allow_naked_reg;
14045 allow_naked_reg = 1;
14046 saved_register_dot = register_chars['.'];
14047 register_chars['.'] = '.';
14048 allow_pseudo_reg = 1;
14049 expression_and_evaluate (exp);
14050 allow_pseudo_reg = 0;
14051 register_chars['.'] = saved_register_dot;
14052 allow_naked_reg = saved_naked_reg;
14053
14054 if (exp->X_op == O_register && exp->X_add_number >= 0)
14055 {
14056 if ((addressT) exp->X_add_number < i386_regtab_size)
14057 {
14058 exp->X_op = O_constant;
14059 exp->X_add_number = i386_regtab[exp->X_add_number]
14060 .dw2_regnum[flag_code >> 1];
14061 }
14062 else
14063 exp->X_op = O_illegal;
14064 }
14065 }
14066
14067 void
14068 tc_x86_frame_initial_instructions (void)
14069 {
14070 static unsigned int sp_regno[2];
14071
14072 if (!sp_regno[flag_code >> 1])
14073 {
14074 char *saved_input = input_line_pointer;
14075 char sp[][4] = {"esp", "rsp"};
14076 expressionS exp;
14077
14078 input_line_pointer = sp[flag_code >> 1];
14079 tc_x86_parse_to_dw2regnum (&exp);
14080 gas_assert (exp.X_op == O_constant);
14081 sp_regno[flag_code >> 1] = exp.X_add_number;
14082 input_line_pointer = saved_input;
14083 }
14084
14085 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14086 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14087 }
14088
14089 int
14090 x86_dwarf2_addr_size (void)
14091 {
14092 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14093 if (x86_elf_abi == X86_64_X32_ABI)
14094 return 4;
14095 #endif
14096 return bfd_arch_bits_per_address (stdoutput) / 8;
14097 }
14098
14099 int
14100 i386_elf_section_type (const char *str, size_t len)
14101 {
14102 if (flag_code == CODE_64BIT
14103 && len == sizeof ("unwind") - 1
14104 && strncmp (str, "unwind", 6) == 0)
14105 return SHT_X86_64_UNWIND;
14106
14107 return -1;
14108 }
14109
14110 #ifdef TE_SOLARIS
14111 void
14112 i386_solaris_fix_up_eh_frame (segT sec)
14113 {
14114 if (flag_code == CODE_64BIT)
14115 elf_section_type (sec) = SHT_X86_64_UNWIND;
14116 }
14117 #endif
14118
14119 #ifdef TE_PE
14120 void
14121 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14122 {
14123 expressionS exp;
14124
14125 exp.X_op = O_secrel;
14126 exp.X_add_symbol = symbol;
14127 exp.X_add_number = 0;
14128 emit_expr (&exp, size);
14129 }
14130 #endif
14131
14132 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14133 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
14134
14135 bfd_vma
14136 x86_64_section_letter (int letter, const char **ptr_msg)
14137 {
14138 if (flag_code == CODE_64BIT)
14139 {
14140 if (letter == 'l')
14141 return SHF_X86_64_LARGE;
14142
14143 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14144 }
14145 else
14146 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14147 return -1;
14148 }
14149
14150 bfd_vma
14151 x86_64_section_word (char *str, size_t len)
14152 {
14153 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
14154 return SHF_X86_64_LARGE;
14155
14156 return -1;
14157 }
14158
14159 static void
14160 handle_large_common (int small ATTRIBUTE_UNUSED)
14161 {
14162 if (flag_code != CODE_64BIT)
14163 {
14164 s_comm_internal (0, elf_common_parse);
14165 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14166 }
14167 else
14168 {
14169 static segT lbss_section;
14170 asection *saved_com_section_ptr = elf_com_section_ptr;
14171 asection *saved_bss_section = bss_section;
14172
14173 if (lbss_section == NULL)
14174 {
14175 flagword applicable;
14176 segT seg = now_seg;
14177 subsegT subseg = now_subseg;
14178
14179 /* The .lbss section is for local .largecomm symbols. */
14180 lbss_section = subseg_new (".lbss", 0);
14181 applicable = bfd_applicable_section_flags (stdoutput);
14182 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14183 seg_info (lbss_section)->bss = 1;
14184
14185 subseg_set (seg, subseg);
14186 }
14187
14188 elf_com_section_ptr = &_bfd_elf_large_com_section;
14189 bss_section = lbss_section;
14190
14191 s_comm_internal (0, elf_common_parse);
14192
14193 elf_com_section_ptr = saved_com_section_ptr;
14194 bss_section = saved_bss_section;
14195 }
14196 }
14197 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 0.295452 seconds and 3 git commands to generate.