x86: Remove CpuABM and add CpuPOPCNT
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef INFER_ADDR_PREFIX
48 #define INFER_ADDR_PREFIX 1
49 #endif
50
51 #ifndef DEFAULT_ARCH
52 #define DEFAULT_ARCH "i386"
53 #endif
54
55 #ifndef INLINE
56 #if __GNUC__ >= 2
57 #define INLINE __inline__
58 #else
59 #define INLINE
60 #endif
61 #endif
62
63 /* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
68 #define WAIT_PREFIX 0
69 #define SEG_PREFIX 1
70 #define ADDR_PREFIX 2
71 #define DATA_PREFIX 3
72 #define REP_PREFIX 4
73 #define HLE_PREFIX REP_PREFIX
74 #define BND_PREFIX REP_PREFIX
75 #define LOCK_PREFIX 5
76 #define REX_PREFIX 6 /* must come last. */
77 #define MAX_PREFIXES 7 /* max prefixes per opcode */
78
79 /* we define the syntax here (modulo base,index,scale syntax) */
80 #define REGISTER_PREFIX '%'
81 #define IMMEDIATE_PREFIX '$'
82 #define ABSOLUTE_PREFIX '*'
83
84 /* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86 #define WORD_MNEM_SUFFIX 'w'
87 #define BYTE_MNEM_SUFFIX 'b'
88 #define SHORT_MNEM_SUFFIX 's'
89 #define LONG_MNEM_SUFFIX 'l'
90 #define QWORD_MNEM_SUFFIX 'q'
91 /* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95 #define END_OF_INSN '\0'
96
97 /* This matches the C -> StaticRounding alias in the opcode table. */
98 #define commutative staticrounding
99
100 /*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107 typedef struct
108 {
109 const insn_template *start;
110 const insn_template *end;
111 }
112 templates;
113
114 /* 386 operand encoding bytes: see 386 book for details of this. */
115 typedef struct
116 {
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120 }
121 modrm_byte;
122
123 /* x86-64 extension prefix. */
124 typedef int rex_byte;
125
126 /* 386 opcode byte to code indirect addressing. */
127 typedef struct
128 {
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132 }
133 sib_byte;
134
135 /* x86 arch names, types and features */
136 typedef struct
137 {
138 const char *name; /* arch name */
139 unsigned int len; /* arch string length */
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
142 unsigned int skip; /* show_arch should skip this. */
143 }
144 arch_entry;
145
146 /* Used to turn off indicated flags. */
147 typedef struct
148 {
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152 }
153 noarch_entry;
154
155 static void update_code_flag (int, int);
156 static void set_code_flag (int);
157 static void set_16bit_gcc_code_flag (int);
158 static void set_intel_syntax (int);
159 static void set_intel_mnemonic (int);
160 static void set_allow_index_reg (int);
161 static void set_check (int);
162 static void set_cpu_arch (int);
163 #ifdef TE_PE
164 static void pe_directive_secrel (int);
165 #endif
166 static void signed_cons (int);
167 static char *output_invalid (int c);
168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
172 static int i386_att_operand (char *);
173 static int i386_intel_operand (char *, int);
174 static int i386_intel_simplify (expressionS *);
175 static int i386_intel_parse_name (const char *, expressionS *);
176 static const reg_entry *parse_register (char *, char **);
177 static char *parse_insn (char *, char *);
178 static char *parse_operands (char *, const char *);
179 static void swap_operands (void);
180 static void swap_2_operands (int, int);
181 static enum flag_code i386_addressing_mode (void);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
202
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
210
211 static const char *default_arch = DEFAULT_ARCH;
212
213 /* This struct describes rounding control and SAE in the instruction. */
214 struct RC_Operation
215 {
216 enum rc_type
217 {
218 rne = 0,
219 rd,
220 ru,
221 rz,
222 saeonly
223 } type;
224 int operand;
225 };
226
227 static struct RC_Operation rc_op;
228
229 /* The struct describes masking, applied to OPERAND in the instruction.
230 MASK is a pointer to the corresponding mask register. ZEROING tells
231 whether merging or zeroing mask is used. */
232 struct Mask_Operation
233 {
234 const reg_entry *mask;
235 unsigned int zeroing;
236 /* The operand where this operation is associated. */
237 int operand;
238 };
239
240 static struct Mask_Operation mask_op;
241
242 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
243 broadcast factor. */
244 struct Broadcast_Operation
245 {
246 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
247 int type;
248
249 /* Index of broadcasted operand. */
250 int operand;
251
252 /* Number of bytes to broadcast. */
253 int bytes;
254 };
255
256 static struct Broadcast_Operation broadcast_op;
257
258 /* VEX prefix. */
259 typedef struct
260 {
261 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
262 unsigned char bytes[4];
263 unsigned int length;
264 /* Destination or source register specifier. */
265 const reg_entry *register_specifier;
266 } vex_prefix;
267
268 /* 'md_assemble ()' gathers together information and puts it into a
269 i386_insn. */
270
271 union i386_op
272 {
273 expressionS *disps;
274 expressionS *imms;
275 const reg_entry *regs;
276 };
277
278 enum i386_error
279 {
280 operand_size_mismatch,
281 operand_type_mismatch,
282 register_type_mismatch,
283 number_of_operands_mismatch,
284 invalid_instruction_suffix,
285 bad_imm4,
286 unsupported_with_intel_mnemonic,
287 unsupported_syntax,
288 unsupported,
289 invalid_vsib_address,
290 invalid_vector_register_set,
291 unsupported_vector_index_register,
292 unsupported_broadcast,
293 broadcast_needed,
294 unsupported_masking,
295 mask_not_on_destination,
296 no_default_mask,
297 unsupported_rc_sae,
298 rc_sae_operand_not_last_imm,
299 invalid_register_operand,
300 };
301
302 struct _i386_insn
303 {
304 /* TM holds the template for the insn were currently assembling. */
305 insn_template tm;
306
307 /* SUFFIX holds the instruction size suffix for byte, word, dword
308 or qword, if given. */
309 char suffix;
310
311 /* OPERANDS gives the number of given operands. */
312 unsigned int operands;
313
314 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
315 of given register, displacement, memory operands and immediate
316 operands. */
317 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
318
319 /* TYPES [i] is the type (see above #defines) which tells us how to
320 use OP[i] for the corresponding operand. */
321 i386_operand_type types[MAX_OPERANDS];
322
323 /* Displacement expression, immediate expression, or register for each
324 operand. */
325 union i386_op op[MAX_OPERANDS];
326
327 /* Flags for operands. */
328 unsigned int flags[MAX_OPERANDS];
329 #define Operand_PCrel 1
330 #define Operand_Mem 2
331
332 /* Relocation type for operand */
333 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
334
335 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
336 the base index byte below. */
337 const reg_entry *base_reg;
338 const reg_entry *index_reg;
339 unsigned int log2_scale_factor;
340
341 /* SEG gives the seg_entries of this insn. They are zero unless
342 explicit segment overrides are given. */
343 const seg_entry *seg[2];
344
345 /* Copied first memory operand string, for re-checking. */
346 char *memop1_string;
347
348 /* PREFIX holds all the given prefix opcodes (usually null).
349 PREFIXES is the number of prefix opcodes. */
350 unsigned int prefixes;
351 unsigned char prefix[MAX_PREFIXES];
352
353 /* Register is in low 3 bits of opcode. */
354 bfd_boolean short_form;
355
356 /* The operand to a branch insn indicates an absolute branch. */
357 bfd_boolean jumpabsolute;
358
359 /* Has MMX register operands. */
360 bfd_boolean has_regmmx;
361
362 /* Has XMM register operands. */
363 bfd_boolean has_regxmm;
364
365 /* Has YMM register operands. */
366 bfd_boolean has_regymm;
367
368 /* Has ZMM register operands. */
369 bfd_boolean has_regzmm;
370
371 /* Has GOTPC or TLS relocation. */
372 bfd_boolean has_gotpc_tls_reloc;
373
374 /* RM and SIB are the modrm byte and the sib byte where the
375 addressing modes of this insn are encoded. */
376 modrm_byte rm;
377 rex_byte rex;
378 rex_byte vrex;
379 sib_byte sib;
380 vex_prefix vex;
381
382 /* Masking attributes. */
383 struct Mask_Operation *mask;
384
385 /* Rounding control and SAE attributes. */
386 struct RC_Operation *rounding;
387
388 /* Broadcasting attributes. */
389 struct Broadcast_Operation *broadcast;
390
391 /* Compressed disp8*N attribute. */
392 unsigned int memshift;
393
394 /* Prefer load or store in encoding. */
395 enum
396 {
397 dir_encoding_default = 0,
398 dir_encoding_load,
399 dir_encoding_store,
400 dir_encoding_swap
401 } dir_encoding;
402
403 /* Prefer 8bit or 32bit displacement in encoding. */
404 enum
405 {
406 disp_encoding_default = 0,
407 disp_encoding_8bit,
408 disp_encoding_32bit
409 } disp_encoding;
410
411 /* Prefer the REX byte in encoding. */
412 bfd_boolean rex_encoding;
413
414 /* Disable instruction size optimization. */
415 bfd_boolean no_optimize;
416
417 /* How to encode vector instructions. */
418 enum
419 {
420 vex_encoding_default = 0,
421 vex_encoding_vex,
422 vex_encoding_vex3,
423 vex_encoding_evex
424 } vec_encoding;
425
426 /* REP prefix. */
427 const char *rep_prefix;
428
429 /* HLE prefix. */
430 const char *hle_prefix;
431
432 /* Have BND prefix. */
433 const char *bnd_prefix;
434
435 /* Have NOTRACK prefix. */
436 const char *notrack_prefix;
437
438 /* Error message. */
439 enum i386_error error;
440 };
441
442 typedef struct _i386_insn i386_insn;
443
444 /* Link RC type with corresponding string, that'll be looked for in
445 asm. */
446 struct RC_name
447 {
448 enum rc_type type;
449 const char *name;
450 unsigned int len;
451 };
452
453 static const struct RC_name RC_NamesTable[] =
454 {
455 { rne, STRING_COMMA_LEN ("rn-sae") },
456 { rd, STRING_COMMA_LEN ("rd-sae") },
457 { ru, STRING_COMMA_LEN ("ru-sae") },
458 { rz, STRING_COMMA_LEN ("rz-sae") },
459 { saeonly, STRING_COMMA_LEN ("sae") },
460 };
461
462 /* List of chars besides those in app.c:symbol_chars that can start an
463 operand. Used to prevent the scrubber eating vital white-space. */
464 const char extra_symbol_chars[] = "*%-([{}"
465 #ifdef LEX_AT
466 "@"
467 #endif
468 #ifdef LEX_QM
469 "?"
470 #endif
471 ;
472
473 #if (defined (TE_I386AIX) \
474 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
475 && !defined (TE_GNU) \
476 && !defined (TE_LINUX) \
477 && !defined (TE_NACL) \
478 && !defined (TE_FreeBSD) \
479 && !defined (TE_DragonFly) \
480 && !defined (TE_NetBSD)))
481 /* This array holds the chars that always start a comment. If the
482 pre-processor is disabled, these aren't very useful. The option
483 --divide will remove '/' from this list. */
484 const char *i386_comment_chars = "#/";
485 #define SVR4_COMMENT_CHARS 1
486 #define PREFIX_SEPARATOR '\\'
487
488 #else
489 const char *i386_comment_chars = "#";
490 #define PREFIX_SEPARATOR '/'
491 #endif
492
493 /* This array holds the chars that only start a comment at the beginning of
494 a line. If the line seems to have the form '# 123 filename'
495 .line and .file directives will appear in the pre-processed output.
496 Note that input_file.c hand checks for '#' at the beginning of the
497 first line of the input file. This is because the compiler outputs
498 #NO_APP at the beginning of its output.
499 Also note that comments started like this one will always work if
500 '/' isn't otherwise defined. */
501 const char line_comment_chars[] = "#/";
502
503 const char line_separator_chars[] = ";";
504
505 /* Chars that can be used to separate mant from exp in floating point
506 nums. */
507 const char EXP_CHARS[] = "eE";
508
509 /* Chars that mean this number is a floating point constant
510 As in 0f12.456
511 or 0d1.2345e12. */
512 const char FLT_CHARS[] = "fFdDxX";
513
514 /* Tables for lexical analysis. */
515 static char mnemonic_chars[256];
516 static char register_chars[256];
517 static char operand_chars[256];
518 static char identifier_chars[256];
519 static char digit_chars[256];
520
521 /* Lexical macros. */
522 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
523 #define is_operand_char(x) (operand_chars[(unsigned char) x])
524 #define is_register_char(x) (register_chars[(unsigned char) x])
525 #define is_space_char(x) ((x) == ' ')
526 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
527 #define is_digit_char(x) (digit_chars[(unsigned char) x])
528
529 /* All non-digit non-letter characters that may occur in an operand. */
530 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
531
532 /* md_assemble() always leaves the strings it's passed unaltered. To
533 effect this we maintain a stack of saved characters that we've smashed
534 with '\0's (indicating end of strings for various sub-fields of the
535 assembler instruction). */
536 static char save_stack[32];
537 static char *save_stack_p;
538 #define END_STRING_AND_SAVE(s) \
539 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
540 #define RESTORE_END_STRING(s) \
541 do { *(s) = *--save_stack_p; } while (0)
542
543 /* The instruction we're assembling. */
544 static i386_insn i;
545
546 /* Possible templates for current insn. */
547 static const templates *current_templates;
548
549 /* Per instruction expressionS buffers: max displacements & immediates. */
550 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
551 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
552
553 /* Current operand we are working on. */
554 static int this_operand = -1;
555
556 /* We support four different modes. FLAG_CODE variable is used to distinguish
557 these. */
558
559 enum flag_code {
560 CODE_32BIT,
561 CODE_16BIT,
562 CODE_64BIT };
563
564 static enum flag_code flag_code;
565 static unsigned int object_64bit;
566 static unsigned int disallow_64bit_reloc;
567 static int use_rela_relocations = 0;
568 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
569 static const char *tls_get_addr;
570
571 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
572 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
573 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
574
575 /* The ELF ABI to use. */
576 enum x86_elf_abi
577 {
578 I386_ABI,
579 X86_64_ABI,
580 X86_64_X32_ABI
581 };
582
583 static enum x86_elf_abi x86_elf_abi = I386_ABI;
584 #endif
585
586 #if defined (TE_PE) || defined (TE_PEP)
587 /* Use big object file format. */
588 static int use_big_obj = 0;
589 #endif
590
591 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
592 /* 1 if generating code for a shared library. */
593 static int shared = 0;
594 #endif
595
596 /* 1 for intel syntax,
597 0 if att syntax. */
598 static int intel_syntax = 0;
599
600 static enum x86_64_isa
601 {
602 amd64 = 1, /* AMD64 ISA. */
603 intel64 /* Intel64 ISA. */
604 } isa64;
605
606 /* 1 for intel mnemonic,
607 0 if att mnemonic. */
608 static int intel_mnemonic = !SYSV386_COMPAT;
609
610 /* 1 if pseudo registers are permitted. */
611 static int allow_pseudo_reg = 0;
612
613 /* 1 if register prefix % not required. */
614 static int allow_naked_reg = 0;
615
616 /* 1 if the assembler should add BND prefix for all control-transferring
617 instructions supporting it, even if this prefix wasn't specified
618 explicitly. */
619 static int add_bnd_prefix = 0;
620
621 /* 1 if pseudo index register, eiz/riz, is allowed . */
622 static int allow_index_reg = 0;
623
624 /* 1 if the assembler should ignore LOCK prefix, even if it was
625 specified explicitly. */
626 static int omit_lock_prefix = 0;
627
628 /* 1 if the assembler should encode lfence, mfence, and sfence as
629 "lock addl $0, (%{re}sp)". */
630 static int avoid_fence = 0;
631
632 /* Type of the previous instruction. */
633 static struct
634 {
635 segT seg;
636 const char *file;
637 const char *name;
638 unsigned int line;
639 enum last_insn_kind
640 {
641 last_insn_other = 0,
642 last_insn_directive,
643 last_insn_prefix
644 } kind;
645 } last_insn;
646
647 /* 1 if the assembler should generate relax relocations. */
648
649 static int generate_relax_relocations
650 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
651
652 static enum check_kind
653 {
654 check_none = 0,
655 check_warning,
656 check_error
657 }
658 sse_check, operand_check = check_warning;
659
660 /* Non-zero if branches should be aligned within power of 2 boundary. */
661 static int align_branch_power = 0;
662
663 /* Types of branches to align. */
664 enum align_branch_kind
665 {
666 align_branch_none = 0,
667 align_branch_jcc = 1,
668 align_branch_fused = 2,
669 align_branch_jmp = 3,
670 align_branch_call = 4,
671 align_branch_indirect = 5,
672 align_branch_ret = 6
673 };
674
675 /* Type bits of branches to align. */
676 enum align_branch_bit
677 {
678 align_branch_jcc_bit = 1 << align_branch_jcc,
679 align_branch_fused_bit = 1 << align_branch_fused,
680 align_branch_jmp_bit = 1 << align_branch_jmp,
681 align_branch_call_bit = 1 << align_branch_call,
682 align_branch_indirect_bit = 1 << align_branch_indirect,
683 align_branch_ret_bit = 1 << align_branch_ret
684 };
685
686 static unsigned int align_branch = (align_branch_jcc_bit
687 | align_branch_fused_bit
688 | align_branch_jmp_bit);
689
690 /* The maximum padding size for fused jcc. CMP like instruction can
691 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
692 prefixes. */
693 #define MAX_FUSED_JCC_PADDING_SIZE 20
694
695 /* The maximum number of prefixes added for an instruction. */
696 static unsigned int align_branch_prefix_size = 5;
697
698 /* Optimization:
699 1. Clear the REX_W bit with register operand if possible.
700 2. Above plus use 128bit vector instruction to clear the full vector
701 register.
702 */
703 static int optimize = 0;
704
705 /* Optimization:
706 1. Clear the REX_W bit with register operand if possible.
707 2. Above plus use 128bit vector instruction to clear the full vector
708 register.
709 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
710 "testb $imm7,%r8".
711 */
712 static int optimize_for_space = 0;
713
714 /* Register prefix used for error message. */
715 static const char *register_prefix = "%";
716
717 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
718 leave, push, and pop instructions so that gcc has the same stack
719 frame as in 32 bit mode. */
720 static char stackop_size = '\0';
721
722 /* Non-zero to optimize code alignment. */
723 int optimize_align_code = 1;
724
725 /* Non-zero to quieten some warnings. */
726 static int quiet_warnings = 0;
727
728 /* CPU name. */
729 static const char *cpu_arch_name = NULL;
730 static char *cpu_sub_arch_name = NULL;
731
732 /* CPU feature flags. */
733 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
734
735 /* If we have selected a cpu we are generating instructions for. */
736 static int cpu_arch_tune_set = 0;
737
738 /* Cpu we are generating instructions for. */
739 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
740
741 /* CPU feature flags of cpu we are generating instructions for. */
742 static i386_cpu_flags cpu_arch_tune_flags;
743
744 /* CPU instruction set architecture used. */
745 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
746
747 /* CPU feature flags of instruction set architecture used. */
748 i386_cpu_flags cpu_arch_isa_flags;
749
750 /* If set, conditional jumps are not automatically promoted to handle
751 larger than a byte offset. */
752 static unsigned int no_cond_jump_promotion = 0;
753
754 /* Encode SSE instructions with VEX prefix. */
755 static unsigned int sse2avx;
756
757 /* Encode scalar AVX instructions with specific vector length. */
758 static enum
759 {
760 vex128 = 0,
761 vex256
762 } avxscalar;
763
764 /* Encode VEX WIG instructions with specific vex.w. */
765 static enum
766 {
767 vexw0 = 0,
768 vexw1
769 } vexwig;
770
771 /* Encode scalar EVEX LIG instructions with specific vector length. */
772 static enum
773 {
774 evexl128 = 0,
775 evexl256,
776 evexl512
777 } evexlig;
778
779 /* Encode EVEX WIG instructions with specific evex.w. */
780 static enum
781 {
782 evexw0 = 0,
783 evexw1
784 } evexwig;
785
786 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
787 static enum rc_type evexrcig = rne;
788
789 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
790 static symbolS *GOT_symbol;
791
792 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
793 unsigned int x86_dwarf2_return_column;
794
795 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
796 int x86_cie_data_alignment;
797
798 /* Interface to relax_segment.
799 There are 3 major relax states for 386 jump insns because the
800 different types of jumps add different sizes to frags when we're
801 figuring out what sort of jump to choose to reach a given label.
802
803 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
804 branches which are handled by md_estimate_size_before_relax() and
805 i386_generic_table_relax_frag(). */
806
807 /* Types. */
808 #define UNCOND_JUMP 0
809 #define COND_JUMP 1
810 #define COND_JUMP86 2
811 #define BRANCH_PADDING 3
812 #define BRANCH_PREFIX 4
813 #define FUSED_JCC_PADDING 5
814
815 /* Sizes. */
816 #define CODE16 1
817 #define SMALL 0
818 #define SMALL16 (SMALL | CODE16)
819 #define BIG 2
820 #define BIG16 (BIG | CODE16)
821
822 #ifndef INLINE
823 #ifdef __GNUC__
824 #define INLINE __inline__
825 #else
826 #define INLINE
827 #endif
828 #endif
829
830 #define ENCODE_RELAX_STATE(type, size) \
831 ((relax_substateT) (((type) << 2) | (size)))
832 #define TYPE_FROM_RELAX_STATE(s) \
833 ((s) >> 2)
834 #define DISP_SIZE_FROM_RELAX_STATE(s) \
835 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
836
837 /* This table is used by relax_frag to promote short jumps to long
838 ones where necessary. SMALL (short) jumps may be promoted to BIG
839 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
840 don't allow a short jump in a 32 bit code segment to be promoted to
841 a 16 bit offset jump because it's slower (requires data size
842 prefix), and doesn't work, unless the destination is in the bottom
843 64k of the code segment (The top 16 bits of eip are zeroed). */
844
845 const relax_typeS md_relax_table[] =
846 {
847 /* The fields are:
848 1) most positive reach of this state,
849 2) most negative reach of this state,
850 3) how many bytes this mode will have in the variable part of the frag
851 4) which index into the table to try if we can't fit into this one. */
852
853 /* UNCOND_JUMP states. */
854 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
855 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
856 /* dword jmp adds 4 bytes to frag:
857 0 extra opcode bytes, 4 displacement bytes. */
858 {0, 0, 4, 0},
859 /* word jmp adds 2 byte2 to frag:
860 0 extra opcode bytes, 2 displacement bytes. */
861 {0, 0, 2, 0},
862
863 /* COND_JUMP states. */
864 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
865 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
866 /* dword conditionals adds 5 bytes to frag:
867 1 extra opcode byte, 4 displacement bytes. */
868 {0, 0, 5, 0},
869 /* word conditionals add 3 bytes to frag:
870 1 extra opcode byte, 2 displacement bytes. */
871 {0, 0, 3, 0},
872
873 /* COND_JUMP86 states. */
874 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
875 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
876 /* dword conditionals adds 5 bytes to frag:
877 1 extra opcode byte, 4 displacement bytes. */
878 {0, 0, 5, 0},
879 /* word conditionals add 4 bytes to frag:
880 1 displacement byte and a 3 byte long branch insn. */
881 {0, 0, 4, 0}
882 };
883
884 static const arch_entry cpu_arch[] =
885 {
886 /* Do not replace the first two entries - i386_target_format()
887 relies on them being there in this order. */
888 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
889 CPU_GENERIC32_FLAGS, 0 },
890 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
891 CPU_GENERIC64_FLAGS, 0 },
892 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
893 CPU_NONE_FLAGS, 0 },
894 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
895 CPU_I186_FLAGS, 0 },
896 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
897 CPU_I286_FLAGS, 0 },
898 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
899 CPU_I386_FLAGS, 0 },
900 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
901 CPU_I486_FLAGS, 0 },
902 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
903 CPU_I586_FLAGS, 0 },
904 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
905 CPU_I686_FLAGS, 0 },
906 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
907 CPU_I586_FLAGS, 0 },
908 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
909 CPU_PENTIUMPRO_FLAGS, 0 },
910 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
911 CPU_P2_FLAGS, 0 },
912 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
913 CPU_P3_FLAGS, 0 },
914 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
915 CPU_P4_FLAGS, 0 },
916 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
917 CPU_CORE_FLAGS, 0 },
918 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
919 CPU_NOCONA_FLAGS, 0 },
920 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
921 CPU_CORE_FLAGS, 1 },
922 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
923 CPU_CORE_FLAGS, 0 },
924 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
925 CPU_CORE2_FLAGS, 1 },
926 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
927 CPU_CORE2_FLAGS, 0 },
928 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
929 CPU_COREI7_FLAGS, 0 },
930 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
931 CPU_L1OM_FLAGS, 0 },
932 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
933 CPU_K1OM_FLAGS, 0 },
934 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
935 CPU_IAMCU_FLAGS, 0 },
936 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
937 CPU_K6_FLAGS, 0 },
938 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
939 CPU_K6_2_FLAGS, 0 },
940 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
941 CPU_ATHLON_FLAGS, 0 },
942 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
943 CPU_K8_FLAGS, 1 },
944 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
945 CPU_K8_FLAGS, 0 },
946 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
947 CPU_K8_FLAGS, 0 },
948 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
949 CPU_AMDFAM10_FLAGS, 0 },
950 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
951 CPU_BDVER1_FLAGS, 0 },
952 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
953 CPU_BDVER2_FLAGS, 0 },
954 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
955 CPU_BDVER3_FLAGS, 0 },
956 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
957 CPU_BDVER4_FLAGS, 0 },
958 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
959 CPU_ZNVER1_FLAGS, 0 },
960 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
961 CPU_ZNVER2_FLAGS, 0 },
962 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
963 CPU_BTVER1_FLAGS, 0 },
964 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
965 CPU_BTVER2_FLAGS, 0 },
966 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
967 CPU_8087_FLAGS, 0 },
968 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
969 CPU_287_FLAGS, 0 },
970 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
971 CPU_387_FLAGS, 0 },
972 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
973 CPU_687_FLAGS, 0 },
974 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
975 CPU_CMOV_FLAGS, 0 },
976 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
977 CPU_FXSR_FLAGS, 0 },
978 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
979 CPU_MMX_FLAGS, 0 },
980 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
981 CPU_SSE_FLAGS, 0 },
982 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
983 CPU_SSE2_FLAGS, 0 },
984 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
985 CPU_SSE3_FLAGS, 0 },
986 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
987 CPU_SSE4A_FLAGS, 0 },
988 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
989 CPU_SSSE3_FLAGS, 0 },
990 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
991 CPU_SSE4_1_FLAGS, 0 },
992 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
993 CPU_SSE4_2_FLAGS, 0 },
994 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
995 CPU_SSE4_2_FLAGS, 0 },
996 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
997 CPU_AVX_FLAGS, 0 },
998 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
999 CPU_AVX2_FLAGS, 0 },
1000 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1001 CPU_AVX512F_FLAGS, 0 },
1002 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1003 CPU_AVX512CD_FLAGS, 0 },
1004 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1005 CPU_AVX512ER_FLAGS, 0 },
1006 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1007 CPU_AVX512PF_FLAGS, 0 },
1008 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1009 CPU_AVX512DQ_FLAGS, 0 },
1010 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1011 CPU_AVX512BW_FLAGS, 0 },
1012 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1013 CPU_AVX512VL_FLAGS, 0 },
1014 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1015 CPU_VMX_FLAGS, 0 },
1016 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1017 CPU_VMFUNC_FLAGS, 0 },
1018 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1019 CPU_SMX_FLAGS, 0 },
1020 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1021 CPU_XSAVE_FLAGS, 0 },
1022 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1023 CPU_XSAVEOPT_FLAGS, 0 },
1024 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1025 CPU_XSAVEC_FLAGS, 0 },
1026 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1027 CPU_XSAVES_FLAGS, 0 },
1028 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1029 CPU_AES_FLAGS, 0 },
1030 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1031 CPU_PCLMUL_FLAGS, 0 },
1032 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1033 CPU_PCLMUL_FLAGS, 1 },
1034 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1035 CPU_FSGSBASE_FLAGS, 0 },
1036 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1037 CPU_RDRND_FLAGS, 0 },
1038 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1039 CPU_F16C_FLAGS, 0 },
1040 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1041 CPU_BMI2_FLAGS, 0 },
1042 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1043 CPU_FMA_FLAGS, 0 },
1044 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1045 CPU_FMA4_FLAGS, 0 },
1046 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1047 CPU_XOP_FLAGS, 0 },
1048 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1049 CPU_LWP_FLAGS, 0 },
1050 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1051 CPU_MOVBE_FLAGS, 0 },
1052 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1053 CPU_CX16_FLAGS, 0 },
1054 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1055 CPU_EPT_FLAGS, 0 },
1056 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1057 CPU_LZCNT_FLAGS, 0 },
1058 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1059 CPU_POPCNT_FLAGS, 0 },
1060 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1061 CPU_HLE_FLAGS, 0 },
1062 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1063 CPU_RTM_FLAGS, 0 },
1064 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1065 CPU_INVPCID_FLAGS, 0 },
1066 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1067 CPU_CLFLUSH_FLAGS, 0 },
1068 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1069 CPU_NOP_FLAGS, 0 },
1070 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1071 CPU_SYSCALL_FLAGS, 0 },
1072 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1073 CPU_RDTSCP_FLAGS, 0 },
1074 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1075 CPU_3DNOW_FLAGS, 0 },
1076 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1077 CPU_3DNOWA_FLAGS, 0 },
1078 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1079 CPU_PADLOCK_FLAGS, 0 },
1080 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1081 CPU_SVME_FLAGS, 1 },
1082 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1083 CPU_SVME_FLAGS, 0 },
1084 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1085 CPU_SSE4A_FLAGS, 0 },
1086 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1087 CPU_ABM_FLAGS, 0 },
1088 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1089 CPU_BMI_FLAGS, 0 },
1090 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1091 CPU_TBM_FLAGS, 0 },
1092 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1093 CPU_ADX_FLAGS, 0 },
1094 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1095 CPU_RDSEED_FLAGS, 0 },
1096 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1097 CPU_PRFCHW_FLAGS, 0 },
1098 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1099 CPU_SMAP_FLAGS, 0 },
1100 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1101 CPU_MPX_FLAGS, 0 },
1102 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1103 CPU_SHA_FLAGS, 0 },
1104 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1105 CPU_CLFLUSHOPT_FLAGS, 0 },
1106 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1107 CPU_PREFETCHWT1_FLAGS, 0 },
1108 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1109 CPU_SE1_FLAGS, 0 },
1110 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1111 CPU_CLWB_FLAGS, 0 },
1112 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1113 CPU_AVX512IFMA_FLAGS, 0 },
1114 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1115 CPU_AVX512VBMI_FLAGS, 0 },
1116 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1117 CPU_AVX512_4FMAPS_FLAGS, 0 },
1118 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1119 CPU_AVX512_4VNNIW_FLAGS, 0 },
1120 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1121 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1122 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1123 CPU_AVX512_VBMI2_FLAGS, 0 },
1124 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1125 CPU_AVX512_VNNI_FLAGS, 0 },
1126 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1127 CPU_AVX512_BITALG_FLAGS, 0 },
1128 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1129 CPU_CLZERO_FLAGS, 0 },
1130 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1131 CPU_MWAITX_FLAGS, 0 },
1132 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1133 CPU_OSPKE_FLAGS, 0 },
1134 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1135 CPU_RDPID_FLAGS, 0 },
1136 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1137 CPU_PTWRITE_FLAGS, 0 },
1138 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1139 CPU_IBT_FLAGS, 0 },
1140 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1141 CPU_SHSTK_FLAGS, 0 },
1142 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1143 CPU_GFNI_FLAGS, 0 },
1144 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1145 CPU_VAES_FLAGS, 0 },
1146 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1147 CPU_VPCLMULQDQ_FLAGS, 0 },
1148 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1149 CPU_WBNOINVD_FLAGS, 0 },
1150 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1151 CPU_PCONFIG_FLAGS, 0 },
1152 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1153 CPU_WAITPKG_FLAGS, 0 },
1154 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1155 CPU_CLDEMOTE_FLAGS, 0 },
1156 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1157 CPU_MOVDIRI_FLAGS, 0 },
1158 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1159 CPU_MOVDIR64B_FLAGS, 0 },
1160 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1161 CPU_AVX512_BF16_FLAGS, 0 },
1162 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1163 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1164 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1165 CPU_ENQCMD_FLAGS, 0 },
1166 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1167 CPU_RDPRU_FLAGS, 0 },
1168 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1169 CPU_MCOMMIT_FLAGS, 0 },
1170 };
1171
1172 static const noarch_entry cpu_noarch[] =
1173 {
1174 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1175 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1176 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1177 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1178 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1179 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1180 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1181 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1182 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1183 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1184 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1185 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1186 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1187 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1188 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1189 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1190 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1191 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1192 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1193 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1194 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1195 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1196 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1197 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1198 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1199 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1200 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1201 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1202 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1203 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1204 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1205 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1206 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1207 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1208 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1209 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1210 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1211 { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1212 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1213 };
1214
1215 #ifdef I386COFF
1216 /* Like s_lcomm_internal in gas/read.c but the alignment string
1217 is allowed to be optional. */
1218
1219 static symbolS *
1220 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1221 {
1222 addressT align = 0;
1223
1224 SKIP_WHITESPACE ();
1225
1226 if (needs_align
1227 && *input_line_pointer == ',')
1228 {
1229 align = parse_align (needs_align - 1);
1230
1231 if (align == (addressT) -1)
1232 return NULL;
1233 }
1234 else
1235 {
1236 if (size >= 8)
1237 align = 3;
1238 else if (size >= 4)
1239 align = 2;
1240 else if (size >= 2)
1241 align = 1;
1242 else
1243 align = 0;
1244 }
1245
1246 bss_alloc (symbolP, size, align);
1247 return symbolP;
1248 }
1249
1250 static void
1251 pe_lcomm (int needs_align)
1252 {
1253 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1254 }
1255 #endif
1256
1257 const pseudo_typeS md_pseudo_table[] =
1258 {
1259 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1260 {"align", s_align_bytes, 0},
1261 #else
1262 {"align", s_align_ptwo, 0},
1263 #endif
1264 {"arch", set_cpu_arch, 0},
1265 #ifndef I386COFF
1266 {"bss", s_bss, 0},
1267 #else
1268 {"lcomm", pe_lcomm, 1},
1269 #endif
1270 {"ffloat", float_cons, 'f'},
1271 {"dfloat", float_cons, 'd'},
1272 {"tfloat", float_cons, 'x'},
1273 {"value", cons, 2},
1274 {"slong", signed_cons, 4},
1275 {"noopt", s_ignore, 0},
1276 {"optim", s_ignore, 0},
1277 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1278 {"code16", set_code_flag, CODE_16BIT},
1279 {"code32", set_code_flag, CODE_32BIT},
1280 #ifdef BFD64
1281 {"code64", set_code_flag, CODE_64BIT},
1282 #endif
1283 {"intel_syntax", set_intel_syntax, 1},
1284 {"att_syntax", set_intel_syntax, 0},
1285 {"intel_mnemonic", set_intel_mnemonic, 1},
1286 {"att_mnemonic", set_intel_mnemonic, 0},
1287 {"allow_index_reg", set_allow_index_reg, 1},
1288 {"disallow_index_reg", set_allow_index_reg, 0},
1289 {"sse_check", set_check, 0},
1290 {"operand_check", set_check, 1},
1291 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1292 {"largecomm", handle_large_common, 0},
1293 #else
1294 {"file", dwarf2_directive_file, 0},
1295 {"loc", dwarf2_directive_loc, 0},
1296 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1297 #endif
1298 #ifdef TE_PE
1299 {"secrel32", pe_directive_secrel, 0},
1300 #endif
1301 {0, 0, 0}
1302 };
1303
1304 /* For interface with expression (). */
1305 extern char *input_line_pointer;
1306
1307 /* Hash table for instruction mnemonic lookup. */
1308 static struct hash_control *op_hash;
1309
1310 /* Hash table for register lookup. */
1311 static struct hash_control *reg_hash;
1312 \f
1313 /* Various efficient no-op patterns for aligning code labels.
1314 Note: Don't try to assemble the instructions in the comments.
1315 0L and 0w are not legal. */
1316 static const unsigned char f32_1[] =
1317 {0x90}; /* nop */
1318 static const unsigned char f32_2[] =
1319 {0x66,0x90}; /* xchg %ax,%ax */
1320 static const unsigned char f32_3[] =
1321 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1322 static const unsigned char f32_4[] =
1323 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1324 static const unsigned char f32_6[] =
1325 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1326 static const unsigned char f32_7[] =
1327 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1328 static const unsigned char f16_3[] =
1329 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1330 static const unsigned char f16_4[] =
1331 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1332 static const unsigned char jump_disp8[] =
1333 {0xeb}; /* jmp disp8 */
1334 static const unsigned char jump32_disp32[] =
1335 {0xe9}; /* jmp disp32 */
1336 static const unsigned char jump16_disp32[] =
1337 {0x66,0xe9}; /* jmp disp32 */
1338 /* 32-bit NOPs patterns. */
1339 static const unsigned char *const f32_patt[] = {
1340 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1341 };
1342 /* 16-bit NOPs patterns. */
1343 static const unsigned char *const f16_patt[] = {
1344 f32_1, f32_2, f16_3, f16_4
1345 };
1346 /* nopl (%[re]ax) */
1347 static const unsigned char alt_3[] =
1348 {0x0f,0x1f,0x00};
1349 /* nopl 0(%[re]ax) */
1350 static const unsigned char alt_4[] =
1351 {0x0f,0x1f,0x40,0x00};
1352 /* nopl 0(%[re]ax,%[re]ax,1) */
1353 static const unsigned char alt_5[] =
1354 {0x0f,0x1f,0x44,0x00,0x00};
1355 /* nopw 0(%[re]ax,%[re]ax,1) */
1356 static const unsigned char alt_6[] =
1357 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1358 /* nopl 0L(%[re]ax) */
1359 static const unsigned char alt_7[] =
1360 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1361 /* nopl 0L(%[re]ax,%[re]ax,1) */
1362 static const unsigned char alt_8[] =
1363 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1364 /* nopw 0L(%[re]ax,%[re]ax,1) */
1365 static const unsigned char alt_9[] =
1366 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1367 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1368 static const unsigned char alt_10[] =
1369 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1370 /* data16 nopw %cs:0L(%eax,%eax,1) */
1371 static const unsigned char alt_11[] =
1372 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1373 /* 32-bit and 64-bit NOPs patterns. */
1374 static const unsigned char *const alt_patt[] = {
1375 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1376 alt_9, alt_10, alt_11
1377 };
1378
1379 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1380 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1381
1382 static void
1383 i386_output_nops (char *where, const unsigned char *const *patt,
1384 int count, int max_single_nop_size)
1385
1386 {
1387 /* Place the longer NOP first. */
1388 int last;
1389 int offset;
1390 const unsigned char *nops;
1391
1392 if (max_single_nop_size < 1)
1393 {
1394 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1395 max_single_nop_size);
1396 return;
1397 }
1398
1399 nops = patt[max_single_nop_size - 1];
1400
1401 /* Use the smaller one if the requsted one isn't available. */
1402 if (nops == NULL)
1403 {
1404 max_single_nop_size--;
1405 nops = patt[max_single_nop_size - 1];
1406 }
1407
1408 last = count % max_single_nop_size;
1409
1410 count -= last;
1411 for (offset = 0; offset < count; offset += max_single_nop_size)
1412 memcpy (where + offset, nops, max_single_nop_size);
1413
1414 if (last)
1415 {
1416 nops = patt[last - 1];
1417 if (nops == NULL)
1418 {
1419 /* Use the smaller one plus one-byte NOP if the needed one
1420 isn't available. */
1421 last--;
1422 nops = patt[last - 1];
1423 memcpy (where + offset, nops, last);
1424 where[offset + last] = *patt[0];
1425 }
1426 else
1427 memcpy (where + offset, nops, last);
1428 }
1429 }
1430
1431 static INLINE int
1432 fits_in_imm7 (offsetT num)
1433 {
1434 return (num & 0x7f) == num;
1435 }
1436
1437 static INLINE int
1438 fits_in_imm31 (offsetT num)
1439 {
1440 return (num & 0x7fffffff) == num;
1441 }
1442
1443 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1444 single NOP instruction LIMIT. */
1445
1446 void
1447 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1448 {
1449 const unsigned char *const *patt = NULL;
1450 int max_single_nop_size;
1451 /* Maximum number of NOPs before switching to jump over NOPs. */
1452 int max_number_of_nops;
1453
1454 switch (fragP->fr_type)
1455 {
1456 case rs_fill_nop:
1457 case rs_align_code:
1458 break;
1459 case rs_machine_dependent:
1460 /* Allow NOP padding for jumps and calls. */
1461 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1462 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1463 break;
1464 /* Fall through. */
1465 default:
1466 return;
1467 }
1468
1469 /* We need to decide which NOP sequence to use for 32bit and
1470 64bit. When -mtune= is used:
1471
1472 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1473 PROCESSOR_GENERIC32, f32_patt will be used.
1474 2. For the rest, alt_patt will be used.
1475
1476 When -mtune= isn't used, alt_patt will be used if
1477 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1478 be used.
1479
1480 When -march= or .arch is used, we can't use anything beyond
1481 cpu_arch_isa_flags. */
1482
1483 if (flag_code == CODE_16BIT)
1484 {
1485 patt = f16_patt;
1486 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1487 /* Limit number of NOPs to 2 in 16-bit mode. */
1488 max_number_of_nops = 2;
1489 }
1490 else
1491 {
1492 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1493 {
1494 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1495 switch (cpu_arch_tune)
1496 {
1497 case PROCESSOR_UNKNOWN:
1498 /* We use cpu_arch_isa_flags to check if we SHOULD
1499 optimize with nops. */
1500 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1501 patt = alt_patt;
1502 else
1503 patt = f32_patt;
1504 break;
1505 case PROCESSOR_PENTIUM4:
1506 case PROCESSOR_NOCONA:
1507 case PROCESSOR_CORE:
1508 case PROCESSOR_CORE2:
1509 case PROCESSOR_COREI7:
1510 case PROCESSOR_L1OM:
1511 case PROCESSOR_K1OM:
1512 case PROCESSOR_GENERIC64:
1513 case PROCESSOR_K6:
1514 case PROCESSOR_ATHLON:
1515 case PROCESSOR_K8:
1516 case PROCESSOR_AMDFAM10:
1517 case PROCESSOR_BD:
1518 case PROCESSOR_ZNVER:
1519 case PROCESSOR_BT:
1520 patt = alt_patt;
1521 break;
1522 case PROCESSOR_I386:
1523 case PROCESSOR_I486:
1524 case PROCESSOR_PENTIUM:
1525 case PROCESSOR_PENTIUMPRO:
1526 case PROCESSOR_IAMCU:
1527 case PROCESSOR_GENERIC32:
1528 patt = f32_patt;
1529 break;
1530 }
1531 }
1532 else
1533 {
1534 switch (fragP->tc_frag_data.tune)
1535 {
1536 case PROCESSOR_UNKNOWN:
1537 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1538 PROCESSOR_UNKNOWN. */
1539 abort ();
1540 break;
1541
1542 case PROCESSOR_I386:
1543 case PROCESSOR_I486:
1544 case PROCESSOR_PENTIUM:
1545 case PROCESSOR_IAMCU:
1546 case PROCESSOR_K6:
1547 case PROCESSOR_ATHLON:
1548 case PROCESSOR_K8:
1549 case PROCESSOR_AMDFAM10:
1550 case PROCESSOR_BD:
1551 case PROCESSOR_ZNVER:
1552 case PROCESSOR_BT:
1553 case PROCESSOR_GENERIC32:
1554 /* We use cpu_arch_isa_flags to check if we CAN optimize
1555 with nops. */
1556 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1557 patt = alt_patt;
1558 else
1559 patt = f32_patt;
1560 break;
1561 case PROCESSOR_PENTIUMPRO:
1562 case PROCESSOR_PENTIUM4:
1563 case PROCESSOR_NOCONA:
1564 case PROCESSOR_CORE:
1565 case PROCESSOR_CORE2:
1566 case PROCESSOR_COREI7:
1567 case PROCESSOR_L1OM:
1568 case PROCESSOR_K1OM:
1569 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1570 patt = alt_patt;
1571 else
1572 patt = f32_patt;
1573 break;
1574 case PROCESSOR_GENERIC64:
1575 patt = alt_patt;
1576 break;
1577 }
1578 }
1579
1580 if (patt == f32_patt)
1581 {
1582 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1583 /* Limit number of NOPs to 2 for older processors. */
1584 max_number_of_nops = 2;
1585 }
1586 else
1587 {
1588 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1589 /* Limit number of NOPs to 7 for newer processors. */
1590 max_number_of_nops = 7;
1591 }
1592 }
1593
1594 if (limit == 0)
1595 limit = max_single_nop_size;
1596
1597 if (fragP->fr_type == rs_fill_nop)
1598 {
1599 /* Output NOPs for .nop directive. */
1600 if (limit > max_single_nop_size)
1601 {
1602 as_bad_where (fragP->fr_file, fragP->fr_line,
1603 _("invalid single nop size: %d "
1604 "(expect within [0, %d])"),
1605 limit, max_single_nop_size);
1606 return;
1607 }
1608 }
1609 else if (fragP->fr_type != rs_machine_dependent)
1610 fragP->fr_var = count;
1611
1612 if ((count / max_single_nop_size) > max_number_of_nops)
1613 {
1614 /* Generate jump over NOPs. */
1615 offsetT disp = count - 2;
1616 if (fits_in_imm7 (disp))
1617 {
1618 /* Use "jmp disp8" if possible. */
1619 count = disp;
1620 where[0] = jump_disp8[0];
1621 where[1] = count;
1622 where += 2;
1623 }
1624 else
1625 {
1626 unsigned int size_of_jump;
1627
1628 if (flag_code == CODE_16BIT)
1629 {
1630 where[0] = jump16_disp32[0];
1631 where[1] = jump16_disp32[1];
1632 size_of_jump = 2;
1633 }
1634 else
1635 {
1636 where[0] = jump32_disp32[0];
1637 size_of_jump = 1;
1638 }
1639
1640 count -= size_of_jump + 4;
1641 if (!fits_in_imm31 (count))
1642 {
1643 as_bad_where (fragP->fr_file, fragP->fr_line,
1644 _("jump over nop padding out of range"));
1645 return;
1646 }
1647
1648 md_number_to_chars (where + size_of_jump, count, 4);
1649 where += size_of_jump + 4;
1650 }
1651 }
1652
1653 /* Generate multiple NOPs. */
1654 i386_output_nops (where, patt, count, limit);
1655 }
1656
1657 static INLINE int
1658 operand_type_all_zero (const union i386_operand_type *x)
1659 {
1660 switch (ARRAY_SIZE(x->array))
1661 {
1662 case 3:
1663 if (x->array[2])
1664 return 0;
1665 /* Fall through. */
1666 case 2:
1667 if (x->array[1])
1668 return 0;
1669 /* Fall through. */
1670 case 1:
1671 return !x->array[0];
1672 default:
1673 abort ();
1674 }
1675 }
1676
1677 static INLINE void
1678 operand_type_set (union i386_operand_type *x, unsigned int v)
1679 {
1680 switch (ARRAY_SIZE(x->array))
1681 {
1682 case 3:
1683 x->array[2] = v;
1684 /* Fall through. */
1685 case 2:
1686 x->array[1] = v;
1687 /* Fall through. */
1688 case 1:
1689 x->array[0] = v;
1690 /* Fall through. */
1691 break;
1692 default:
1693 abort ();
1694 }
1695
1696 x->bitfield.class = ClassNone;
1697 x->bitfield.instance = InstanceNone;
1698 }
1699
1700 static INLINE int
1701 operand_type_equal (const union i386_operand_type *x,
1702 const union i386_operand_type *y)
1703 {
1704 switch (ARRAY_SIZE(x->array))
1705 {
1706 case 3:
1707 if (x->array[2] != y->array[2])
1708 return 0;
1709 /* Fall through. */
1710 case 2:
1711 if (x->array[1] != y->array[1])
1712 return 0;
1713 /* Fall through. */
1714 case 1:
1715 return x->array[0] == y->array[0];
1716 break;
1717 default:
1718 abort ();
1719 }
1720 }
1721
1722 static INLINE int
1723 cpu_flags_all_zero (const union i386_cpu_flags *x)
1724 {
1725 switch (ARRAY_SIZE(x->array))
1726 {
1727 case 4:
1728 if (x->array[3])
1729 return 0;
1730 /* Fall through. */
1731 case 3:
1732 if (x->array[2])
1733 return 0;
1734 /* Fall through. */
1735 case 2:
1736 if (x->array[1])
1737 return 0;
1738 /* Fall through. */
1739 case 1:
1740 return !x->array[0];
1741 default:
1742 abort ();
1743 }
1744 }
1745
1746 static INLINE int
1747 cpu_flags_equal (const union i386_cpu_flags *x,
1748 const union i386_cpu_flags *y)
1749 {
1750 switch (ARRAY_SIZE(x->array))
1751 {
1752 case 4:
1753 if (x->array[3] != y->array[3])
1754 return 0;
1755 /* Fall through. */
1756 case 3:
1757 if (x->array[2] != y->array[2])
1758 return 0;
1759 /* Fall through. */
1760 case 2:
1761 if (x->array[1] != y->array[1])
1762 return 0;
1763 /* Fall through. */
1764 case 1:
1765 return x->array[0] == y->array[0];
1766 break;
1767 default:
1768 abort ();
1769 }
1770 }
1771
1772 static INLINE int
1773 cpu_flags_check_cpu64 (i386_cpu_flags f)
1774 {
1775 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1776 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1777 }
1778
1779 static INLINE i386_cpu_flags
1780 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1781 {
1782 switch (ARRAY_SIZE (x.array))
1783 {
1784 case 4:
1785 x.array [3] &= y.array [3];
1786 /* Fall through. */
1787 case 3:
1788 x.array [2] &= y.array [2];
1789 /* Fall through. */
1790 case 2:
1791 x.array [1] &= y.array [1];
1792 /* Fall through. */
1793 case 1:
1794 x.array [0] &= y.array [0];
1795 break;
1796 default:
1797 abort ();
1798 }
1799 return x;
1800 }
1801
1802 static INLINE i386_cpu_flags
1803 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1804 {
1805 switch (ARRAY_SIZE (x.array))
1806 {
1807 case 4:
1808 x.array [3] |= y.array [3];
1809 /* Fall through. */
1810 case 3:
1811 x.array [2] |= y.array [2];
1812 /* Fall through. */
1813 case 2:
1814 x.array [1] |= y.array [1];
1815 /* Fall through. */
1816 case 1:
1817 x.array [0] |= y.array [0];
1818 break;
1819 default:
1820 abort ();
1821 }
1822 return x;
1823 }
1824
1825 static INLINE i386_cpu_flags
1826 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1827 {
1828 switch (ARRAY_SIZE (x.array))
1829 {
1830 case 4:
1831 x.array [3] &= ~y.array [3];
1832 /* Fall through. */
1833 case 3:
1834 x.array [2] &= ~y.array [2];
1835 /* Fall through. */
1836 case 2:
1837 x.array [1] &= ~y.array [1];
1838 /* Fall through. */
1839 case 1:
1840 x.array [0] &= ~y.array [0];
1841 break;
1842 default:
1843 abort ();
1844 }
1845 return x;
1846 }
1847
1848 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1849
1850 #define CPU_FLAGS_ARCH_MATCH 0x1
1851 #define CPU_FLAGS_64BIT_MATCH 0x2
1852
1853 #define CPU_FLAGS_PERFECT_MATCH \
1854 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1855
1856 /* Return CPU flags match bits. */
1857
1858 static int
1859 cpu_flags_match (const insn_template *t)
1860 {
1861 i386_cpu_flags x = t->cpu_flags;
1862 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1863
1864 x.bitfield.cpu64 = 0;
1865 x.bitfield.cpuno64 = 0;
1866
1867 if (cpu_flags_all_zero (&x))
1868 {
1869 /* This instruction is available on all archs. */
1870 match |= CPU_FLAGS_ARCH_MATCH;
1871 }
1872 else
1873 {
1874 /* This instruction is available only on some archs. */
1875 i386_cpu_flags cpu = cpu_arch_flags;
1876
1877 /* AVX512VL is no standalone feature - match it and then strip it. */
1878 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1879 return match;
1880 x.bitfield.cpuavx512vl = 0;
1881
1882 cpu = cpu_flags_and (x, cpu);
1883 if (!cpu_flags_all_zero (&cpu))
1884 {
1885 if (x.bitfield.cpuavx)
1886 {
1887 /* We need to check a few extra flags with AVX. */
1888 if (cpu.bitfield.cpuavx
1889 && (!t->opcode_modifier.sse2avx || sse2avx)
1890 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1891 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1892 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1893 match |= CPU_FLAGS_ARCH_MATCH;
1894 }
1895 else if (x.bitfield.cpuavx512f)
1896 {
1897 /* We need to check a few extra flags with AVX512F. */
1898 if (cpu.bitfield.cpuavx512f
1899 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1900 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1901 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1902 match |= CPU_FLAGS_ARCH_MATCH;
1903 }
1904 else
1905 match |= CPU_FLAGS_ARCH_MATCH;
1906 }
1907 }
1908 return match;
1909 }
1910
1911 static INLINE i386_operand_type
1912 operand_type_and (i386_operand_type x, i386_operand_type y)
1913 {
1914 if (x.bitfield.class != y.bitfield.class)
1915 x.bitfield.class = ClassNone;
1916 if (x.bitfield.instance != y.bitfield.instance)
1917 x.bitfield.instance = InstanceNone;
1918
1919 switch (ARRAY_SIZE (x.array))
1920 {
1921 case 3:
1922 x.array [2] &= y.array [2];
1923 /* Fall through. */
1924 case 2:
1925 x.array [1] &= y.array [1];
1926 /* Fall through. */
1927 case 1:
1928 x.array [0] &= y.array [0];
1929 break;
1930 default:
1931 abort ();
1932 }
1933 return x;
1934 }
1935
1936 static INLINE i386_operand_type
1937 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1938 {
1939 gas_assert (y.bitfield.class == ClassNone);
1940 gas_assert (y.bitfield.instance == InstanceNone);
1941
1942 switch (ARRAY_SIZE (x.array))
1943 {
1944 case 3:
1945 x.array [2] &= ~y.array [2];
1946 /* Fall through. */
1947 case 2:
1948 x.array [1] &= ~y.array [1];
1949 /* Fall through. */
1950 case 1:
1951 x.array [0] &= ~y.array [0];
1952 break;
1953 default:
1954 abort ();
1955 }
1956 return x;
1957 }
1958
1959 static INLINE i386_operand_type
1960 operand_type_or (i386_operand_type x, i386_operand_type y)
1961 {
1962 gas_assert (x.bitfield.class == ClassNone ||
1963 y.bitfield.class == ClassNone ||
1964 x.bitfield.class == y.bitfield.class);
1965 gas_assert (x.bitfield.instance == InstanceNone ||
1966 y.bitfield.instance == InstanceNone ||
1967 x.bitfield.instance == y.bitfield.instance);
1968
1969 switch (ARRAY_SIZE (x.array))
1970 {
1971 case 3:
1972 x.array [2] |= y.array [2];
1973 /* Fall through. */
1974 case 2:
1975 x.array [1] |= y.array [1];
1976 /* Fall through. */
1977 case 1:
1978 x.array [0] |= y.array [0];
1979 break;
1980 default:
1981 abort ();
1982 }
1983 return x;
1984 }
1985
1986 static INLINE i386_operand_type
1987 operand_type_xor (i386_operand_type x, i386_operand_type y)
1988 {
1989 gas_assert (y.bitfield.class == ClassNone);
1990 gas_assert (y.bitfield.instance == InstanceNone);
1991
1992 switch (ARRAY_SIZE (x.array))
1993 {
1994 case 3:
1995 x.array [2] ^= y.array [2];
1996 /* Fall through. */
1997 case 2:
1998 x.array [1] ^= y.array [1];
1999 /* Fall through. */
2000 case 1:
2001 x.array [0] ^= y.array [0];
2002 break;
2003 default:
2004 abort ();
2005 }
2006 return x;
2007 }
2008
2009 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2010 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2011 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2012 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2013 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2014 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2015 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2016 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2017 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2018 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2019 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2020 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2021 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2022 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2023 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2024 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2025 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2026
2027 enum operand_type
2028 {
2029 reg,
2030 imm,
2031 disp,
2032 anymem
2033 };
2034
2035 static INLINE int
2036 operand_type_check (i386_operand_type t, enum operand_type c)
2037 {
2038 switch (c)
2039 {
2040 case reg:
2041 return t.bitfield.class == Reg;
2042
2043 case imm:
2044 return (t.bitfield.imm8
2045 || t.bitfield.imm8s
2046 || t.bitfield.imm16
2047 || t.bitfield.imm32
2048 || t.bitfield.imm32s
2049 || t.bitfield.imm64);
2050
2051 case disp:
2052 return (t.bitfield.disp8
2053 || t.bitfield.disp16
2054 || t.bitfield.disp32
2055 || t.bitfield.disp32s
2056 || t.bitfield.disp64);
2057
2058 case anymem:
2059 return (t.bitfield.disp8
2060 || t.bitfield.disp16
2061 || t.bitfield.disp32
2062 || t.bitfield.disp32s
2063 || t.bitfield.disp64
2064 || t.bitfield.baseindex);
2065
2066 default:
2067 abort ();
2068 }
2069
2070 return 0;
2071 }
2072
2073 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2074 between operand GIVEN and opeand WANTED for instruction template T. */
2075
2076 static INLINE int
2077 match_operand_size (const insn_template *t, unsigned int wanted,
2078 unsigned int given)
2079 {
2080 return !((i.types[given].bitfield.byte
2081 && !t->operand_types[wanted].bitfield.byte)
2082 || (i.types[given].bitfield.word
2083 && !t->operand_types[wanted].bitfield.word)
2084 || (i.types[given].bitfield.dword
2085 && !t->operand_types[wanted].bitfield.dword)
2086 || (i.types[given].bitfield.qword
2087 && !t->operand_types[wanted].bitfield.qword)
2088 || (i.types[given].bitfield.tbyte
2089 && !t->operand_types[wanted].bitfield.tbyte));
2090 }
2091
2092 /* Return 1 if there is no conflict in SIMD register between operand
2093 GIVEN and opeand WANTED for instruction template T. */
2094
2095 static INLINE int
2096 match_simd_size (const insn_template *t, unsigned int wanted,
2097 unsigned int given)
2098 {
2099 return !((i.types[given].bitfield.xmmword
2100 && !t->operand_types[wanted].bitfield.xmmword)
2101 || (i.types[given].bitfield.ymmword
2102 && !t->operand_types[wanted].bitfield.ymmword)
2103 || (i.types[given].bitfield.zmmword
2104 && !t->operand_types[wanted].bitfield.zmmword));
2105 }
2106
2107 /* Return 1 if there is no conflict in any size between operand GIVEN
2108 and opeand WANTED for instruction template T. */
2109
2110 static INLINE int
2111 match_mem_size (const insn_template *t, unsigned int wanted,
2112 unsigned int given)
2113 {
2114 return (match_operand_size (t, wanted, given)
2115 && !((i.types[given].bitfield.unspecified
2116 && !i.broadcast
2117 && !t->operand_types[wanted].bitfield.unspecified)
2118 || (i.types[given].bitfield.fword
2119 && !t->operand_types[wanted].bitfield.fword)
2120 /* For scalar opcode templates to allow register and memory
2121 operands at the same time, some special casing is needed
2122 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2123 down-conversion vpmov*. */
2124 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2125 && !t->opcode_modifier.broadcast
2126 && (t->operand_types[wanted].bitfield.byte
2127 || t->operand_types[wanted].bitfield.word
2128 || t->operand_types[wanted].bitfield.dword
2129 || t->operand_types[wanted].bitfield.qword))
2130 ? (i.types[given].bitfield.xmmword
2131 || i.types[given].bitfield.ymmword
2132 || i.types[given].bitfield.zmmword)
2133 : !match_simd_size(t, wanted, given))));
2134 }
2135
2136 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2137 operands for instruction template T, and it has MATCH_REVERSE set if there
2138 is no size conflict on any operands for the template with operands reversed
2139 (and the template allows for reversing in the first place). */
2140
2141 #define MATCH_STRAIGHT 1
2142 #define MATCH_REVERSE 2
2143
2144 static INLINE unsigned int
2145 operand_size_match (const insn_template *t)
2146 {
2147 unsigned int j, match = MATCH_STRAIGHT;
2148
2149 /* Don't check non-absolute jump instructions. */
2150 if (t->opcode_modifier.jump
2151 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2152 return match;
2153
2154 /* Check memory and accumulator operand size. */
2155 for (j = 0; j < i.operands; j++)
2156 {
2157 if (i.types[j].bitfield.class != Reg
2158 && i.types[j].bitfield.class != RegSIMD
2159 && t->opcode_modifier.anysize)
2160 continue;
2161
2162 if (t->operand_types[j].bitfield.class == Reg
2163 && !match_operand_size (t, j, j))
2164 {
2165 match = 0;
2166 break;
2167 }
2168
2169 if (t->operand_types[j].bitfield.class == RegSIMD
2170 && !match_simd_size (t, j, j))
2171 {
2172 match = 0;
2173 break;
2174 }
2175
2176 if (t->operand_types[j].bitfield.instance == Accum
2177 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2178 {
2179 match = 0;
2180 break;
2181 }
2182
2183 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2184 {
2185 match = 0;
2186 break;
2187 }
2188 }
2189
2190 if (!t->opcode_modifier.d)
2191 {
2192 mismatch:
2193 if (!match)
2194 i.error = operand_size_mismatch;
2195 return match;
2196 }
2197
2198 /* Check reverse. */
2199 gas_assert (i.operands >= 2 && i.operands <= 3);
2200
2201 for (j = 0; j < i.operands; j++)
2202 {
2203 unsigned int given = i.operands - j - 1;
2204
2205 if (t->operand_types[j].bitfield.class == Reg
2206 && !match_operand_size (t, j, given))
2207 goto mismatch;
2208
2209 if (t->operand_types[j].bitfield.class == RegSIMD
2210 && !match_simd_size (t, j, given))
2211 goto mismatch;
2212
2213 if (t->operand_types[j].bitfield.instance == Accum
2214 && (!match_operand_size (t, j, given)
2215 || !match_simd_size (t, j, given)))
2216 goto mismatch;
2217
2218 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2219 goto mismatch;
2220 }
2221
2222 return match | MATCH_REVERSE;
2223 }
2224
2225 static INLINE int
2226 operand_type_match (i386_operand_type overlap,
2227 i386_operand_type given)
2228 {
2229 i386_operand_type temp = overlap;
2230
2231 temp.bitfield.unspecified = 0;
2232 temp.bitfield.byte = 0;
2233 temp.bitfield.word = 0;
2234 temp.bitfield.dword = 0;
2235 temp.bitfield.fword = 0;
2236 temp.bitfield.qword = 0;
2237 temp.bitfield.tbyte = 0;
2238 temp.bitfield.xmmword = 0;
2239 temp.bitfield.ymmword = 0;
2240 temp.bitfield.zmmword = 0;
2241 if (operand_type_all_zero (&temp))
2242 goto mismatch;
2243
2244 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2245 return 1;
2246
2247 mismatch:
2248 i.error = operand_type_mismatch;
2249 return 0;
2250 }
2251
2252 /* If given types g0 and g1 are registers they must be of the same type
2253 unless the expected operand type register overlap is null.
2254 Some Intel syntax memory operand size checking also happens here. */
2255
2256 static INLINE int
2257 operand_type_register_match (i386_operand_type g0,
2258 i386_operand_type t0,
2259 i386_operand_type g1,
2260 i386_operand_type t1)
2261 {
2262 if (g0.bitfield.class != Reg
2263 && g0.bitfield.class != RegSIMD
2264 && (!operand_type_check (g0, anymem)
2265 || g0.bitfield.unspecified
2266 || (t0.bitfield.class != Reg
2267 && t0.bitfield.class != RegSIMD)))
2268 return 1;
2269
2270 if (g1.bitfield.class != Reg
2271 && g1.bitfield.class != RegSIMD
2272 && (!operand_type_check (g1, anymem)
2273 || g1.bitfield.unspecified
2274 || (t1.bitfield.class != Reg
2275 && t1.bitfield.class != RegSIMD)))
2276 return 1;
2277
2278 if (g0.bitfield.byte == g1.bitfield.byte
2279 && g0.bitfield.word == g1.bitfield.word
2280 && g0.bitfield.dword == g1.bitfield.dword
2281 && g0.bitfield.qword == g1.bitfield.qword
2282 && g0.bitfield.xmmword == g1.bitfield.xmmword
2283 && g0.bitfield.ymmword == g1.bitfield.ymmword
2284 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2285 return 1;
2286
2287 if (!(t0.bitfield.byte & t1.bitfield.byte)
2288 && !(t0.bitfield.word & t1.bitfield.word)
2289 && !(t0.bitfield.dword & t1.bitfield.dword)
2290 && !(t0.bitfield.qword & t1.bitfield.qword)
2291 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2292 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2293 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2294 return 1;
2295
2296 i.error = register_type_mismatch;
2297
2298 return 0;
2299 }
2300
2301 static INLINE unsigned int
2302 register_number (const reg_entry *r)
2303 {
2304 unsigned int nr = r->reg_num;
2305
2306 if (r->reg_flags & RegRex)
2307 nr += 8;
2308
2309 if (r->reg_flags & RegVRex)
2310 nr += 16;
2311
2312 return nr;
2313 }
2314
2315 static INLINE unsigned int
2316 mode_from_disp_size (i386_operand_type t)
2317 {
2318 if (t.bitfield.disp8)
2319 return 1;
2320 else if (t.bitfield.disp16
2321 || t.bitfield.disp32
2322 || t.bitfield.disp32s)
2323 return 2;
2324 else
2325 return 0;
2326 }
2327
2328 static INLINE int
2329 fits_in_signed_byte (addressT num)
2330 {
2331 return num + 0x80 <= 0xff;
2332 }
2333
2334 static INLINE int
2335 fits_in_unsigned_byte (addressT num)
2336 {
2337 return num <= 0xff;
2338 }
2339
2340 static INLINE int
2341 fits_in_unsigned_word (addressT num)
2342 {
2343 return num <= 0xffff;
2344 }
2345
2346 static INLINE int
2347 fits_in_signed_word (addressT num)
2348 {
2349 return num + 0x8000 <= 0xffff;
2350 }
2351
2352 static INLINE int
2353 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2354 {
2355 #ifndef BFD64
2356 return 1;
2357 #else
2358 return num + 0x80000000 <= 0xffffffff;
2359 #endif
2360 } /* fits_in_signed_long() */
2361
2362 static INLINE int
2363 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2364 {
2365 #ifndef BFD64
2366 return 1;
2367 #else
2368 return num <= 0xffffffff;
2369 #endif
2370 } /* fits_in_unsigned_long() */
2371
2372 static INLINE int
2373 fits_in_disp8 (offsetT num)
2374 {
2375 int shift = i.memshift;
2376 unsigned int mask;
2377
2378 if (shift == -1)
2379 abort ();
2380
2381 mask = (1 << shift) - 1;
2382
2383 /* Return 0 if NUM isn't properly aligned. */
2384 if ((num & mask))
2385 return 0;
2386
2387 /* Check if NUM will fit in 8bit after shift. */
2388 return fits_in_signed_byte (num >> shift);
2389 }
2390
2391 static INLINE int
2392 fits_in_imm4 (offsetT num)
2393 {
2394 return (num & 0xf) == num;
2395 }
2396
2397 static i386_operand_type
2398 smallest_imm_type (offsetT num)
2399 {
2400 i386_operand_type t;
2401
2402 operand_type_set (&t, 0);
2403 t.bitfield.imm64 = 1;
2404
2405 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2406 {
2407 /* This code is disabled on the 486 because all the Imm1 forms
2408 in the opcode table are slower on the i486. They're the
2409 versions with the implicitly specified single-position
2410 displacement, which has another syntax if you really want to
2411 use that form. */
2412 t.bitfield.imm1 = 1;
2413 t.bitfield.imm8 = 1;
2414 t.bitfield.imm8s = 1;
2415 t.bitfield.imm16 = 1;
2416 t.bitfield.imm32 = 1;
2417 t.bitfield.imm32s = 1;
2418 }
2419 else if (fits_in_signed_byte (num))
2420 {
2421 t.bitfield.imm8 = 1;
2422 t.bitfield.imm8s = 1;
2423 t.bitfield.imm16 = 1;
2424 t.bitfield.imm32 = 1;
2425 t.bitfield.imm32s = 1;
2426 }
2427 else if (fits_in_unsigned_byte (num))
2428 {
2429 t.bitfield.imm8 = 1;
2430 t.bitfield.imm16 = 1;
2431 t.bitfield.imm32 = 1;
2432 t.bitfield.imm32s = 1;
2433 }
2434 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2435 {
2436 t.bitfield.imm16 = 1;
2437 t.bitfield.imm32 = 1;
2438 t.bitfield.imm32s = 1;
2439 }
2440 else if (fits_in_signed_long (num))
2441 {
2442 t.bitfield.imm32 = 1;
2443 t.bitfield.imm32s = 1;
2444 }
2445 else if (fits_in_unsigned_long (num))
2446 t.bitfield.imm32 = 1;
2447
2448 return t;
2449 }
2450
2451 static offsetT
2452 offset_in_range (offsetT val, int size)
2453 {
2454 addressT mask;
2455
2456 switch (size)
2457 {
2458 case 1: mask = ((addressT) 1 << 8) - 1; break;
2459 case 2: mask = ((addressT) 1 << 16) - 1; break;
2460 case 4: mask = ((addressT) 2 << 31) - 1; break;
2461 #ifdef BFD64
2462 case 8: mask = ((addressT) 2 << 63) - 1; break;
2463 #endif
2464 default: abort ();
2465 }
2466
2467 #ifdef BFD64
2468 /* If BFD64, sign extend val for 32bit address mode. */
2469 if (flag_code != CODE_64BIT
2470 || i.prefix[ADDR_PREFIX])
2471 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2472 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2473 #endif
2474
2475 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2476 {
2477 char buf1[40], buf2[40];
2478
2479 sprint_value (buf1, val);
2480 sprint_value (buf2, val & mask);
2481 as_warn (_("%s shortened to %s"), buf1, buf2);
2482 }
2483 return val & mask;
2484 }
2485
2486 enum PREFIX_GROUP
2487 {
2488 PREFIX_EXIST = 0,
2489 PREFIX_LOCK,
2490 PREFIX_REP,
2491 PREFIX_DS,
2492 PREFIX_OTHER
2493 };
2494
2495 /* Returns
2496 a. PREFIX_EXIST if attempting to add a prefix where one from the
2497 same class already exists.
2498 b. PREFIX_LOCK if lock prefix is added.
2499 c. PREFIX_REP if rep/repne prefix is added.
2500 d. PREFIX_DS if ds prefix is added.
2501 e. PREFIX_OTHER if other prefix is added.
2502 */
2503
2504 static enum PREFIX_GROUP
2505 add_prefix (unsigned int prefix)
2506 {
2507 enum PREFIX_GROUP ret = PREFIX_OTHER;
2508 unsigned int q;
2509
2510 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2511 && flag_code == CODE_64BIT)
2512 {
2513 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2514 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2515 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2516 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2517 ret = PREFIX_EXIST;
2518 q = REX_PREFIX;
2519 }
2520 else
2521 {
2522 switch (prefix)
2523 {
2524 default:
2525 abort ();
2526
2527 case DS_PREFIX_OPCODE:
2528 ret = PREFIX_DS;
2529 /* Fall through. */
2530 case CS_PREFIX_OPCODE:
2531 case ES_PREFIX_OPCODE:
2532 case FS_PREFIX_OPCODE:
2533 case GS_PREFIX_OPCODE:
2534 case SS_PREFIX_OPCODE:
2535 q = SEG_PREFIX;
2536 break;
2537
2538 case REPNE_PREFIX_OPCODE:
2539 case REPE_PREFIX_OPCODE:
2540 q = REP_PREFIX;
2541 ret = PREFIX_REP;
2542 break;
2543
2544 case LOCK_PREFIX_OPCODE:
2545 q = LOCK_PREFIX;
2546 ret = PREFIX_LOCK;
2547 break;
2548
2549 case FWAIT_OPCODE:
2550 q = WAIT_PREFIX;
2551 break;
2552
2553 case ADDR_PREFIX_OPCODE:
2554 q = ADDR_PREFIX;
2555 break;
2556
2557 case DATA_PREFIX_OPCODE:
2558 q = DATA_PREFIX;
2559 break;
2560 }
2561 if (i.prefix[q] != 0)
2562 ret = PREFIX_EXIST;
2563 }
2564
2565 if (ret)
2566 {
2567 if (!i.prefix[q])
2568 ++i.prefixes;
2569 i.prefix[q] |= prefix;
2570 }
2571 else
2572 as_bad (_("same type of prefix used twice"));
2573
2574 return ret;
2575 }
2576
2577 static void
2578 update_code_flag (int value, int check)
2579 {
2580 PRINTF_LIKE ((*as_error));
2581
2582 flag_code = (enum flag_code) value;
2583 if (flag_code == CODE_64BIT)
2584 {
2585 cpu_arch_flags.bitfield.cpu64 = 1;
2586 cpu_arch_flags.bitfield.cpuno64 = 0;
2587 }
2588 else
2589 {
2590 cpu_arch_flags.bitfield.cpu64 = 0;
2591 cpu_arch_flags.bitfield.cpuno64 = 1;
2592 }
2593 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2594 {
2595 if (check)
2596 as_error = as_fatal;
2597 else
2598 as_error = as_bad;
2599 (*as_error) (_("64bit mode not supported on `%s'."),
2600 cpu_arch_name ? cpu_arch_name : default_arch);
2601 }
2602 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2603 {
2604 if (check)
2605 as_error = as_fatal;
2606 else
2607 as_error = as_bad;
2608 (*as_error) (_("32bit mode not supported on `%s'."),
2609 cpu_arch_name ? cpu_arch_name : default_arch);
2610 }
2611 stackop_size = '\0';
2612 }
2613
2614 static void
2615 set_code_flag (int value)
2616 {
2617 update_code_flag (value, 0);
2618 }
2619
2620 static void
2621 set_16bit_gcc_code_flag (int new_code_flag)
2622 {
2623 flag_code = (enum flag_code) new_code_flag;
2624 if (flag_code != CODE_16BIT)
2625 abort ();
2626 cpu_arch_flags.bitfield.cpu64 = 0;
2627 cpu_arch_flags.bitfield.cpuno64 = 1;
2628 stackop_size = LONG_MNEM_SUFFIX;
2629 }
2630
2631 static void
2632 set_intel_syntax (int syntax_flag)
2633 {
2634 /* Find out if register prefixing is specified. */
2635 int ask_naked_reg = 0;
2636
2637 SKIP_WHITESPACE ();
2638 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2639 {
2640 char *string;
2641 int e = get_symbol_name (&string);
2642
2643 if (strcmp (string, "prefix") == 0)
2644 ask_naked_reg = 1;
2645 else if (strcmp (string, "noprefix") == 0)
2646 ask_naked_reg = -1;
2647 else
2648 as_bad (_("bad argument to syntax directive."));
2649 (void) restore_line_pointer (e);
2650 }
2651 demand_empty_rest_of_line ();
2652
2653 intel_syntax = syntax_flag;
2654
2655 if (ask_naked_reg == 0)
2656 allow_naked_reg = (intel_syntax
2657 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2658 else
2659 allow_naked_reg = (ask_naked_reg < 0);
2660
2661 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2662
2663 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2664 identifier_chars['$'] = intel_syntax ? '$' : 0;
2665 register_prefix = allow_naked_reg ? "" : "%";
2666 }
2667
2668 static void
2669 set_intel_mnemonic (int mnemonic_flag)
2670 {
2671 intel_mnemonic = mnemonic_flag;
2672 }
2673
2674 static void
2675 set_allow_index_reg (int flag)
2676 {
2677 allow_index_reg = flag;
2678 }
2679
2680 static void
2681 set_check (int what)
2682 {
2683 enum check_kind *kind;
2684 const char *str;
2685
2686 if (what)
2687 {
2688 kind = &operand_check;
2689 str = "operand";
2690 }
2691 else
2692 {
2693 kind = &sse_check;
2694 str = "sse";
2695 }
2696
2697 SKIP_WHITESPACE ();
2698
2699 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2700 {
2701 char *string;
2702 int e = get_symbol_name (&string);
2703
2704 if (strcmp (string, "none") == 0)
2705 *kind = check_none;
2706 else if (strcmp (string, "warning") == 0)
2707 *kind = check_warning;
2708 else if (strcmp (string, "error") == 0)
2709 *kind = check_error;
2710 else
2711 as_bad (_("bad argument to %s_check directive."), str);
2712 (void) restore_line_pointer (e);
2713 }
2714 else
2715 as_bad (_("missing argument for %s_check directive"), str);
2716
2717 demand_empty_rest_of_line ();
2718 }
2719
2720 static void
2721 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2722 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2723 {
2724 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2725 static const char *arch;
2726
2727 /* Intel LIOM is only supported on ELF. */
2728 if (!IS_ELF)
2729 return;
2730
2731 if (!arch)
2732 {
2733 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2734 use default_arch. */
2735 arch = cpu_arch_name;
2736 if (!arch)
2737 arch = default_arch;
2738 }
2739
2740 /* If we are targeting Intel MCU, we must enable it. */
2741 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2742 || new_flag.bitfield.cpuiamcu)
2743 return;
2744
2745 /* If we are targeting Intel L1OM, we must enable it. */
2746 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2747 || new_flag.bitfield.cpul1om)
2748 return;
2749
2750 /* If we are targeting Intel K1OM, we must enable it. */
2751 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2752 || new_flag.bitfield.cpuk1om)
2753 return;
2754
2755 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2756 #endif
2757 }
2758
2759 static void
2760 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2761 {
2762 SKIP_WHITESPACE ();
2763
2764 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2765 {
2766 char *string;
2767 int e = get_symbol_name (&string);
2768 unsigned int j;
2769 i386_cpu_flags flags;
2770
2771 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2772 {
2773 if (strcmp (string, cpu_arch[j].name) == 0)
2774 {
2775 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2776
2777 if (*string != '.')
2778 {
2779 cpu_arch_name = cpu_arch[j].name;
2780 cpu_sub_arch_name = NULL;
2781 cpu_arch_flags = cpu_arch[j].flags;
2782 if (flag_code == CODE_64BIT)
2783 {
2784 cpu_arch_flags.bitfield.cpu64 = 1;
2785 cpu_arch_flags.bitfield.cpuno64 = 0;
2786 }
2787 else
2788 {
2789 cpu_arch_flags.bitfield.cpu64 = 0;
2790 cpu_arch_flags.bitfield.cpuno64 = 1;
2791 }
2792 cpu_arch_isa = cpu_arch[j].type;
2793 cpu_arch_isa_flags = cpu_arch[j].flags;
2794 if (!cpu_arch_tune_set)
2795 {
2796 cpu_arch_tune = cpu_arch_isa;
2797 cpu_arch_tune_flags = cpu_arch_isa_flags;
2798 }
2799 break;
2800 }
2801
2802 flags = cpu_flags_or (cpu_arch_flags,
2803 cpu_arch[j].flags);
2804
2805 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2806 {
2807 if (cpu_sub_arch_name)
2808 {
2809 char *name = cpu_sub_arch_name;
2810 cpu_sub_arch_name = concat (name,
2811 cpu_arch[j].name,
2812 (const char *) NULL);
2813 free (name);
2814 }
2815 else
2816 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2817 cpu_arch_flags = flags;
2818 cpu_arch_isa_flags = flags;
2819 }
2820 else
2821 cpu_arch_isa_flags
2822 = cpu_flags_or (cpu_arch_isa_flags,
2823 cpu_arch[j].flags);
2824 (void) restore_line_pointer (e);
2825 demand_empty_rest_of_line ();
2826 return;
2827 }
2828 }
2829
2830 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2831 {
2832 /* Disable an ISA extension. */
2833 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2834 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2835 {
2836 flags = cpu_flags_and_not (cpu_arch_flags,
2837 cpu_noarch[j].flags);
2838 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2839 {
2840 if (cpu_sub_arch_name)
2841 {
2842 char *name = cpu_sub_arch_name;
2843 cpu_sub_arch_name = concat (name, string,
2844 (const char *) NULL);
2845 free (name);
2846 }
2847 else
2848 cpu_sub_arch_name = xstrdup (string);
2849 cpu_arch_flags = flags;
2850 cpu_arch_isa_flags = flags;
2851 }
2852 (void) restore_line_pointer (e);
2853 demand_empty_rest_of_line ();
2854 return;
2855 }
2856
2857 j = ARRAY_SIZE (cpu_arch);
2858 }
2859
2860 if (j >= ARRAY_SIZE (cpu_arch))
2861 as_bad (_("no such architecture: `%s'"), string);
2862
2863 *input_line_pointer = e;
2864 }
2865 else
2866 as_bad (_("missing cpu architecture"));
2867
2868 no_cond_jump_promotion = 0;
2869 if (*input_line_pointer == ','
2870 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2871 {
2872 char *string;
2873 char e;
2874
2875 ++input_line_pointer;
2876 e = get_symbol_name (&string);
2877
2878 if (strcmp (string, "nojumps") == 0)
2879 no_cond_jump_promotion = 1;
2880 else if (strcmp (string, "jumps") == 0)
2881 ;
2882 else
2883 as_bad (_("no such architecture modifier: `%s'"), string);
2884
2885 (void) restore_line_pointer (e);
2886 }
2887
2888 demand_empty_rest_of_line ();
2889 }
2890
2891 enum bfd_architecture
2892 i386_arch (void)
2893 {
2894 if (cpu_arch_isa == PROCESSOR_L1OM)
2895 {
2896 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2897 || flag_code != CODE_64BIT)
2898 as_fatal (_("Intel L1OM is 64bit ELF only"));
2899 return bfd_arch_l1om;
2900 }
2901 else if (cpu_arch_isa == PROCESSOR_K1OM)
2902 {
2903 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2904 || flag_code != CODE_64BIT)
2905 as_fatal (_("Intel K1OM is 64bit ELF only"));
2906 return bfd_arch_k1om;
2907 }
2908 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2909 {
2910 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2911 || flag_code == CODE_64BIT)
2912 as_fatal (_("Intel MCU is 32bit ELF only"));
2913 return bfd_arch_iamcu;
2914 }
2915 else
2916 return bfd_arch_i386;
2917 }
2918
2919 unsigned long
2920 i386_mach (void)
2921 {
2922 if (!strncmp (default_arch, "x86_64", 6))
2923 {
2924 if (cpu_arch_isa == PROCESSOR_L1OM)
2925 {
2926 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2927 || default_arch[6] != '\0')
2928 as_fatal (_("Intel L1OM is 64bit ELF only"));
2929 return bfd_mach_l1om;
2930 }
2931 else if (cpu_arch_isa == PROCESSOR_K1OM)
2932 {
2933 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2934 || default_arch[6] != '\0')
2935 as_fatal (_("Intel K1OM is 64bit ELF only"));
2936 return bfd_mach_k1om;
2937 }
2938 else if (default_arch[6] == '\0')
2939 return bfd_mach_x86_64;
2940 else
2941 return bfd_mach_x64_32;
2942 }
2943 else if (!strcmp (default_arch, "i386")
2944 || !strcmp (default_arch, "iamcu"))
2945 {
2946 if (cpu_arch_isa == PROCESSOR_IAMCU)
2947 {
2948 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2949 as_fatal (_("Intel MCU is 32bit ELF only"));
2950 return bfd_mach_i386_iamcu;
2951 }
2952 else
2953 return bfd_mach_i386_i386;
2954 }
2955 else
2956 as_fatal (_("unknown architecture"));
2957 }
2958 \f
2959 void
2960 md_begin (void)
2961 {
2962 const char *hash_err;
2963
2964 /* Support pseudo prefixes like {disp32}. */
2965 lex_type ['{'] = LEX_BEGIN_NAME;
2966
2967 /* Initialize op_hash hash table. */
2968 op_hash = hash_new ();
2969
2970 {
2971 const insn_template *optab;
2972 templates *core_optab;
2973
2974 /* Setup for loop. */
2975 optab = i386_optab;
2976 core_optab = XNEW (templates);
2977 core_optab->start = optab;
2978
2979 while (1)
2980 {
2981 ++optab;
2982 if (optab->name == NULL
2983 || strcmp (optab->name, (optab - 1)->name) != 0)
2984 {
2985 /* different name --> ship out current template list;
2986 add to hash table; & begin anew. */
2987 core_optab->end = optab;
2988 hash_err = hash_insert (op_hash,
2989 (optab - 1)->name,
2990 (void *) core_optab);
2991 if (hash_err)
2992 {
2993 as_fatal (_("can't hash %s: %s"),
2994 (optab - 1)->name,
2995 hash_err);
2996 }
2997 if (optab->name == NULL)
2998 break;
2999 core_optab = XNEW (templates);
3000 core_optab->start = optab;
3001 }
3002 }
3003 }
3004
3005 /* Initialize reg_hash hash table. */
3006 reg_hash = hash_new ();
3007 {
3008 const reg_entry *regtab;
3009 unsigned int regtab_size = i386_regtab_size;
3010
3011 for (regtab = i386_regtab; regtab_size--; regtab++)
3012 {
3013 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3014 if (hash_err)
3015 as_fatal (_("can't hash %s: %s"),
3016 regtab->reg_name,
3017 hash_err);
3018 }
3019 }
3020
3021 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3022 {
3023 int c;
3024 char *p;
3025
3026 for (c = 0; c < 256; c++)
3027 {
3028 if (ISDIGIT (c))
3029 {
3030 digit_chars[c] = c;
3031 mnemonic_chars[c] = c;
3032 register_chars[c] = c;
3033 operand_chars[c] = c;
3034 }
3035 else if (ISLOWER (c))
3036 {
3037 mnemonic_chars[c] = c;
3038 register_chars[c] = c;
3039 operand_chars[c] = c;
3040 }
3041 else if (ISUPPER (c))
3042 {
3043 mnemonic_chars[c] = TOLOWER (c);
3044 register_chars[c] = mnemonic_chars[c];
3045 operand_chars[c] = c;
3046 }
3047 else if (c == '{' || c == '}')
3048 {
3049 mnemonic_chars[c] = c;
3050 operand_chars[c] = c;
3051 }
3052
3053 if (ISALPHA (c) || ISDIGIT (c))
3054 identifier_chars[c] = c;
3055 else if (c >= 128)
3056 {
3057 identifier_chars[c] = c;
3058 operand_chars[c] = c;
3059 }
3060 }
3061
3062 #ifdef LEX_AT
3063 identifier_chars['@'] = '@';
3064 #endif
3065 #ifdef LEX_QM
3066 identifier_chars['?'] = '?';
3067 operand_chars['?'] = '?';
3068 #endif
3069 digit_chars['-'] = '-';
3070 mnemonic_chars['_'] = '_';
3071 mnemonic_chars['-'] = '-';
3072 mnemonic_chars['.'] = '.';
3073 identifier_chars['_'] = '_';
3074 identifier_chars['.'] = '.';
3075
3076 for (p = operand_special_chars; *p != '\0'; p++)
3077 operand_chars[(unsigned char) *p] = *p;
3078 }
3079
3080 if (flag_code == CODE_64BIT)
3081 {
3082 #if defined (OBJ_COFF) && defined (TE_PE)
3083 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3084 ? 32 : 16);
3085 #else
3086 x86_dwarf2_return_column = 16;
3087 #endif
3088 x86_cie_data_alignment = -8;
3089 }
3090 else
3091 {
3092 x86_dwarf2_return_column = 8;
3093 x86_cie_data_alignment = -4;
3094 }
3095
3096 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3097 can be turned into BRANCH_PREFIX frag. */
3098 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3099 abort ();
3100 }
3101
3102 void
3103 i386_print_statistics (FILE *file)
3104 {
3105 hash_print_statistics (file, "i386 opcode", op_hash);
3106 hash_print_statistics (file, "i386 register", reg_hash);
3107 }
3108 \f
3109 #ifdef DEBUG386
3110
3111 /* Debugging routines for md_assemble. */
3112 static void pte (insn_template *);
3113 static void pt (i386_operand_type);
3114 static void pe (expressionS *);
3115 static void ps (symbolS *);
3116
3117 static void
3118 pi (const char *line, i386_insn *x)
3119 {
3120 unsigned int j;
3121
3122 fprintf (stdout, "%s: template ", line);
3123 pte (&x->tm);
3124 fprintf (stdout, " address: base %s index %s scale %x\n",
3125 x->base_reg ? x->base_reg->reg_name : "none",
3126 x->index_reg ? x->index_reg->reg_name : "none",
3127 x->log2_scale_factor);
3128 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3129 x->rm.mode, x->rm.reg, x->rm.regmem);
3130 fprintf (stdout, " sib: base %x index %x scale %x\n",
3131 x->sib.base, x->sib.index, x->sib.scale);
3132 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3133 (x->rex & REX_W) != 0,
3134 (x->rex & REX_R) != 0,
3135 (x->rex & REX_X) != 0,
3136 (x->rex & REX_B) != 0);
3137 for (j = 0; j < x->operands; j++)
3138 {
3139 fprintf (stdout, " #%d: ", j + 1);
3140 pt (x->types[j]);
3141 fprintf (stdout, "\n");
3142 if (x->types[j].bitfield.class == Reg
3143 || x->types[j].bitfield.class == RegMMX
3144 || x->types[j].bitfield.class == RegSIMD
3145 || x->types[j].bitfield.class == SReg
3146 || x->types[j].bitfield.class == RegCR
3147 || x->types[j].bitfield.class == RegDR
3148 || x->types[j].bitfield.class == RegTR)
3149 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3150 if (operand_type_check (x->types[j], imm))
3151 pe (x->op[j].imms);
3152 if (operand_type_check (x->types[j], disp))
3153 pe (x->op[j].disps);
3154 }
3155 }
3156
3157 static void
3158 pte (insn_template *t)
3159 {
3160 unsigned int j;
3161 fprintf (stdout, " %d operands ", t->operands);
3162 fprintf (stdout, "opcode %x ", t->base_opcode);
3163 if (t->extension_opcode != None)
3164 fprintf (stdout, "ext %x ", t->extension_opcode);
3165 if (t->opcode_modifier.d)
3166 fprintf (stdout, "D");
3167 if (t->opcode_modifier.w)
3168 fprintf (stdout, "W");
3169 fprintf (stdout, "\n");
3170 for (j = 0; j < t->operands; j++)
3171 {
3172 fprintf (stdout, " #%d type ", j + 1);
3173 pt (t->operand_types[j]);
3174 fprintf (stdout, "\n");
3175 }
3176 }
3177
3178 static void
3179 pe (expressionS *e)
3180 {
3181 fprintf (stdout, " operation %d\n", e->X_op);
3182 fprintf (stdout, " add_number %ld (%lx)\n",
3183 (long) e->X_add_number, (long) e->X_add_number);
3184 if (e->X_add_symbol)
3185 {
3186 fprintf (stdout, " add_symbol ");
3187 ps (e->X_add_symbol);
3188 fprintf (stdout, "\n");
3189 }
3190 if (e->X_op_symbol)
3191 {
3192 fprintf (stdout, " op_symbol ");
3193 ps (e->X_op_symbol);
3194 fprintf (stdout, "\n");
3195 }
3196 }
3197
3198 static void
3199 ps (symbolS *s)
3200 {
3201 fprintf (stdout, "%s type %s%s",
3202 S_GET_NAME (s),
3203 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3204 segment_name (S_GET_SEGMENT (s)));
3205 }
3206
3207 static struct type_name
3208 {
3209 i386_operand_type mask;
3210 const char *name;
3211 }
3212 const type_names[] =
3213 {
3214 { OPERAND_TYPE_REG8, "r8" },
3215 { OPERAND_TYPE_REG16, "r16" },
3216 { OPERAND_TYPE_REG32, "r32" },
3217 { OPERAND_TYPE_REG64, "r64" },
3218 { OPERAND_TYPE_ACC8, "acc8" },
3219 { OPERAND_TYPE_ACC16, "acc16" },
3220 { OPERAND_TYPE_ACC32, "acc32" },
3221 { OPERAND_TYPE_ACC64, "acc64" },
3222 { OPERAND_TYPE_IMM8, "i8" },
3223 { OPERAND_TYPE_IMM8, "i8s" },
3224 { OPERAND_TYPE_IMM16, "i16" },
3225 { OPERAND_TYPE_IMM32, "i32" },
3226 { OPERAND_TYPE_IMM32S, "i32s" },
3227 { OPERAND_TYPE_IMM64, "i64" },
3228 { OPERAND_TYPE_IMM1, "i1" },
3229 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3230 { OPERAND_TYPE_DISP8, "d8" },
3231 { OPERAND_TYPE_DISP16, "d16" },
3232 { OPERAND_TYPE_DISP32, "d32" },
3233 { OPERAND_TYPE_DISP32S, "d32s" },
3234 { OPERAND_TYPE_DISP64, "d64" },
3235 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3236 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3237 { OPERAND_TYPE_CONTROL, "control reg" },
3238 { OPERAND_TYPE_TEST, "test reg" },
3239 { OPERAND_TYPE_DEBUG, "debug reg" },
3240 { OPERAND_TYPE_FLOATREG, "FReg" },
3241 { OPERAND_TYPE_FLOATACC, "FAcc" },
3242 { OPERAND_TYPE_SREG, "SReg" },
3243 { OPERAND_TYPE_REGMMX, "rMMX" },
3244 { OPERAND_TYPE_REGXMM, "rXMM" },
3245 { OPERAND_TYPE_REGYMM, "rYMM" },
3246 { OPERAND_TYPE_REGZMM, "rZMM" },
3247 { OPERAND_TYPE_REGMASK, "Mask reg" },
3248 };
3249
3250 static void
3251 pt (i386_operand_type t)
3252 {
3253 unsigned int j;
3254 i386_operand_type a;
3255
3256 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3257 {
3258 a = operand_type_and (t, type_names[j].mask);
3259 if (operand_type_equal (&a, &type_names[j].mask))
3260 fprintf (stdout, "%s, ", type_names[j].name);
3261 }
3262 fflush (stdout);
3263 }
3264
3265 #endif /* DEBUG386 */
3266 \f
3267 static bfd_reloc_code_real_type
3268 reloc (unsigned int size,
3269 int pcrel,
3270 int sign,
3271 bfd_reloc_code_real_type other)
3272 {
3273 if (other != NO_RELOC)
3274 {
3275 reloc_howto_type *rel;
3276
3277 if (size == 8)
3278 switch (other)
3279 {
3280 case BFD_RELOC_X86_64_GOT32:
3281 return BFD_RELOC_X86_64_GOT64;
3282 break;
3283 case BFD_RELOC_X86_64_GOTPLT64:
3284 return BFD_RELOC_X86_64_GOTPLT64;
3285 break;
3286 case BFD_RELOC_X86_64_PLTOFF64:
3287 return BFD_RELOC_X86_64_PLTOFF64;
3288 break;
3289 case BFD_RELOC_X86_64_GOTPC32:
3290 other = BFD_RELOC_X86_64_GOTPC64;
3291 break;
3292 case BFD_RELOC_X86_64_GOTPCREL:
3293 other = BFD_RELOC_X86_64_GOTPCREL64;
3294 break;
3295 case BFD_RELOC_X86_64_TPOFF32:
3296 other = BFD_RELOC_X86_64_TPOFF64;
3297 break;
3298 case BFD_RELOC_X86_64_DTPOFF32:
3299 other = BFD_RELOC_X86_64_DTPOFF64;
3300 break;
3301 default:
3302 break;
3303 }
3304
3305 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3306 if (other == BFD_RELOC_SIZE32)
3307 {
3308 if (size == 8)
3309 other = BFD_RELOC_SIZE64;
3310 if (pcrel)
3311 {
3312 as_bad (_("there are no pc-relative size relocations"));
3313 return NO_RELOC;
3314 }
3315 }
3316 #endif
3317
3318 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3319 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3320 sign = -1;
3321
3322 rel = bfd_reloc_type_lookup (stdoutput, other);
3323 if (!rel)
3324 as_bad (_("unknown relocation (%u)"), other);
3325 else if (size != bfd_get_reloc_size (rel))
3326 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3327 bfd_get_reloc_size (rel),
3328 size);
3329 else if (pcrel && !rel->pc_relative)
3330 as_bad (_("non-pc-relative relocation for pc-relative field"));
3331 else if ((rel->complain_on_overflow == complain_overflow_signed
3332 && !sign)
3333 || (rel->complain_on_overflow == complain_overflow_unsigned
3334 && sign > 0))
3335 as_bad (_("relocated field and relocation type differ in signedness"));
3336 else
3337 return other;
3338 return NO_RELOC;
3339 }
3340
3341 if (pcrel)
3342 {
3343 if (!sign)
3344 as_bad (_("there are no unsigned pc-relative relocations"));
3345 switch (size)
3346 {
3347 case 1: return BFD_RELOC_8_PCREL;
3348 case 2: return BFD_RELOC_16_PCREL;
3349 case 4: return BFD_RELOC_32_PCREL;
3350 case 8: return BFD_RELOC_64_PCREL;
3351 }
3352 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3353 }
3354 else
3355 {
3356 if (sign > 0)
3357 switch (size)
3358 {
3359 case 4: return BFD_RELOC_X86_64_32S;
3360 }
3361 else
3362 switch (size)
3363 {
3364 case 1: return BFD_RELOC_8;
3365 case 2: return BFD_RELOC_16;
3366 case 4: return BFD_RELOC_32;
3367 case 8: return BFD_RELOC_64;
3368 }
3369 as_bad (_("cannot do %s %u byte relocation"),
3370 sign > 0 ? "signed" : "unsigned", size);
3371 }
3372
3373 return NO_RELOC;
3374 }
3375
3376 /* Here we decide which fixups can be adjusted to make them relative to
3377 the beginning of the section instead of the symbol. Basically we need
3378 to make sure that the dynamic relocations are done correctly, so in
3379 some cases we force the original symbol to be used. */
3380
3381 int
3382 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3383 {
3384 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3385 if (!IS_ELF)
3386 return 1;
3387
3388 /* Don't adjust pc-relative references to merge sections in 64-bit
3389 mode. */
3390 if (use_rela_relocations
3391 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3392 && fixP->fx_pcrel)
3393 return 0;
3394
3395 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3396 and changed later by validate_fix. */
3397 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3398 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3399 return 0;
3400
3401 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3402 for size relocations. */
3403 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3404 || fixP->fx_r_type == BFD_RELOC_SIZE64
3405 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3406 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3407 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3408 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3409 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3410 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3411 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3412 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3413 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3414 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3415 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3416 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3417 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3418 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3419 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3420 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3421 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3422 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3423 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3424 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3425 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3426 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3427 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3428 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3429 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3430 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3431 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3432 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3433 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3434 return 0;
3435 #endif
3436 return 1;
3437 }
3438
3439 static int
3440 intel_float_operand (const char *mnemonic)
3441 {
3442 /* Note that the value returned is meaningful only for opcodes with (memory)
3443 operands, hence the code here is free to improperly handle opcodes that
3444 have no operands (for better performance and smaller code). */
3445
3446 if (mnemonic[0] != 'f')
3447 return 0; /* non-math */
3448
3449 switch (mnemonic[1])
3450 {
3451 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3452 the fs segment override prefix not currently handled because no
3453 call path can make opcodes without operands get here */
3454 case 'i':
3455 return 2 /* integer op */;
3456 case 'l':
3457 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3458 return 3; /* fldcw/fldenv */
3459 break;
3460 case 'n':
3461 if (mnemonic[2] != 'o' /* fnop */)
3462 return 3; /* non-waiting control op */
3463 break;
3464 case 'r':
3465 if (mnemonic[2] == 's')
3466 return 3; /* frstor/frstpm */
3467 break;
3468 case 's':
3469 if (mnemonic[2] == 'a')
3470 return 3; /* fsave */
3471 if (mnemonic[2] == 't')
3472 {
3473 switch (mnemonic[3])
3474 {
3475 case 'c': /* fstcw */
3476 case 'd': /* fstdw */
3477 case 'e': /* fstenv */
3478 case 's': /* fsts[gw] */
3479 return 3;
3480 }
3481 }
3482 break;
3483 case 'x':
3484 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3485 return 0; /* fxsave/fxrstor are not really math ops */
3486 break;
3487 }
3488
3489 return 1;
3490 }
3491
3492 /* Build the VEX prefix. */
3493
3494 static void
3495 build_vex_prefix (const insn_template *t)
3496 {
3497 unsigned int register_specifier;
3498 unsigned int implied_prefix;
3499 unsigned int vector_length;
3500 unsigned int w;
3501
3502 /* Check register specifier. */
3503 if (i.vex.register_specifier)
3504 {
3505 register_specifier =
3506 ~register_number (i.vex.register_specifier) & 0xf;
3507 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3508 }
3509 else
3510 register_specifier = 0xf;
3511
3512 /* Use 2-byte VEX prefix by swapping destination and source operand
3513 if there are more than 1 register operand. */
3514 if (i.reg_operands > 1
3515 && i.vec_encoding != vex_encoding_vex3
3516 && i.dir_encoding == dir_encoding_default
3517 && i.operands == i.reg_operands
3518 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3519 && i.tm.opcode_modifier.vexopcode == VEX0F
3520 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3521 && i.rex == REX_B)
3522 {
3523 unsigned int xchg = i.operands - 1;
3524 union i386_op temp_op;
3525 i386_operand_type temp_type;
3526
3527 temp_type = i.types[xchg];
3528 i.types[xchg] = i.types[0];
3529 i.types[0] = temp_type;
3530 temp_op = i.op[xchg];
3531 i.op[xchg] = i.op[0];
3532 i.op[0] = temp_op;
3533
3534 gas_assert (i.rm.mode == 3);
3535
3536 i.rex = REX_R;
3537 xchg = i.rm.regmem;
3538 i.rm.regmem = i.rm.reg;
3539 i.rm.reg = xchg;
3540
3541 if (i.tm.opcode_modifier.d)
3542 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3543 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3544 else /* Use the next insn. */
3545 i.tm = t[1];
3546 }
3547
3548 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3549 are no memory operands and at least 3 register ones. */
3550 if (i.reg_operands >= 3
3551 && i.vec_encoding != vex_encoding_vex3
3552 && i.reg_operands == i.operands - i.imm_operands
3553 && i.tm.opcode_modifier.vex
3554 && i.tm.opcode_modifier.commutative
3555 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3556 && i.rex == REX_B
3557 && i.vex.register_specifier
3558 && !(i.vex.register_specifier->reg_flags & RegRex))
3559 {
3560 unsigned int xchg = i.operands - i.reg_operands;
3561 union i386_op temp_op;
3562 i386_operand_type temp_type;
3563
3564 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3565 gas_assert (!i.tm.opcode_modifier.sae);
3566 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3567 &i.types[i.operands - 3]));
3568 gas_assert (i.rm.mode == 3);
3569
3570 temp_type = i.types[xchg];
3571 i.types[xchg] = i.types[xchg + 1];
3572 i.types[xchg + 1] = temp_type;
3573 temp_op = i.op[xchg];
3574 i.op[xchg] = i.op[xchg + 1];
3575 i.op[xchg + 1] = temp_op;
3576
3577 i.rex = 0;
3578 xchg = i.rm.regmem | 8;
3579 i.rm.regmem = ~register_specifier & 0xf;
3580 gas_assert (!(i.rm.regmem & 8));
3581 i.vex.register_specifier += xchg - i.rm.regmem;
3582 register_specifier = ~xchg & 0xf;
3583 }
3584
3585 if (i.tm.opcode_modifier.vex == VEXScalar)
3586 vector_length = avxscalar;
3587 else if (i.tm.opcode_modifier.vex == VEX256)
3588 vector_length = 1;
3589 else
3590 {
3591 unsigned int op;
3592
3593 /* Determine vector length from the last multi-length vector
3594 operand. */
3595 vector_length = 0;
3596 for (op = t->operands; op--;)
3597 if (t->operand_types[op].bitfield.xmmword
3598 && t->operand_types[op].bitfield.ymmword
3599 && i.types[op].bitfield.ymmword)
3600 {
3601 vector_length = 1;
3602 break;
3603 }
3604 }
3605
3606 switch ((i.tm.base_opcode >> 8) & 0xff)
3607 {
3608 case 0:
3609 implied_prefix = 0;
3610 break;
3611 case DATA_PREFIX_OPCODE:
3612 implied_prefix = 1;
3613 break;
3614 case REPE_PREFIX_OPCODE:
3615 implied_prefix = 2;
3616 break;
3617 case REPNE_PREFIX_OPCODE:
3618 implied_prefix = 3;
3619 break;
3620 default:
3621 abort ();
3622 }
3623
3624 /* Check the REX.W bit and VEXW. */
3625 if (i.tm.opcode_modifier.vexw == VEXWIG)
3626 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3627 else if (i.tm.opcode_modifier.vexw)
3628 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3629 else
3630 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3631
3632 /* Use 2-byte VEX prefix if possible. */
3633 if (w == 0
3634 && i.vec_encoding != vex_encoding_vex3
3635 && i.tm.opcode_modifier.vexopcode == VEX0F
3636 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3637 {
3638 /* 2-byte VEX prefix. */
3639 unsigned int r;
3640
3641 i.vex.length = 2;
3642 i.vex.bytes[0] = 0xc5;
3643
3644 /* Check the REX.R bit. */
3645 r = (i.rex & REX_R) ? 0 : 1;
3646 i.vex.bytes[1] = (r << 7
3647 | register_specifier << 3
3648 | vector_length << 2
3649 | implied_prefix);
3650 }
3651 else
3652 {
3653 /* 3-byte VEX prefix. */
3654 unsigned int m;
3655
3656 i.vex.length = 3;
3657
3658 switch (i.tm.opcode_modifier.vexopcode)
3659 {
3660 case VEX0F:
3661 m = 0x1;
3662 i.vex.bytes[0] = 0xc4;
3663 break;
3664 case VEX0F38:
3665 m = 0x2;
3666 i.vex.bytes[0] = 0xc4;
3667 break;
3668 case VEX0F3A:
3669 m = 0x3;
3670 i.vex.bytes[0] = 0xc4;
3671 break;
3672 case XOP08:
3673 m = 0x8;
3674 i.vex.bytes[0] = 0x8f;
3675 break;
3676 case XOP09:
3677 m = 0x9;
3678 i.vex.bytes[0] = 0x8f;
3679 break;
3680 case XOP0A:
3681 m = 0xa;
3682 i.vex.bytes[0] = 0x8f;
3683 break;
3684 default:
3685 abort ();
3686 }
3687
3688 /* The high 3 bits of the second VEX byte are 1's compliment
3689 of RXB bits from REX. */
3690 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3691
3692 i.vex.bytes[2] = (w << 7
3693 | register_specifier << 3
3694 | vector_length << 2
3695 | implied_prefix);
3696 }
3697 }
3698
3699 static INLINE bfd_boolean
3700 is_evex_encoding (const insn_template *t)
3701 {
3702 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3703 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3704 || t->opcode_modifier.sae;
3705 }
3706
3707 static INLINE bfd_boolean
3708 is_any_vex_encoding (const insn_template *t)
3709 {
3710 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3711 || is_evex_encoding (t);
3712 }
3713
3714 /* Build the EVEX prefix. */
3715
3716 static void
3717 build_evex_prefix (void)
3718 {
3719 unsigned int register_specifier;
3720 unsigned int implied_prefix;
3721 unsigned int m, w;
3722 rex_byte vrex_used = 0;
3723
3724 /* Check register specifier. */
3725 if (i.vex.register_specifier)
3726 {
3727 gas_assert ((i.vrex & REX_X) == 0);
3728
3729 register_specifier = i.vex.register_specifier->reg_num;
3730 if ((i.vex.register_specifier->reg_flags & RegRex))
3731 register_specifier += 8;
3732 /* The upper 16 registers are encoded in the fourth byte of the
3733 EVEX prefix. */
3734 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3735 i.vex.bytes[3] = 0x8;
3736 register_specifier = ~register_specifier & 0xf;
3737 }
3738 else
3739 {
3740 register_specifier = 0xf;
3741
3742 /* Encode upper 16 vector index register in the fourth byte of
3743 the EVEX prefix. */
3744 if (!(i.vrex & REX_X))
3745 i.vex.bytes[3] = 0x8;
3746 else
3747 vrex_used |= REX_X;
3748 }
3749
3750 switch ((i.tm.base_opcode >> 8) & 0xff)
3751 {
3752 case 0:
3753 implied_prefix = 0;
3754 break;
3755 case DATA_PREFIX_OPCODE:
3756 implied_prefix = 1;
3757 break;
3758 case REPE_PREFIX_OPCODE:
3759 implied_prefix = 2;
3760 break;
3761 case REPNE_PREFIX_OPCODE:
3762 implied_prefix = 3;
3763 break;
3764 default:
3765 abort ();
3766 }
3767
3768 /* 4 byte EVEX prefix. */
3769 i.vex.length = 4;
3770 i.vex.bytes[0] = 0x62;
3771
3772 /* mmmm bits. */
3773 switch (i.tm.opcode_modifier.vexopcode)
3774 {
3775 case VEX0F:
3776 m = 1;
3777 break;
3778 case VEX0F38:
3779 m = 2;
3780 break;
3781 case VEX0F3A:
3782 m = 3;
3783 break;
3784 default:
3785 abort ();
3786 break;
3787 }
3788
3789 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3790 bits from REX. */
3791 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3792
3793 /* The fifth bit of the second EVEX byte is 1's compliment of the
3794 REX_R bit in VREX. */
3795 if (!(i.vrex & REX_R))
3796 i.vex.bytes[1] |= 0x10;
3797 else
3798 vrex_used |= REX_R;
3799
3800 if ((i.reg_operands + i.imm_operands) == i.operands)
3801 {
3802 /* When all operands are registers, the REX_X bit in REX is not
3803 used. We reuse it to encode the upper 16 registers, which is
3804 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3805 as 1's compliment. */
3806 if ((i.vrex & REX_B))
3807 {
3808 vrex_used |= REX_B;
3809 i.vex.bytes[1] &= ~0x40;
3810 }
3811 }
3812
3813 /* EVEX instructions shouldn't need the REX prefix. */
3814 i.vrex &= ~vrex_used;
3815 gas_assert (i.vrex == 0);
3816
3817 /* Check the REX.W bit and VEXW. */
3818 if (i.tm.opcode_modifier.vexw == VEXWIG)
3819 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3820 else if (i.tm.opcode_modifier.vexw)
3821 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3822 else
3823 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3824
3825 /* Encode the U bit. */
3826 implied_prefix |= 0x4;
3827
3828 /* The third byte of the EVEX prefix. */
3829 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3830
3831 /* The fourth byte of the EVEX prefix. */
3832 /* The zeroing-masking bit. */
3833 if (i.mask && i.mask->zeroing)
3834 i.vex.bytes[3] |= 0x80;
3835
3836 /* Don't always set the broadcast bit if there is no RC. */
3837 if (!i.rounding)
3838 {
3839 /* Encode the vector length. */
3840 unsigned int vec_length;
3841
3842 if (!i.tm.opcode_modifier.evex
3843 || i.tm.opcode_modifier.evex == EVEXDYN)
3844 {
3845 unsigned int op;
3846
3847 /* Determine vector length from the last multi-length vector
3848 operand. */
3849 vec_length = 0;
3850 for (op = i.operands; op--;)
3851 if (i.tm.operand_types[op].bitfield.xmmword
3852 + i.tm.operand_types[op].bitfield.ymmword
3853 + i.tm.operand_types[op].bitfield.zmmword > 1)
3854 {
3855 if (i.types[op].bitfield.zmmword)
3856 {
3857 i.tm.opcode_modifier.evex = EVEX512;
3858 break;
3859 }
3860 else if (i.types[op].bitfield.ymmword)
3861 {
3862 i.tm.opcode_modifier.evex = EVEX256;
3863 break;
3864 }
3865 else if (i.types[op].bitfield.xmmword)
3866 {
3867 i.tm.opcode_modifier.evex = EVEX128;
3868 break;
3869 }
3870 else if (i.broadcast && (int) op == i.broadcast->operand)
3871 {
3872 switch (i.broadcast->bytes)
3873 {
3874 case 64:
3875 i.tm.opcode_modifier.evex = EVEX512;
3876 break;
3877 case 32:
3878 i.tm.opcode_modifier.evex = EVEX256;
3879 break;
3880 case 16:
3881 i.tm.opcode_modifier.evex = EVEX128;
3882 break;
3883 default:
3884 abort ();
3885 }
3886 break;
3887 }
3888 }
3889
3890 if (op >= MAX_OPERANDS)
3891 abort ();
3892 }
3893
3894 switch (i.tm.opcode_modifier.evex)
3895 {
3896 case EVEXLIG: /* LL' is ignored */
3897 vec_length = evexlig << 5;
3898 break;
3899 case EVEX128:
3900 vec_length = 0 << 5;
3901 break;
3902 case EVEX256:
3903 vec_length = 1 << 5;
3904 break;
3905 case EVEX512:
3906 vec_length = 2 << 5;
3907 break;
3908 default:
3909 abort ();
3910 break;
3911 }
3912 i.vex.bytes[3] |= vec_length;
3913 /* Encode the broadcast bit. */
3914 if (i.broadcast)
3915 i.vex.bytes[3] |= 0x10;
3916 }
3917 else
3918 {
3919 if (i.rounding->type != saeonly)
3920 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3921 else
3922 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3923 }
3924
3925 if (i.mask && i.mask->mask)
3926 i.vex.bytes[3] |= i.mask->mask->reg_num;
3927 }
3928
3929 static void
3930 process_immext (void)
3931 {
3932 expressionS *exp;
3933
3934 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3935 which is coded in the same place as an 8-bit immediate field
3936 would be. Here we fake an 8-bit immediate operand from the
3937 opcode suffix stored in tm.extension_opcode.
3938
3939 AVX instructions also use this encoding, for some of
3940 3 argument instructions. */
3941
3942 gas_assert (i.imm_operands <= 1
3943 && (i.operands <= 2
3944 || (is_any_vex_encoding (&i.tm)
3945 && i.operands <= 4)));
3946
3947 exp = &im_expressions[i.imm_operands++];
3948 i.op[i.operands].imms = exp;
3949 i.types[i.operands] = imm8;
3950 i.operands++;
3951 exp->X_op = O_constant;
3952 exp->X_add_number = i.tm.extension_opcode;
3953 i.tm.extension_opcode = None;
3954 }
3955
3956
3957 static int
3958 check_hle (void)
3959 {
3960 switch (i.tm.opcode_modifier.hleprefixok)
3961 {
3962 default:
3963 abort ();
3964 case HLEPrefixNone:
3965 as_bad (_("invalid instruction `%s' after `%s'"),
3966 i.tm.name, i.hle_prefix);
3967 return 0;
3968 case HLEPrefixLock:
3969 if (i.prefix[LOCK_PREFIX])
3970 return 1;
3971 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3972 return 0;
3973 case HLEPrefixAny:
3974 return 1;
3975 case HLEPrefixRelease:
3976 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3977 {
3978 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3979 i.tm.name);
3980 return 0;
3981 }
3982 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
3983 {
3984 as_bad (_("memory destination needed for instruction `%s'"
3985 " after `xrelease'"), i.tm.name);
3986 return 0;
3987 }
3988 return 1;
3989 }
3990 }
3991
3992 /* Try the shortest encoding by shortening operand size. */
3993
3994 static void
3995 optimize_encoding (void)
3996 {
3997 unsigned int j;
3998
3999 if (optimize_for_space
4000 && !is_any_vex_encoding (&i.tm)
4001 && i.reg_operands == 1
4002 && i.imm_operands == 1
4003 && !i.types[1].bitfield.byte
4004 && i.op[0].imms->X_op == O_constant
4005 && fits_in_imm7 (i.op[0].imms->X_add_number)
4006 && (i.tm.base_opcode == 0xa8
4007 || (i.tm.base_opcode == 0xf6
4008 && i.tm.extension_opcode == 0x0)))
4009 {
4010 /* Optimize: -Os:
4011 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4012 */
4013 unsigned int base_regnum = i.op[1].regs->reg_num;
4014 if (flag_code == CODE_64BIT || base_regnum < 4)
4015 {
4016 i.types[1].bitfield.byte = 1;
4017 /* Ignore the suffix. */
4018 i.suffix = 0;
4019 /* Convert to byte registers. */
4020 if (i.types[1].bitfield.word)
4021 j = 16;
4022 else if (i.types[1].bitfield.dword)
4023 j = 32;
4024 else
4025 j = 48;
4026 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4027 j += 8;
4028 i.op[1].regs -= j;
4029 }
4030 }
4031 else if (flag_code == CODE_64BIT
4032 && !is_any_vex_encoding (&i.tm)
4033 && ((i.types[1].bitfield.qword
4034 && i.reg_operands == 1
4035 && i.imm_operands == 1
4036 && i.op[0].imms->X_op == O_constant
4037 && ((i.tm.base_opcode == 0xb8
4038 && i.tm.extension_opcode == None
4039 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4040 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4041 && ((i.tm.base_opcode == 0x24
4042 || i.tm.base_opcode == 0xa8)
4043 || (i.tm.base_opcode == 0x80
4044 && i.tm.extension_opcode == 0x4)
4045 || ((i.tm.base_opcode == 0xf6
4046 || (i.tm.base_opcode | 1) == 0xc7)
4047 && i.tm.extension_opcode == 0x0)))
4048 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4049 && i.tm.base_opcode == 0x83
4050 && i.tm.extension_opcode == 0x4)))
4051 || (i.types[0].bitfield.qword
4052 && ((i.reg_operands == 2
4053 && i.op[0].regs == i.op[1].regs
4054 && (i.tm.base_opcode == 0x30
4055 || i.tm.base_opcode == 0x28))
4056 || (i.reg_operands == 1
4057 && i.operands == 1
4058 && i.tm.base_opcode == 0x30)))))
4059 {
4060 /* Optimize: -O:
4061 andq $imm31, %r64 -> andl $imm31, %r32
4062 andq $imm7, %r64 -> andl $imm7, %r32
4063 testq $imm31, %r64 -> testl $imm31, %r32
4064 xorq %r64, %r64 -> xorl %r32, %r32
4065 subq %r64, %r64 -> subl %r32, %r32
4066 movq $imm31, %r64 -> movl $imm31, %r32
4067 movq $imm32, %r64 -> movl $imm32, %r32
4068 */
4069 i.tm.opcode_modifier.norex64 = 1;
4070 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4071 {
4072 /* Handle
4073 movq $imm31, %r64 -> movl $imm31, %r32
4074 movq $imm32, %r64 -> movl $imm32, %r32
4075 */
4076 i.tm.operand_types[0].bitfield.imm32 = 1;
4077 i.tm.operand_types[0].bitfield.imm32s = 0;
4078 i.tm.operand_types[0].bitfield.imm64 = 0;
4079 i.types[0].bitfield.imm32 = 1;
4080 i.types[0].bitfield.imm32s = 0;
4081 i.types[0].bitfield.imm64 = 0;
4082 i.types[1].bitfield.dword = 1;
4083 i.types[1].bitfield.qword = 0;
4084 if ((i.tm.base_opcode | 1) == 0xc7)
4085 {
4086 /* Handle
4087 movq $imm31, %r64 -> movl $imm31, %r32
4088 */
4089 i.tm.base_opcode = 0xb8;
4090 i.tm.extension_opcode = None;
4091 i.tm.opcode_modifier.w = 0;
4092 i.tm.opcode_modifier.modrm = 0;
4093 }
4094 }
4095 }
4096 else if (optimize > 1
4097 && !optimize_for_space
4098 && !is_any_vex_encoding (&i.tm)
4099 && i.reg_operands == 2
4100 && i.op[0].regs == i.op[1].regs
4101 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4102 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4103 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4104 {
4105 /* Optimize: -O2:
4106 andb %rN, %rN -> testb %rN, %rN
4107 andw %rN, %rN -> testw %rN, %rN
4108 andq %rN, %rN -> testq %rN, %rN
4109 orb %rN, %rN -> testb %rN, %rN
4110 orw %rN, %rN -> testw %rN, %rN
4111 orq %rN, %rN -> testq %rN, %rN
4112
4113 and outside of 64-bit mode
4114
4115 andl %rN, %rN -> testl %rN, %rN
4116 orl %rN, %rN -> testl %rN, %rN
4117 */
4118 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4119 }
4120 else if (i.reg_operands == 3
4121 && i.op[0].regs == i.op[1].regs
4122 && !i.types[2].bitfield.xmmword
4123 && (i.tm.opcode_modifier.vex
4124 || ((!i.mask || i.mask->zeroing)
4125 && !i.rounding
4126 && is_evex_encoding (&i.tm)
4127 && (i.vec_encoding != vex_encoding_evex
4128 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4129 || i.tm.cpu_flags.bitfield.cpuavx512vl
4130 || (i.tm.operand_types[2].bitfield.zmmword
4131 && i.types[2].bitfield.ymmword))))
4132 && ((i.tm.base_opcode == 0x55
4133 || i.tm.base_opcode == 0x6655
4134 || i.tm.base_opcode == 0x66df
4135 || i.tm.base_opcode == 0x57
4136 || i.tm.base_opcode == 0x6657
4137 || i.tm.base_opcode == 0x66ef
4138 || i.tm.base_opcode == 0x66f8
4139 || i.tm.base_opcode == 0x66f9
4140 || i.tm.base_opcode == 0x66fa
4141 || i.tm.base_opcode == 0x66fb
4142 || i.tm.base_opcode == 0x42
4143 || i.tm.base_opcode == 0x6642
4144 || i.tm.base_opcode == 0x47
4145 || i.tm.base_opcode == 0x6647)
4146 && i.tm.extension_opcode == None))
4147 {
4148 /* Optimize: -O1:
4149 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4150 vpsubq and vpsubw:
4151 EVEX VOP %zmmM, %zmmM, %zmmN
4152 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4153 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4154 EVEX VOP %ymmM, %ymmM, %ymmN
4155 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4156 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4157 VEX VOP %ymmM, %ymmM, %ymmN
4158 -> VEX VOP %xmmM, %xmmM, %xmmN
4159 VOP, one of vpandn and vpxor:
4160 VEX VOP %ymmM, %ymmM, %ymmN
4161 -> VEX VOP %xmmM, %xmmM, %xmmN
4162 VOP, one of vpandnd and vpandnq:
4163 EVEX VOP %zmmM, %zmmM, %zmmN
4164 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4165 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4166 EVEX VOP %ymmM, %ymmM, %ymmN
4167 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4168 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4169 VOP, one of vpxord and vpxorq:
4170 EVEX VOP %zmmM, %zmmM, %zmmN
4171 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4172 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4173 EVEX VOP %ymmM, %ymmM, %ymmN
4174 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4175 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4176 VOP, one of kxord and kxorq:
4177 VEX VOP %kM, %kM, %kN
4178 -> VEX kxorw %kM, %kM, %kN
4179 VOP, one of kandnd and kandnq:
4180 VEX VOP %kM, %kM, %kN
4181 -> VEX kandnw %kM, %kM, %kN
4182 */
4183 if (is_evex_encoding (&i.tm))
4184 {
4185 if (i.vec_encoding != vex_encoding_evex)
4186 {
4187 i.tm.opcode_modifier.vex = VEX128;
4188 i.tm.opcode_modifier.vexw = VEXW0;
4189 i.tm.opcode_modifier.evex = 0;
4190 }
4191 else if (optimize > 1)
4192 i.tm.opcode_modifier.evex = EVEX128;
4193 else
4194 return;
4195 }
4196 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4197 {
4198 i.tm.base_opcode &= 0xff;
4199 i.tm.opcode_modifier.vexw = VEXW0;
4200 }
4201 else
4202 i.tm.opcode_modifier.vex = VEX128;
4203
4204 if (i.tm.opcode_modifier.vex)
4205 for (j = 0; j < 3; j++)
4206 {
4207 i.types[j].bitfield.xmmword = 1;
4208 i.types[j].bitfield.ymmword = 0;
4209 }
4210 }
4211 else if (i.vec_encoding != vex_encoding_evex
4212 && !i.types[0].bitfield.zmmword
4213 && !i.types[1].bitfield.zmmword
4214 && !i.mask
4215 && !i.broadcast
4216 && is_evex_encoding (&i.tm)
4217 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4218 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4219 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4220 || (i.tm.base_opcode & ~4) == 0x66db
4221 || (i.tm.base_opcode & ~4) == 0x66eb)
4222 && i.tm.extension_opcode == None)
4223 {
4224 /* Optimize: -O1:
4225 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4226 vmovdqu32 and vmovdqu64:
4227 EVEX VOP %xmmM, %xmmN
4228 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4229 EVEX VOP %ymmM, %ymmN
4230 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4231 EVEX VOP %xmmM, mem
4232 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4233 EVEX VOP %ymmM, mem
4234 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4235 EVEX VOP mem, %xmmN
4236 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4237 EVEX VOP mem, %ymmN
4238 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4239 VOP, one of vpand, vpandn, vpor, vpxor:
4240 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4241 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4242 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4243 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4244 EVEX VOP{d,q} mem, %xmmM, %xmmN
4245 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4246 EVEX VOP{d,q} mem, %ymmM, %ymmN
4247 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4248 */
4249 for (j = 0; j < i.operands; j++)
4250 if (operand_type_check (i.types[j], disp)
4251 && i.op[j].disps->X_op == O_constant)
4252 {
4253 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4254 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4255 bytes, we choose EVEX Disp8 over VEX Disp32. */
4256 int evex_disp8, vex_disp8;
4257 unsigned int memshift = i.memshift;
4258 offsetT n = i.op[j].disps->X_add_number;
4259
4260 evex_disp8 = fits_in_disp8 (n);
4261 i.memshift = 0;
4262 vex_disp8 = fits_in_disp8 (n);
4263 if (evex_disp8 != vex_disp8)
4264 {
4265 i.memshift = memshift;
4266 return;
4267 }
4268
4269 i.types[j].bitfield.disp8 = vex_disp8;
4270 break;
4271 }
4272 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4273 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4274 i.tm.opcode_modifier.vex
4275 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4276 i.tm.opcode_modifier.vexw = VEXW0;
4277 /* VPAND, VPOR, and VPXOR are commutative. */
4278 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4279 i.tm.opcode_modifier.commutative = 1;
4280 i.tm.opcode_modifier.evex = 0;
4281 i.tm.opcode_modifier.masking = 0;
4282 i.tm.opcode_modifier.broadcast = 0;
4283 i.tm.opcode_modifier.disp8memshift = 0;
4284 i.memshift = 0;
4285 if (j < i.operands)
4286 i.types[j].bitfield.disp8
4287 = fits_in_disp8 (i.op[j].disps->X_add_number);
4288 }
4289 }
4290
4291 /* This is the guts of the machine-dependent assembler. LINE points to a
4292 machine dependent instruction. This function is supposed to emit
4293 the frags/bytes it assembles to. */
4294
4295 void
4296 md_assemble (char *line)
4297 {
4298 unsigned int j;
4299 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4300 const insn_template *t;
4301
4302 /* Initialize globals. */
4303 memset (&i, '\0', sizeof (i));
4304 for (j = 0; j < MAX_OPERANDS; j++)
4305 i.reloc[j] = NO_RELOC;
4306 memset (disp_expressions, '\0', sizeof (disp_expressions));
4307 memset (im_expressions, '\0', sizeof (im_expressions));
4308 save_stack_p = save_stack;
4309
4310 /* First parse an instruction mnemonic & call i386_operand for the operands.
4311 We assume that the scrubber has arranged it so that line[0] is the valid
4312 start of a (possibly prefixed) mnemonic. */
4313
4314 line = parse_insn (line, mnemonic);
4315 if (line == NULL)
4316 return;
4317 mnem_suffix = i.suffix;
4318
4319 line = parse_operands (line, mnemonic);
4320 this_operand = -1;
4321 xfree (i.memop1_string);
4322 i.memop1_string = NULL;
4323 if (line == NULL)
4324 return;
4325
4326 /* Now we've parsed the mnemonic into a set of templates, and have the
4327 operands at hand. */
4328
4329 /* All Intel opcodes have reversed operands except for "bound", "enter"
4330 "monitor*", and "mwait*". We also don't reverse intersegment "jmp"
4331 and "call" instructions with 2 immediate operands so that the immediate
4332 segment precedes the offset, as it does when in AT&T mode. */
4333 if (intel_syntax
4334 && i.operands > 1
4335 && (strcmp (mnemonic, "bound") != 0)
4336 && (strcmp (mnemonic, "invlpga") != 0)
4337 && (strncmp (mnemonic, "monitor", 7) != 0)
4338 && (strncmp (mnemonic, "mwait", 5) != 0)
4339 && !(operand_type_check (i.types[0], imm)
4340 && operand_type_check (i.types[1], imm)))
4341 swap_operands ();
4342
4343 /* The order of the immediates should be reversed
4344 for 2 immediates extrq and insertq instructions */
4345 if (i.imm_operands == 2
4346 && (strcmp (mnemonic, "extrq") == 0
4347 || strcmp (mnemonic, "insertq") == 0))
4348 swap_2_operands (0, 1);
4349
4350 if (i.imm_operands)
4351 optimize_imm ();
4352
4353 /* Don't optimize displacement for movabs since it only takes 64bit
4354 displacement. */
4355 if (i.disp_operands
4356 && i.disp_encoding != disp_encoding_32bit
4357 && (flag_code != CODE_64BIT
4358 || strcmp (mnemonic, "movabs") != 0))
4359 optimize_disp ();
4360
4361 /* Next, we find a template that matches the given insn,
4362 making sure the overlap of the given operands types is consistent
4363 with the template operand types. */
4364
4365 if (!(t = match_template (mnem_suffix)))
4366 return;
4367
4368 if (sse_check != check_none
4369 && !i.tm.opcode_modifier.noavx
4370 && !i.tm.cpu_flags.bitfield.cpuavx
4371 && !i.tm.cpu_flags.bitfield.cpuavx512f
4372 && (i.tm.cpu_flags.bitfield.cpusse
4373 || i.tm.cpu_flags.bitfield.cpusse2
4374 || i.tm.cpu_flags.bitfield.cpusse3
4375 || i.tm.cpu_flags.bitfield.cpussse3
4376 || i.tm.cpu_flags.bitfield.cpusse4_1
4377 || i.tm.cpu_flags.bitfield.cpusse4_2
4378 || i.tm.cpu_flags.bitfield.cpusse4a
4379 || i.tm.cpu_flags.bitfield.cpupclmul
4380 || i.tm.cpu_flags.bitfield.cpuaes
4381 || i.tm.cpu_flags.bitfield.cpusha
4382 || i.tm.cpu_flags.bitfield.cpugfni))
4383 {
4384 (sse_check == check_warning
4385 ? as_warn
4386 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4387 }
4388
4389 if (i.tm.opcode_modifier.fwait)
4390 if (!add_prefix (FWAIT_OPCODE))
4391 return;
4392
4393 /* Check if REP prefix is OK. */
4394 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4395 {
4396 as_bad (_("invalid instruction `%s' after `%s'"),
4397 i.tm.name, i.rep_prefix);
4398 return;
4399 }
4400
4401 /* Check for lock without a lockable instruction. Destination operand
4402 must be memory unless it is xchg (0x86). */
4403 if (i.prefix[LOCK_PREFIX]
4404 && (!i.tm.opcode_modifier.islockable
4405 || i.mem_operands == 0
4406 || (i.tm.base_opcode != 0x86
4407 && !(i.flags[i.operands - 1] & Operand_Mem))))
4408 {
4409 as_bad (_("expecting lockable instruction after `lock'"));
4410 return;
4411 }
4412
4413 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4414 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4415 {
4416 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4417 return;
4418 }
4419
4420 /* Check if HLE prefix is OK. */
4421 if (i.hle_prefix && !check_hle ())
4422 return;
4423
4424 /* Check BND prefix. */
4425 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4426 as_bad (_("expecting valid branch instruction after `bnd'"));
4427
4428 /* Check NOTRACK prefix. */
4429 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4430 as_bad (_("expecting indirect branch instruction after `notrack'"));
4431
4432 if (i.tm.cpu_flags.bitfield.cpumpx)
4433 {
4434 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4435 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4436 else if (flag_code != CODE_16BIT
4437 ? i.prefix[ADDR_PREFIX]
4438 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4439 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4440 }
4441
4442 /* Insert BND prefix. */
4443 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4444 {
4445 if (!i.prefix[BND_PREFIX])
4446 add_prefix (BND_PREFIX_OPCODE);
4447 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4448 {
4449 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4450 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4451 }
4452 }
4453
4454 /* Check string instruction segment overrides. */
4455 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4456 {
4457 gas_assert (i.mem_operands);
4458 if (!check_string ())
4459 return;
4460 i.disp_operands = 0;
4461 }
4462
4463 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4464 optimize_encoding ();
4465
4466 if (!process_suffix ())
4467 return;
4468
4469 /* Update operand types. */
4470 for (j = 0; j < i.operands; j++)
4471 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4472
4473 /* Make still unresolved immediate matches conform to size of immediate
4474 given in i.suffix. */
4475 if (!finalize_imm ())
4476 return;
4477
4478 if (i.types[0].bitfield.imm1)
4479 i.imm_operands = 0; /* kludge for shift insns. */
4480
4481 /* We only need to check those implicit registers for instructions
4482 with 3 operands or less. */
4483 if (i.operands <= 3)
4484 for (j = 0; j < i.operands; j++)
4485 if (i.types[j].bitfield.instance != InstanceNone
4486 && !i.types[j].bitfield.xmmword)
4487 i.reg_operands--;
4488
4489 /* ImmExt should be processed after SSE2AVX. */
4490 if (!i.tm.opcode_modifier.sse2avx
4491 && i.tm.opcode_modifier.immext)
4492 process_immext ();
4493
4494 /* For insns with operands there are more diddles to do to the opcode. */
4495 if (i.operands)
4496 {
4497 if (!process_operands ())
4498 return;
4499 }
4500 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4501 {
4502 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4503 as_warn (_("translating to `%sp'"), i.tm.name);
4504 }
4505
4506 if (is_any_vex_encoding (&i.tm))
4507 {
4508 if (!cpu_arch_flags.bitfield.cpui286)
4509 {
4510 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4511 i.tm.name);
4512 return;
4513 }
4514
4515 if (i.tm.opcode_modifier.vex)
4516 build_vex_prefix (t);
4517 else
4518 build_evex_prefix ();
4519 }
4520
4521 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4522 instructions may define INT_OPCODE as well, so avoid this corner
4523 case for those instructions that use MODRM. */
4524 if (i.tm.base_opcode == INT_OPCODE
4525 && !i.tm.opcode_modifier.modrm
4526 && i.op[0].imms->X_add_number == 3)
4527 {
4528 i.tm.base_opcode = INT3_OPCODE;
4529 i.imm_operands = 0;
4530 }
4531
4532 if ((i.tm.opcode_modifier.jump == JUMP
4533 || i.tm.opcode_modifier.jump == JUMP_BYTE
4534 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4535 && i.op[0].disps->X_op == O_constant)
4536 {
4537 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4538 the absolute address given by the constant. Since ix86 jumps and
4539 calls are pc relative, we need to generate a reloc. */
4540 i.op[0].disps->X_add_symbol = &abs_symbol;
4541 i.op[0].disps->X_op = O_symbol;
4542 }
4543
4544 if (i.tm.opcode_modifier.rex64)
4545 i.rex |= REX_W;
4546
4547 /* For 8 bit registers we need an empty rex prefix. Also if the
4548 instruction already has a prefix, we need to convert old
4549 registers to new ones. */
4550
4551 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4552 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4553 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4554 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4555 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4556 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4557 && i.rex != 0))
4558 {
4559 int x;
4560
4561 i.rex |= REX_OPCODE;
4562 for (x = 0; x < 2; x++)
4563 {
4564 /* Look for 8 bit operand that uses old registers. */
4565 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4566 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4567 {
4568 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4569 /* In case it is "hi" register, give up. */
4570 if (i.op[x].regs->reg_num > 3)
4571 as_bad (_("can't encode register '%s%s' in an "
4572 "instruction requiring REX prefix."),
4573 register_prefix, i.op[x].regs->reg_name);
4574
4575 /* Otherwise it is equivalent to the extended register.
4576 Since the encoding doesn't change this is merely
4577 cosmetic cleanup for debug output. */
4578
4579 i.op[x].regs = i.op[x].regs + 8;
4580 }
4581 }
4582 }
4583
4584 if (i.rex == 0 && i.rex_encoding)
4585 {
4586 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4587 that uses legacy register. If it is "hi" register, don't add
4588 the REX_OPCODE byte. */
4589 int x;
4590 for (x = 0; x < 2; x++)
4591 if (i.types[x].bitfield.class == Reg
4592 && i.types[x].bitfield.byte
4593 && (i.op[x].regs->reg_flags & RegRex64) == 0
4594 && i.op[x].regs->reg_num > 3)
4595 {
4596 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4597 i.rex_encoding = FALSE;
4598 break;
4599 }
4600
4601 if (i.rex_encoding)
4602 i.rex = REX_OPCODE;
4603 }
4604
4605 if (i.rex != 0)
4606 add_prefix (REX_OPCODE | i.rex);
4607
4608 /* We are ready to output the insn. */
4609 output_insn ();
4610
4611 last_insn.seg = now_seg;
4612
4613 if (i.tm.opcode_modifier.isprefix)
4614 {
4615 last_insn.kind = last_insn_prefix;
4616 last_insn.name = i.tm.name;
4617 last_insn.file = as_where (&last_insn.line);
4618 }
4619 else
4620 last_insn.kind = last_insn_other;
4621 }
4622
4623 static char *
4624 parse_insn (char *line, char *mnemonic)
4625 {
4626 char *l = line;
4627 char *token_start = l;
4628 char *mnem_p;
4629 int supported;
4630 const insn_template *t;
4631 char *dot_p = NULL;
4632
4633 while (1)
4634 {
4635 mnem_p = mnemonic;
4636 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4637 {
4638 if (*mnem_p == '.')
4639 dot_p = mnem_p;
4640 mnem_p++;
4641 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4642 {
4643 as_bad (_("no such instruction: `%s'"), token_start);
4644 return NULL;
4645 }
4646 l++;
4647 }
4648 if (!is_space_char (*l)
4649 && *l != END_OF_INSN
4650 && (intel_syntax
4651 || (*l != PREFIX_SEPARATOR
4652 && *l != ',')))
4653 {
4654 as_bad (_("invalid character %s in mnemonic"),
4655 output_invalid (*l));
4656 return NULL;
4657 }
4658 if (token_start == l)
4659 {
4660 if (!intel_syntax && *l == PREFIX_SEPARATOR)
4661 as_bad (_("expecting prefix; got nothing"));
4662 else
4663 as_bad (_("expecting mnemonic; got nothing"));
4664 return NULL;
4665 }
4666
4667 /* Look up instruction (or prefix) via hash table. */
4668 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4669
4670 if (*l != END_OF_INSN
4671 && (!is_space_char (*l) || l[1] != END_OF_INSN)
4672 && current_templates
4673 && current_templates->start->opcode_modifier.isprefix)
4674 {
4675 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4676 {
4677 as_bad ((flag_code != CODE_64BIT
4678 ? _("`%s' is only supported in 64-bit mode")
4679 : _("`%s' is not supported in 64-bit mode")),
4680 current_templates->start->name);
4681 return NULL;
4682 }
4683 /* If we are in 16-bit mode, do not allow addr16 or data16.
4684 Similarly, in 32-bit mode, do not allow addr32 or data32. */
4685 if ((current_templates->start->opcode_modifier.size == SIZE16
4686 || current_templates->start->opcode_modifier.size == SIZE32)
4687 && flag_code != CODE_64BIT
4688 && ((current_templates->start->opcode_modifier.size == SIZE32)
4689 ^ (flag_code == CODE_16BIT)))
4690 {
4691 as_bad (_("redundant %s prefix"),
4692 current_templates->start->name);
4693 return NULL;
4694 }
4695 if (current_templates->start->opcode_length == 0)
4696 {
4697 /* Handle pseudo prefixes. */
4698 switch (current_templates->start->base_opcode)
4699 {
4700 case 0x0:
4701 /* {disp8} */
4702 i.disp_encoding = disp_encoding_8bit;
4703 break;
4704 case 0x1:
4705 /* {disp32} */
4706 i.disp_encoding = disp_encoding_32bit;
4707 break;
4708 case 0x2:
4709 /* {load} */
4710 i.dir_encoding = dir_encoding_load;
4711 break;
4712 case 0x3:
4713 /* {store} */
4714 i.dir_encoding = dir_encoding_store;
4715 break;
4716 case 0x4:
4717 /* {vex} */
4718 i.vec_encoding = vex_encoding_vex;
4719 break;
4720 case 0x5:
4721 /* {vex3} */
4722 i.vec_encoding = vex_encoding_vex3;
4723 break;
4724 case 0x6:
4725 /* {evex} */
4726 i.vec_encoding = vex_encoding_evex;
4727 break;
4728 case 0x7:
4729 /* {rex} */
4730 i.rex_encoding = TRUE;
4731 break;
4732 case 0x8:
4733 /* {nooptimize} */
4734 i.no_optimize = TRUE;
4735 break;
4736 default:
4737 abort ();
4738 }
4739 }
4740 else
4741 {
4742 /* Add prefix, checking for repeated prefixes. */
4743 switch (add_prefix (current_templates->start->base_opcode))
4744 {
4745 case PREFIX_EXIST:
4746 return NULL;
4747 case PREFIX_DS:
4748 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4749 i.notrack_prefix = current_templates->start->name;
4750 break;
4751 case PREFIX_REP:
4752 if (current_templates->start->cpu_flags.bitfield.cpuhle)
4753 i.hle_prefix = current_templates->start->name;
4754 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4755 i.bnd_prefix = current_templates->start->name;
4756 else
4757 i.rep_prefix = current_templates->start->name;
4758 break;
4759 default:
4760 break;
4761 }
4762 }
4763 /* Skip past PREFIX_SEPARATOR and reset token_start. */
4764 token_start = ++l;
4765 }
4766 else
4767 break;
4768 }
4769
4770 if (!current_templates)
4771 {
4772 /* Deprecated functionality (new code should use pseudo-prefixes instead):
4773 Check if we should swap operand or force 32bit displacement in
4774 encoding. */
4775 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4776 i.dir_encoding = dir_encoding_swap;
4777 else if (mnem_p - 3 == dot_p
4778 && dot_p[1] == 'd'
4779 && dot_p[2] == '8')
4780 i.disp_encoding = disp_encoding_8bit;
4781 else if (mnem_p - 4 == dot_p
4782 && dot_p[1] == 'd'
4783 && dot_p[2] == '3'
4784 && dot_p[3] == '2')
4785 i.disp_encoding = disp_encoding_32bit;
4786 else
4787 goto check_suffix;
4788 mnem_p = dot_p;
4789 *dot_p = '\0';
4790 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4791 }
4792
4793 if (!current_templates)
4794 {
4795 check_suffix:
4796 if (mnem_p > mnemonic)
4797 {
4798 /* See if we can get a match by trimming off a suffix. */
4799 switch (mnem_p[-1])
4800 {
4801 case WORD_MNEM_SUFFIX:
4802 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4803 i.suffix = SHORT_MNEM_SUFFIX;
4804 else
4805 /* Fall through. */
4806 case BYTE_MNEM_SUFFIX:
4807 case QWORD_MNEM_SUFFIX:
4808 i.suffix = mnem_p[-1];
4809 mnem_p[-1] = '\0';
4810 current_templates = (const templates *) hash_find (op_hash,
4811 mnemonic);
4812 break;
4813 case SHORT_MNEM_SUFFIX:
4814 case LONG_MNEM_SUFFIX:
4815 if (!intel_syntax)
4816 {
4817 i.suffix = mnem_p[-1];
4818 mnem_p[-1] = '\0';
4819 current_templates = (const templates *) hash_find (op_hash,
4820 mnemonic);
4821 }
4822 break;
4823
4824 /* Intel Syntax. */
4825 case 'd':
4826 if (intel_syntax)
4827 {
4828 if (intel_float_operand (mnemonic) == 1)
4829 i.suffix = SHORT_MNEM_SUFFIX;
4830 else
4831 i.suffix = LONG_MNEM_SUFFIX;
4832 mnem_p[-1] = '\0';
4833 current_templates = (const templates *) hash_find (op_hash,
4834 mnemonic);
4835 }
4836 break;
4837 }
4838 }
4839
4840 if (!current_templates)
4841 {
4842 as_bad (_("no such instruction: `%s'"), token_start);
4843 return NULL;
4844 }
4845 }
4846
4847 if (current_templates->start->opcode_modifier.jump == JUMP
4848 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
4849 {
4850 /* Check for a branch hint. We allow ",pt" and ",pn" for
4851 predict taken and predict not taken respectively.
4852 I'm not sure that branch hints actually do anything on loop
4853 and jcxz insns (JumpByte) for current Pentium4 chips. They
4854 may work in the future and it doesn't hurt to accept them
4855 now. */
4856 if (l[0] == ',' && l[1] == 'p')
4857 {
4858 if (l[2] == 't')
4859 {
4860 if (!add_prefix (DS_PREFIX_OPCODE))
4861 return NULL;
4862 l += 3;
4863 }
4864 else if (l[2] == 'n')
4865 {
4866 if (!add_prefix (CS_PREFIX_OPCODE))
4867 return NULL;
4868 l += 3;
4869 }
4870 }
4871 }
4872 /* Any other comma loses. */
4873 if (*l == ',')
4874 {
4875 as_bad (_("invalid character %s in mnemonic"),
4876 output_invalid (*l));
4877 return NULL;
4878 }
4879
4880 /* Check if instruction is supported on specified architecture. */
4881 supported = 0;
4882 for (t = current_templates->start; t < current_templates->end; ++t)
4883 {
4884 supported |= cpu_flags_match (t);
4885 if (supported == CPU_FLAGS_PERFECT_MATCH)
4886 {
4887 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4888 as_warn (_("use .code16 to ensure correct addressing mode"));
4889
4890 return l;
4891 }
4892 }
4893
4894 if (!(supported & CPU_FLAGS_64BIT_MATCH))
4895 as_bad (flag_code == CODE_64BIT
4896 ? _("`%s' is not supported in 64-bit mode")
4897 : _("`%s' is only supported in 64-bit mode"),
4898 current_templates->start->name);
4899 else
4900 as_bad (_("`%s' is not supported on `%s%s'"),
4901 current_templates->start->name,
4902 cpu_arch_name ? cpu_arch_name : default_arch,
4903 cpu_sub_arch_name ? cpu_sub_arch_name : "");
4904
4905 return NULL;
4906 }
4907
4908 static char *
4909 parse_operands (char *l, const char *mnemonic)
4910 {
4911 char *token_start;
4912
4913 /* 1 if operand is pending after ','. */
4914 unsigned int expecting_operand = 0;
4915
4916 /* Non-zero if operand parens not balanced. */
4917 unsigned int paren_not_balanced;
4918
4919 while (*l != END_OF_INSN)
4920 {
4921 /* Skip optional white space before operand. */
4922 if (is_space_char (*l))
4923 ++l;
4924 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4925 {
4926 as_bad (_("invalid character %s before operand %d"),
4927 output_invalid (*l),
4928 i.operands + 1);
4929 return NULL;
4930 }
4931 token_start = l; /* After white space. */
4932 paren_not_balanced = 0;
4933 while (paren_not_balanced || *l != ',')
4934 {
4935 if (*l == END_OF_INSN)
4936 {
4937 if (paren_not_balanced)
4938 {
4939 if (!intel_syntax)
4940 as_bad (_("unbalanced parenthesis in operand %d."),
4941 i.operands + 1);
4942 else
4943 as_bad (_("unbalanced brackets in operand %d."),
4944 i.operands + 1);
4945 return NULL;
4946 }
4947 else
4948 break; /* we are done */
4949 }
4950 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4951 {
4952 as_bad (_("invalid character %s in operand %d"),
4953 output_invalid (*l),
4954 i.operands + 1);
4955 return NULL;
4956 }
4957 if (!intel_syntax)
4958 {
4959 if (*l == '(')
4960 ++paren_not_balanced;
4961 if (*l == ')')
4962 --paren_not_balanced;
4963 }
4964 else
4965 {
4966 if (*l == '[')
4967 ++paren_not_balanced;
4968 if (*l == ']')
4969 --paren_not_balanced;
4970 }
4971 l++;
4972 }
4973 if (l != token_start)
4974 { /* Yes, we've read in another operand. */
4975 unsigned int operand_ok;
4976 this_operand = i.operands++;
4977 if (i.operands > MAX_OPERANDS)
4978 {
4979 as_bad (_("spurious operands; (%d operands/instruction max)"),
4980 MAX_OPERANDS);
4981 return NULL;
4982 }
4983 i.types[this_operand].bitfield.unspecified = 1;
4984 /* Now parse operand adding info to 'i' as we go along. */
4985 END_STRING_AND_SAVE (l);
4986
4987 if (i.mem_operands > 1)
4988 {
4989 as_bad (_("too many memory references for `%s'"),
4990 mnemonic);
4991 return 0;
4992 }
4993
4994 if (intel_syntax)
4995 operand_ok =
4996 i386_intel_operand (token_start,
4997 intel_float_operand (mnemonic));
4998 else
4999 operand_ok = i386_att_operand (token_start);
5000
5001 RESTORE_END_STRING (l);
5002 if (!operand_ok)
5003 return NULL;
5004 }
5005 else
5006 {
5007 if (expecting_operand)
5008 {
5009 expecting_operand_after_comma:
5010 as_bad (_("expecting operand after ','; got nothing"));
5011 return NULL;
5012 }
5013 if (*l == ',')
5014 {
5015 as_bad (_("expecting operand before ','; got nothing"));
5016 return NULL;
5017 }
5018 }
5019
5020 /* Now *l must be either ',' or END_OF_INSN. */
5021 if (*l == ',')
5022 {
5023 if (*++l == END_OF_INSN)
5024 {
5025 /* Just skip it, if it's \n complain. */
5026 goto expecting_operand_after_comma;
5027 }
5028 expecting_operand = 1;
5029 }
5030 }
5031 return l;
5032 }
5033
5034 static void
5035 swap_2_operands (int xchg1, int xchg2)
5036 {
5037 union i386_op temp_op;
5038 i386_operand_type temp_type;
5039 unsigned int temp_flags;
5040 enum bfd_reloc_code_real temp_reloc;
5041
5042 temp_type = i.types[xchg2];
5043 i.types[xchg2] = i.types[xchg1];
5044 i.types[xchg1] = temp_type;
5045
5046 temp_flags = i.flags[xchg2];
5047 i.flags[xchg2] = i.flags[xchg1];
5048 i.flags[xchg1] = temp_flags;
5049
5050 temp_op = i.op[xchg2];
5051 i.op[xchg2] = i.op[xchg1];
5052 i.op[xchg1] = temp_op;
5053
5054 temp_reloc = i.reloc[xchg2];
5055 i.reloc[xchg2] = i.reloc[xchg1];
5056 i.reloc[xchg1] = temp_reloc;
5057
5058 if (i.mask)
5059 {
5060 if (i.mask->operand == xchg1)
5061 i.mask->operand = xchg2;
5062 else if (i.mask->operand == xchg2)
5063 i.mask->operand = xchg1;
5064 }
5065 if (i.broadcast)
5066 {
5067 if (i.broadcast->operand == xchg1)
5068 i.broadcast->operand = xchg2;
5069 else if (i.broadcast->operand == xchg2)
5070 i.broadcast->operand = xchg1;
5071 }
5072 if (i.rounding)
5073 {
5074 if (i.rounding->operand == xchg1)
5075 i.rounding->operand = xchg2;
5076 else if (i.rounding->operand == xchg2)
5077 i.rounding->operand = xchg1;
5078 }
5079 }
5080
5081 static void
5082 swap_operands (void)
5083 {
5084 switch (i.operands)
5085 {
5086 case 5:
5087 case 4:
5088 swap_2_operands (1, i.operands - 2);
5089 /* Fall through. */
5090 case 3:
5091 case 2:
5092 swap_2_operands (0, i.operands - 1);
5093 break;
5094 default:
5095 abort ();
5096 }
5097
5098 if (i.mem_operands == 2)
5099 {
5100 const seg_entry *temp_seg;
5101 temp_seg = i.seg[0];
5102 i.seg[0] = i.seg[1];
5103 i.seg[1] = temp_seg;
5104 }
5105 }
5106
5107 /* Try to ensure constant immediates are represented in the smallest
5108 opcode possible. */
5109 static void
5110 optimize_imm (void)
5111 {
5112 char guess_suffix = 0;
5113 int op;
5114
5115 if (i.suffix)
5116 guess_suffix = i.suffix;
5117 else if (i.reg_operands)
5118 {
5119 /* Figure out a suffix from the last register operand specified.
5120 We can't do this properly yet, i.e. excluding special register
5121 instances, but the following works for instructions with
5122 immediates. In any case, we can't set i.suffix yet. */
5123 for (op = i.operands; --op >= 0;)
5124 if (i.types[op].bitfield.class != Reg)
5125 continue;
5126 else if (i.types[op].bitfield.byte)
5127 {
5128 guess_suffix = BYTE_MNEM_SUFFIX;
5129 break;
5130 }
5131 else if (i.types[op].bitfield.word)
5132 {
5133 guess_suffix = WORD_MNEM_SUFFIX;
5134 break;
5135 }
5136 else if (i.types[op].bitfield.dword)
5137 {
5138 guess_suffix = LONG_MNEM_SUFFIX;
5139 break;
5140 }
5141 else if (i.types[op].bitfield.qword)
5142 {
5143 guess_suffix = QWORD_MNEM_SUFFIX;
5144 break;
5145 }
5146 }
5147 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5148 guess_suffix = WORD_MNEM_SUFFIX;
5149
5150 for (op = i.operands; --op >= 0;)
5151 if (operand_type_check (i.types[op], imm))
5152 {
5153 switch (i.op[op].imms->X_op)
5154 {
5155 case O_constant:
5156 /* If a suffix is given, this operand may be shortened. */
5157 switch (guess_suffix)
5158 {
5159 case LONG_MNEM_SUFFIX:
5160 i.types[op].bitfield.imm32 = 1;
5161 i.types[op].bitfield.imm64 = 1;
5162 break;
5163 case WORD_MNEM_SUFFIX:
5164 i.types[op].bitfield.imm16 = 1;
5165 i.types[op].bitfield.imm32 = 1;
5166 i.types[op].bitfield.imm32s = 1;
5167 i.types[op].bitfield.imm64 = 1;
5168 break;
5169 case BYTE_MNEM_SUFFIX:
5170 i.types[op].bitfield.imm8 = 1;
5171 i.types[op].bitfield.imm8s = 1;
5172 i.types[op].bitfield.imm16 = 1;
5173 i.types[op].bitfield.imm32 = 1;
5174 i.types[op].bitfield.imm32s = 1;
5175 i.types[op].bitfield.imm64 = 1;
5176 break;
5177 }
5178
5179 /* If this operand is at most 16 bits, convert it
5180 to a signed 16 bit number before trying to see
5181 whether it will fit in an even smaller size.
5182 This allows a 16-bit operand such as $0xffe0 to
5183 be recognised as within Imm8S range. */
5184 if ((i.types[op].bitfield.imm16)
5185 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5186 {
5187 i.op[op].imms->X_add_number =
5188 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5189 }
5190 #ifdef BFD64
5191 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5192 if ((i.types[op].bitfield.imm32)
5193 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5194 == 0))
5195 {
5196 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5197 ^ ((offsetT) 1 << 31))
5198 - ((offsetT) 1 << 31));
5199 }
5200 #endif
5201 i.types[op]
5202 = operand_type_or (i.types[op],
5203 smallest_imm_type (i.op[op].imms->X_add_number));
5204
5205 /* We must avoid matching of Imm32 templates when 64bit
5206 only immediate is available. */
5207 if (guess_suffix == QWORD_MNEM_SUFFIX)
5208 i.types[op].bitfield.imm32 = 0;
5209 break;
5210
5211 case O_absent:
5212 case O_register:
5213 abort ();
5214
5215 /* Symbols and expressions. */
5216 default:
5217 /* Convert symbolic operand to proper sizes for matching, but don't
5218 prevent matching a set of insns that only supports sizes other
5219 than those matching the insn suffix. */
5220 {
5221 i386_operand_type mask, allowed;
5222 const insn_template *t;
5223
5224 operand_type_set (&mask, 0);
5225 operand_type_set (&allowed, 0);
5226
5227 for (t = current_templates->start;
5228 t < current_templates->end;
5229 ++t)
5230 {
5231 allowed = operand_type_or (allowed, t->operand_types[op]);
5232 allowed = operand_type_and (allowed, anyimm);
5233 }
5234 switch (guess_suffix)
5235 {
5236 case QWORD_MNEM_SUFFIX:
5237 mask.bitfield.imm64 = 1;
5238 mask.bitfield.imm32s = 1;
5239 break;
5240 case LONG_MNEM_SUFFIX:
5241 mask.bitfield.imm32 = 1;
5242 break;
5243 case WORD_MNEM_SUFFIX:
5244 mask.bitfield.imm16 = 1;
5245 break;
5246 case BYTE_MNEM_SUFFIX:
5247 mask.bitfield.imm8 = 1;
5248 break;
5249 default:
5250 break;
5251 }
5252 allowed = operand_type_and (mask, allowed);
5253 if (!operand_type_all_zero (&allowed))
5254 i.types[op] = operand_type_and (i.types[op], mask);
5255 }
5256 break;
5257 }
5258 }
5259 }
5260
5261 /* Try to use the smallest displacement type too. */
5262 static void
5263 optimize_disp (void)
5264 {
5265 int op;
5266
5267 for (op = i.operands; --op >= 0;)
5268 if (operand_type_check (i.types[op], disp))
5269 {
5270 if (i.op[op].disps->X_op == O_constant)
5271 {
5272 offsetT op_disp = i.op[op].disps->X_add_number;
5273
5274 if (i.types[op].bitfield.disp16
5275 && (op_disp & ~(offsetT) 0xffff) == 0)
5276 {
5277 /* If this operand is at most 16 bits, convert
5278 to a signed 16 bit number and don't use 64bit
5279 displacement. */
5280 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5281 i.types[op].bitfield.disp64 = 0;
5282 }
5283 #ifdef BFD64
5284 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5285 if (i.types[op].bitfield.disp32
5286 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5287 {
5288 /* If this operand is at most 32 bits, convert
5289 to a signed 32 bit number and don't use 64bit
5290 displacement. */
5291 op_disp &= (((offsetT) 2 << 31) - 1);
5292 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5293 i.types[op].bitfield.disp64 = 0;
5294 }
5295 #endif
5296 if (!op_disp && i.types[op].bitfield.baseindex)
5297 {
5298 i.types[op].bitfield.disp8 = 0;
5299 i.types[op].bitfield.disp16 = 0;
5300 i.types[op].bitfield.disp32 = 0;
5301 i.types[op].bitfield.disp32s = 0;
5302 i.types[op].bitfield.disp64 = 0;
5303 i.op[op].disps = 0;
5304 i.disp_operands--;
5305 }
5306 else if (flag_code == CODE_64BIT)
5307 {
5308 if (fits_in_signed_long (op_disp))
5309 {
5310 i.types[op].bitfield.disp64 = 0;
5311 i.types[op].bitfield.disp32s = 1;
5312 }
5313 if (i.prefix[ADDR_PREFIX]
5314 && fits_in_unsigned_long (op_disp))
5315 i.types[op].bitfield.disp32 = 1;
5316 }
5317 if ((i.types[op].bitfield.disp32
5318 || i.types[op].bitfield.disp32s
5319 || i.types[op].bitfield.disp16)
5320 && fits_in_disp8 (op_disp))
5321 i.types[op].bitfield.disp8 = 1;
5322 }
5323 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5324 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5325 {
5326 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5327 i.op[op].disps, 0, i.reloc[op]);
5328 i.types[op].bitfield.disp8 = 0;
5329 i.types[op].bitfield.disp16 = 0;
5330 i.types[op].bitfield.disp32 = 0;
5331 i.types[op].bitfield.disp32s = 0;
5332 i.types[op].bitfield.disp64 = 0;
5333 }
5334 else
5335 /* We only support 64bit displacement on constants. */
5336 i.types[op].bitfield.disp64 = 0;
5337 }
5338 }
5339
5340 /* Return 1 if there is a match in broadcast bytes between operand
5341 GIVEN and instruction template T. */
5342
5343 static INLINE int
5344 match_broadcast_size (const insn_template *t, unsigned int given)
5345 {
5346 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5347 && i.types[given].bitfield.byte)
5348 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5349 && i.types[given].bitfield.word)
5350 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5351 && i.types[given].bitfield.dword)
5352 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5353 && i.types[given].bitfield.qword));
5354 }
5355
5356 /* Check if operands are valid for the instruction. */
5357
5358 static int
5359 check_VecOperands (const insn_template *t)
5360 {
5361 unsigned int op;
5362 i386_cpu_flags cpu;
5363
5364 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5365 any one operand are implicity requiring AVX512VL support if the actual
5366 operand size is YMMword or XMMword. Since this function runs after
5367 template matching, there's no need to check for YMMword/XMMword in
5368 the template. */
5369 cpu = cpu_flags_and (t->cpu_flags, avx512);
5370 if (!cpu_flags_all_zero (&cpu)
5371 && !t->cpu_flags.bitfield.cpuavx512vl
5372 && !cpu_arch_flags.bitfield.cpuavx512vl)
5373 {
5374 for (op = 0; op < t->operands; ++op)
5375 {
5376 if (t->operand_types[op].bitfield.zmmword
5377 && (i.types[op].bitfield.ymmword
5378 || i.types[op].bitfield.xmmword))
5379 {
5380 i.error = unsupported;
5381 return 1;
5382 }
5383 }
5384 }
5385
5386 /* Without VSIB byte, we can't have a vector register for index. */
5387 if (!t->opcode_modifier.vecsib
5388 && i.index_reg
5389 && (i.index_reg->reg_type.bitfield.xmmword
5390 || i.index_reg->reg_type.bitfield.ymmword
5391 || i.index_reg->reg_type.bitfield.zmmword))
5392 {
5393 i.error = unsupported_vector_index_register;
5394 return 1;
5395 }
5396
5397 /* Check if default mask is allowed. */
5398 if (t->opcode_modifier.nodefmask
5399 && (!i.mask || i.mask->mask->reg_num == 0))
5400 {
5401 i.error = no_default_mask;
5402 return 1;
5403 }
5404
5405 /* For VSIB byte, we need a vector register for index, and all vector
5406 registers must be distinct. */
5407 if (t->opcode_modifier.vecsib)
5408 {
5409 if (!i.index_reg
5410 || !((t->opcode_modifier.vecsib == VecSIB128
5411 && i.index_reg->reg_type.bitfield.xmmword)
5412 || (t->opcode_modifier.vecsib == VecSIB256
5413 && i.index_reg->reg_type.bitfield.ymmword)
5414 || (t->opcode_modifier.vecsib == VecSIB512
5415 && i.index_reg->reg_type.bitfield.zmmword)))
5416 {
5417 i.error = invalid_vsib_address;
5418 return 1;
5419 }
5420
5421 gas_assert (i.reg_operands == 2 || i.mask);
5422 if (i.reg_operands == 2 && !i.mask)
5423 {
5424 gas_assert (i.types[0].bitfield.class == RegSIMD);
5425 gas_assert (i.types[0].bitfield.xmmword
5426 || i.types[0].bitfield.ymmword);
5427 gas_assert (i.types[2].bitfield.class == RegSIMD);
5428 gas_assert (i.types[2].bitfield.xmmword
5429 || i.types[2].bitfield.ymmword);
5430 if (operand_check == check_none)
5431 return 0;
5432 if (register_number (i.op[0].regs)
5433 != register_number (i.index_reg)
5434 && register_number (i.op[2].regs)
5435 != register_number (i.index_reg)
5436 && register_number (i.op[0].regs)
5437 != register_number (i.op[2].regs))
5438 return 0;
5439 if (operand_check == check_error)
5440 {
5441 i.error = invalid_vector_register_set;
5442 return 1;
5443 }
5444 as_warn (_("mask, index, and destination registers should be distinct"));
5445 }
5446 else if (i.reg_operands == 1 && i.mask)
5447 {
5448 if (i.types[1].bitfield.class == RegSIMD
5449 && (i.types[1].bitfield.xmmword
5450 || i.types[1].bitfield.ymmword
5451 || i.types[1].bitfield.zmmword)
5452 && (register_number (i.op[1].regs)
5453 == register_number (i.index_reg)))
5454 {
5455 if (operand_check == check_error)
5456 {
5457 i.error = invalid_vector_register_set;
5458 return 1;
5459 }
5460 if (operand_check != check_none)
5461 as_warn (_("index and destination registers should be distinct"));
5462 }
5463 }
5464 }
5465
5466 /* Check if broadcast is supported by the instruction and is applied
5467 to the memory operand. */
5468 if (i.broadcast)
5469 {
5470 i386_operand_type type, overlap;
5471
5472 /* Check if specified broadcast is supported in this instruction,
5473 and its broadcast bytes match the memory operand. */
5474 op = i.broadcast->operand;
5475 if (!t->opcode_modifier.broadcast
5476 || !(i.flags[op] & Operand_Mem)
5477 || (!i.types[op].bitfield.unspecified
5478 && !match_broadcast_size (t, op)))
5479 {
5480 bad_broadcast:
5481 i.error = unsupported_broadcast;
5482 return 1;
5483 }
5484
5485 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5486 * i.broadcast->type);
5487 operand_type_set (&type, 0);
5488 switch (i.broadcast->bytes)
5489 {
5490 case 2:
5491 type.bitfield.word = 1;
5492 break;
5493 case 4:
5494 type.bitfield.dword = 1;
5495 break;
5496 case 8:
5497 type.bitfield.qword = 1;
5498 break;
5499 case 16:
5500 type.bitfield.xmmword = 1;
5501 break;
5502 case 32:
5503 type.bitfield.ymmword = 1;
5504 break;
5505 case 64:
5506 type.bitfield.zmmword = 1;
5507 break;
5508 default:
5509 goto bad_broadcast;
5510 }
5511
5512 overlap = operand_type_and (type, t->operand_types[op]);
5513 if (operand_type_all_zero (&overlap))
5514 goto bad_broadcast;
5515
5516 if (t->opcode_modifier.checkregsize)
5517 {
5518 unsigned int j;
5519
5520 type.bitfield.baseindex = 1;
5521 for (j = 0; j < i.operands; ++j)
5522 {
5523 if (j != op
5524 && !operand_type_register_match(i.types[j],
5525 t->operand_types[j],
5526 type,
5527 t->operand_types[op]))
5528 goto bad_broadcast;
5529 }
5530 }
5531 }
5532 /* If broadcast is supported in this instruction, we need to check if
5533 operand of one-element size isn't specified without broadcast. */
5534 else if (t->opcode_modifier.broadcast && i.mem_operands)
5535 {
5536 /* Find memory operand. */
5537 for (op = 0; op < i.operands; op++)
5538 if (i.flags[op] & Operand_Mem)
5539 break;
5540 gas_assert (op < i.operands);
5541 /* Check size of the memory operand. */
5542 if (match_broadcast_size (t, op))
5543 {
5544 i.error = broadcast_needed;
5545 return 1;
5546 }
5547 }
5548 else
5549 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5550
5551 /* Check if requested masking is supported. */
5552 if (i.mask)
5553 {
5554 switch (t->opcode_modifier.masking)
5555 {
5556 case BOTH_MASKING:
5557 break;
5558 case MERGING_MASKING:
5559 if (i.mask->zeroing)
5560 {
5561 case 0:
5562 i.error = unsupported_masking;
5563 return 1;
5564 }
5565 break;
5566 case DYNAMIC_MASKING:
5567 /* Memory destinations allow only merging masking. */
5568 if (i.mask->zeroing && i.mem_operands)
5569 {
5570 /* Find memory operand. */
5571 for (op = 0; op < i.operands; op++)
5572 if (i.flags[op] & Operand_Mem)
5573 break;
5574 gas_assert (op < i.operands);
5575 if (op == i.operands - 1)
5576 {
5577 i.error = unsupported_masking;
5578 return 1;
5579 }
5580 }
5581 break;
5582 default:
5583 abort ();
5584 }
5585 }
5586
5587 /* Check if masking is applied to dest operand. */
5588 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5589 {
5590 i.error = mask_not_on_destination;
5591 return 1;
5592 }
5593
5594 /* Check RC/SAE. */
5595 if (i.rounding)
5596 {
5597 if (!t->opcode_modifier.sae
5598 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5599 {
5600 i.error = unsupported_rc_sae;
5601 return 1;
5602 }
5603 /* If the instruction has several immediate operands and one of
5604 them is rounding, the rounding operand should be the last
5605 immediate operand. */
5606 if (i.imm_operands > 1
5607 && i.rounding->operand != (int) (i.imm_operands - 1))
5608 {
5609 i.error = rc_sae_operand_not_last_imm;
5610 return 1;
5611 }
5612 }
5613
5614 /* Check vector Disp8 operand. */
5615 if (t->opcode_modifier.disp8memshift
5616 && i.disp_encoding != disp_encoding_32bit)
5617 {
5618 if (i.broadcast)
5619 i.memshift = t->opcode_modifier.broadcast - 1;
5620 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5621 i.memshift = t->opcode_modifier.disp8memshift;
5622 else
5623 {
5624 const i386_operand_type *type = NULL;
5625
5626 i.memshift = 0;
5627 for (op = 0; op < i.operands; op++)
5628 if (i.flags[op] & Operand_Mem)
5629 {
5630 if (t->opcode_modifier.evex == EVEXLIG)
5631 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5632 else if (t->operand_types[op].bitfield.xmmword
5633 + t->operand_types[op].bitfield.ymmword
5634 + t->operand_types[op].bitfield.zmmword <= 1)
5635 type = &t->operand_types[op];
5636 else if (!i.types[op].bitfield.unspecified)
5637 type = &i.types[op];
5638 }
5639 else if (i.types[op].bitfield.class == RegSIMD
5640 && t->opcode_modifier.evex != EVEXLIG)
5641 {
5642 if (i.types[op].bitfield.zmmword)
5643 i.memshift = 6;
5644 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5645 i.memshift = 5;
5646 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5647 i.memshift = 4;
5648 }
5649
5650 if (type)
5651 {
5652 if (type->bitfield.zmmword)
5653 i.memshift = 6;
5654 else if (type->bitfield.ymmword)
5655 i.memshift = 5;
5656 else if (type->bitfield.xmmword)
5657 i.memshift = 4;
5658 }
5659
5660 /* For the check in fits_in_disp8(). */
5661 if (i.memshift == 0)
5662 i.memshift = -1;
5663 }
5664
5665 for (op = 0; op < i.operands; op++)
5666 if (operand_type_check (i.types[op], disp)
5667 && i.op[op].disps->X_op == O_constant)
5668 {
5669 if (fits_in_disp8 (i.op[op].disps->X_add_number))
5670 {
5671 i.types[op].bitfield.disp8 = 1;
5672 return 0;
5673 }
5674 i.types[op].bitfield.disp8 = 0;
5675 }
5676 }
5677
5678 i.memshift = 0;
5679
5680 return 0;
5681 }
5682
5683 /* Check if operands are valid for the instruction. Update VEX
5684 operand types. */
5685
5686 static int
5687 VEX_check_operands (const insn_template *t)
5688 {
5689 if (i.vec_encoding == vex_encoding_evex)
5690 {
5691 /* This instruction must be encoded with EVEX prefix. */
5692 if (!is_evex_encoding (t))
5693 {
5694 i.error = unsupported;
5695 return 1;
5696 }
5697 return 0;
5698 }
5699
5700 if (!t->opcode_modifier.vex)
5701 {
5702 /* This instruction template doesn't have VEX prefix. */
5703 if (i.vec_encoding != vex_encoding_default)
5704 {
5705 i.error = unsupported;
5706 return 1;
5707 }
5708 return 0;
5709 }
5710
5711 /* Check the special Imm4 cases; must be the first operand. */
5712 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
5713 {
5714 if (i.op[0].imms->X_op != O_constant
5715 || !fits_in_imm4 (i.op[0].imms->X_add_number))
5716 {
5717 i.error = bad_imm4;
5718 return 1;
5719 }
5720
5721 /* Turn off Imm<N> so that update_imm won't complain. */
5722 operand_type_set (&i.types[0], 0);
5723 }
5724
5725 return 0;
5726 }
5727
5728 static const insn_template *
5729 match_template (char mnem_suffix)
5730 {
5731 /* Points to template once we've found it. */
5732 const insn_template *t;
5733 i386_operand_type overlap0, overlap1, overlap2, overlap3;
5734 i386_operand_type overlap4;
5735 unsigned int found_reverse_match;
5736 i386_opcode_modifier suffix_check;
5737 i386_operand_type operand_types [MAX_OPERANDS];
5738 int addr_prefix_disp;
5739 unsigned int j, size_match, check_register;
5740 enum i386_error specific_error = 0;
5741
5742 #if MAX_OPERANDS != 5
5743 # error "MAX_OPERANDS must be 5."
5744 #endif
5745
5746 found_reverse_match = 0;
5747 addr_prefix_disp = -1;
5748
5749 /* Prepare for mnemonic suffix check. */
5750 memset (&suffix_check, 0, sizeof (suffix_check));
5751 switch (mnem_suffix)
5752 {
5753 case BYTE_MNEM_SUFFIX:
5754 suffix_check.no_bsuf = 1;
5755 break;
5756 case WORD_MNEM_SUFFIX:
5757 suffix_check.no_wsuf = 1;
5758 break;
5759 case SHORT_MNEM_SUFFIX:
5760 suffix_check.no_ssuf = 1;
5761 break;
5762 case LONG_MNEM_SUFFIX:
5763 suffix_check.no_lsuf = 1;
5764 break;
5765 case QWORD_MNEM_SUFFIX:
5766 suffix_check.no_qsuf = 1;
5767 break;
5768 default:
5769 /* NB: In Intel syntax, normally we can check for memory operand
5770 size when there is no mnemonic suffix. But jmp and call have
5771 2 different encodings with Dword memory operand size, one with
5772 No_ldSuf and the other without. i.suffix is set to
5773 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
5774 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5775 suffix_check.no_ldsuf = 1;
5776 }
5777
5778 /* Must have right number of operands. */
5779 i.error = number_of_operands_mismatch;
5780
5781 for (t = current_templates->start; t < current_templates->end; t++)
5782 {
5783 addr_prefix_disp = -1;
5784 found_reverse_match = 0;
5785
5786 if (i.operands != t->operands)
5787 continue;
5788
5789 /* Check processor support. */
5790 i.error = unsupported;
5791 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
5792 continue;
5793
5794 /* Check AT&T mnemonic. */
5795 i.error = unsupported_with_intel_mnemonic;
5796 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5797 continue;
5798
5799 /* Check AT&T/Intel syntax. */
5800 i.error = unsupported_syntax;
5801 if ((intel_syntax && t->opcode_modifier.attsyntax)
5802 || (!intel_syntax && t->opcode_modifier.intelsyntax))
5803 continue;
5804
5805 /* Check Intel64/AMD64 ISA. */
5806 switch (isa64)
5807 {
5808 default:
5809 /* Default: Don't accept Intel64. */
5810 if (t->opcode_modifier.isa64 == INTEL64)
5811 continue;
5812 break;
5813 case amd64:
5814 /* -mamd64: Don't accept Intel64 and Intel64 only. */
5815 if (t->opcode_modifier.isa64 >= INTEL64)
5816 continue;
5817 break;
5818 case intel64:
5819 /* -mintel64: Don't accept AMD64. */
5820 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
5821 continue;
5822 break;
5823 }
5824
5825 /* Check the suffix. */
5826 i.error = invalid_instruction_suffix;
5827 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5828 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5829 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5830 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5831 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5832 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
5833 continue;
5834
5835 size_match = operand_size_match (t);
5836 if (!size_match)
5837 continue;
5838
5839 /* This is intentionally not
5840
5841 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
5842
5843 as the case of a missing * on the operand is accepted (perhaps with
5844 a warning, issued further down). */
5845 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5846 {
5847 i.error = operand_type_mismatch;
5848 continue;
5849 }
5850
5851 for (j = 0; j < MAX_OPERANDS; j++)
5852 operand_types[j] = t->operand_types[j];
5853
5854 /* In general, don't allow 64-bit operands in 32-bit mode. */
5855 if (i.suffix == QWORD_MNEM_SUFFIX
5856 && flag_code != CODE_64BIT
5857 && (intel_syntax
5858 ? (!t->opcode_modifier.ignoresize
5859 && !t->opcode_modifier.broadcast
5860 && !intel_float_operand (t->name))
5861 : intel_float_operand (t->name) != 2)
5862 && ((operand_types[0].bitfield.class != RegMMX
5863 && operand_types[0].bitfield.class != RegSIMD)
5864 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5865 && operand_types[t->operands > 1].bitfield.class != RegSIMD))
5866 && (t->base_opcode != 0x0fc7
5867 || t->extension_opcode != 1 /* cmpxchg8b */))
5868 continue;
5869
5870 /* In general, don't allow 32-bit operands on pre-386. */
5871 else if (i.suffix == LONG_MNEM_SUFFIX
5872 && !cpu_arch_flags.bitfield.cpui386
5873 && (intel_syntax
5874 ? (!t->opcode_modifier.ignoresize
5875 && !intel_float_operand (t->name))
5876 : intel_float_operand (t->name) != 2)
5877 && ((operand_types[0].bitfield.class != RegMMX
5878 && operand_types[0].bitfield.class != RegSIMD)
5879 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5880 && operand_types[t->operands > 1].bitfield.class
5881 != RegSIMD)))
5882 continue;
5883
5884 /* Do not verify operands when there are none. */
5885 else
5886 {
5887 if (!t->operands)
5888 /* We've found a match; break out of loop. */
5889 break;
5890 }
5891
5892 if (!t->opcode_modifier.jump
5893 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
5894 {
5895 /* There should be only one Disp operand. */
5896 for (j = 0; j < MAX_OPERANDS; j++)
5897 if (operand_type_check (operand_types[j], disp))
5898 break;
5899 if (j < MAX_OPERANDS)
5900 {
5901 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
5902
5903 addr_prefix_disp = j;
5904
5905 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
5906 operand into Disp32/Disp32/Disp16/Disp32 operand. */
5907 switch (flag_code)
5908 {
5909 case CODE_16BIT:
5910 override = !override;
5911 /* Fall through. */
5912 case CODE_32BIT:
5913 if (operand_types[j].bitfield.disp32
5914 && operand_types[j].bitfield.disp16)
5915 {
5916 operand_types[j].bitfield.disp16 = override;
5917 operand_types[j].bitfield.disp32 = !override;
5918 }
5919 operand_types[j].bitfield.disp32s = 0;
5920 operand_types[j].bitfield.disp64 = 0;
5921 break;
5922
5923 case CODE_64BIT:
5924 if (operand_types[j].bitfield.disp32s
5925 || operand_types[j].bitfield.disp64)
5926 {
5927 operand_types[j].bitfield.disp64 &= !override;
5928 operand_types[j].bitfield.disp32s &= !override;
5929 operand_types[j].bitfield.disp32 = override;
5930 }
5931 operand_types[j].bitfield.disp16 = 0;
5932 break;
5933 }
5934 }
5935 }
5936
5937 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
5938 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5939 continue;
5940
5941 /* We check register size if needed. */
5942 if (t->opcode_modifier.checkregsize)
5943 {
5944 check_register = (1 << t->operands) - 1;
5945 if (i.broadcast)
5946 check_register &= ~(1 << i.broadcast->operand);
5947 }
5948 else
5949 check_register = 0;
5950
5951 overlap0 = operand_type_and (i.types[0], operand_types[0]);
5952 switch (t->operands)
5953 {
5954 case 1:
5955 if (!operand_type_match (overlap0, i.types[0]))
5956 continue;
5957 break;
5958 case 2:
5959 /* xchg %eax, %eax is a special case. It is an alias for nop
5960 only in 32bit mode and we can use opcode 0x90. In 64bit
5961 mode, we can't use 0x90 for xchg %eax, %eax since it should
5962 zero-extend %eax to %rax. */
5963 if (flag_code == CODE_64BIT
5964 && t->base_opcode == 0x90
5965 && i.types[0].bitfield.instance == Accum
5966 && i.types[0].bitfield.dword
5967 && i.types[1].bitfield.instance == Accum
5968 && i.types[1].bitfield.dword)
5969 continue;
5970 /* xrelease mov %eax, <disp> is another special case. It must not
5971 match the accumulator-only encoding of mov. */
5972 if (flag_code != CODE_64BIT
5973 && i.hle_prefix
5974 && t->base_opcode == 0xa0
5975 && i.types[0].bitfield.instance == Accum
5976 && (i.flags[1] & Operand_Mem))
5977 continue;
5978 /* Fall through. */
5979
5980 case 3:
5981 if (!(size_match & MATCH_STRAIGHT))
5982 goto check_reverse;
5983 /* Reverse direction of operands if swapping is possible in the first
5984 place (operands need to be symmetric) and
5985 - the load form is requested, and the template is a store form,
5986 - the store form is requested, and the template is a load form,
5987 - the non-default (swapped) form is requested. */
5988 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5989 if (t->opcode_modifier.d && i.reg_operands == i.operands
5990 && !operand_type_all_zero (&overlap1))
5991 switch (i.dir_encoding)
5992 {
5993 case dir_encoding_load:
5994 if (operand_type_check (operand_types[i.operands - 1], anymem)
5995 || t->opcode_modifier.regmem)
5996 goto check_reverse;
5997 break;
5998
5999 case dir_encoding_store:
6000 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6001 && !t->opcode_modifier.regmem)
6002 goto check_reverse;
6003 break;
6004
6005 case dir_encoding_swap:
6006 goto check_reverse;
6007
6008 case dir_encoding_default:
6009 break;
6010 }
6011 /* If we want store form, we skip the current load. */
6012 if ((i.dir_encoding == dir_encoding_store
6013 || i.dir_encoding == dir_encoding_swap)
6014 && i.mem_operands == 0
6015 && t->opcode_modifier.load)
6016 continue;
6017 /* Fall through. */
6018 case 4:
6019 case 5:
6020 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6021 if (!operand_type_match (overlap0, i.types[0])
6022 || !operand_type_match (overlap1, i.types[1])
6023 || ((check_register & 3) == 3
6024 && !operand_type_register_match (i.types[0],
6025 operand_types[0],
6026 i.types[1],
6027 operand_types[1])))
6028 {
6029 /* Check if other direction is valid ... */
6030 if (!t->opcode_modifier.d)
6031 continue;
6032
6033 check_reverse:
6034 if (!(size_match & MATCH_REVERSE))
6035 continue;
6036 /* Try reversing direction of operands. */
6037 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6038 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6039 if (!operand_type_match (overlap0, i.types[0])
6040 || !operand_type_match (overlap1, i.types[i.operands - 1])
6041 || (check_register
6042 && !operand_type_register_match (i.types[0],
6043 operand_types[i.operands - 1],
6044 i.types[i.operands - 1],
6045 operand_types[0])))
6046 {
6047 /* Does not match either direction. */
6048 continue;
6049 }
6050 /* found_reverse_match holds which of D or FloatR
6051 we've found. */
6052 if (!t->opcode_modifier.d)
6053 found_reverse_match = 0;
6054 else if (operand_types[0].bitfield.tbyte)
6055 found_reverse_match = Opcode_FloatD;
6056 else if (operand_types[0].bitfield.xmmword
6057 || operand_types[i.operands - 1].bitfield.xmmword
6058 || operand_types[0].bitfield.class == RegMMX
6059 || operand_types[i.operands - 1].bitfield.class == RegMMX
6060 || is_any_vex_encoding(t))
6061 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6062 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6063 else
6064 found_reverse_match = Opcode_D;
6065 if (t->opcode_modifier.floatr)
6066 found_reverse_match |= Opcode_FloatR;
6067 }
6068 else
6069 {
6070 /* Found a forward 2 operand match here. */
6071 switch (t->operands)
6072 {
6073 case 5:
6074 overlap4 = operand_type_and (i.types[4],
6075 operand_types[4]);
6076 /* Fall through. */
6077 case 4:
6078 overlap3 = operand_type_and (i.types[3],
6079 operand_types[3]);
6080 /* Fall through. */
6081 case 3:
6082 overlap2 = operand_type_and (i.types[2],
6083 operand_types[2]);
6084 break;
6085 }
6086
6087 switch (t->operands)
6088 {
6089 case 5:
6090 if (!operand_type_match (overlap4, i.types[4])
6091 || !operand_type_register_match (i.types[3],
6092 operand_types[3],
6093 i.types[4],
6094 operand_types[4]))
6095 continue;
6096 /* Fall through. */
6097 case 4:
6098 if (!operand_type_match (overlap3, i.types[3])
6099 || ((check_register & 0xa) == 0xa
6100 && !operand_type_register_match (i.types[1],
6101 operand_types[1],
6102 i.types[3],
6103 operand_types[3]))
6104 || ((check_register & 0xc) == 0xc
6105 && !operand_type_register_match (i.types[2],
6106 operand_types[2],
6107 i.types[3],
6108 operand_types[3])))
6109 continue;
6110 /* Fall through. */
6111 case 3:
6112 /* Here we make use of the fact that there are no
6113 reverse match 3 operand instructions. */
6114 if (!operand_type_match (overlap2, i.types[2])
6115 || ((check_register & 5) == 5
6116 && !operand_type_register_match (i.types[0],
6117 operand_types[0],
6118 i.types[2],
6119 operand_types[2]))
6120 || ((check_register & 6) == 6
6121 && !operand_type_register_match (i.types[1],
6122 operand_types[1],
6123 i.types[2],
6124 operand_types[2])))
6125 continue;
6126 break;
6127 }
6128 }
6129 /* Found either forward/reverse 2, 3 or 4 operand match here:
6130 slip through to break. */
6131 }
6132
6133 /* Check if vector and VEX operands are valid. */
6134 if (check_VecOperands (t) || VEX_check_operands (t))
6135 {
6136 specific_error = i.error;
6137 continue;
6138 }
6139
6140 /* We've found a match; break out of loop. */
6141 break;
6142 }
6143
6144 if (t == current_templates->end)
6145 {
6146 /* We found no match. */
6147 const char *err_msg;
6148 switch (specific_error ? specific_error : i.error)
6149 {
6150 default:
6151 abort ();
6152 case operand_size_mismatch:
6153 err_msg = _("operand size mismatch");
6154 break;
6155 case operand_type_mismatch:
6156 err_msg = _("operand type mismatch");
6157 break;
6158 case register_type_mismatch:
6159 err_msg = _("register type mismatch");
6160 break;
6161 case number_of_operands_mismatch:
6162 err_msg = _("number of operands mismatch");
6163 break;
6164 case invalid_instruction_suffix:
6165 err_msg = _("invalid instruction suffix");
6166 break;
6167 case bad_imm4:
6168 err_msg = _("constant doesn't fit in 4 bits");
6169 break;
6170 case unsupported_with_intel_mnemonic:
6171 err_msg = _("unsupported with Intel mnemonic");
6172 break;
6173 case unsupported_syntax:
6174 err_msg = _("unsupported syntax");
6175 break;
6176 case unsupported:
6177 as_bad (_("unsupported instruction `%s'"),
6178 current_templates->start->name);
6179 return NULL;
6180 case invalid_vsib_address:
6181 err_msg = _("invalid VSIB address");
6182 break;
6183 case invalid_vector_register_set:
6184 err_msg = _("mask, index, and destination registers must be distinct");
6185 break;
6186 case unsupported_vector_index_register:
6187 err_msg = _("unsupported vector index register");
6188 break;
6189 case unsupported_broadcast:
6190 err_msg = _("unsupported broadcast");
6191 break;
6192 case broadcast_needed:
6193 err_msg = _("broadcast is needed for operand of such type");
6194 break;
6195 case unsupported_masking:
6196 err_msg = _("unsupported masking");
6197 break;
6198 case mask_not_on_destination:
6199 err_msg = _("mask not on destination operand");
6200 break;
6201 case no_default_mask:
6202 err_msg = _("default mask isn't allowed");
6203 break;
6204 case unsupported_rc_sae:
6205 err_msg = _("unsupported static rounding/sae");
6206 break;
6207 case rc_sae_operand_not_last_imm:
6208 if (intel_syntax)
6209 err_msg = _("RC/SAE operand must precede immediate operands");
6210 else
6211 err_msg = _("RC/SAE operand must follow immediate operands");
6212 break;
6213 case invalid_register_operand:
6214 err_msg = _("invalid register operand");
6215 break;
6216 }
6217 as_bad (_("%s for `%s'"), err_msg,
6218 current_templates->start->name);
6219 return NULL;
6220 }
6221
6222 if (!quiet_warnings)
6223 {
6224 if (!intel_syntax
6225 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6226 as_warn (_("indirect %s without `*'"), t->name);
6227
6228 if (t->opcode_modifier.isprefix
6229 && t->opcode_modifier.ignoresize)
6230 {
6231 /* Warn them that a data or address size prefix doesn't
6232 affect assembly of the next line of code. */
6233 as_warn (_("stand-alone `%s' prefix"), t->name);
6234 }
6235 }
6236
6237 /* Copy the template we found. */
6238 i.tm = *t;
6239
6240 if (addr_prefix_disp != -1)
6241 i.tm.operand_types[addr_prefix_disp]
6242 = operand_types[addr_prefix_disp];
6243
6244 if (found_reverse_match)
6245 {
6246 /* If we found a reverse match we must alter the opcode direction
6247 bit and clear/flip the regmem modifier one. found_reverse_match
6248 holds bits to change (different for int & float insns). */
6249
6250 i.tm.base_opcode ^= found_reverse_match;
6251
6252 i.tm.operand_types[0] = operand_types[i.operands - 1];
6253 i.tm.operand_types[i.operands - 1] = operand_types[0];
6254
6255 /* Certain SIMD insns have their load forms specified in the opcode
6256 table, and hence we need to _set_ RegMem instead of clearing it.
6257 We need to avoid setting the bit though on insns like KMOVW. */
6258 i.tm.opcode_modifier.regmem
6259 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6260 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6261 && !i.tm.opcode_modifier.regmem;
6262 }
6263
6264 return t;
6265 }
6266
6267 static int
6268 check_string (void)
6269 {
6270 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6271 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6272
6273 if (i.seg[op] != NULL && i.seg[op] != &es)
6274 {
6275 as_bad (_("`%s' operand %u must use `%ses' segment"),
6276 i.tm.name,
6277 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6278 register_prefix);
6279 return 0;
6280 }
6281
6282 /* There's only ever one segment override allowed per instruction.
6283 This instruction possibly has a legal segment override on the
6284 second operand, so copy the segment to where non-string
6285 instructions store it, allowing common code. */
6286 i.seg[op] = i.seg[1];
6287
6288 return 1;
6289 }
6290
6291 static int
6292 process_suffix (void)
6293 {
6294 /* If matched instruction specifies an explicit instruction mnemonic
6295 suffix, use it. */
6296 if (i.tm.opcode_modifier.size == SIZE16)
6297 i.suffix = WORD_MNEM_SUFFIX;
6298 else if (i.tm.opcode_modifier.size == SIZE32)
6299 i.suffix = LONG_MNEM_SUFFIX;
6300 else if (i.tm.opcode_modifier.size == SIZE64)
6301 i.suffix = QWORD_MNEM_SUFFIX;
6302 else if (i.reg_operands
6303 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6304 && !i.tm.opcode_modifier.addrprefixopreg)
6305 {
6306 unsigned int numop = i.operands;
6307
6308 /* movsx/movzx want only their source operand considered here, for the
6309 ambiguity checking below. The suffix will be replaced afterwards
6310 to represent the destination (register). */
6311 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6312 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6313 --i.operands;
6314
6315 /* If there's no instruction mnemonic suffix we try to invent one
6316 based on GPR operands. */
6317 if (!i.suffix)
6318 {
6319 /* We take i.suffix from the last register operand specified,
6320 Destination register type is more significant than source
6321 register type. crc32 in SSE4.2 prefers source register
6322 type. */
6323 unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6324
6325 while (op--)
6326 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6327 || i.tm.operand_types[op].bitfield.instance == Accum)
6328 {
6329 if (i.types[op].bitfield.class != Reg)
6330 continue;
6331 if (i.types[op].bitfield.byte)
6332 i.suffix = BYTE_MNEM_SUFFIX;
6333 else if (i.types[op].bitfield.word)
6334 i.suffix = WORD_MNEM_SUFFIX;
6335 else if (i.types[op].bitfield.dword)
6336 i.suffix = LONG_MNEM_SUFFIX;
6337 else if (i.types[op].bitfield.qword)
6338 i.suffix = QWORD_MNEM_SUFFIX;
6339 else
6340 continue;
6341 break;
6342 }
6343
6344 /* As an exception, movsx/movzx silently default to a byte source
6345 in AT&T mode. */
6346 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6347 && !i.suffix && !intel_syntax)
6348 i.suffix = BYTE_MNEM_SUFFIX;
6349 }
6350 else if (i.suffix == BYTE_MNEM_SUFFIX)
6351 {
6352 if (intel_syntax
6353 && i.tm.opcode_modifier.ignoresize
6354 && i.tm.opcode_modifier.no_bsuf)
6355 i.suffix = 0;
6356 else if (!check_byte_reg ())
6357 return 0;
6358 }
6359 else if (i.suffix == LONG_MNEM_SUFFIX)
6360 {
6361 if (intel_syntax
6362 && i.tm.opcode_modifier.ignoresize
6363 && i.tm.opcode_modifier.no_lsuf
6364 && !i.tm.opcode_modifier.todword
6365 && !i.tm.opcode_modifier.toqword)
6366 i.suffix = 0;
6367 else if (!check_long_reg ())
6368 return 0;
6369 }
6370 else if (i.suffix == QWORD_MNEM_SUFFIX)
6371 {
6372 if (intel_syntax
6373 && i.tm.opcode_modifier.ignoresize
6374 && i.tm.opcode_modifier.no_qsuf
6375 && !i.tm.opcode_modifier.todword
6376 && !i.tm.opcode_modifier.toqword)
6377 i.suffix = 0;
6378 else if (!check_qword_reg ())
6379 return 0;
6380 }
6381 else if (i.suffix == WORD_MNEM_SUFFIX)
6382 {
6383 if (intel_syntax
6384 && i.tm.opcode_modifier.ignoresize
6385 && i.tm.opcode_modifier.no_wsuf)
6386 i.suffix = 0;
6387 else if (!check_word_reg ())
6388 return 0;
6389 }
6390 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6391 /* Do nothing if the instruction is going to ignore the prefix. */
6392 ;
6393 else
6394 abort ();
6395
6396 /* Undo the movsx/movzx change done above. */
6397 i.operands = numop;
6398 }
6399 else if (i.tm.opcode_modifier.defaultsize && !i.suffix)
6400 {
6401 i.suffix = stackop_size;
6402 if (stackop_size == LONG_MNEM_SUFFIX)
6403 {
6404 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6405 .code16gcc directive to support 16-bit mode with
6406 32-bit address. For IRET without a suffix, generate
6407 16-bit IRET (opcode 0xcf) to return from an interrupt
6408 handler. */
6409 if (i.tm.base_opcode == 0xcf)
6410 {
6411 i.suffix = WORD_MNEM_SUFFIX;
6412 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6413 }
6414 /* Warn about changed behavior for segment register push/pop. */
6415 else if ((i.tm.base_opcode | 1) == 0x07)
6416 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6417 i.tm.name);
6418 }
6419 }
6420 else if (!i.suffix
6421 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6422 || i.tm.opcode_modifier.jump == JUMP_BYTE
6423 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6424 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6425 && i.tm.extension_opcode <= 3)))
6426 {
6427 switch (flag_code)
6428 {
6429 case CODE_64BIT:
6430 if (!i.tm.opcode_modifier.no_qsuf)
6431 {
6432 i.suffix = QWORD_MNEM_SUFFIX;
6433 break;
6434 }
6435 /* Fall through. */
6436 case CODE_32BIT:
6437 if (!i.tm.opcode_modifier.no_lsuf)
6438 i.suffix = LONG_MNEM_SUFFIX;
6439 break;
6440 case CODE_16BIT:
6441 if (!i.tm.opcode_modifier.no_wsuf)
6442 i.suffix = WORD_MNEM_SUFFIX;
6443 break;
6444 }
6445 }
6446
6447 if (!i.suffix
6448 && (!i.tm.opcode_modifier.defaultsize
6449 /* Also cover lret/retf/iret in 64-bit mode. */
6450 || (flag_code == CODE_64BIT
6451 && !i.tm.opcode_modifier.no_lsuf
6452 && !i.tm.opcode_modifier.no_qsuf))
6453 && !i.tm.opcode_modifier.ignoresize
6454 /* Accept FLDENV et al without suffix. */
6455 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6456 {
6457 unsigned int suffixes, evex = 0;
6458
6459 suffixes = !i.tm.opcode_modifier.no_bsuf;
6460 if (!i.tm.opcode_modifier.no_wsuf)
6461 suffixes |= 1 << 1;
6462 if (!i.tm.opcode_modifier.no_lsuf)
6463 suffixes |= 1 << 2;
6464 if (!i.tm.opcode_modifier.no_ldsuf)
6465 suffixes |= 1 << 3;
6466 if (!i.tm.opcode_modifier.no_ssuf)
6467 suffixes |= 1 << 4;
6468 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6469 suffixes |= 1 << 5;
6470
6471 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6472 also suitable for AT&T syntax mode, it was requested that this be
6473 restricted to just Intel syntax. */
6474 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6475 {
6476 unsigned int op;
6477
6478 for (op = 0; op < i.tm.operands; ++op)
6479 {
6480 if (is_evex_encoding (&i.tm)
6481 && !cpu_arch_flags.bitfield.cpuavx512vl)
6482 {
6483 if (i.tm.operand_types[op].bitfield.ymmword)
6484 i.tm.operand_types[op].bitfield.xmmword = 0;
6485 if (i.tm.operand_types[op].bitfield.zmmword)
6486 i.tm.operand_types[op].bitfield.ymmword = 0;
6487 if (!i.tm.opcode_modifier.evex
6488 || i.tm.opcode_modifier.evex == EVEXDYN)
6489 i.tm.opcode_modifier.evex = EVEX512;
6490 }
6491
6492 if (i.tm.operand_types[op].bitfield.xmmword
6493 + i.tm.operand_types[op].bitfield.ymmword
6494 + i.tm.operand_types[op].bitfield.zmmword < 2)
6495 continue;
6496
6497 /* Any properly sized operand disambiguates the insn. */
6498 if (i.types[op].bitfield.xmmword
6499 || i.types[op].bitfield.ymmword
6500 || i.types[op].bitfield.zmmword)
6501 {
6502 suffixes &= ~(7 << 6);
6503 evex = 0;
6504 break;
6505 }
6506
6507 if ((i.flags[op] & Operand_Mem)
6508 && i.tm.operand_types[op].bitfield.unspecified)
6509 {
6510 if (i.tm.operand_types[op].bitfield.xmmword)
6511 suffixes |= 1 << 6;
6512 if (i.tm.operand_types[op].bitfield.ymmword)
6513 suffixes |= 1 << 7;
6514 if (i.tm.operand_types[op].bitfield.zmmword)
6515 suffixes |= 1 << 8;
6516 if (is_evex_encoding (&i.tm))
6517 evex = EVEX512;
6518 }
6519 }
6520 }
6521
6522 /* Are multiple suffixes / operand sizes allowed? */
6523 if (suffixes & (suffixes - 1))
6524 {
6525 if (intel_syntax
6526 && (!i.tm.opcode_modifier.defaultsize
6527 || operand_check == check_error))
6528 {
6529 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6530 return 0;
6531 }
6532 if (operand_check == check_error)
6533 {
6534 as_bad (_("no instruction mnemonic suffix given and "
6535 "no register operands; can't size `%s'"), i.tm.name);
6536 return 0;
6537 }
6538 if (operand_check == check_warning)
6539 as_warn (_("%s; using default for `%s'"),
6540 intel_syntax
6541 ? _("ambiguous operand size")
6542 : _("no instruction mnemonic suffix given and "
6543 "no register operands"),
6544 i.tm.name);
6545
6546 if (i.tm.opcode_modifier.floatmf)
6547 i.suffix = SHORT_MNEM_SUFFIX;
6548 else if ((i.tm.base_opcode | 8) == 0xfbe
6549 || (i.tm.base_opcode == 0x63
6550 && i.tm.cpu_flags.bitfield.cpu64))
6551 /* handled below */;
6552 else if (evex)
6553 i.tm.opcode_modifier.evex = evex;
6554 else if (flag_code == CODE_16BIT)
6555 i.suffix = WORD_MNEM_SUFFIX;
6556 else if (!i.tm.opcode_modifier.no_lsuf)
6557 i.suffix = LONG_MNEM_SUFFIX;
6558 else
6559 i.suffix = QWORD_MNEM_SUFFIX;
6560 }
6561 }
6562
6563 if ((i.tm.base_opcode | 8) == 0xfbe
6564 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6565 {
6566 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
6567 In AT&T syntax, if there is no suffix (warned about above), the default
6568 will be byte extension. */
6569 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
6570 i.tm.base_opcode |= 1;
6571
6572 /* For further processing, the suffix should represent the destination
6573 (register). This is already the case when one was used with
6574 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
6575 no suffix to begin with. */
6576 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
6577 {
6578 if (i.types[1].bitfield.word)
6579 i.suffix = WORD_MNEM_SUFFIX;
6580 else if (i.types[1].bitfield.qword)
6581 i.suffix = QWORD_MNEM_SUFFIX;
6582 else
6583 i.suffix = LONG_MNEM_SUFFIX;
6584
6585 i.tm.opcode_modifier.w = 0;
6586 }
6587 }
6588
6589 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
6590 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
6591 != (i.tm.operand_types[1].bitfield.class == Reg);
6592
6593 /* Change the opcode based on the operand size given by i.suffix. */
6594 switch (i.suffix)
6595 {
6596 /* Size floating point instruction. */
6597 case LONG_MNEM_SUFFIX:
6598 if (i.tm.opcode_modifier.floatmf)
6599 {
6600 i.tm.base_opcode ^= 4;
6601 break;
6602 }
6603 /* fall through */
6604 case WORD_MNEM_SUFFIX:
6605 case QWORD_MNEM_SUFFIX:
6606 /* It's not a byte, select word/dword operation. */
6607 if (i.tm.opcode_modifier.w)
6608 {
6609 if (i.short_form)
6610 i.tm.base_opcode |= 8;
6611 else
6612 i.tm.base_opcode |= 1;
6613 }
6614 /* fall through */
6615 case SHORT_MNEM_SUFFIX:
6616 /* Now select between word & dword operations via the operand
6617 size prefix, except for instructions that will ignore this
6618 prefix anyway. */
6619 if (i.suffix != QWORD_MNEM_SUFFIX
6620 && !i.tm.opcode_modifier.ignoresize
6621 && !i.tm.opcode_modifier.floatmf
6622 && !is_any_vex_encoding (&i.tm)
6623 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6624 || (flag_code == CODE_64BIT
6625 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
6626 {
6627 unsigned int prefix = DATA_PREFIX_OPCODE;
6628
6629 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
6630 prefix = ADDR_PREFIX_OPCODE;
6631
6632 if (!add_prefix (prefix))
6633 return 0;
6634 }
6635
6636 /* Set mode64 for an operand. */
6637 if (i.suffix == QWORD_MNEM_SUFFIX
6638 && flag_code == CODE_64BIT
6639 && !i.tm.opcode_modifier.norex64
6640 /* Special case for xchg %rax,%rax. It is NOP and doesn't
6641 need rex64. */
6642 && ! (i.operands == 2
6643 && i.tm.base_opcode == 0x90
6644 && i.tm.extension_opcode == None
6645 && i.types[0].bitfield.instance == Accum
6646 && i.types[0].bitfield.qword
6647 && i.types[1].bitfield.instance == Accum
6648 && i.types[1].bitfield.qword))
6649 i.rex |= REX_W;
6650
6651 break;
6652 }
6653
6654 if (i.tm.opcode_modifier.addrprefixopreg)
6655 {
6656 gas_assert (!i.suffix);
6657 gas_assert (i.reg_operands);
6658
6659 if (i.tm.operand_types[0].bitfield.instance == Accum
6660 || i.operands == 1)
6661 {
6662 /* The address size override prefix changes the size of the
6663 first operand. */
6664 if (flag_code == CODE_64BIT
6665 && i.op[0].regs->reg_type.bitfield.word)
6666 {
6667 as_bad (_("16-bit addressing unavailable for `%s'"),
6668 i.tm.name);
6669 return 0;
6670 }
6671
6672 if ((flag_code == CODE_32BIT
6673 ? i.op[0].regs->reg_type.bitfield.word
6674 : i.op[0].regs->reg_type.bitfield.dword)
6675 && !add_prefix (ADDR_PREFIX_OPCODE))
6676 return 0;
6677 }
6678 else
6679 {
6680 /* Check invalid register operand when the address size override
6681 prefix changes the size of register operands. */
6682 unsigned int op;
6683 enum { need_word, need_dword, need_qword } need;
6684
6685 if (flag_code == CODE_32BIT)
6686 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6687 else if (i.prefix[ADDR_PREFIX])
6688 need = need_dword;
6689 else
6690 need = flag_code == CODE_64BIT ? need_qword : need_word;
6691
6692 for (op = 0; op < i.operands; op++)
6693 {
6694 if (i.types[op].bitfield.class != Reg)
6695 continue;
6696
6697 switch (need)
6698 {
6699 case need_word:
6700 if (i.op[op].regs->reg_type.bitfield.word)
6701 continue;
6702 break;
6703 case need_dword:
6704 if (i.op[op].regs->reg_type.bitfield.dword)
6705 continue;
6706 break;
6707 case need_qword:
6708 if (i.op[op].regs->reg_type.bitfield.qword)
6709 continue;
6710 break;
6711 }
6712
6713 as_bad (_("invalid register operand size for `%s'"),
6714 i.tm.name);
6715 return 0;
6716 }
6717 }
6718 }
6719
6720 return 1;
6721 }
6722
6723 static int
6724 check_byte_reg (void)
6725 {
6726 int op;
6727
6728 for (op = i.operands; --op >= 0;)
6729 {
6730 /* Skip non-register operands. */
6731 if (i.types[op].bitfield.class != Reg)
6732 continue;
6733
6734 /* If this is an eight bit register, it's OK. If it's the 16 or
6735 32 bit version of an eight bit register, we will just use the
6736 low portion, and that's OK too. */
6737 if (i.types[op].bitfield.byte)
6738 continue;
6739
6740 /* I/O port address operands are OK too. */
6741 if (i.tm.operand_types[op].bitfield.instance == RegD
6742 && i.tm.operand_types[op].bitfield.word)
6743 continue;
6744
6745 /* crc32 only wants its source operand checked here. */
6746 if (i.tm.base_opcode == 0xf20f38f0 && op)
6747 continue;
6748
6749 /* Any other register is bad. */
6750 if (i.types[op].bitfield.class == Reg
6751 || i.types[op].bitfield.class == RegMMX
6752 || i.types[op].bitfield.class == RegSIMD
6753 || i.types[op].bitfield.class == SReg
6754 || i.types[op].bitfield.class == RegCR
6755 || i.types[op].bitfield.class == RegDR
6756 || i.types[op].bitfield.class == RegTR)
6757 {
6758 as_bad (_("`%s%s' not allowed with `%s%c'"),
6759 register_prefix,
6760 i.op[op].regs->reg_name,
6761 i.tm.name,
6762 i.suffix);
6763 return 0;
6764 }
6765 }
6766 return 1;
6767 }
6768
6769 static int
6770 check_long_reg (void)
6771 {
6772 int op;
6773
6774 for (op = i.operands; --op >= 0;)
6775 /* Skip non-register operands. */
6776 if (i.types[op].bitfield.class != Reg)
6777 continue;
6778 /* Reject eight bit registers, except where the template requires
6779 them. (eg. movzb) */
6780 else if (i.types[op].bitfield.byte
6781 && (i.tm.operand_types[op].bitfield.class == Reg
6782 || i.tm.operand_types[op].bitfield.instance == Accum)
6783 && (i.tm.operand_types[op].bitfield.word
6784 || i.tm.operand_types[op].bitfield.dword))
6785 {
6786 as_bad (_("`%s%s' not allowed with `%s%c'"),
6787 register_prefix,
6788 i.op[op].regs->reg_name,
6789 i.tm.name,
6790 i.suffix);
6791 return 0;
6792 }
6793 /* Error if the e prefix on a general reg is missing. */
6794 else if (i.types[op].bitfield.word
6795 && (i.tm.operand_types[op].bitfield.class == Reg
6796 || i.tm.operand_types[op].bitfield.instance == Accum)
6797 && i.tm.operand_types[op].bitfield.dword)
6798 {
6799 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6800 register_prefix, i.op[op].regs->reg_name,
6801 i.suffix);
6802 return 0;
6803 }
6804 /* Warn if the r prefix on a general reg is present. */
6805 else if (i.types[op].bitfield.qword
6806 && (i.tm.operand_types[op].bitfield.class == Reg
6807 || i.tm.operand_types[op].bitfield.instance == Accum)
6808 && i.tm.operand_types[op].bitfield.dword)
6809 {
6810 if (intel_syntax
6811 && i.tm.opcode_modifier.toqword
6812 && i.types[0].bitfield.class != RegSIMD)
6813 {
6814 /* Convert to QWORD. We want REX byte. */
6815 i.suffix = QWORD_MNEM_SUFFIX;
6816 }
6817 else
6818 {
6819 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6820 register_prefix, i.op[op].regs->reg_name,
6821 i.suffix);
6822 return 0;
6823 }
6824 }
6825 return 1;
6826 }
6827
6828 static int
6829 check_qword_reg (void)
6830 {
6831 int op;
6832
6833 for (op = i.operands; --op >= 0; )
6834 /* Skip non-register operands. */
6835 if (i.types[op].bitfield.class != Reg)
6836 continue;
6837 /* Reject eight bit registers, except where the template requires
6838 them. (eg. movzb) */
6839 else if (i.types[op].bitfield.byte
6840 && (i.tm.operand_types[op].bitfield.class == Reg
6841 || i.tm.operand_types[op].bitfield.instance == Accum)
6842 && (i.tm.operand_types[op].bitfield.word
6843 || i.tm.operand_types[op].bitfield.dword))
6844 {
6845 as_bad (_("`%s%s' not allowed with `%s%c'"),
6846 register_prefix,
6847 i.op[op].regs->reg_name,
6848 i.tm.name,
6849 i.suffix);
6850 return 0;
6851 }
6852 /* Warn if the r prefix on a general reg is missing. */
6853 else if ((i.types[op].bitfield.word
6854 || i.types[op].bitfield.dword)
6855 && (i.tm.operand_types[op].bitfield.class == Reg
6856 || i.tm.operand_types[op].bitfield.instance == Accum)
6857 && i.tm.operand_types[op].bitfield.qword)
6858 {
6859 /* Prohibit these changes in the 64bit mode, since the
6860 lowering is more complicated. */
6861 if (intel_syntax
6862 && i.tm.opcode_modifier.todword
6863 && i.types[0].bitfield.class != RegSIMD)
6864 {
6865 /* Convert to DWORD. We don't want REX byte. */
6866 i.suffix = LONG_MNEM_SUFFIX;
6867 }
6868 else
6869 {
6870 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6871 register_prefix, i.op[op].regs->reg_name,
6872 i.suffix);
6873 return 0;
6874 }
6875 }
6876 return 1;
6877 }
6878
6879 static int
6880 check_word_reg (void)
6881 {
6882 int op;
6883 for (op = i.operands; --op >= 0;)
6884 /* Skip non-register operands. */
6885 if (i.types[op].bitfield.class != Reg)
6886 continue;
6887 /* Reject eight bit registers, except where the template requires
6888 them. (eg. movzb) */
6889 else if (i.types[op].bitfield.byte
6890 && (i.tm.operand_types[op].bitfield.class == Reg
6891 || i.tm.operand_types[op].bitfield.instance == Accum)
6892 && (i.tm.operand_types[op].bitfield.word
6893 || i.tm.operand_types[op].bitfield.dword))
6894 {
6895 as_bad (_("`%s%s' not allowed with `%s%c'"),
6896 register_prefix,
6897 i.op[op].regs->reg_name,
6898 i.tm.name,
6899 i.suffix);
6900 return 0;
6901 }
6902 /* Error if the e or r prefix on a general reg is present. */
6903 else if ((i.types[op].bitfield.dword
6904 || i.types[op].bitfield.qword)
6905 && (i.tm.operand_types[op].bitfield.class == Reg
6906 || i.tm.operand_types[op].bitfield.instance == Accum)
6907 && i.tm.operand_types[op].bitfield.word)
6908 {
6909 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6910 register_prefix, i.op[op].regs->reg_name,
6911 i.suffix);
6912 return 0;
6913 }
6914 return 1;
6915 }
6916
6917 static int
6918 update_imm (unsigned int j)
6919 {
6920 i386_operand_type overlap = i.types[j];
6921 if ((overlap.bitfield.imm8
6922 || overlap.bitfield.imm8s
6923 || overlap.bitfield.imm16
6924 || overlap.bitfield.imm32
6925 || overlap.bitfield.imm32s
6926 || overlap.bitfield.imm64)
6927 && !operand_type_equal (&overlap, &imm8)
6928 && !operand_type_equal (&overlap, &imm8s)
6929 && !operand_type_equal (&overlap, &imm16)
6930 && !operand_type_equal (&overlap, &imm32)
6931 && !operand_type_equal (&overlap, &imm32s)
6932 && !operand_type_equal (&overlap, &imm64))
6933 {
6934 if (i.suffix)
6935 {
6936 i386_operand_type temp;
6937
6938 operand_type_set (&temp, 0);
6939 if (i.suffix == BYTE_MNEM_SUFFIX)
6940 {
6941 temp.bitfield.imm8 = overlap.bitfield.imm8;
6942 temp.bitfield.imm8s = overlap.bitfield.imm8s;
6943 }
6944 else if (i.suffix == WORD_MNEM_SUFFIX)
6945 temp.bitfield.imm16 = overlap.bitfield.imm16;
6946 else if (i.suffix == QWORD_MNEM_SUFFIX)
6947 {
6948 temp.bitfield.imm64 = overlap.bitfield.imm64;
6949 temp.bitfield.imm32s = overlap.bitfield.imm32s;
6950 }
6951 else
6952 temp.bitfield.imm32 = overlap.bitfield.imm32;
6953 overlap = temp;
6954 }
6955 else if (operand_type_equal (&overlap, &imm16_32_32s)
6956 || operand_type_equal (&overlap, &imm16_32)
6957 || operand_type_equal (&overlap, &imm16_32s))
6958 {
6959 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6960 overlap = imm16;
6961 else
6962 overlap = imm32s;
6963 }
6964 if (!operand_type_equal (&overlap, &imm8)
6965 && !operand_type_equal (&overlap, &imm8s)
6966 && !operand_type_equal (&overlap, &imm16)
6967 && !operand_type_equal (&overlap, &imm32)
6968 && !operand_type_equal (&overlap, &imm32s)
6969 && !operand_type_equal (&overlap, &imm64))
6970 {
6971 as_bad (_("no instruction mnemonic suffix given; "
6972 "can't determine immediate size"));
6973 return 0;
6974 }
6975 }
6976 i.types[j] = overlap;
6977
6978 return 1;
6979 }
6980
6981 static int
6982 finalize_imm (void)
6983 {
6984 unsigned int j, n;
6985
6986 /* Update the first 2 immediate operands. */
6987 n = i.operands > 2 ? 2 : i.operands;
6988 if (n)
6989 {
6990 for (j = 0; j < n; j++)
6991 if (update_imm (j) == 0)
6992 return 0;
6993
6994 /* The 3rd operand can't be immediate operand. */
6995 gas_assert (operand_type_check (i.types[2], imm) == 0);
6996 }
6997
6998 return 1;
6999 }
7000
7001 static int
7002 process_operands (void)
7003 {
7004 /* Default segment register this instruction will use for memory
7005 accesses. 0 means unknown. This is only for optimizing out
7006 unnecessary segment overrides. */
7007 const seg_entry *default_seg = 0;
7008
7009 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7010 {
7011 unsigned int dupl = i.operands;
7012 unsigned int dest = dupl - 1;
7013 unsigned int j;
7014
7015 /* The destination must be an xmm register. */
7016 gas_assert (i.reg_operands
7017 && MAX_OPERANDS > dupl
7018 && operand_type_equal (&i.types[dest], &regxmm));
7019
7020 if (i.tm.operand_types[0].bitfield.instance == Accum
7021 && i.tm.operand_types[0].bitfield.xmmword)
7022 {
7023 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7024 {
7025 /* Keep xmm0 for instructions with VEX prefix and 3
7026 sources. */
7027 i.tm.operand_types[0].bitfield.instance = InstanceNone;
7028 i.tm.operand_types[0].bitfield.class = RegSIMD;
7029 goto duplicate;
7030 }
7031 else
7032 {
7033 /* We remove the first xmm0 and keep the number of
7034 operands unchanged, which in fact duplicates the
7035 destination. */
7036 for (j = 1; j < i.operands; j++)
7037 {
7038 i.op[j - 1] = i.op[j];
7039 i.types[j - 1] = i.types[j];
7040 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7041 i.flags[j - 1] = i.flags[j];
7042 }
7043 }
7044 }
7045 else if (i.tm.opcode_modifier.implicit1stxmm0)
7046 {
7047 gas_assert ((MAX_OPERANDS - 1) > dupl
7048 && (i.tm.opcode_modifier.vexsources
7049 == VEX3SOURCES));
7050
7051 /* Add the implicit xmm0 for instructions with VEX prefix
7052 and 3 sources. */
7053 for (j = i.operands; j > 0; j--)
7054 {
7055 i.op[j] = i.op[j - 1];
7056 i.types[j] = i.types[j - 1];
7057 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7058 i.flags[j] = i.flags[j - 1];
7059 }
7060 i.op[0].regs
7061 = (const reg_entry *) hash_find (reg_hash, "xmm0");
7062 i.types[0] = regxmm;
7063 i.tm.operand_types[0] = regxmm;
7064
7065 i.operands += 2;
7066 i.reg_operands += 2;
7067 i.tm.operands += 2;
7068
7069 dupl++;
7070 dest++;
7071 i.op[dupl] = i.op[dest];
7072 i.types[dupl] = i.types[dest];
7073 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7074 i.flags[dupl] = i.flags[dest];
7075 }
7076 else
7077 {
7078 duplicate:
7079 i.operands++;
7080 i.reg_operands++;
7081 i.tm.operands++;
7082
7083 i.op[dupl] = i.op[dest];
7084 i.types[dupl] = i.types[dest];
7085 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7086 i.flags[dupl] = i.flags[dest];
7087 }
7088
7089 if (i.tm.opcode_modifier.immext)
7090 process_immext ();
7091 }
7092 else if (i.tm.operand_types[0].bitfield.instance == Accum
7093 && i.tm.operand_types[0].bitfield.xmmword)
7094 {
7095 unsigned int j;
7096
7097 for (j = 1; j < i.operands; j++)
7098 {
7099 i.op[j - 1] = i.op[j];
7100 i.types[j - 1] = i.types[j];
7101
7102 /* We need to adjust fields in i.tm since they are used by
7103 build_modrm_byte. */
7104 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7105
7106 i.flags[j - 1] = i.flags[j];
7107 }
7108
7109 i.operands--;
7110 i.reg_operands--;
7111 i.tm.operands--;
7112 }
7113 else if (i.tm.opcode_modifier.implicitquadgroup)
7114 {
7115 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7116
7117 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7118 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7119 regnum = register_number (i.op[1].regs);
7120 first_reg_in_group = regnum & ~3;
7121 last_reg_in_group = first_reg_in_group + 3;
7122 if (regnum != first_reg_in_group)
7123 as_warn (_("source register `%s%s' implicitly denotes"
7124 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7125 register_prefix, i.op[1].regs->reg_name,
7126 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7127 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7128 i.tm.name);
7129 }
7130 else if (i.tm.opcode_modifier.regkludge)
7131 {
7132 /* The imul $imm, %reg instruction is converted into
7133 imul $imm, %reg, %reg, and the clr %reg instruction
7134 is converted into xor %reg, %reg. */
7135
7136 unsigned int first_reg_op;
7137
7138 if (operand_type_check (i.types[0], reg))
7139 first_reg_op = 0;
7140 else
7141 first_reg_op = 1;
7142 /* Pretend we saw the extra register operand. */
7143 gas_assert (i.reg_operands == 1
7144 && i.op[first_reg_op + 1].regs == 0);
7145 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7146 i.types[first_reg_op + 1] = i.types[first_reg_op];
7147 i.operands++;
7148 i.reg_operands++;
7149 }
7150
7151 if (i.tm.opcode_modifier.modrm)
7152 {
7153 /* The opcode is completed (modulo i.tm.extension_opcode which
7154 must be put into the modrm byte). Now, we make the modrm and
7155 index base bytes based on all the info we've collected. */
7156
7157 default_seg = build_modrm_byte ();
7158 }
7159 else if (i.types[0].bitfield.class == SReg)
7160 {
7161 if (flag_code != CODE_64BIT
7162 ? i.tm.base_opcode == POP_SEG_SHORT
7163 && i.op[0].regs->reg_num == 1
7164 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7165 && i.op[0].regs->reg_num < 4)
7166 {
7167 as_bad (_("you can't `%s %s%s'"),
7168 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7169 return 0;
7170 }
7171 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7172 {
7173 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7174 i.tm.opcode_length = 2;
7175 }
7176 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7177 }
7178 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7179 {
7180 default_seg = &ds;
7181 }
7182 else if (i.tm.opcode_modifier.isstring)
7183 {
7184 /* For the string instructions that allow a segment override
7185 on one of their operands, the default segment is ds. */
7186 default_seg = &ds;
7187 }
7188 else if (i.short_form)
7189 {
7190 /* The register or float register operand is in operand
7191 0 or 1. */
7192 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7193
7194 /* Register goes in low 3 bits of opcode. */
7195 i.tm.base_opcode |= i.op[op].regs->reg_num;
7196 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7197 i.rex |= REX_B;
7198 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7199 {
7200 /* Warn about some common errors, but press on regardless.
7201 The first case can be generated by gcc (<= 2.8.1). */
7202 if (i.operands == 2)
7203 {
7204 /* Reversed arguments on faddp, fsubp, etc. */
7205 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7206 register_prefix, i.op[!intel_syntax].regs->reg_name,
7207 register_prefix, i.op[intel_syntax].regs->reg_name);
7208 }
7209 else
7210 {
7211 /* Extraneous `l' suffix on fp insn. */
7212 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7213 register_prefix, i.op[0].regs->reg_name);
7214 }
7215 }
7216 }
7217
7218 if ((i.seg[0] || i.prefix[SEG_PREFIX])
7219 && i.tm.base_opcode == 0x8d /* lea */
7220 && !is_any_vex_encoding(&i.tm))
7221 {
7222 if (!quiet_warnings)
7223 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7224 if (optimize)
7225 {
7226 i.seg[0] = NULL;
7227 i.prefix[SEG_PREFIX] = 0;
7228 }
7229 }
7230
7231 /* If a segment was explicitly specified, and the specified segment
7232 is neither the default nor the one already recorded from a prefix,
7233 use an opcode prefix to select it. If we never figured out what
7234 the default segment is, then default_seg will be zero at this
7235 point, and the specified segment prefix will always be used. */
7236 if (i.seg[0]
7237 && i.seg[0] != default_seg
7238 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7239 {
7240 if (!add_prefix (i.seg[0]->seg_prefix))
7241 return 0;
7242 }
7243 return 1;
7244 }
7245
7246 static const seg_entry *
7247 build_modrm_byte (void)
7248 {
7249 const seg_entry *default_seg = 0;
7250 unsigned int source, dest;
7251 int vex_3_sources;
7252
7253 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7254 if (vex_3_sources)
7255 {
7256 unsigned int nds, reg_slot;
7257 expressionS *exp;
7258
7259 dest = i.operands - 1;
7260 nds = dest - 1;
7261
7262 /* There are 2 kinds of instructions:
7263 1. 5 operands: 4 register operands or 3 register operands
7264 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7265 VexW0 or VexW1. The destination must be either XMM, YMM or
7266 ZMM register.
7267 2. 4 operands: 4 register operands or 3 register operands
7268 plus 1 memory operand, with VexXDS. */
7269 gas_assert ((i.reg_operands == 4
7270 || (i.reg_operands == 3 && i.mem_operands == 1))
7271 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7272 && i.tm.opcode_modifier.vexw
7273 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7274
7275 /* If VexW1 is set, the first non-immediate operand is the source and
7276 the second non-immediate one is encoded in the immediate operand. */
7277 if (i.tm.opcode_modifier.vexw == VEXW1)
7278 {
7279 source = i.imm_operands;
7280 reg_slot = i.imm_operands + 1;
7281 }
7282 else
7283 {
7284 source = i.imm_operands + 1;
7285 reg_slot = i.imm_operands;
7286 }
7287
7288 if (i.imm_operands == 0)
7289 {
7290 /* When there is no immediate operand, generate an 8bit
7291 immediate operand to encode the first operand. */
7292 exp = &im_expressions[i.imm_operands++];
7293 i.op[i.operands].imms = exp;
7294 i.types[i.operands] = imm8;
7295 i.operands++;
7296
7297 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7298 exp->X_op = O_constant;
7299 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7300 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7301 }
7302 else
7303 {
7304 gas_assert (i.imm_operands == 1);
7305 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7306 gas_assert (!i.tm.opcode_modifier.immext);
7307
7308 /* Turn on Imm8 again so that output_imm will generate it. */
7309 i.types[0].bitfield.imm8 = 1;
7310
7311 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7312 i.op[0].imms->X_add_number
7313 |= register_number (i.op[reg_slot].regs) << 4;
7314 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7315 }
7316
7317 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7318 i.vex.register_specifier = i.op[nds].regs;
7319 }
7320 else
7321 source = dest = 0;
7322
7323 /* i.reg_operands MUST be the number of real register operands;
7324 implicit registers do not count. If there are 3 register
7325 operands, it must be a instruction with VexNDS. For a
7326 instruction with VexNDD, the destination register is encoded
7327 in VEX prefix. If there are 4 register operands, it must be
7328 a instruction with VEX prefix and 3 sources. */
7329 if (i.mem_operands == 0
7330 && ((i.reg_operands == 2
7331 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7332 || (i.reg_operands == 3
7333 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7334 || (i.reg_operands == 4 && vex_3_sources)))
7335 {
7336 switch (i.operands)
7337 {
7338 case 2:
7339 source = 0;
7340 break;
7341 case 3:
7342 /* When there are 3 operands, one of them may be immediate,
7343 which may be the first or the last operand. Otherwise,
7344 the first operand must be shift count register (cl) or it
7345 is an instruction with VexNDS. */
7346 gas_assert (i.imm_operands == 1
7347 || (i.imm_operands == 0
7348 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7349 || (i.types[0].bitfield.instance == RegC
7350 && i.types[0].bitfield.byte))));
7351 if (operand_type_check (i.types[0], imm)
7352 || (i.types[0].bitfield.instance == RegC
7353 && i.types[0].bitfield.byte))
7354 source = 1;
7355 else
7356 source = 0;
7357 break;
7358 case 4:
7359 /* When there are 4 operands, the first two must be 8bit
7360 immediate operands. The source operand will be the 3rd
7361 one.
7362
7363 For instructions with VexNDS, if the first operand
7364 an imm8, the source operand is the 2nd one. If the last
7365 operand is imm8, the source operand is the first one. */
7366 gas_assert ((i.imm_operands == 2
7367 && i.types[0].bitfield.imm8
7368 && i.types[1].bitfield.imm8)
7369 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7370 && i.imm_operands == 1
7371 && (i.types[0].bitfield.imm8
7372 || i.types[i.operands - 1].bitfield.imm8
7373 || i.rounding)));
7374 if (i.imm_operands == 2)
7375 source = 2;
7376 else
7377 {
7378 if (i.types[0].bitfield.imm8)
7379 source = 1;
7380 else
7381 source = 0;
7382 }
7383 break;
7384 case 5:
7385 if (is_evex_encoding (&i.tm))
7386 {
7387 /* For EVEX instructions, when there are 5 operands, the
7388 first one must be immediate operand. If the second one
7389 is immediate operand, the source operand is the 3th
7390 one. If the last one is immediate operand, the source
7391 operand is the 2nd one. */
7392 gas_assert (i.imm_operands == 2
7393 && i.tm.opcode_modifier.sae
7394 && operand_type_check (i.types[0], imm));
7395 if (operand_type_check (i.types[1], imm))
7396 source = 2;
7397 else if (operand_type_check (i.types[4], imm))
7398 source = 1;
7399 else
7400 abort ();
7401 }
7402 break;
7403 default:
7404 abort ();
7405 }
7406
7407 if (!vex_3_sources)
7408 {
7409 dest = source + 1;
7410
7411 /* RC/SAE operand could be between DEST and SRC. That happens
7412 when one operand is GPR and the other one is XMM/YMM/ZMM
7413 register. */
7414 if (i.rounding && i.rounding->operand == (int) dest)
7415 dest++;
7416
7417 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7418 {
7419 /* For instructions with VexNDS, the register-only source
7420 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7421 register. It is encoded in VEX prefix. */
7422
7423 i386_operand_type op;
7424 unsigned int vvvv;
7425
7426 /* Check register-only source operand when two source
7427 operands are swapped. */
7428 if (!i.tm.operand_types[source].bitfield.baseindex
7429 && i.tm.operand_types[dest].bitfield.baseindex)
7430 {
7431 vvvv = source;
7432 source = dest;
7433 }
7434 else
7435 vvvv = dest;
7436
7437 op = i.tm.operand_types[vvvv];
7438 if ((dest + 1) >= i.operands
7439 || ((op.bitfield.class != Reg
7440 || (!op.bitfield.dword && !op.bitfield.qword))
7441 && op.bitfield.class != RegSIMD
7442 && !operand_type_equal (&op, &regmask)))
7443 abort ();
7444 i.vex.register_specifier = i.op[vvvv].regs;
7445 dest++;
7446 }
7447 }
7448
7449 i.rm.mode = 3;
7450 /* One of the register operands will be encoded in the i.rm.reg
7451 field, the other in the combined i.rm.mode and i.rm.regmem
7452 fields. If no form of this instruction supports a memory
7453 destination operand, then we assume the source operand may
7454 sometimes be a memory operand and so we need to store the
7455 destination in the i.rm.reg field. */
7456 if (!i.tm.opcode_modifier.regmem
7457 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7458 {
7459 i.rm.reg = i.op[dest].regs->reg_num;
7460 i.rm.regmem = i.op[source].regs->reg_num;
7461 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7462 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7463 i.has_regmmx = TRUE;
7464 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7465 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7466 {
7467 if (i.types[dest].bitfield.zmmword
7468 || i.types[source].bitfield.zmmword)
7469 i.has_regzmm = TRUE;
7470 else if (i.types[dest].bitfield.ymmword
7471 || i.types[source].bitfield.ymmword)
7472 i.has_regymm = TRUE;
7473 else
7474 i.has_regxmm = TRUE;
7475 }
7476 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7477 i.rex |= REX_R;
7478 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7479 i.vrex |= REX_R;
7480 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7481 i.rex |= REX_B;
7482 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7483 i.vrex |= REX_B;
7484 }
7485 else
7486 {
7487 i.rm.reg = i.op[source].regs->reg_num;
7488 i.rm.regmem = i.op[dest].regs->reg_num;
7489 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7490 i.rex |= REX_B;
7491 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7492 i.vrex |= REX_B;
7493 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7494 i.rex |= REX_R;
7495 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7496 i.vrex |= REX_R;
7497 }
7498 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7499 {
7500 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7501 abort ();
7502 i.rex &= ~REX_R;
7503 add_prefix (LOCK_PREFIX_OPCODE);
7504 }
7505 }
7506 else
7507 { /* If it's not 2 reg operands... */
7508 unsigned int mem;
7509
7510 if (i.mem_operands)
7511 {
7512 unsigned int fake_zero_displacement = 0;
7513 unsigned int op;
7514
7515 for (op = 0; op < i.operands; op++)
7516 if (i.flags[op] & Operand_Mem)
7517 break;
7518 gas_assert (op < i.operands);
7519
7520 if (i.tm.opcode_modifier.vecsib)
7521 {
7522 if (i.index_reg->reg_num == RegIZ)
7523 abort ();
7524
7525 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7526 if (!i.base_reg)
7527 {
7528 i.sib.base = NO_BASE_REGISTER;
7529 i.sib.scale = i.log2_scale_factor;
7530 i.types[op].bitfield.disp8 = 0;
7531 i.types[op].bitfield.disp16 = 0;
7532 i.types[op].bitfield.disp64 = 0;
7533 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7534 {
7535 /* Must be 32 bit */
7536 i.types[op].bitfield.disp32 = 1;
7537 i.types[op].bitfield.disp32s = 0;
7538 }
7539 else
7540 {
7541 i.types[op].bitfield.disp32 = 0;
7542 i.types[op].bitfield.disp32s = 1;
7543 }
7544 }
7545 i.sib.index = i.index_reg->reg_num;
7546 if ((i.index_reg->reg_flags & RegRex) != 0)
7547 i.rex |= REX_X;
7548 if ((i.index_reg->reg_flags & RegVRex) != 0)
7549 i.vrex |= REX_X;
7550 }
7551
7552 default_seg = &ds;
7553
7554 if (i.base_reg == 0)
7555 {
7556 i.rm.mode = 0;
7557 if (!i.disp_operands)
7558 fake_zero_displacement = 1;
7559 if (i.index_reg == 0)
7560 {
7561 i386_operand_type newdisp;
7562
7563 gas_assert (!i.tm.opcode_modifier.vecsib);
7564 /* Operand is just <disp> */
7565 if (flag_code == CODE_64BIT)
7566 {
7567 /* 64bit mode overwrites the 32bit absolute
7568 addressing by RIP relative addressing and
7569 absolute addressing is encoded by one of the
7570 redundant SIB forms. */
7571 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7572 i.sib.base = NO_BASE_REGISTER;
7573 i.sib.index = NO_INDEX_REGISTER;
7574 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7575 }
7576 else if ((flag_code == CODE_16BIT)
7577 ^ (i.prefix[ADDR_PREFIX] != 0))
7578 {
7579 i.rm.regmem = NO_BASE_REGISTER_16;
7580 newdisp = disp16;
7581 }
7582 else
7583 {
7584 i.rm.regmem = NO_BASE_REGISTER;
7585 newdisp = disp32;
7586 }
7587 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7588 i.types[op] = operand_type_or (i.types[op], newdisp);
7589 }
7590 else if (!i.tm.opcode_modifier.vecsib)
7591 {
7592 /* !i.base_reg && i.index_reg */
7593 if (i.index_reg->reg_num == RegIZ)
7594 i.sib.index = NO_INDEX_REGISTER;
7595 else
7596 i.sib.index = i.index_reg->reg_num;
7597 i.sib.base = NO_BASE_REGISTER;
7598 i.sib.scale = i.log2_scale_factor;
7599 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7600 i.types[op].bitfield.disp8 = 0;
7601 i.types[op].bitfield.disp16 = 0;
7602 i.types[op].bitfield.disp64 = 0;
7603 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7604 {
7605 /* Must be 32 bit */
7606 i.types[op].bitfield.disp32 = 1;
7607 i.types[op].bitfield.disp32s = 0;
7608 }
7609 else
7610 {
7611 i.types[op].bitfield.disp32 = 0;
7612 i.types[op].bitfield.disp32s = 1;
7613 }
7614 if ((i.index_reg->reg_flags & RegRex) != 0)
7615 i.rex |= REX_X;
7616 }
7617 }
7618 /* RIP addressing for 64bit mode. */
7619 else if (i.base_reg->reg_num == RegIP)
7620 {
7621 gas_assert (!i.tm.opcode_modifier.vecsib);
7622 i.rm.regmem = NO_BASE_REGISTER;
7623 i.types[op].bitfield.disp8 = 0;
7624 i.types[op].bitfield.disp16 = 0;
7625 i.types[op].bitfield.disp32 = 0;
7626 i.types[op].bitfield.disp32s = 1;
7627 i.types[op].bitfield.disp64 = 0;
7628 i.flags[op] |= Operand_PCrel;
7629 if (! i.disp_operands)
7630 fake_zero_displacement = 1;
7631 }
7632 else if (i.base_reg->reg_type.bitfield.word)
7633 {
7634 gas_assert (!i.tm.opcode_modifier.vecsib);
7635 switch (i.base_reg->reg_num)
7636 {
7637 case 3: /* (%bx) */
7638 if (i.index_reg == 0)
7639 i.rm.regmem = 7;
7640 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
7641 i.rm.regmem = i.index_reg->reg_num - 6;
7642 break;
7643 case 5: /* (%bp) */
7644 default_seg = &ss;
7645 if (i.index_reg == 0)
7646 {
7647 i.rm.regmem = 6;
7648 if (operand_type_check (i.types[op], disp) == 0)
7649 {
7650 /* fake (%bp) into 0(%bp) */
7651 i.types[op].bitfield.disp8 = 1;
7652 fake_zero_displacement = 1;
7653 }
7654 }
7655 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
7656 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7657 break;
7658 default: /* (%si) -> 4 or (%di) -> 5 */
7659 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7660 }
7661 i.rm.mode = mode_from_disp_size (i.types[op]);
7662 }
7663 else /* i.base_reg and 32/64 bit mode */
7664 {
7665 if (flag_code == CODE_64BIT
7666 && operand_type_check (i.types[op], disp))
7667 {
7668 i.types[op].bitfield.disp16 = 0;
7669 i.types[op].bitfield.disp64 = 0;
7670 if (i.prefix[ADDR_PREFIX] == 0)
7671 {
7672 i.types[op].bitfield.disp32 = 0;
7673 i.types[op].bitfield.disp32s = 1;
7674 }
7675 else
7676 {
7677 i.types[op].bitfield.disp32 = 1;
7678 i.types[op].bitfield.disp32s = 0;
7679 }
7680 }
7681
7682 if (!i.tm.opcode_modifier.vecsib)
7683 i.rm.regmem = i.base_reg->reg_num;
7684 if ((i.base_reg->reg_flags & RegRex) != 0)
7685 i.rex |= REX_B;
7686 i.sib.base = i.base_reg->reg_num;
7687 /* x86-64 ignores REX prefix bit here to avoid decoder
7688 complications. */
7689 if (!(i.base_reg->reg_flags & RegRex)
7690 && (i.base_reg->reg_num == EBP_REG_NUM
7691 || i.base_reg->reg_num == ESP_REG_NUM))
7692 default_seg = &ss;
7693 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7694 {
7695 fake_zero_displacement = 1;
7696 i.types[op].bitfield.disp8 = 1;
7697 }
7698 i.sib.scale = i.log2_scale_factor;
7699 if (i.index_reg == 0)
7700 {
7701 gas_assert (!i.tm.opcode_modifier.vecsib);
7702 /* <disp>(%esp) becomes two byte modrm with no index
7703 register. We've already stored the code for esp
7704 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7705 Any base register besides %esp will not use the
7706 extra modrm byte. */
7707 i.sib.index = NO_INDEX_REGISTER;
7708 }
7709 else if (!i.tm.opcode_modifier.vecsib)
7710 {
7711 if (i.index_reg->reg_num == RegIZ)
7712 i.sib.index = NO_INDEX_REGISTER;
7713 else
7714 i.sib.index = i.index_reg->reg_num;
7715 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7716 if ((i.index_reg->reg_flags & RegRex) != 0)
7717 i.rex |= REX_X;
7718 }
7719
7720 if (i.disp_operands
7721 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7722 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7723 i.rm.mode = 0;
7724 else
7725 {
7726 if (!fake_zero_displacement
7727 && !i.disp_operands
7728 && i.disp_encoding)
7729 {
7730 fake_zero_displacement = 1;
7731 if (i.disp_encoding == disp_encoding_8bit)
7732 i.types[op].bitfield.disp8 = 1;
7733 else
7734 i.types[op].bitfield.disp32 = 1;
7735 }
7736 i.rm.mode = mode_from_disp_size (i.types[op]);
7737 }
7738 }
7739
7740 if (fake_zero_displacement)
7741 {
7742 /* Fakes a zero displacement assuming that i.types[op]
7743 holds the correct displacement size. */
7744 expressionS *exp;
7745
7746 gas_assert (i.op[op].disps == 0);
7747 exp = &disp_expressions[i.disp_operands++];
7748 i.op[op].disps = exp;
7749 exp->X_op = O_constant;
7750 exp->X_add_number = 0;
7751 exp->X_add_symbol = (symbolS *) 0;
7752 exp->X_op_symbol = (symbolS *) 0;
7753 }
7754
7755 mem = op;
7756 }
7757 else
7758 mem = ~0;
7759
7760 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7761 {
7762 if (operand_type_check (i.types[0], imm))
7763 i.vex.register_specifier = NULL;
7764 else
7765 {
7766 /* VEX.vvvv encodes one of the sources when the first
7767 operand is not an immediate. */
7768 if (i.tm.opcode_modifier.vexw == VEXW0)
7769 i.vex.register_specifier = i.op[0].regs;
7770 else
7771 i.vex.register_specifier = i.op[1].regs;
7772 }
7773
7774 /* Destination is a XMM register encoded in the ModRM.reg
7775 and VEX.R bit. */
7776 i.rm.reg = i.op[2].regs->reg_num;
7777 if ((i.op[2].regs->reg_flags & RegRex) != 0)
7778 i.rex |= REX_R;
7779
7780 /* ModRM.rm and VEX.B encodes the other source. */
7781 if (!i.mem_operands)
7782 {
7783 i.rm.mode = 3;
7784
7785 if (i.tm.opcode_modifier.vexw == VEXW0)
7786 i.rm.regmem = i.op[1].regs->reg_num;
7787 else
7788 i.rm.regmem = i.op[0].regs->reg_num;
7789
7790 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7791 i.rex |= REX_B;
7792 }
7793 }
7794 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7795 {
7796 i.vex.register_specifier = i.op[2].regs;
7797 if (!i.mem_operands)
7798 {
7799 i.rm.mode = 3;
7800 i.rm.regmem = i.op[1].regs->reg_num;
7801 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7802 i.rex |= REX_B;
7803 }
7804 }
7805 /* Fill in i.rm.reg or i.rm.regmem field with register operand
7806 (if any) based on i.tm.extension_opcode. Again, we must be
7807 careful to make sure that segment/control/debug/test/MMX
7808 registers are coded into the i.rm.reg field. */
7809 else if (i.reg_operands)
7810 {
7811 unsigned int op;
7812 unsigned int vex_reg = ~0;
7813
7814 for (op = 0; op < i.operands; op++)
7815 {
7816 if (i.types[op].bitfield.class == Reg
7817 || i.types[op].bitfield.class == RegBND
7818 || i.types[op].bitfield.class == RegMask
7819 || i.types[op].bitfield.class == SReg
7820 || i.types[op].bitfield.class == RegCR
7821 || i.types[op].bitfield.class == RegDR
7822 || i.types[op].bitfield.class == RegTR)
7823 break;
7824 if (i.types[op].bitfield.class == RegSIMD)
7825 {
7826 if (i.types[op].bitfield.zmmword)
7827 i.has_regzmm = TRUE;
7828 else if (i.types[op].bitfield.ymmword)
7829 i.has_regymm = TRUE;
7830 else
7831 i.has_regxmm = TRUE;
7832 break;
7833 }
7834 if (i.types[op].bitfield.class == RegMMX)
7835 {
7836 i.has_regmmx = TRUE;
7837 break;
7838 }
7839 }
7840
7841 if (vex_3_sources)
7842 op = dest;
7843 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7844 {
7845 /* For instructions with VexNDS, the register-only
7846 source operand is encoded in VEX prefix. */
7847 gas_assert (mem != (unsigned int) ~0);
7848
7849 if (op > mem)
7850 {
7851 vex_reg = op++;
7852 gas_assert (op < i.operands);
7853 }
7854 else
7855 {
7856 /* Check register-only source operand when two source
7857 operands are swapped. */
7858 if (!i.tm.operand_types[op].bitfield.baseindex
7859 && i.tm.operand_types[op + 1].bitfield.baseindex)
7860 {
7861 vex_reg = op;
7862 op += 2;
7863 gas_assert (mem == (vex_reg + 1)
7864 && op < i.operands);
7865 }
7866 else
7867 {
7868 vex_reg = op + 1;
7869 gas_assert (vex_reg < i.operands);
7870 }
7871 }
7872 }
7873 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7874 {
7875 /* For instructions with VexNDD, the register destination
7876 is encoded in VEX prefix. */
7877 if (i.mem_operands == 0)
7878 {
7879 /* There is no memory operand. */
7880 gas_assert ((op + 2) == i.operands);
7881 vex_reg = op + 1;
7882 }
7883 else
7884 {
7885 /* There are only 2 non-immediate operands. */
7886 gas_assert (op < i.imm_operands + 2
7887 && i.operands == i.imm_operands + 2);
7888 vex_reg = i.imm_operands + 1;
7889 }
7890 }
7891 else
7892 gas_assert (op < i.operands);
7893
7894 if (vex_reg != (unsigned int) ~0)
7895 {
7896 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7897
7898 if ((type->bitfield.class != Reg
7899 || (!type->bitfield.dword && !type->bitfield.qword))
7900 && type->bitfield.class != RegSIMD
7901 && !operand_type_equal (type, &regmask))
7902 abort ();
7903
7904 i.vex.register_specifier = i.op[vex_reg].regs;
7905 }
7906
7907 /* Don't set OP operand twice. */
7908 if (vex_reg != op)
7909 {
7910 /* If there is an extension opcode to put here, the
7911 register number must be put into the regmem field. */
7912 if (i.tm.extension_opcode != None)
7913 {
7914 i.rm.regmem = i.op[op].regs->reg_num;
7915 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7916 i.rex |= REX_B;
7917 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7918 i.vrex |= REX_B;
7919 }
7920 else
7921 {
7922 i.rm.reg = i.op[op].regs->reg_num;
7923 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7924 i.rex |= REX_R;
7925 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7926 i.vrex |= REX_R;
7927 }
7928 }
7929
7930 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7931 must set it to 3 to indicate this is a register operand
7932 in the regmem field. */
7933 if (!i.mem_operands)
7934 i.rm.mode = 3;
7935 }
7936
7937 /* Fill in i.rm.reg field with extension opcode (if any). */
7938 if (i.tm.extension_opcode != None)
7939 i.rm.reg = i.tm.extension_opcode;
7940 }
7941 return default_seg;
7942 }
7943
7944 static unsigned int
7945 flip_code16 (unsigned int code16)
7946 {
7947 gas_assert (i.tm.operands == 1);
7948
7949 return !(i.prefix[REX_PREFIX] & REX_W)
7950 && (code16 ? i.tm.operand_types[0].bitfield.disp32
7951 || i.tm.operand_types[0].bitfield.disp32s
7952 : i.tm.operand_types[0].bitfield.disp16)
7953 ? CODE16 : 0;
7954 }
7955
7956 static void
7957 output_branch (void)
7958 {
7959 char *p;
7960 int size;
7961 int code16;
7962 int prefix;
7963 relax_substateT subtype;
7964 symbolS *sym;
7965 offsetT off;
7966
7967 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7968 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7969
7970 prefix = 0;
7971 if (i.prefix[DATA_PREFIX] != 0)
7972 {
7973 prefix = 1;
7974 i.prefixes -= 1;
7975 code16 ^= flip_code16(code16);
7976 }
7977 /* Pentium4 branch hints. */
7978 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7979 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7980 {
7981 prefix++;
7982 i.prefixes--;
7983 }
7984 if (i.prefix[REX_PREFIX] != 0)
7985 {
7986 prefix++;
7987 i.prefixes--;
7988 }
7989
7990 /* BND prefixed jump. */
7991 if (i.prefix[BND_PREFIX] != 0)
7992 {
7993 prefix++;
7994 i.prefixes--;
7995 }
7996
7997 if (i.prefixes != 0)
7998 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
7999
8000 /* It's always a symbol; End frag & setup for relax.
8001 Make sure there is enough room in this frag for the largest
8002 instruction we may generate in md_convert_frag. This is 2
8003 bytes for the opcode and room for the prefix and largest
8004 displacement. */
8005 frag_grow (prefix + 2 + 4);
8006 /* Prefix and 1 opcode byte go in fr_fix. */
8007 p = frag_more (prefix + 1);
8008 if (i.prefix[DATA_PREFIX] != 0)
8009 *p++ = DATA_PREFIX_OPCODE;
8010 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8011 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8012 *p++ = i.prefix[SEG_PREFIX];
8013 if (i.prefix[BND_PREFIX] != 0)
8014 *p++ = BND_PREFIX_OPCODE;
8015 if (i.prefix[REX_PREFIX] != 0)
8016 *p++ = i.prefix[REX_PREFIX];
8017 *p = i.tm.base_opcode;
8018
8019 if ((unsigned char) *p == JUMP_PC_RELATIVE)
8020 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8021 else if (cpu_arch_flags.bitfield.cpui386)
8022 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8023 else
8024 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8025 subtype |= code16;
8026
8027 sym = i.op[0].disps->X_add_symbol;
8028 off = i.op[0].disps->X_add_number;
8029
8030 if (i.op[0].disps->X_op != O_constant
8031 && i.op[0].disps->X_op != O_symbol)
8032 {
8033 /* Handle complex expressions. */
8034 sym = make_expr_symbol (i.op[0].disps);
8035 off = 0;
8036 }
8037
8038 /* 1 possible extra opcode + 4 byte displacement go in var part.
8039 Pass reloc in fr_var. */
8040 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8041 }
8042
8043 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8044 /* Return TRUE iff PLT32 relocation should be used for branching to
8045 symbol S. */
8046
8047 static bfd_boolean
8048 need_plt32_p (symbolS *s)
8049 {
8050 /* PLT32 relocation is ELF only. */
8051 if (!IS_ELF)
8052 return FALSE;
8053
8054 #ifdef TE_SOLARIS
8055 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8056 krtld support it. */
8057 return FALSE;
8058 #endif
8059
8060 /* Since there is no need to prepare for PLT branch on x86-64, we
8061 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8062 be used as a marker for 32-bit PC-relative branches. */
8063 if (!object_64bit)
8064 return FALSE;
8065
8066 /* Weak or undefined symbol need PLT32 relocation. */
8067 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8068 return TRUE;
8069
8070 /* Non-global symbol doesn't need PLT32 relocation. */
8071 if (! S_IS_EXTERNAL (s))
8072 return FALSE;
8073
8074 /* Other global symbols need PLT32 relocation. NB: Symbol with
8075 non-default visibilities are treated as normal global symbol
8076 so that PLT32 relocation can be used as a marker for 32-bit
8077 PC-relative branches. It is useful for linker relaxation. */
8078 return TRUE;
8079 }
8080 #endif
8081
8082 static void
8083 output_jump (void)
8084 {
8085 char *p;
8086 int size;
8087 fixS *fixP;
8088 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8089
8090 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8091 {
8092 /* This is a loop or jecxz type instruction. */
8093 size = 1;
8094 if (i.prefix[ADDR_PREFIX] != 0)
8095 {
8096 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8097 i.prefixes -= 1;
8098 }
8099 /* Pentium4 branch hints. */
8100 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8101 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8102 {
8103 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8104 i.prefixes--;
8105 }
8106 }
8107 else
8108 {
8109 int code16;
8110
8111 code16 = 0;
8112 if (flag_code == CODE_16BIT)
8113 code16 = CODE16;
8114
8115 if (i.prefix[DATA_PREFIX] != 0)
8116 {
8117 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8118 i.prefixes -= 1;
8119 code16 ^= flip_code16(code16);
8120 }
8121
8122 size = 4;
8123 if (code16)
8124 size = 2;
8125 }
8126
8127 /* BND prefixed jump. */
8128 if (i.prefix[BND_PREFIX] != 0)
8129 {
8130 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8131 i.prefixes -= 1;
8132 }
8133
8134 if (i.prefix[REX_PREFIX] != 0)
8135 {
8136 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8137 i.prefixes -= 1;
8138 }
8139
8140 if (i.prefixes != 0)
8141 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8142
8143 p = frag_more (i.tm.opcode_length + size);
8144 switch (i.tm.opcode_length)
8145 {
8146 case 2:
8147 *p++ = i.tm.base_opcode >> 8;
8148 /* Fall through. */
8149 case 1:
8150 *p++ = i.tm.base_opcode;
8151 break;
8152 default:
8153 abort ();
8154 }
8155
8156 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8157 if (size == 4
8158 && jump_reloc == NO_RELOC
8159 && need_plt32_p (i.op[0].disps->X_add_symbol))
8160 jump_reloc = BFD_RELOC_X86_64_PLT32;
8161 #endif
8162
8163 jump_reloc = reloc (size, 1, 1, jump_reloc);
8164
8165 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8166 i.op[0].disps, 1, jump_reloc);
8167
8168 /* All jumps handled here are signed, but don't use a signed limit
8169 check for 32 and 16 bit jumps as we want to allow wrap around at
8170 4G and 64k respectively. */
8171 if (size == 1)
8172 fixP->fx_signed = 1;
8173 }
8174
8175 static void
8176 output_interseg_jump (void)
8177 {
8178 char *p;
8179 int size;
8180 int prefix;
8181 int code16;
8182
8183 code16 = 0;
8184 if (flag_code == CODE_16BIT)
8185 code16 = CODE16;
8186
8187 prefix = 0;
8188 if (i.prefix[DATA_PREFIX] != 0)
8189 {
8190 prefix = 1;
8191 i.prefixes -= 1;
8192 code16 ^= CODE16;
8193 }
8194
8195 gas_assert (!i.prefix[REX_PREFIX]);
8196
8197 size = 4;
8198 if (code16)
8199 size = 2;
8200
8201 if (i.prefixes != 0)
8202 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8203
8204 /* 1 opcode; 2 segment; offset */
8205 p = frag_more (prefix + 1 + 2 + size);
8206
8207 if (i.prefix[DATA_PREFIX] != 0)
8208 *p++ = DATA_PREFIX_OPCODE;
8209
8210 if (i.prefix[REX_PREFIX] != 0)
8211 *p++ = i.prefix[REX_PREFIX];
8212
8213 *p++ = i.tm.base_opcode;
8214 if (i.op[1].imms->X_op == O_constant)
8215 {
8216 offsetT n = i.op[1].imms->X_add_number;
8217
8218 if (size == 2
8219 && !fits_in_unsigned_word (n)
8220 && !fits_in_signed_word (n))
8221 {
8222 as_bad (_("16-bit jump out of range"));
8223 return;
8224 }
8225 md_number_to_chars (p, n, size);
8226 }
8227 else
8228 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8229 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8230 if (i.op[0].imms->X_op != O_constant)
8231 as_bad (_("can't handle non absolute segment in `%s'"),
8232 i.tm.name);
8233 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8234 }
8235
8236 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8237 void
8238 x86_cleanup (void)
8239 {
8240 char *p;
8241 asection *seg = now_seg;
8242 subsegT subseg = now_subseg;
8243 asection *sec;
8244 unsigned int alignment, align_size_1;
8245 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8246 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8247 unsigned int padding;
8248
8249 if (!IS_ELF || !x86_used_note)
8250 return;
8251
8252 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8253
8254 /* The .note.gnu.property section layout:
8255
8256 Field Length Contents
8257 ---- ---- ----
8258 n_namsz 4 4
8259 n_descsz 4 The note descriptor size
8260 n_type 4 NT_GNU_PROPERTY_TYPE_0
8261 n_name 4 "GNU"
8262 n_desc n_descsz The program property array
8263 .... .... ....
8264 */
8265
8266 /* Create the .note.gnu.property section. */
8267 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8268 bfd_set_section_flags (sec,
8269 (SEC_ALLOC
8270 | SEC_LOAD
8271 | SEC_DATA
8272 | SEC_HAS_CONTENTS
8273 | SEC_READONLY));
8274
8275 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8276 {
8277 align_size_1 = 7;
8278 alignment = 3;
8279 }
8280 else
8281 {
8282 align_size_1 = 3;
8283 alignment = 2;
8284 }
8285
8286 bfd_set_section_alignment (sec, alignment);
8287 elf_section_type (sec) = SHT_NOTE;
8288
8289 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8290 + 4-byte data */
8291 isa_1_descsz_raw = 4 + 4 + 4;
8292 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8293 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8294
8295 feature_2_descsz_raw = isa_1_descsz;
8296 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8297 + 4-byte data */
8298 feature_2_descsz_raw += 4 + 4 + 4;
8299 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8300 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8301 & ~align_size_1);
8302
8303 descsz = feature_2_descsz;
8304 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8305 p = frag_more (4 + 4 + 4 + 4 + descsz);
8306
8307 /* Write n_namsz. */
8308 md_number_to_chars (p, (valueT) 4, 4);
8309
8310 /* Write n_descsz. */
8311 md_number_to_chars (p + 4, (valueT) descsz, 4);
8312
8313 /* Write n_type. */
8314 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8315
8316 /* Write n_name. */
8317 memcpy (p + 4 * 3, "GNU", 4);
8318
8319 /* Write 4-byte type. */
8320 md_number_to_chars (p + 4 * 4,
8321 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8322
8323 /* Write 4-byte data size. */
8324 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8325
8326 /* Write 4-byte data. */
8327 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8328
8329 /* Zero out paddings. */
8330 padding = isa_1_descsz - isa_1_descsz_raw;
8331 if (padding)
8332 memset (p + 4 * 7, 0, padding);
8333
8334 /* Write 4-byte type. */
8335 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8336 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8337
8338 /* Write 4-byte data size. */
8339 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8340
8341 /* Write 4-byte data. */
8342 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8343 (valueT) x86_feature_2_used, 4);
8344
8345 /* Zero out paddings. */
8346 padding = feature_2_descsz - feature_2_descsz_raw;
8347 if (padding)
8348 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8349
8350 /* We probably can't restore the current segment, for there likely
8351 isn't one yet... */
8352 if (seg && subseg)
8353 subseg_set (seg, subseg);
8354 }
8355 #endif
8356
8357 static unsigned int
8358 encoding_length (const fragS *start_frag, offsetT start_off,
8359 const char *frag_now_ptr)
8360 {
8361 unsigned int len = 0;
8362
8363 if (start_frag != frag_now)
8364 {
8365 const fragS *fr = start_frag;
8366
8367 do {
8368 len += fr->fr_fix;
8369 fr = fr->fr_next;
8370 } while (fr && fr != frag_now);
8371 }
8372
8373 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8374 }
8375
8376 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8377 be macro-fused with conditional jumps. */
8378
8379 static int
8380 maybe_fused_with_jcc_p (void)
8381 {
8382 /* No RIP address. */
8383 if (i.base_reg && i.base_reg->reg_num == RegIP)
8384 return 0;
8385
8386 /* No VEX/EVEX encoding. */
8387 if (is_any_vex_encoding (&i.tm))
8388 return 0;
8389
8390 /* and, add, sub with destination register. */
8391 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8392 || i.tm.base_opcode <= 5
8393 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8394 || ((i.tm.base_opcode | 3) == 0x83
8395 && ((i.tm.extension_opcode | 1) == 0x5
8396 || i.tm.extension_opcode == 0x0)))
8397 return (i.types[1].bitfield.class == Reg
8398 || i.types[1].bitfield.instance == Accum);
8399
8400 /* test, cmp with any register. */
8401 if ((i.tm.base_opcode | 1) == 0x85
8402 || (i.tm.base_opcode | 1) == 0xa9
8403 || ((i.tm.base_opcode | 1) == 0xf7
8404 && i.tm.extension_opcode == 0)
8405 || (i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8406 || ((i.tm.base_opcode | 3) == 0x83
8407 && (i.tm.extension_opcode == 0x7)))
8408 return (i.types[0].bitfield.class == Reg
8409 || i.types[0].bitfield.instance == Accum
8410 || i.types[1].bitfield.class == Reg
8411 || i.types[1].bitfield.instance == Accum);
8412
8413 /* inc, dec with any register. */
8414 if ((i.tm.cpu_flags.bitfield.cpuno64
8415 && (i.tm.base_opcode | 0xf) == 0x4f)
8416 || ((i.tm.base_opcode | 1) == 0xff
8417 && i.tm.extension_opcode <= 0x1))
8418 return (i.types[0].bitfield.class == Reg
8419 || i.types[0].bitfield.instance == Accum);
8420
8421 return 0;
8422 }
8423
8424 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8425
8426 static int
8427 add_fused_jcc_padding_frag_p (void)
8428 {
8429 /* NB: Don't work with COND_JUMP86 without i386. */
8430 if (!align_branch_power
8431 || now_seg == absolute_section
8432 || !cpu_arch_flags.bitfield.cpui386
8433 || !(align_branch & align_branch_fused_bit))
8434 return 0;
8435
8436 if (maybe_fused_with_jcc_p ())
8437 {
8438 if (last_insn.kind == last_insn_other
8439 || last_insn.seg != now_seg)
8440 return 1;
8441 if (flag_debug)
8442 as_warn_where (last_insn.file, last_insn.line,
8443 _("`%s` skips -malign-branch-boundary on `%s`"),
8444 last_insn.name, i.tm.name);
8445 }
8446
8447 return 0;
8448 }
8449
8450 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
8451
8452 static int
8453 add_branch_prefix_frag_p (void)
8454 {
8455 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8456 to PadLock instructions since they include prefixes in opcode. */
8457 if (!align_branch_power
8458 || !align_branch_prefix_size
8459 || now_seg == absolute_section
8460 || i.tm.cpu_flags.bitfield.cpupadlock
8461 || !cpu_arch_flags.bitfield.cpui386)
8462 return 0;
8463
8464 /* Don't add prefix if it is a prefix or there is no operand in case
8465 that segment prefix is special. */
8466 if (!i.operands || i.tm.opcode_modifier.isprefix)
8467 return 0;
8468
8469 if (last_insn.kind == last_insn_other
8470 || last_insn.seg != now_seg)
8471 return 1;
8472
8473 if (flag_debug)
8474 as_warn_where (last_insn.file, last_insn.line,
8475 _("`%s` skips -malign-branch-boundary on `%s`"),
8476 last_insn.name, i.tm.name);
8477
8478 return 0;
8479 }
8480
8481 /* Return 1 if a BRANCH_PADDING frag should be generated. */
8482
8483 static int
8484 add_branch_padding_frag_p (enum align_branch_kind *branch_p)
8485 {
8486 int add_padding;
8487
8488 /* NB: Don't work with COND_JUMP86 without i386. */
8489 if (!align_branch_power
8490 || now_seg == absolute_section
8491 || !cpu_arch_flags.bitfield.cpui386)
8492 return 0;
8493
8494 add_padding = 0;
8495
8496 /* Check for jcc and direct jmp. */
8497 if (i.tm.opcode_modifier.jump == JUMP)
8498 {
8499 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8500 {
8501 *branch_p = align_branch_jmp;
8502 add_padding = align_branch & align_branch_jmp_bit;
8503 }
8504 else
8505 {
8506 *branch_p = align_branch_jcc;
8507 if ((align_branch & align_branch_jcc_bit))
8508 add_padding = 1;
8509 }
8510 }
8511 else if (is_any_vex_encoding (&i.tm))
8512 return 0;
8513 else if ((i.tm.base_opcode | 1) == 0xc3)
8514 {
8515 /* Near ret. */
8516 *branch_p = align_branch_ret;
8517 if ((align_branch & align_branch_ret_bit))
8518 add_padding = 1;
8519 }
8520 else
8521 {
8522 /* Check for indirect jmp, direct and indirect calls. */
8523 if (i.tm.base_opcode == 0xe8)
8524 {
8525 /* Direct call. */
8526 *branch_p = align_branch_call;
8527 if ((align_branch & align_branch_call_bit))
8528 add_padding = 1;
8529 }
8530 else if (i.tm.base_opcode == 0xff
8531 && (i.tm.extension_opcode == 2
8532 || i.tm.extension_opcode == 4))
8533 {
8534 /* Indirect call and jmp. */
8535 *branch_p = align_branch_indirect;
8536 if ((align_branch & align_branch_indirect_bit))
8537 add_padding = 1;
8538 }
8539
8540 if (add_padding
8541 && i.disp_operands
8542 && tls_get_addr
8543 && (i.op[0].disps->X_op == O_symbol
8544 || (i.op[0].disps->X_op == O_subtract
8545 && i.op[0].disps->X_op_symbol == GOT_symbol)))
8546 {
8547 symbolS *s = i.op[0].disps->X_add_symbol;
8548 /* No padding to call to global or undefined tls_get_addr. */
8549 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
8550 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
8551 return 0;
8552 }
8553 }
8554
8555 if (add_padding
8556 && last_insn.kind != last_insn_other
8557 && last_insn.seg == now_seg)
8558 {
8559 if (flag_debug)
8560 as_warn_where (last_insn.file, last_insn.line,
8561 _("`%s` skips -malign-branch-boundary on `%s`"),
8562 last_insn.name, i.tm.name);
8563 return 0;
8564 }
8565
8566 return add_padding;
8567 }
8568
8569 static void
8570 output_insn (void)
8571 {
8572 fragS *insn_start_frag;
8573 offsetT insn_start_off;
8574 fragS *fragP = NULL;
8575 enum align_branch_kind branch = align_branch_none;
8576
8577 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8578 if (IS_ELF && x86_used_note)
8579 {
8580 if (i.tm.cpu_flags.bitfield.cpucmov)
8581 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8582 if (i.tm.cpu_flags.bitfield.cpusse)
8583 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8584 if (i.tm.cpu_flags.bitfield.cpusse2)
8585 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8586 if (i.tm.cpu_flags.bitfield.cpusse3)
8587 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8588 if (i.tm.cpu_flags.bitfield.cpussse3)
8589 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8590 if (i.tm.cpu_flags.bitfield.cpusse4_1)
8591 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8592 if (i.tm.cpu_flags.bitfield.cpusse4_2)
8593 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8594 if (i.tm.cpu_flags.bitfield.cpuavx)
8595 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8596 if (i.tm.cpu_flags.bitfield.cpuavx2)
8597 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8598 if (i.tm.cpu_flags.bitfield.cpufma)
8599 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8600 if (i.tm.cpu_flags.bitfield.cpuavx512f)
8601 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8602 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8603 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8604 if (i.tm.cpu_flags.bitfield.cpuavx512er)
8605 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8606 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8607 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8608 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8609 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8610 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8611 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8612 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8613 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8614 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8615 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8616 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8617 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8618 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8619 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8620 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8621 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8622 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8623 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8624 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8625 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8626 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8627 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8628 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8629 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8630
8631 if (i.tm.cpu_flags.bitfield.cpu8087
8632 || i.tm.cpu_flags.bitfield.cpu287
8633 || i.tm.cpu_flags.bitfield.cpu387
8634 || i.tm.cpu_flags.bitfield.cpu687
8635 || i.tm.cpu_flags.bitfield.cpufisttp)
8636 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8637 if (i.has_regmmx
8638 || i.tm.base_opcode == 0xf77 /* emms */
8639 || i.tm.base_opcode == 0xf0e /* femms */)
8640 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8641 if (i.has_regxmm)
8642 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8643 if (i.has_regymm)
8644 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8645 if (i.has_regzmm)
8646 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8647 if (i.tm.cpu_flags.bitfield.cpufxsr)
8648 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8649 if (i.tm.cpu_flags.bitfield.cpuxsave)
8650 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8651 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8652 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8653 if (i.tm.cpu_flags.bitfield.cpuxsavec)
8654 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8655 }
8656 #endif
8657
8658 /* Tie dwarf2 debug info to the address at the start of the insn.
8659 We can't do this after the insn has been output as the current
8660 frag may have been closed off. eg. by frag_var. */
8661 dwarf2_emit_insn (0);
8662
8663 insn_start_frag = frag_now;
8664 insn_start_off = frag_now_fix ();
8665
8666 if (add_branch_padding_frag_p (&branch))
8667 {
8668 char *p;
8669 /* Branch can be 8 bytes. Leave some room for prefixes. */
8670 unsigned int max_branch_padding_size = 14;
8671
8672 /* Align section to boundary. */
8673 record_alignment (now_seg, align_branch_power);
8674
8675 /* Make room for padding. */
8676 frag_grow (max_branch_padding_size);
8677
8678 /* Start of the padding. */
8679 p = frag_more (0);
8680
8681 fragP = frag_now;
8682
8683 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
8684 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
8685 NULL, 0, p);
8686
8687 fragP->tc_frag_data.branch_type = branch;
8688 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
8689 }
8690
8691 /* Output jumps. */
8692 if (i.tm.opcode_modifier.jump == JUMP)
8693 output_branch ();
8694 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
8695 || i.tm.opcode_modifier.jump == JUMP_DWORD)
8696 output_jump ();
8697 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
8698 output_interseg_jump ();
8699 else
8700 {
8701 /* Output normal instructions here. */
8702 char *p;
8703 unsigned char *q;
8704 unsigned int j;
8705 unsigned int prefix;
8706
8707 if (avoid_fence
8708 && (i.tm.base_opcode == 0xfaee8
8709 || i.tm.base_opcode == 0xfaef0
8710 || i.tm.base_opcode == 0xfaef8))
8711 {
8712 /* Encode lfence, mfence, and sfence as
8713 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
8714 offsetT val = 0x240483f0ULL;
8715 p = frag_more (5);
8716 md_number_to_chars (p, val, 5);
8717 return;
8718 }
8719
8720 /* Some processors fail on LOCK prefix. This options makes
8721 assembler ignore LOCK prefix and serves as a workaround. */
8722 if (omit_lock_prefix)
8723 {
8724 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8725 return;
8726 i.prefix[LOCK_PREFIX] = 0;
8727 }
8728
8729 if (branch)
8730 /* Skip if this is a branch. */
8731 ;
8732 else if (add_fused_jcc_padding_frag_p ())
8733 {
8734 /* Make room for padding. */
8735 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
8736 p = frag_more (0);
8737
8738 fragP = frag_now;
8739
8740 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
8741 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
8742 NULL, 0, p);
8743
8744 fragP->tc_frag_data.branch_type = align_branch_fused;
8745 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
8746 }
8747 else if (add_branch_prefix_frag_p ())
8748 {
8749 unsigned int max_prefix_size = align_branch_prefix_size;
8750
8751 /* Make room for padding. */
8752 frag_grow (max_prefix_size);
8753 p = frag_more (0);
8754
8755 fragP = frag_now;
8756
8757 frag_var (rs_machine_dependent, max_prefix_size, 0,
8758 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
8759 NULL, 0, p);
8760
8761 fragP->tc_frag_data.max_bytes = max_prefix_size;
8762 }
8763
8764 /* Since the VEX/EVEX prefix contains the implicit prefix, we
8765 don't need the explicit prefix. */
8766 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8767 {
8768 switch (i.tm.opcode_length)
8769 {
8770 case 3:
8771 if (i.tm.base_opcode & 0xff000000)
8772 {
8773 prefix = (i.tm.base_opcode >> 24) & 0xff;
8774 if (!i.tm.cpu_flags.bitfield.cpupadlock
8775 || prefix != REPE_PREFIX_OPCODE
8776 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8777 add_prefix (prefix);
8778 }
8779 break;
8780 case 2:
8781 if ((i.tm.base_opcode & 0xff0000) != 0)
8782 {
8783 prefix = (i.tm.base_opcode >> 16) & 0xff;
8784 add_prefix (prefix);
8785 }
8786 break;
8787 case 1:
8788 break;
8789 case 0:
8790 /* Check for pseudo prefixes. */
8791 as_bad_where (insn_start_frag->fr_file,
8792 insn_start_frag->fr_line,
8793 _("pseudo prefix without instruction"));
8794 return;
8795 default:
8796 abort ();
8797 }
8798
8799 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8800 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8801 R_X86_64_GOTTPOFF relocation so that linker can safely
8802 perform IE->LE optimization. A dummy REX_OPCODE prefix
8803 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
8804 relocation for GDesc -> IE/LE optimization. */
8805 if (x86_elf_abi == X86_64_X32_ABI
8806 && i.operands == 2
8807 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8808 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
8809 && i.prefix[REX_PREFIX] == 0)
8810 add_prefix (REX_OPCODE);
8811 #endif
8812
8813 /* The prefix bytes. */
8814 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8815 if (*q)
8816 FRAG_APPEND_1_CHAR (*q);
8817 }
8818 else
8819 {
8820 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8821 if (*q)
8822 switch (j)
8823 {
8824 case REX_PREFIX:
8825 /* REX byte is encoded in VEX prefix. */
8826 break;
8827 case SEG_PREFIX:
8828 case ADDR_PREFIX:
8829 FRAG_APPEND_1_CHAR (*q);
8830 break;
8831 default:
8832 /* There should be no other prefixes for instructions
8833 with VEX prefix. */
8834 abort ();
8835 }
8836
8837 /* For EVEX instructions i.vrex should become 0 after
8838 build_evex_prefix. For VEX instructions upper 16 registers
8839 aren't available, so VREX should be 0. */
8840 if (i.vrex)
8841 abort ();
8842 /* Now the VEX prefix. */
8843 p = frag_more (i.vex.length);
8844 for (j = 0; j < i.vex.length; j++)
8845 p[j] = i.vex.bytes[j];
8846 }
8847
8848 /* Now the opcode; be careful about word order here! */
8849 if (i.tm.opcode_length == 1)
8850 {
8851 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8852 }
8853 else
8854 {
8855 switch (i.tm.opcode_length)
8856 {
8857 case 4:
8858 p = frag_more (4);
8859 *p++ = (i.tm.base_opcode >> 24) & 0xff;
8860 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8861 break;
8862 case 3:
8863 p = frag_more (3);
8864 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8865 break;
8866 case 2:
8867 p = frag_more (2);
8868 break;
8869 default:
8870 abort ();
8871 break;
8872 }
8873
8874 /* Put out high byte first: can't use md_number_to_chars! */
8875 *p++ = (i.tm.base_opcode >> 8) & 0xff;
8876 *p = i.tm.base_opcode & 0xff;
8877 }
8878
8879 /* Now the modrm byte and sib byte (if present). */
8880 if (i.tm.opcode_modifier.modrm)
8881 {
8882 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8883 | i.rm.reg << 3
8884 | i.rm.mode << 6));
8885 /* If i.rm.regmem == ESP (4)
8886 && i.rm.mode != (Register mode)
8887 && not 16 bit
8888 ==> need second modrm byte. */
8889 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8890 && i.rm.mode != 3
8891 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8892 FRAG_APPEND_1_CHAR ((i.sib.base << 0
8893 | i.sib.index << 3
8894 | i.sib.scale << 6));
8895 }
8896
8897 if (i.disp_operands)
8898 output_disp (insn_start_frag, insn_start_off);
8899
8900 if (i.imm_operands)
8901 output_imm (insn_start_frag, insn_start_off);
8902
8903 /*
8904 * frag_now_fix () returning plain abs_section_offset when we're in the
8905 * absolute section, and abs_section_offset not getting updated as data
8906 * gets added to the frag breaks the logic below.
8907 */
8908 if (now_seg != absolute_section)
8909 {
8910 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8911 if (j > 15)
8912 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8913 j);
8914 else if (fragP)
8915 {
8916 /* NB: Don't add prefix with GOTPC relocation since
8917 output_disp() above depends on the fixed encoding
8918 length. Can't add prefix with TLS relocation since
8919 it breaks TLS linker optimization. */
8920 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
8921 /* Prefix count on the current instruction. */
8922 unsigned int count = i.vex.length;
8923 unsigned int k;
8924 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
8925 /* REX byte is encoded in VEX/EVEX prefix. */
8926 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
8927 count++;
8928
8929 /* Count prefixes for extended opcode maps. */
8930 if (!i.vex.length)
8931 switch (i.tm.opcode_length)
8932 {
8933 case 3:
8934 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
8935 {
8936 count++;
8937 switch ((i.tm.base_opcode >> 8) & 0xff)
8938 {
8939 case 0x38:
8940 case 0x3a:
8941 count++;
8942 break;
8943 default:
8944 break;
8945 }
8946 }
8947 break;
8948 case 2:
8949 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
8950 count++;
8951 break;
8952 case 1:
8953 break;
8954 default:
8955 abort ();
8956 }
8957
8958 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
8959 == BRANCH_PREFIX)
8960 {
8961 /* Set the maximum prefix size in BRANCH_PREFIX
8962 frag. */
8963 if (fragP->tc_frag_data.max_bytes > max)
8964 fragP->tc_frag_data.max_bytes = max;
8965 if (fragP->tc_frag_data.max_bytes > count)
8966 fragP->tc_frag_data.max_bytes -= count;
8967 else
8968 fragP->tc_frag_data.max_bytes = 0;
8969 }
8970 else
8971 {
8972 /* Remember the maximum prefix size in FUSED_JCC_PADDING
8973 frag. */
8974 unsigned int max_prefix_size;
8975 if (align_branch_prefix_size > max)
8976 max_prefix_size = max;
8977 else
8978 max_prefix_size = align_branch_prefix_size;
8979 if (max_prefix_size > count)
8980 fragP->tc_frag_data.max_prefix_length
8981 = max_prefix_size - count;
8982 }
8983
8984 /* Use existing segment prefix if possible. Use CS
8985 segment prefix in 64-bit mode. In 32-bit mode, use SS
8986 segment prefix with ESP/EBP base register and use DS
8987 segment prefix without ESP/EBP base register. */
8988 if (i.prefix[SEG_PREFIX])
8989 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
8990 else if (flag_code == CODE_64BIT)
8991 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
8992 else if (i.base_reg
8993 && (i.base_reg->reg_num == 4
8994 || i.base_reg->reg_num == 5))
8995 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
8996 else
8997 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
8998 }
8999 }
9000 }
9001
9002 /* NB: Don't work with COND_JUMP86 without i386. */
9003 if (align_branch_power
9004 && now_seg != absolute_section
9005 && cpu_arch_flags.bitfield.cpui386)
9006 {
9007 /* Terminate each frag so that we can add prefix and check for
9008 fused jcc. */
9009 frag_wane (frag_now);
9010 frag_new (0);
9011 }
9012
9013 #ifdef DEBUG386
9014 if (flag_debug)
9015 {
9016 pi ("" /*line*/, &i);
9017 }
9018 #endif /* DEBUG386 */
9019 }
9020
9021 /* Return the size of the displacement operand N. */
9022
9023 static int
9024 disp_size (unsigned int n)
9025 {
9026 int size = 4;
9027
9028 if (i.types[n].bitfield.disp64)
9029 size = 8;
9030 else if (i.types[n].bitfield.disp8)
9031 size = 1;
9032 else if (i.types[n].bitfield.disp16)
9033 size = 2;
9034 return size;
9035 }
9036
9037 /* Return the size of the immediate operand N. */
9038
9039 static int
9040 imm_size (unsigned int n)
9041 {
9042 int size = 4;
9043 if (i.types[n].bitfield.imm64)
9044 size = 8;
9045 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9046 size = 1;
9047 else if (i.types[n].bitfield.imm16)
9048 size = 2;
9049 return size;
9050 }
9051
9052 static void
9053 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9054 {
9055 char *p;
9056 unsigned int n;
9057
9058 for (n = 0; n < i.operands; n++)
9059 {
9060 if (operand_type_check (i.types[n], disp))
9061 {
9062 if (i.op[n].disps->X_op == O_constant)
9063 {
9064 int size = disp_size (n);
9065 offsetT val = i.op[n].disps->X_add_number;
9066
9067 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9068 size);
9069 p = frag_more (size);
9070 md_number_to_chars (p, val, size);
9071 }
9072 else
9073 {
9074 enum bfd_reloc_code_real reloc_type;
9075 int size = disp_size (n);
9076 int sign = i.types[n].bitfield.disp32s;
9077 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9078 fixS *fixP;
9079
9080 /* We can't have 8 bit displacement here. */
9081 gas_assert (!i.types[n].bitfield.disp8);
9082
9083 /* The PC relative address is computed relative
9084 to the instruction boundary, so in case immediate
9085 fields follows, we need to adjust the value. */
9086 if (pcrel && i.imm_operands)
9087 {
9088 unsigned int n1;
9089 int sz = 0;
9090
9091 for (n1 = 0; n1 < i.operands; n1++)
9092 if (operand_type_check (i.types[n1], imm))
9093 {
9094 /* Only one immediate is allowed for PC
9095 relative address. */
9096 gas_assert (sz == 0);
9097 sz = imm_size (n1);
9098 i.op[n].disps->X_add_number -= sz;
9099 }
9100 /* We should find the immediate. */
9101 gas_assert (sz != 0);
9102 }
9103
9104 p = frag_more (size);
9105 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9106 if (GOT_symbol
9107 && GOT_symbol == i.op[n].disps->X_add_symbol
9108 && (((reloc_type == BFD_RELOC_32
9109 || reloc_type == BFD_RELOC_X86_64_32S
9110 || (reloc_type == BFD_RELOC_64
9111 && object_64bit))
9112 && (i.op[n].disps->X_op == O_symbol
9113 || (i.op[n].disps->X_op == O_add
9114 && ((symbol_get_value_expression
9115 (i.op[n].disps->X_op_symbol)->X_op)
9116 == O_subtract))))
9117 || reloc_type == BFD_RELOC_32_PCREL))
9118 {
9119 if (!object_64bit)
9120 {
9121 reloc_type = BFD_RELOC_386_GOTPC;
9122 i.has_gotpc_tls_reloc = TRUE;
9123 i.op[n].imms->X_add_number +=
9124 encoding_length (insn_start_frag, insn_start_off, p);
9125 }
9126 else if (reloc_type == BFD_RELOC_64)
9127 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9128 else
9129 /* Don't do the adjustment for x86-64, as there
9130 the pcrel addressing is relative to the _next_
9131 insn, and that is taken care of in other code. */
9132 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9133 }
9134 else if (align_branch_power)
9135 {
9136 switch (reloc_type)
9137 {
9138 case BFD_RELOC_386_TLS_GD:
9139 case BFD_RELOC_386_TLS_LDM:
9140 case BFD_RELOC_386_TLS_IE:
9141 case BFD_RELOC_386_TLS_IE_32:
9142 case BFD_RELOC_386_TLS_GOTIE:
9143 case BFD_RELOC_386_TLS_GOTDESC:
9144 case BFD_RELOC_386_TLS_DESC_CALL:
9145 case BFD_RELOC_X86_64_TLSGD:
9146 case BFD_RELOC_X86_64_TLSLD:
9147 case BFD_RELOC_X86_64_GOTTPOFF:
9148 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9149 case BFD_RELOC_X86_64_TLSDESC_CALL:
9150 i.has_gotpc_tls_reloc = TRUE;
9151 default:
9152 break;
9153 }
9154 }
9155 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9156 size, i.op[n].disps, pcrel,
9157 reloc_type);
9158 /* Check for "call/jmp *mem", "mov mem, %reg",
9159 "test %reg, mem" and "binop mem, %reg" where binop
9160 is one of adc, add, and, cmp, or, sbb, sub, xor
9161 instructions without data prefix. Always generate
9162 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9163 if (i.prefix[DATA_PREFIX] == 0
9164 && (generate_relax_relocations
9165 || (!object_64bit
9166 && i.rm.mode == 0
9167 && i.rm.regmem == 5))
9168 && (i.rm.mode == 2
9169 || (i.rm.mode == 0 && i.rm.regmem == 5))
9170 && !is_any_vex_encoding(&i.tm)
9171 && ((i.operands == 1
9172 && i.tm.base_opcode == 0xff
9173 && (i.rm.reg == 2 || i.rm.reg == 4))
9174 || (i.operands == 2
9175 && (i.tm.base_opcode == 0x8b
9176 || i.tm.base_opcode == 0x85
9177 || (i.tm.base_opcode & ~0x38) == 0x03))))
9178 {
9179 if (object_64bit)
9180 {
9181 fixP->fx_tcbit = i.rex != 0;
9182 if (i.base_reg
9183 && (i.base_reg->reg_num == RegIP))
9184 fixP->fx_tcbit2 = 1;
9185 }
9186 else
9187 fixP->fx_tcbit2 = 1;
9188 }
9189 }
9190 }
9191 }
9192 }
9193
9194 static void
9195 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9196 {
9197 char *p;
9198 unsigned int n;
9199
9200 for (n = 0; n < i.operands; n++)
9201 {
9202 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9203 if (i.rounding && (int) n == i.rounding->operand)
9204 continue;
9205
9206 if (operand_type_check (i.types[n], imm))
9207 {
9208 if (i.op[n].imms->X_op == O_constant)
9209 {
9210 int size = imm_size (n);
9211 offsetT val;
9212
9213 val = offset_in_range (i.op[n].imms->X_add_number,
9214 size);
9215 p = frag_more (size);
9216 md_number_to_chars (p, val, size);
9217 }
9218 else
9219 {
9220 /* Not absolute_section.
9221 Need a 32-bit fixup (don't support 8bit
9222 non-absolute imms). Try to support other
9223 sizes ... */
9224 enum bfd_reloc_code_real reloc_type;
9225 int size = imm_size (n);
9226 int sign;
9227
9228 if (i.types[n].bitfield.imm32s
9229 && (i.suffix == QWORD_MNEM_SUFFIX
9230 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9231 sign = 1;
9232 else
9233 sign = 0;
9234
9235 p = frag_more (size);
9236 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9237
9238 /* This is tough to explain. We end up with this one if we
9239 * have operands that look like
9240 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9241 * obtain the absolute address of the GOT, and it is strongly
9242 * preferable from a performance point of view to avoid using
9243 * a runtime relocation for this. The actual sequence of
9244 * instructions often look something like:
9245 *
9246 * call .L66
9247 * .L66:
9248 * popl %ebx
9249 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9250 *
9251 * The call and pop essentially return the absolute address
9252 * of the label .L66 and store it in %ebx. The linker itself
9253 * will ultimately change the first operand of the addl so
9254 * that %ebx points to the GOT, but to keep things simple, the
9255 * .o file must have this operand set so that it generates not
9256 * the absolute address of .L66, but the absolute address of
9257 * itself. This allows the linker itself simply treat a GOTPC
9258 * relocation as asking for a pcrel offset to the GOT to be
9259 * added in, and the addend of the relocation is stored in the
9260 * operand field for the instruction itself.
9261 *
9262 * Our job here is to fix the operand so that it would add
9263 * the correct offset so that %ebx would point to itself. The
9264 * thing that is tricky is that .-.L66 will point to the
9265 * beginning of the instruction, so we need to further modify
9266 * the operand so that it will point to itself. There are
9267 * other cases where you have something like:
9268 *
9269 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9270 *
9271 * and here no correction would be required. Internally in
9272 * the assembler we treat operands of this form as not being
9273 * pcrel since the '.' is explicitly mentioned, and I wonder
9274 * whether it would simplify matters to do it this way. Who
9275 * knows. In earlier versions of the PIC patches, the
9276 * pcrel_adjust field was used to store the correction, but
9277 * since the expression is not pcrel, I felt it would be
9278 * confusing to do it this way. */
9279
9280 if ((reloc_type == BFD_RELOC_32
9281 || reloc_type == BFD_RELOC_X86_64_32S
9282 || reloc_type == BFD_RELOC_64)
9283 && GOT_symbol
9284 && GOT_symbol == i.op[n].imms->X_add_symbol
9285 && (i.op[n].imms->X_op == O_symbol
9286 || (i.op[n].imms->X_op == O_add
9287 && ((symbol_get_value_expression
9288 (i.op[n].imms->X_op_symbol)->X_op)
9289 == O_subtract))))
9290 {
9291 if (!object_64bit)
9292 reloc_type = BFD_RELOC_386_GOTPC;
9293 else if (size == 4)
9294 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9295 else if (size == 8)
9296 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9297 i.has_gotpc_tls_reloc = TRUE;
9298 i.op[n].imms->X_add_number +=
9299 encoding_length (insn_start_frag, insn_start_off, p);
9300 }
9301 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9302 i.op[n].imms, 0, reloc_type);
9303 }
9304 }
9305 }
9306 }
9307 \f
9308 /* x86_cons_fix_new is called via the expression parsing code when a
9309 reloc is needed. We use this hook to get the correct .got reloc. */
9310 static int cons_sign = -1;
9311
9312 void
9313 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9314 expressionS *exp, bfd_reloc_code_real_type r)
9315 {
9316 r = reloc (len, 0, cons_sign, r);
9317
9318 #ifdef TE_PE
9319 if (exp->X_op == O_secrel)
9320 {
9321 exp->X_op = O_symbol;
9322 r = BFD_RELOC_32_SECREL;
9323 }
9324 #endif
9325
9326 fix_new_exp (frag, off, len, exp, 0, r);
9327 }
9328
9329 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9330 purpose of the `.dc.a' internal pseudo-op. */
9331
9332 int
9333 x86_address_bytes (void)
9334 {
9335 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9336 return 4;
9337 return stdoutput->arch_info->bits_per_address / 8;
9338 }
9339
9340 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9341 || defined (LEX_AT)
9342 # define lex_got(reloc, adjust, types) NULL
9343 #else
9344 /* Parse operands of the form
9345 <symbol>@GOTOFF+<nnn>
9346 and similar .plt or .got references.
9347
9348 If we find one, set up the correct relocation in RELOC and copy the
9349 input string, minus the `@GOTOFF' into a malloc'd buffer for
9350 parsing by the calling routine. Return this buffer, and if ADJUST
9351 is non-null set it to the length of the string we removed from the
9352 input line. Otherwise return NULL. */
9353 static char *
9354 lex_got (enum bfd_reloc_code_real *rel,
9355 int *adjust,
9356 i386_operand_type *types)
9357 {
9358 /* Some of the relocations depend on the size of what field is to
9359 be relocated. But in our callers i386_immediate and i386_displacement
9360 we don't yet know the operand size (this will be set by insn
9361 matching). Hence we record the word32 relocation here,
9362 and adjust the reloc according to the real size in reloc(). */
9363 static const struct {
9364 const char *str;
9365 int len;
9366 const enum bfd_reloc_code_real rel[2];
9367 const i386_operand_type types64;
9368 } gotrel[] = {
9369 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9370 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9371 BFD_RELOC_SIZE32 },
9372 OPERAND_TYPE_IMM32_64 },
9373 #endif
9374 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9375 BFD_RELOC_X86_64_PLTOFF64 },
9376 OPERAND_TYPE_IMM64 },
9377 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9378 BFD_RELOC_X86_64_PLT32 },
9379 OPERAND_TYPE_IMM32_32S_DISP32 },
9380 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9381 BFD_RELOC_X86_64_GOTPLT64 },
9382 OPERAND_TYPE_IMM64_DISP64 },
9383 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9384 BFD_RELOC_X86_64_GOTOFF64 },
9385 OPERAND_TYPE_IMM64_DISP64 },
9386 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9387 BFD_RELOC_X86_64_GOTPCREL },
9388 OPERAND_TYPE_IMM32_32S_DISP32 },
9389 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9390 BFD_RELOC_X86_64_TLSGD },
9391 OPERAND_TYPE_IMM32_32S_DISP32 },
9392 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9393 _dummy_first_bfd_reloc_code_real },
9394 OPERAND_TYPE_NONE },
9395 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9396 BFD_RELOC_X86_64_TLSLD },
9397 OPERAND_TYPE_IMM32_32S_DISP32 },
9398 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9399 BFD_RELOC_X86_64_GOTTPOFF },
9400 OPERAND_TYPE_IMM32_32S_DISP32 },
9401 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9402 BFD_RELOC_X86_64_TPOFF32 },
9403 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9404 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9405 _dummy_first_bfd_reloc_code_real },
9406 OPERAND_TYPE_NONE },
9407 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9408 BFD_RELOC_X86_64_DTPOFF32 },
9409 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9410 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9411 _dummy_first_bfd_reloc_code_real },
9412 OPERAND_TYPE_NONE },
9413 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9414 _dummy_first_bfd_reloc_code_real },
9415 OPERAND_TYPE_NONE },
9416 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9417 BFD_RELOC_X86_64_GOT32 },
9418 OPERAND_TYPE_IMM32_32S_64_DISP32 },
9419 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9420 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9421 OPERAND_TYPE_IMM32_32S_DISP32 },
9422 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9423 BFD_RELOC_X86_64_TLSDESC_CALL },
9424 OPERAND_TYPE_IMM32_32S_DISP32 },
9425 };
9426 char *cp;
9427 unsigned int j;
9428
9429 #if defined (OBJ_MAYBE_ELF)
9430 if (!IS_ELF)
9431 return NULL;
9432 #endif
9433
9434 for (cp = input_line_pointer; *cp != '@'; cp++)
9435 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9436 return NULL;
9437
9438 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9439 {
9440 int len = gotrel[j].len;
9441 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9442 {
9443 if (gotrel[j].rel[object_64bit] != 0)
9444 {
9445 int first, second;
9446 char *tmpbuf, *past_reloc;
9447
9448 *rel = gotrel[j].rel[object_64bit];
9449
9450 if (types)
9451 {
9452 if (flag_code != CODE_64BIT)
9453 {
9454 types->bitfield.imm32 = 1;
9455 types->bitfield.disp32 = 1;
9456 }
9457 else
9458 *types = gotrel[j].types64;
9459 }
9460
9461 if (j != 0 && GOT_symbol == NULL)
9462 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9463
9464 /* The length of the first part of our input line. */
9465 first = cp - input_line_pointer;
9466
9467 /* The second part goes from after the reloc token until
9468 (and including) an end_of_line char or comma. */
9469 past_reloc = cp + 1 + len;
9470 cp = past_reloc;
9471 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9472 ++cp;
9473 second = cp + 1 - past_reloc;
9474
9475 /* Allocate and copy string. The trailing NUL shouldn't
9476 be necessary, but be safe. */
9477 tmpbuf = XNEWVEC (char, first + second + 2);
9478 memcpy (tmpbuf, input_line_pointer, first);
9479 if (second != 0 && *past_reloc != ' ')
9480 /* Replace the relocation token with ' ', so that
9481 errors like foo@GOTOFF1 will be detected. */
9482 tmpbuf[first++] = ' ';
9483 else
9484 /* Increment length by 1 if the relocation token is
9485 removed. */
9486 len++;
9487 if (adjust)
9488 *adjust = len;
9489 memcpy (tmpbuf + first, past_reloc, second);
9490 tmpbuf[first + second] = '\0';
9491 return tmpbuf;
9492 }
9493
9494 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9495 gotrel[j].str, 1 << (5 + object_64bit));
9496 return NULL;
9497 }
9498 }
9499
9500 /* Might be a symbol version string. Don't as_bad here. */
9501 return NULL;
9502 }
9503 #endif
9504
9505 #ifdef TE_PE
9506 #ifdef lex_got
9507 #undef lex_got
9508 #endif
9509 /* Parse operands of the form
9510 <symbol>@SECREL32+<nnn>
9511
9512 If we find one, set up the correct relocation in RELOC and copy the
9513 input string, minus the `@SECREL32' into a malloc'd buffer for
9514 parsing by the calling routine. Return this buffer, and if ADJUST
9515 is non-null set it to the length of the string we removed from the
9516 input line. Otherwise return NULL.
9517
9518 This function is copied from the ELF version above adjusted for PE targets. */
9519
9520 static char *
9521 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
9522 int *adjust ATTRIBUTE_UNUSED,
9523 i386_operand_type *types)
9524 {
9525 static const struct
9526 {
9527 const char *str;
9528 int len;
9529 const enum bfd_reloc_code_real rel[2];
9530 const i386_operand_type types64;
9531 }
9532 gotrel[] =
9533 {
9534 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
9535 BFD_RELOC_32_SECREL },
9536 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9537 };
9538
9539 char *cp;
9540 unsigned j;
9541
9542 for (cp = input_line_pointer; *cp != '@'; cp++)
9543 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9544 return NULL;
9545
9546 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9547 {
9548 int len = gotrel[j].len;
9549
9550 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9551 {
9552 if (gotrel[j].rel[object_64bit] != 0)
9553 {
9554 int first, second;
9555 char *tmpbuf, *past_reloc;
9556
9557 *rel = gotrel[j].rel[object_64bit];
9558 if (adjust)
9559 *adjust = len;
9560
9561 if (types)
9562 {
9563 if (flag_code != CODE_64BIT)
9564 {
9565 types->bitfield.imm32 = 1;
9566 types->bitfield.disp32 = 1;
9567 }
9568 else
9569 *types = gotrel[j].types64;
9570 }
9571
9572 /* The length of the first part of our input line. */
9573 first = cp - input_line_pointer;
9574
9575 /* The second part goes from after the reloc token until
9576 (and including) an end_of_line char or comma. */
9577 past_reloc = cp + 1 + len;
9578 cp = past_reloc;
9579 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9580 ++cp;
9581 second = cp + 1 - past_reloc;
9582
9583 /* Allocate and copy string. The trailing NUL shouldn't
9584 be necessary, but be safe. */
9585 tmpbuf = XNEWVEC (char, first + second + 2);
9586 memcpy (tmpbuf, input_line_pointer, first);
9587 if (second != 0 && *past_reloc != ' ')
9588 /* Replace the relocation token with ' ', so that
9589 errors like foo@SECLREL321 will be detected. */
9590 tmpbuf[first++] = ' ';
9591 memcpy (tmpbuf + first, past_reloc, second);
9592 tmpbuf[first + second] = '\0';
9593 return tmpbuf;
9594 }
9595
9596 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9597 gotrel[j].str, 1 << (5 + object_64bit));
9598 return NULL;
9599 }
9600 }
9601
9602 /* Might be a symbol version string. Don't as_bad here. */
9603 return NULL;
9604 }
9605
9606 #endif /* TE_PE */
9607
9608 bfd_reloc_code_real_type
9609 x86_cons (expressionS *exp, int size)
9610 {
9611 bfd_reloc_code_real_type got_reloc = NO_RELOC;
9612
9613 intel_syntax = -intel_syntax;
9614
9615 exp->X_md = 0;
9616 if (size == 4 || (object_64bit && size == 8))
9617 {
9618 /* Handle @GOTOFF and the like in an expression. */
9619 char *save;
9620 char *gotfree_input_line;
9621 int adjust = 0;
9622
9623 save = input_line_pointer;
9624 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9625 if (gotfree_input_line)
9626 input_line_pointer = gotfree_input_line;
9627
9628 expression (exp);
9629
9630 if (gotfree_input_line)
9631 {
9632 /* expression () has merrily parsed up to the end of line,
9633 or a comma - in the wrong buffer. Transfer how far
9634 input_line_pointer has moved to the right buffer. */
9635 input_line_pointer = (save
9636 + (input_line_pointer - gotfree_input_line)
9637 + adjust);
9638 free (gotfree_input_line);
9639 if (exp->X_op == O_constant
9640 || exp->X_op == O_absent
9641 || exp->X_op == O_illegal
9642 || exp->X_op == O_register
9643 || exp->X_op == O_big)
9644 {
9645 char c = *input_line_pointer;
9646 *input_line_pointer = 0;
9647 as_bad (_("missing or invalid expression `%s'"), save);
9648 *input_line_pointer = c;
9649 }
9650 else if ((got_reloc == BFD_RELOC_386_PLT32
9651 || got_reloc == BFD_RELOC_X86_64_PLT32)
9652 && exp->X_op != O_symbol)
9653 {
9654 char c = *input_line_pointer;
9655 *input_line_pointer = 0;
9656 as_bad (_("invalid PLT expression `%s'"), save);
9657 *input_line_pointer = c;
9658 }
9659 }
9660 }
9661 else
9662 expression (exp);
9663
9664 intel_syntax = -intel_syntax;
9665
9666 if (intel_syntax)
9667 i386_intel_simplify (exp);
9668
9669 return got_reloc;
9670 }
9671
9672 static void
9673 signed_cons (int size)
9674 {
9675 if (flag_code == CODE_64BIT)
9676 cons_sign = 1;
9677 cons (size);
9678 cons_sign = -1;
9679 }
9680
9681 #ifdef TE_PE
9682 static void
9683 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9684 {
9685 expressionS exp;
9686
9687 do
9688 {
9689 expression (&exp);
9690 if (exp.X_op == O_symbol)
9691 exp.X_op = O_secrel;
9692
9693 emit_expr (&exp, 4);
9694 }
9695 while (*input_line_pointer++ == ',');
9696
9697 input_line_pointer--;
9698 demand_empty_rest_of_line ();
9699 }
9700 #endif
9701
9702 /* Handle Vector operations. */
9703
9704 static char *
9705 check_VecOperations (char *op_string, char *op_end)
9706 {
9707 const reg_entry *mask;
9708 const char *saved;
9709 char *end_op;
9710
9711 while (*op_string
9712 && (op_end == NULL || op_string < op_end))
9713 {
9714 saved = op_string;
9715 if (*op_string == '{')
9716 {
9717 op_string++;
9718
9719 /* Check broadcasts. */
9720 if (strncmp (op_string, "1to", 3) == 0)
9721 {
9722 int bcst_type;
9723
9724 if (i.broadcast)
9725 goto duplicated_vec_op;
9726
9727 op_string += 3;
9728 if (*op_string == '8')
9729 bcst_type = 8;
9730 else if (*op_string == '4')
9731 bcst_type = 4;
9732 else if (*op_string == '2')
9733 bcst_type = 2;
9734 else if (*op_string == '1'
9735 && *(op_string+1) == '6')
9736 {
9737 bcst_type = 16;
9738 op_string++;
9739 }
9740 else
9741 {
9742 as_bad (_("Unsupported broadcast: `%s'"), saved);
9743 return NULL;
9744 }
9745 op_string++;
9746
9747 broadcast_op.type = bcst_type;
9748 broadcast_op.operand = this_operand;
9749 broadcast_op.bytes = 0;
9750 i.broadcast = &broadcast_op;
9751 }
9752 /* Check masking operation. */
9753 else if ((mask = parse_register (op_string, &end_op)) != NULL)
9754 {
9755 /* k0 can't be used for write mask. */
9756 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
9757 {
9758 as_bad (_("`%s%s' can't be used for write mask"),
9759 register_prefix, mask->reg_name);
9760 return NULL;
9761 }
9762
9763 if (!i.mask)
9764 {
9765 mask_op.mask = mask;
9766 mask_op.zeroing = 0;
9767 mask_op.operand = this_operand;
9768 i.mask = &mask_op;
9769 }
9770 else
9771 {
9772 if (i.mask->mask)
9773 goto duplicated_vec_op;
9774
9775 i.mask->mask = mask;
9776
9777 /* Only "{z}" is allowed here. No need to check
9778 zeroing mask explicitly. */
9779 if (i.mask->operand != this_operand)
9780 {
9781 as_bad (_("invalid write mask `%s'"), saved);
9782 return NULL;
9783 }
9784 }
9785
9786 op_string = end_op;
9787 }
9788 /* Check zeroing-flag for masking operation. */
9789 else if (*op_string == 'z')
9790 {
9791 if (!i.mask)
9792 {
9793 mask_op.mask = NULL;
9794 mask_op.zeroing = 1;
9795 mask_op.operand = this_operand;
9796 i.mask = &mask_op;
9797 }
9798 else
9799 {
9800 if (i.mask->zeroing)
9801 {
9802 duplicated_vec_op:
9803 as_bad (_("duplicated `%s'"), saved);
9804 return NULL;
9805 }
9806
9807 i.mask->zeroing = 1;
9808
9809 /* Only "{%k}" is allowed here. No need to check mask
9810 register explicitly. */
9811 if (i.mask->operand != this_operand)
9812 {
9813 as_bad (_("invalid zeroing-masking `%s'"),
9814 saved);
9815 return NULL;
9816 }
9817 }
9818
9819 op_string++;
9820 }
9821 else
9822 goto unknown_vec_op;
9823
9824 if (*op_string != '}')
9825 {
9826 as_bad (_("missing `}' in `%s'"), saved);
9827 return NULL;
9828 }
9829 op_string++;
9830
9831 /* Strip whitespace since the addition of pseudo prefixes
9832 changed how the scrubber treats '{'. */
9833 if (is_space_char (*op_string))
9834 ++op_string;
9835
9836 continue;
9837 }
9838 unknown_vec_op:
9839 /* We don't know this one. */
9840 as_bad (_("unknown vector operation: `%s'"), saved);
9841 return NULL;
9842 }
9843
9844 if (i.mask && i.mask->zeroing && !i.mask->mask)
9845 {
9846 as_bad (_("zeroing-masking only allowed with write mask"));
9847 return NULL;
9848 }
9849
9850 return op_string;
9851 }
9852
9853 static int
9854 i386_immediate (char *imm_start)
9855 {
9856 char *save_input_line_pointer;
9857 char *gotfree_input_line;
9858 segT exp_seg = 0;
9859 expressionS *exp;
9860 i386_operand_type types;
9861
9862 operand_type_set (&types, ~0);
9863
9864 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9865 {
9866 as_bad (_("at most %d immediate operands are allowed"),
9867 MAX_IMMEDIATE_OPERANDS);
9868 return 0;
9869 }
9870
9871 exp = &im_expressions[i.imm_operands++];
9872 i.op[this_operand].imms = exp;
9873
9874 if (is_space_char (*imm_start))
9875 ++imm_start;
9876
9877 save_input_line_pointer = input_line_pointer;
9878 input_line_pointer = imm_start;
9879
9880 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9881 if (gotfree_input_line)
9882 input_line_pointer = gotfree_input_line;
9883
9884 exp_seg = expression (exp);
9885
9886 SKIP_WHITESPACE ();
9887
9888 /* Handle vector operations. */
9889 if (*input_line_pointer == '{')
9890 {
9891 input_line_pointer = check_VecOperations (input_line_pointer,
9892 NULL);
9893 if (input_line_pointer == NULL)
9894 return 0;
9895 }
9896
9897 if (*input_line_pointer)
9898 as_bad (_("junk `%s' after expression"), input_line_pointer);
9899
9900 input_line_pointer = save_input_line_pointer;
9901 if (gotfree_input_line)
9902 {
9903 free (gotfree_input_line);
9904
9905 if (exp->X_op == O_constant || exp->X_op == O_register)
9906 exp->X_op = O_illegal;
9907 }
9908
9909 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9910 }
9911
9912 static int
9913 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9914 i386_operand_type types, const char *imm_start)
9915 {
9916 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9917 {
9918 if (imm_start)
9919 as_bad (_("missing or invalid immediate expression `%s'"),
9920 imm_start);
9921 return 0;
9922 }
9923 else if (exp->X_op == O_constant)
9924 {
9925 /* Size it properly later. */
9926 i.types[this_operand].bitfield.imm64 = 1;
9927 /* If not 64bit, sign extend val. */
9928 if (flag_code != CODE_64BIT
9929 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9930 exp->X_add_number
9931 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9932 }
9933 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9934 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9935 && exp_seg != absolute_section
9936 && exp_seg != text_section
9937 && exp_seg != data_section
9938 && exp_seg != bss_section
9939 && exp_seg != undefined_section
9940 && !bfd_is_com_section (exp_seg))
9941 {
9942 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9943 return 0;
9944 }
9945 #endif
9946 else if (!intel_syntax && exp_seg == reg_section)
9947 {
9948 if (imm_start)
9949 as_bad (_("illegal immediate register operand %s"), imm_start);
9950 return 0;
9951 }
9952 else
9953 {
9954 /* This is an address. The size of the address will be
9955 determined later, depending on destination register,
9956 suffix, or the default for the section. */
9957 i.types[this_operand].bitfield.imm8 = 1;
9958 i.types[this_operand].bitfield.imm16 = 1;
9959 i.types[this_operand].bitfield.imm32 = 1;
9960 i.types[this_operand].bitfield.imm32s = 1;
9961 i.types[this_operand].bitfield.imm64 = 1;
9962 i.types[this_operand] = operand_type_and (i.types[this_operand],
9963 types);
9964 }
9965
9966 return 1;
9967 }
9968
9969 static char *
9970 i386_scale (char *scale)
9971 {
9972 offsetT val;
9973 char *save = input_line_pointer;
9974
9975 input_line_pointer = scale;
9976 val = get_absolute_expression ();
9977
9978 switch (val)
9979 {
9980 case 1:
9981 i.log2_scale_factor = 0;
9982 break;
9983 case 2:
9984 i.log2_scale_factor = 1;
9985 break;
9986 case 4:
9987 i.log2_scale_factor = 2;
9988 break;
9989 case 8:
9990 i.log2_scale_factor = 3;
9991 break;
9992 default:
9993 {
9994 char sep = *input_line_pointer;
9995
9996 *input_line_pointer = '\0';
9997 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9998 scale);
9999 *input_line_pointer = sep;
10000 input_line_pointer = save;
10001 return NULL;
10002 }
10003 }
10004 if (i.log2_scale_factor != 0 && i.index_reg == 0)
10005 {
10006 as_warn (_("scale factor of %d without an index register"),
10007 1 << i.log2_scale_factor);
10008 i.log2_scale_factor = 0;
10009 }
10010 scale = input_line_pointer;
10011 input_line_pointer = save;
10012 return scale;
10013 }
10014
10015 static int
10016 i386_displacement (char *disp_start, char *disp_end)
10017 {
10018 expressionS *exp;
10019 segT exp_seg = 0;
10020 char *save_input_line_pointer;
10021 char *gotfree_input_line;
10022 int override;
10023 i386_operand_type bigdisp, types = anydisp;
10024 int ret;
10025
10026 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10027 {
10028 as_bad (_("at most %d displacement operands are allowed"),
10029 MAX_MEMORY_OPERANDS);
10030 return 0;
10031 }
10032
10033 operand_type_set (&bigdisp, 0);
10034 if (i.jumpabsolute
10035 || i.types[this_operand].bitfield.baseindex
10036 || (current_templates->start->opcode_modifier.jump != JUMP
10037 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10038 {
10039 i386_addressing_mode ();
10040 override = (i.prefix[ADDR_PREFIX] != 0);
10041 if (flag_code == CODE_64BIT)
10042 {
10043 if (!override)
10044 {
10045 bigdisp.bitfield.disp32s = 1;
10046 bigdisp.bitfield.disp64 = 1;
10047 }
10048 else
10049 bigdisp.bitfield.disp32 = 1;
10050 }
10051 else if ((flag_code == CODE_16BIT) ^ override)
10052 bigdisp.bitfield.disp16 = 1;
10053 else
10054 bigdisp.bitfield.disp32 = 1;
10055 }
10056 else
10057 {
10058 /* For PC-relative branches, the width of the displacement may be
10059 dependent upon data size, but is never dependent upon address size.
10060 Also make sure to not unintentionally match against a non-PC-relative
10061 branch template. */
10062 static templates aux_templates;
10063 const insn_template *t = current_templates->start;
10064 bfd_boolean has_intel64 = FALSE;
10065
10066 aux_templates.start = t;
10067 while (++t < current_templates->end)
10068 {
10069 if (t->opcode_modifier.jump
10070 != current_templates->start->opcode_modifier.jump)
10071 break;
10072 if ((t->opcode_modifier.isa64 >= INTEL64))
10073 has_intel64 = TRUE;
10074 }
10075 if (t < current_templates->end)
10076 {
10077 aux_templates.end = t;
10078 current_templates = &aux_templates;
10079 }
10080
10081 override = (i.prefix[DATA_PREFIX] != 0);
10082 if (flag_code == CODE_64BIT)
10083 {
10084 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10085 && (!intel64 || !has_intel64))
10086 bigdisp.bitfield.disp16 = 1;
10087 else
10088 bigdisp.bitfield.disp32s = 1;
10089 }
10090 else
10091 {
10092 if (!override)
10093 override = (i.suffix == (flag_code != CODE_16BIT
10094 ? WORD_MNEM_SUFFIX
10095 : LONG_MNEM_SUFFIX));
10096 bigdisp.bitfield.disp32 = 1;
10097 if ((flag_code == CODE_16BIT) ^ override)
10098 {
10099 bigdisp.bitfield.disp32 = 0;
10100 bigdisp.bitfield.disp16 = 1;
10101 }
10102 }
10103 }
10104 i.types[this_operand] = operand_type_or (i.types[this_operand],
10105 bigdisp);
10106
10107 exp = &disp_expressions[i.disp_operands];
10108 i.op[this_operand].disps = exp;
10109 i.disp_operands++;
10110 save_input_line_pointer = input_line_pointer;
10111 input_line_pointer = disp_start;
10112 END_STRING_AND_SAVE (disp_end);
10113
10114 #ifndef GCC_ASM_O_HACK
10115 #define GCC_ASM_O_HACK 0
10116 #endif
10117 #if GCC_ASM_O_HACK
10118 END_STRING_AND_SAVE (disp_end + 1);
10119 if (i.types[this_operand].bitfield.baseIndex
10120 && displacement_string_end[-1] == '+')
10121 {
10122 /* This hack is to avoid a warning when using the "o"
10123 constraint within gcc asm statements.
10124 For instance:
10125
10126 #define _set_tssldt_desc(n,addr,limit,type) \
10127 __asm__ __volatile__ ( \
10128 "movw %w2,%0\n\t" \
10129 "movw %w1,2+%0\n\t" \
10130 "rorl $16,%1\n\t" \
10131 "movb %b1,4+%0\n\t" \
10132 "movb %4,5+%0\n\t" \
10133 "movb $0,6+%0\n\t" \
10134 "movb %h1,7+%0\n\t" \
10135 "rorl $16,%1" \
10136 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10137
10138 This works great except that the output assembler ends
10139 up looking a bit weird if it turns out that there is
10140 no offset. You end up producing code that looks like:
10141
10142 #APP
10143 movw $235,(%eax)
10144 movw %dx,2+(%eax)
10145 rorl $16,%edx
10146 movb %dl,4+(%eax)
10147 movb $137,5+(%eax)
10148 movb $0,6+(%eax)
10149 movb %dh,7+(%eax)
10150 rorl $16,%edx
10151 #NO_APP
10152
10153 So here we provide the missing zero. */
10154
10155 *displacement_string_end = '0';
10156 }
10157 #endif
10158 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10159 if (gotfree_input_line)
10160 input_line_pointer = gotfree_input_line;
10161
10162 exp_seg = expression (exp);
10163
10164 SKIP_WHITESPACE ();
10165 if (*input_line_pointer)
10166 as_bad (_("junk `%s' after expression"), input_line_pointer);
10167 #if GCC_ASM_O_HACK
10168 RESTORE_END_STRING (disp_end + 1);
10169 #endif
10170 input_line_pointer = save_input_line_pointer;
10171 if (gotfree_input_line)
10172 {
10173 free (gotfree_input_line);
10174
10175 if (exp->X_op == O_constant || exp->X_op == O_register)
10176 exp->X_op = O_illegal;
10177 }
10178
10179 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10180
10181 RESTORE_END_STRING (disp_end);
10182
10183 return ret;
10184 }
10185
10186 static int
10187 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10188 i386_operand_type types, const char *disp_start)
10189 {
10190 i386_operand_type bigdisp;
10191 int ret = 1;
10192
10193 /* We do this to make sure that the section symbol is in
10194 the symbol table. We will ultimately change the relocation
10195 to be relative to the beginning of the section. */
10196 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10197 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10198 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10199 {
10200 if (exp->X_op != O_symbol)
10201 goto inv_disp;
10202
10203 if (S_IS_LOCAL (exp->X_add_symbol)
10204 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10205 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10206 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10207 exp->X_op = O_subtract;
10208 exp->X_op_symbol = GOT_symbol;
10209 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10210 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10211 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10212 i.reloc[this_operand] = BFD_RELOC_64;
10213 else
10214 i.reloc[this_operand] = BFD_RELOC_32;
10215 }
10216
10217 else if (exp->X_op == O_absent
10218 || exp->X_op == O_illegal
10219 || exp->X_op == O_big)
10220 {
10221 inv_disp:
10222 as_bad (_("missing or invalid displacement expression `%s'"),
10223 disp_start);
10224 ret = 0;
10225 }
10226
10227 else if (flag_code == CODE_64BIT
10228 && !i.prefix[ADDR_PREFIX]
10229 && exp->X_op == O_constant)
10230 {
10231 /* Since displacement is signed extended to 64bit, don't allow
10232 disp32 and turn off disp32s if they are out of range. */
10233 i.types[this_operand].bitfield.disp32 = 0;
10234 if (!fits_in_signed_long (exp->X_add_number))
10235 {
10236 i.types[this_operand].bitfield.disp32s = 0;
10237 if (i.types[this_operand].bitfield.baseindex)
10238 {
10239 as_bad (_("0x%lx out range of signed 32bit displacement"),
10240 (long) exp->X_add_number);
10241 ret = 0;
10242 }
10243 }
10244 }
10245
10246 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10247 else if (exp->X_op != O_constant
10248 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10249 && exp_seg != absolute_section
10250 && exp_seg != text_section
10251 && exp_seg != data_section
10252 && exp_seg != bss_section
10253 && exp_seg != undefined_section
10254 && !bfd_is_com_section (exp_seg))
10255 {
10256 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10257 ret = 0;
10258 }
10259 #endif
10260
10261 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10262 /* Constants get taken care of by optimize_disp(). */
10263 && exp->X_op != O_constant)
10264 i.types[this_operand].bitfield.disp8 = 1;
10265
10266 /* Check if this is a displacement only operand. */
10267 bigdisp = i.types[this_operand];
10268 bigdisp.bitfield.disp8 = 0;
10269 bigdisp.bitfield.disp16 = 0;
10270 bigdisp.bitfield.disp32 = 0;
10271 bigdisp.bitfield.disp32s = 0;
10272 bigdisp.bitfield.disp64 = 0;
10273 if (operand_type_all_zero (&bigdisp))
10274 i.types[this_operand] = operand_type_and (i.types[this_operand],
10275 types);
10276
10277 return ret;
10278 }
10279
10280 /* Return the active addressing mode, taking address override and
10281 registers forming the address into consideration. Update the
10282 address override prefix if necessary. */
10283
10284 static enum flag_code
10285 i386_addressing_mode (void)
10286 {
10287 enum flag_code addr_mode;
10288
10289 if (i.prefix[ADDR_PREFIX])
10290 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10291 else
10292 {
10293 addr_mode = flag_code;
10294
10295 #if INFER_ADDR_PREFIX
10296 if (i.mem_operands == 0)
10297 {
10298 /* Infer address prefix from the first memory operand. */
10299 const reg_entry *addr_reg = i.base_reg;
10300
10301 if (addr_reg == NULL)
10302 addr_reg = i.index_reg;
10303
10304 if (addr_reg)
10305 {
10306 if (addr_reg->reg_type.bitfield.dword)
10307 addr_mode = CODE_32BIT;
10308 else if (flag_code != CODE_64BIT
10309 && addr_reg->reg_type.bitfield.word)
10310 addr_mode = CODE_16BIT;
10311
10312 if (addr_mode != flag_code)
10313 {
10314 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10315 i.prefixes += 1;
10316 /* Change the size of any displacement too. At most one
10317 of Disp16 or Disp32 is set.
10318 FIXME. There doesn't seem to be any real need for
10319 separate Disp16 and Disp32 flags. The same goes for
10320 Imm16 and Imm32. Removing them would probably clean
10321 up the code quite a lot. */
10322 if (flag_code != CODE_64BIT
10323 && (i.types[this_operand].bitfield.disp16
10324 || i.types[this_operand].bitfield.disp32))
10325 i.types[this_operand]
10326 = operand_type_xor (i.types[this_operand], disp16_32);
10327 }
10328 }
10329 }
10330 #endif
10331 }
10332
10333 return addr_mode;
10334 }
10335
10336 /* Make sure the memory operand we've been dealt is valid.
10337 Return 1 on success, 0 on a failure. */
10338
10339 static int
10340 i386_index_check (const char *operand_string)
10341 {
10342 const char *kind = "base/index";
10343 enum flag_code addr_mode = i386_addressing_mode ();
10344
10345 if (current_templates->start->opcode_modifier.isstring
10346 && !current_templates->start->cpu_flags.bitfield.cpupadlock
10347 && (current_templates->end[-1].opcode_modifier.isstring
10348 || i.mem_operands))
10349 {
10350 /* Memory operands of string insns are special in that they only allow
10351 a single register (rDI, rSI, or rBX) as their memory address. */
10352 const reg_entry *expected_reg;
10353 static const char *di_si[][2] =
10354 {
10355 { "esi", "edi" },
10356 { "si", "di" },
10357 { "rsi", "rdi" }
10358 };
10359 static const char *bx[] = { "ebx", "bx", "rbx" };
10360
10361 kind = "string address";
10362
10363 if (current_templates->start->opcode_modifier.repprefixok)
10364 {
10365 int es_op = current_templates->end[-1].opcode_modifier.isstring
10366 - IS_STRING_ES_OP0;
10367 int op = 0;
10368
10369 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10370 || ((!i.mem_operands != !intel_syntax)
10371 && current_templates->end[-1].operand_types[1]
10372 .bitfield.baseindex))
10373 op = 1;
10374 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10375 }
10376 else
10377 expected_reg = hash_find (reg_hash, bx[addr_mode]);
10378
10379 if (i.base_reg != expected_reg
10380 || i.index_reg
10381 || operand_type_check (i.types[this_operand], disp))
10382 {
10383 /* The second memory operand must have the same size as
10384 the first one. */
10385 if (i.mem_operands
10386 && i.base_reg
10387 && !((addr_mode == CODE_64BIT
10388 && i.base_reg->reg_type.bitfield.qword)
10389 || (addr_mode == CODE_32BIT
10390 ? i.base_reg->reg_type.bitfield.dword
10391 : i.base_reg->reg_type.bitfield.word)))
10392 goto bad_address;
10393
10394 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10395 operand_string,
10396 intel_syntax ? '[' : '(',
10397 register_prefix,
10398 expected_reg->reg_name,
10399 intel_syntax ? ']' : ')');
10400 return 1;
10401 }
10402 else
10403 return 1;
10404
10405 bad_address:
10406 as_bad (_("`%s' is not a valid %s expression"),
10407 operand_string, kind);
10408 return 0;
10409 }
10410 else
10411 {
10412 if (addr_mode != CODE_16BIT)
10413 {
10414 /* 32-bit/64-bit checks. */
10415 if ((i.base_reg
10416 && ((addr_mode == CODE_64BIT
10417 ? !i.base_reg->reg_type.bitfield.qword
10418 : !i.base_reg->reg_type.bitfield.dword)
10419 || (i.index_reg && i.base_reg->reg_num == RegIP)
10420 || i.base_reg->reg_num == RegIZ))
10421 || (i.index_reg
10422 && !i.index_reg->reg_type.bitfield.xmmword
10423 && !i.index_reg->reg_type.bitfield.ymmword
10424 && !i.index_reg->reg_type.bitfield.zmmword
10425 && ((addr_mode == CODE_64BIT
10426 ? !i.index_reg->reg_type.bitfield.qword
10427 : !i.index_reg->reg_type.bitfield.dword)
10428 || !i.index_reg->reg_type.bitfield.baseindex)))
10429 goto bad_address;
10430
10431 /* bndmk, bndldx, and bndstx have special restrictions. */
10432 if (current_templates->start->base_opcode == 0xf30f1b
10433 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10434 {
10435 /* They cannot use RIP-relative addressing. */
10436 if (i.base_reg && i.base_reg->reg_num == RegIP)
10437 {
10438 as_bad (_("`%s' cannot be used here"), operand_string);
10439 return 0;
10440 }
10441
10442 /* bndldx and bndstx ignore their scale factor. */
10443 if (current_templates->start->base_opcode != 0xf30f1b
10444 && i.log2_scale_factor)
10445 as_warn (_("register scaling is being ignored here"));
10446 }
10447 }
10448 else
10449 {
10450 /* 16-bit checks. */
10451 if ((i.base_reg
10452 && (!i.base_reg->reg_type.bitfield.word
10453 || !i.base_reg->reg_type.bitfield.baseindex))
10454 || (i.index_reg
10455 && (!i.index_reg->reg_type.bitfield.word
10456 || !i.index_reg->reg_type.bitfield.baseindex
10457 || !(i.base_reg
10458 && i.base_reg->reg_num < 6
10459 && i.index_reg->reg_num >= 6
10460 && i.log2_scale_factor == 0))))
10461 goto bad_address;
10462 }
10463 }
10464 return 1;
10465 }
10466
10467 /* Handle vector immediates. */
10468
10469 static int
10470 RC_SAE_immediate (const char *imm_start)
10471 {
10472 unsigned int match_found, j;
10473 const char *pstr = imm_start;
10474 expressionS *exp;
10475
10476 if (*pstr != '{')
10477 return 0;
10478
10479 pstr++;
10480 match_found = 0;
10481 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10482 {
10483 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10484 {
10485 if (!i.rounding)
10486 {
10487 rc_op.type = RC_NamesTable[j].type;
10488 rc_op.operand = this_operand;
10489 i.rounding = &rc_op;
10490 }
10491 else
10492 {
10493 as_bad (_("duplicated `%s'"), imm_start);
10494 return 0;
10495 }
10496 pstr += RC_NamesTable[j].len;
10497 match_found = 1;
10498 break;
10499 }
10500 }
10501 if (!match_found)
10502 return 0;
10503
10504 if (*pstr++ != '}')
10505 {
10506 as_bad (_("Missing '}': '%s'"), imm_start);
10507 return 0;
10508 }
10509 /* RC/SAE immediate string should contain nothing more. */;
10510 if (*pstr != 0)
10511 {
10512 as_bad (_("Junk after '}': '%s'"), imm_start);
10513 return 0;
10514 }
10515
10516 exp = &im_expressions[i.imm_operands++];
10517 i.op[this_operand].imms = exp;
10518
10519 exp->X_op = O_constant;
10520 exp->X_add_number = 0;
10521 exp->X_add_symbol = (symbolS *) 0;
10522 exp->X_op_symbol = (symbolS *) 0;
10523
10524 i.types[this_operand].bitfield.imm8 = 1;
10525 return 1;
10526 }
10527
10528 /* Only string instructions can have a second memory operand, so
10529 reduce current_templates to just those if it contains any. */
10530 static int
10531 maybe_adjust_templates (void)
10532 {
10533 const insn_template *t;
10534
10535 gas_assert (i.mem_operands == 1);
10536
10537 for (t = current_templates->start; t < current_templates->end; ++t)
10538 if (t->opcode_modifier.isstring)
10539 break;
10540
10541 if (t < current_templates->end)
10542 {
10543 static templates aux_templates;
10544 bfd_boolean recheck;
10545
10546 aux_templates.start = t;
10547 for (; t < current_templates->end; ++t)
10548 if (!t->opcode_modifier.isstring)
10549 break;
10550 aux_templates.end = t;
10551
10552 /* Determine whether to re-check the first memory operand. */
10553 recheck = (aux_templates.start != current_templates->start
10554 || t != current_templates->end);
10555
10556 current_templates = &aux_templates;
10557
10558 if (recheck)
10559 {
10560 i.mem_operands = 0;
10561 if (i.memop1_string != NULL
10562 && i386_index_check (i.memop1_string) == 0)
10563 return 0;
10564 i.mem_operands = 1;
10565 }
10566 }
10567
10568 return 1;
10569 }
10570
10571 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
10572 on error. */
10573
10574 static int
10575 i386_att_operand (char *operand_string)
10576 {
10577 const reg_entry *r;
10578 char *end_op;
10579 char *op_string = operand_string;
10580
10581 if (is_space_char (*op_string))
10582 ++op_string;
10583
10584 /* We check for an absolute prefix (differentiating,
10585 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
10586 if (*op_string == ABSOLUTE_PREFIX)
10587 {
10588 ++op_string;
10589 if (is_space_char (*op_string))
10590 ++op_string;
10591 i.jumpabsolute = TRUE;
10592 }
10593
10594 /* Check if operand is a register. */
10595 if ((r = parse_register (op_string, &end_op)) != NULL)
10596 {
10597 i386_operand_type temp;
10598
10599 /* Check for a segment override by searching for ':' after a
10600 segment register. */
10601 op_string = end_op;
10602 if (is_space_char (*op_string))
10603 ++op_string;
10604 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
10605 {
10606 switch (r->reg_num)
10607 {
10608 case 0:
10609 i.seg[i.mem_operands] = &es;
10610 break;
10611 case 1:
10612 i.seg[i.mem_operands] = &cs;
10613 break;
10614 case 2:
10615 i.seg[i.mem_operands] = &ss;
10616 break;
10617 case 3:
10618 i.seg[i.mem_operands] = &ds;
10619 break;
10620 case 4:
10621 i.seg[i.mem_operands] = &fs;
10622 break;
10623 case 5:
10624 i.seg[i.mem_operands] = &gs;
10625 break;
10626 }
10627
10628 /* Skip the ':' and whitespace. */
10629 ++op_string;
10630 if (is_space_char (*op_string))
10631 ++op_string;
10632
10633 if (!is_digit_char (*op_string)
10634 && !is_identifier_char (*op_string)
10635 && *op_string != '('
10636 && *op_string != ABSOLUTE_PREFIX)
10637 {
10638 as_bad (_("bad memory operand `%s'"), op_string);
10639 return 0;
10640 }
10641 /* Handle case of %es:*foo. */
10642 if (*op_string == ABSOLUTE_PREFIX)
10643 {
10644 ++op_string;
10645 if (is_space_char (*op_string))
10646 ++op_string;
10647 i.jumpabsolute = TRUE;
10648 }
10649 goto do_memory_reference;
10650 }
10651
10652 /* Handle vector operations. */
10653 if (*op_string == '{')
10654 {
10655 op_string = check_VecOperations (op_string, NULL);
10656 if (op_string == NULL)
10657 return 0;
10658 }
10659
10660 if (*op_string)
10661 {
10662 as_bad (_("junk `%s' after register"), op_string);
10663 return 0;
10664 }
10665 temp = r->reg_type;
10666 temp.bitfield.baseindex = 0;
10667 i.types[this_operand] = operand_type_or (i.types[this_operand],
10668 temp);
10669 i.types[this_operand].bitfield.unspecified = 0;
10670 i.op[this_operand].regs = r;
10671 i.reg_operands++;
10672 }
10673 else if (*op_string == REGISTER_PREFIX)
10674 {
10675 as_bad (_("bad register name `%s'"), op_string);
10676 return 0;
10677 }
10678 else if (*op_string == IMMEDIATE_PREFIX)
10679 {
10680 ++op_string;
10681 if (i.jumpabsolute)
10682 {
10683 as_bad (_("immediate operand illegal with absolute jump"));
10684 return 0;
10685 }
10686 if (!i386_immediate (op_string))
10687 return 0;
10688 }
10689 else if (RC_SAE_immediate (operand_string))
10690 {
10691 /* If it is a RC or SAE immediate, do nothing. */
10692 ;
10693 }
10694 else if (is_digit_char (*op_string)
10695 || is_identifier_char (*op_string)
10696 || *op_string == '"'
10697 || *op_string == '(')
10698 {
10699 /* This is a memory reference of some sort. */
10700 char *base_string;
10701
10702 /* Start and end of displacement string expression (if found). */
10703 char *displacement_string_start;
10704 char *displacement_string_end;
10705 char *vop_start;
10706
10707 do_memory_reference:
10708 if (i.mem_operands == 1 && !maybe_adjust_templates ())
10709 return 0;
10710 if ((i.mem_operands == 1
10711 && !current_templates->start->opcode_modifier.isstring)
10712 || i.mem_operands == 2)
10713 {
10714 as_bad (_("too many memory references for `%s'"),
10715 current_templates->start->name);
10716 return 0;
10717 }
10718
10719 /* Check for base index form. We detect the base index form by
10720 looking for an ')' at the end of the operand, searching
10721 for the '(' matching it, and finding a REGISTER_PREFIX or ','
10722 after the '('. */
10723 base_string = op_string + strlen (op_string);
10724
10725 /* Handle vector operations. */
10726 vop_start = strchr (op_string, '{');
10727 if (vop_start && vop_start < base_string)
10728 {
10729 if (check_VecOperations (vop_start, base_string) == NULL)
10730 return 0;
10731 base_string = vop_start;
10732 }
10733
10734 --base_string;
10735 if (is_space_char (*base_string))
10736 --base_string;
10737
10738 /* If we only have a displacement, set-up for it to be parsed later. */
10739 displacement_string_start = op_string;
10740 displacement_string_end = base_string + 1;
10741
10742 if (*base_string == ')')
10743 {
10744 char *temp_string;
10745 unsigned int parens_balanced = 1;
10746 /* We've already checked that the number of left & right ()'s are
10747 equal, so this loop will not be infinite. */
10748 do
10749 {
10750 base_string--;
10751 if (*base_string == ')')
10752 parens_balanced++;
10753 if (*base_string == '(')
10754 parens_balanced--;
10755 }
10756 while (parens_balanced);
10757
10758 temp_string = base_string;
10759
10760 /* Skip past '(' and whitespace. */
10761 ++base_string;
10762 if (is_space_char (*base_string))
10763 ++base_string;
10764
10765 if (*base_string == ','
10766 || ((i.base_reg = parse_register (base_string, &end_op))
10767 != NULL))
10768 {
10769 displacement_string_end = temp_string;
10770
10771 i.types[this_operand].bitfield.baseindex = 1;
10772
10773 if (i.base_reg)
10774 {
10775 base_string = end_op;
10776 if (is_space_char (*base_string))
10777 ++base_string;
10778 }
10779
10780 /* There may be an index reg or scale factor here. */
10781 if (*base_string == ',')
10782 {
10783 ++base_string;
10784 if (is_space_char (*base_string))
10785 ++base_string;
10786
10787 if ((i.index_reg = parse_register (base_string, &end_op))
10788 != NULL)
10789 {
10790 base_string = end_op;
10791 if (is_space_char (*base_string))
10792 ++base_string;
10793 if (*base_string == ',')
10794 {
10795 ++base_string;
10796 if (is_space_char (*base_string))
10797 ++base_string;
10798 }
10799 else if (*base_string != ')')
10800 {
10801 as_bad (_("expecting `,' or `)' "
10802 "after index register in `%s'"),
10803 operand_string);
10804 return 0;
10805 }
10806 }
10807 else if (*base_string == REGISTER_PREFIX)
10808 {
10809 end_op = strchr (base_string, ',');
10810 if (end_op)
10811 *end_op = '\0';
10812 as_bad (_("bad register name `%s'"), base_string);
10813 return 0;
10814 }
10815
10816 /* Check for scale factor. */
10817 if (*base_string != ')')
10818 {
10819 char *end_scale = i386_scale (base_string);
10820
10821 if (!end_scale)
10822 return 0;
10823
10824 base_string = end_scale;
10825 if (is_space_char (*base_string))
10826 ++base_string;
10827 if (*base_string != ')')
10828 {
10829 as_bad (_("expecting `)' "
10830 "after scale factor in `%s'"),
10831 operand_string);
10832 return 0;
10833 }
10834 }
10835 else if (!i.index_reg)
10836 {
10837 as_bad (_("expecting index register or scale factor "
10838 "after `,'; got '%c'"),
10839 *base_string);
10840 return 0;
10841 }
10842 }
10843 else if (*base_string != ')')
10844 {
10845 as_bad (_("expecting `,' or `)' "
10846 "after base register in `%s'"),
10847 operand_string);
10848 return 0;
10849 }
10850 }
10851 else if (*base_string == REGISTER_PREFIX)
10852 {
10853 end_op = strchr (base_string, ',');
10854 if (end_op)
10855 *end_op = '\0';
10856 as_bad (_("bad register name `%s'"), base_string);
10857 return 0;
10858 }
10859 }
10860
10861 /* If there's an expression beginning the operand, parse it,
10862 assuming displacement_string_start and
10863 displacement_string_end are meaningful. */
10864 if (displacement_string_start != displacement_string_end)
10865 {
10866 if (!i386_displacement (displacement_string_start,
10867 displacement_string_end))
10868 return 0;
10869 }
10870
10871 /* Special case for (%dx) while doing input/output op. */
10872 if (i.base_reg
10873 && i.base_reg->reg_type.bitfield.instance == RegD
10874 && i.base_reg->reg_type.bitfield.word
10875 && i.index_reg == 0
10876 && i.log2_scale_factor == 0
10877 && i.seg[i.mem_operands] == 0
10878 && !operand_type_check (i.types[this_operand], disp))
10879 {
10880 i.types[this_operand] = i.base_reg->reg_type;
10881 return 1;
10882 }
10883
10884 if (i386_index_check (operand_string) == 0)
10885 return 0;
10886 i.flags[this_operand] |= Operand_Mem;
10887 if (i.mem_operands == 0)
10888 i.memop1_string = xstrdup (operand_string);
10889 i.mem_operands++;
10890 }
10891 else
10892 {
10893 /* It's not a memory operand; argh! */
10894 as_bad (_("invalid char %s beginning operand %d `%s'"),
10895 output_invalid (*op_string),
10896 this_operand + 1,
10897 op_string);
10898 return 0;
10899 }
10900 return 1; /* Normal return. */
10901 }
10902 \f
10903 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10904 that an rs_machine_dependent frag may reach. */
10905
10906 unsigned int
10907 i386_frag_max_var (fragS *frag)
10908 {
10909 /* The only relaxable frags are for jumps.
10910 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
10911 gas_assert (frag->fr_type == rs_machine_dependent);
10912 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10913 }
10914
10915 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10916 static int
10917 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10918 {
10919 /* STT_GNU_IFUNC symbol must go through PLT. */
10920 if ((symbol_get_bfdsym (fr_symbol)->flags
10921 & BSF_GNU_INDIRECT_FUNCTION) != 0)
10922 return 0;
10923
10924 if (!S_IS_EXTERNAL (fr_symbol))
10925 /* Symbol may be weak or local. */
10926 return !S_IS_WEAK (fr_symbol);
10927
10928 /* Global symbols with non-default visibility can't be preempted. */
10929 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10930 return 1;
10931
10932 if (fr_var != NO_RELOC)
10933 switch ((enum bfd_reloc_code_real) fr_var)
10934 {
10935 case BFD_RELOC_386_PLT32:
10936 case BFD_RELOC_X86_64_PLT32:
10937 /* Symbol with PLT relocation may be preempted. */
10938 return 0;
10939 default:
10940 abort ();
10941 }
10942
10943 /* Global symbols with default visibility in a shared library may be
10944 preempted by another definition. */
10945 return !shared;
10946 }
10947 #endif
10948
10949 /* Return the next non-empty frag. */
10950
10951 static fragS *
10952 i386_next_non_empty_frag (fragS *fragP)
10953 {
10954 /* There may be a frag with a ".fill 0" when there is no room in
10955 the current frag for frag_grow in output_insn. */
10956 for (fragP = fragP->fr_next;
10957 (fragP != NULL
10958 && fragP->fr_type == rs_fill
10959 && fragP->fr_fix == 0);
10960 fragP = fragP->fr_next)
10961 ;
10962 return fragP;
10963 }
10964
10965 /* Return the next jcc frag after BRANCH_PADDING. */
10966
10967 static fragS *
10968 i386_next_jcc_frag (fragS *fragP)
10969 {
10970 if (!fragP)
10971 return NULL;
10972
10973 if (fragP->fr_type == rs_machine_dependent
10974 && (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10975 == BRANCH_PADDING))
10976 {
10977 fragP = i386_next_non_empty_frag (fragP);
10978 if (fragP->fr_type != rs_machine_dependent)
10979 return NULL;
10980 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == COND_JUMP)
10981 return fragP;
10982 }
10983
10984 return NULL;
10985 }
10986
10987 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
10988
10989 static void
10990 i386_classify_machine_dependent_frag (fragS *fragP)
10991 {
10992 fragS *cmp_fragP;
10993 fragS *pad_fragP;
10994 fragS *branch_fragP;
10995 fragS *next_fragP;
10996 unsigned int max_prefix_length;
10997
10998 if (fragP->tc_frag_data.classified)
10999 return;
11000
11001 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11002 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11003 for (next_fragP = fragP;
11004 next_fragP != NULL;
11005 next_fragP = next_fragP->fr_next)
11006 {
11007 next_fragP->tc_frag_data.classified = 1;
11008 if (next_fragP->fr_type == rs_machine_dependent)
11009 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11010 {
11011 case BRANCH_PADDING:
11012 /* The BRANCH_PADDING frag must be followed by a branch
11013 frag. */
11014 branch_fragP = i386_next_non_empty_frag (next_fragP);
11015 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11016 break;
11017 case FUSED_JCC_PADDING:
11018 /* Check if this is a fused jcc:
11019 FUSED_JCC_PADDING
11020 CMP like instruction
11021 BRANCH_PADDING
11022 COND_JUMP
11023 */
11024 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11025 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11026 branch_fragP = i386_next_jcc_frag (pad_fragP);
11027 if (branch_fragP)
11028 {
11029 /* The BRANCH_PADDING frag is merged with the
11030 FUSED_JCC_PADDING frag. */
11031 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11032 /* CMP like instruction size. */
11033 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11034 frag_wane (pad_fragP);
11035 /* Skip to branch_fragP. */
11036 next_fragP = branch_fragP;
11037 }
11038 else if (next_fragP->tc_frag_data.max_prefix_length)
11039 {
11040 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11041 a fused jcc. */
11042 next_fragP->fr_subtype
11043 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11044 next_fragP->tc_frag_data.max_bytes
11045 = next_fragP->tc_frag_data.max_prefix_length;
11046 /* This will be updated in the BRANCH_PREFIX scan. */
11047 next_fragP->tc_frag_data.max_prefix_length = 0;
11048 }
11049 else
11050 frag_wane (next_fragP);
11051 break;
11052 }
11053 }
11054
11055 /* Stop if there is no BRANCH_PREFIX. */
11056 if (!align_branch_prefix_size)
11057 return;
11058
11059 /* Scan for BRANCH_PREFIX. */
11060 for (; fragP != NULL; fragP = fragP->fr_next)
11061 {
11062 if (fragP->fr_type != rs_machine_dependent
11063 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11064 != BRANCH_PREFIX))
11065 continue;
11066
11067 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11068 COND_JUMP_PREFIX. */
11069 max_prefix_length = 0;
11070 for (next_fragP = fragP;
11071 next_fragP != NULL;
11072 next_fragP = next_fragP->fr_next)
11073 {
11074 if (next_fragP->fr_type == rs_fill)
11075 /* Skip rs_fill frags. */
11076 continue;
11077 else if (next_fragP->fr_type != rs_machine_dependent)
11078 /* Stop for all other frags. */
11079 break;
11080
11081 /* rs_machine_dependent frags. */
11082 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11083 == BRANCH_PREFIX)
11084 {
11085 /* Count BRANCH_PREFIX frags. */
11086 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11087 {
11088 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11089 frag_wane (next_fragP);
11090 }
11091 else
11092 max_prefix_length
11093 += next_fragP->tc_frag_data.max_bytes;
11094 }
11095 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11096 == BRANCH_PADDING)
11097 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11098 == FUSED_JCC_PADDING))
11099 {
11100 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11101 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11102 break;
11103 }
11104 else
11105 /* Stop for other rs_machine_dependent frags. */
11106 break;
11107 }
11108
11109 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11110
11111 /* Skip to the next frag. */
11112 fragP = next_fragP;
11113 }
11114 }
11115
11116 /* Compute padding size for
11117
11118 FUSED_JCC_PADDING
11119 CMP like instruction
11120 BRANCH_PADDING
11121 COND_JUMP/UNCOND_JUMP
11122
11123 or
11124
11125 BRANCH_PADDING
11126 COND_JUMP/UNCOND_JUMP
11127 */
11128
11129 static int
11130 i386_branch_padding_size (fragS *fragP, offsetT address)
11131 {
11132 unsigned int offset, size, padding_size;
11133 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11134
11135 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11136 if (!address)
11137 address = fragP->fr_address;
11138 address += fragP->fr_fix;
11139
11140 /* CMP like instrunction size. */
11141 size = fragP->tc_frag_data.cmp_size;
11142
11143 /* The base size of the branch frag. */
11144 size += branch_fragP->fr_fix;
11145
11146 /* Add opcode and displacement bytes for the rs_machine_dependent
11147 branch frag. */
11148 if (branch_fragP->fr_type == rs_machine_dependent)
11149 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11150
11151 /* Check if branch is within boundary and doesn't end at the last
11152 byte. */
11153 offset = address & ((1U << align_branch_power) - 1);
11154 if ((offset + size) >= (1U << align_branch_power))
11155 /* Padding needed to avoid crossing boundary. */
11156 padding_size = (1U << align_branch_power) - offset;
11157 else
11158 /* No padding needed. */
11159 padding_size = 0;
11160
11161 /* The return value may be saved in tc_frag_data.length which is
11162 unsigned byte. */
11163 if (!fits_in_unsigned_byte (padding_size))
11164 abort ();
11165
11166 return padding_size;
11167 }
11168
11169 /* i386_generic_table_relax_frag()
11170
11171 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11172 grow/shrink padding to align branch frags. Hand others to
11173 relax_frag(). */
11174
11175 long
11176 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11177 {
11178 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11179 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11180 {
11181 long padding_size = i386_branch_padding_size (fragP, 0);
11182 long grow = padding_size - fragP->tc_frag_data.length;
11183
11184 /* When the BRANCH_PREFIX frag is used, the computed address
11185 must match the actual address and there should be no padding. */
11186 if (fragP->tc_frag_data.padding_address
11187 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11188 || padding_size))
11189 abort ();
11190
11191 /* Update the padding size. */
11192 if (grow)
11193 fragP->tc_frag_data.length = padding_size;
11194
11195 return grow;
11196 }
11197 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11198 {
11199 fragS *padding_fragP, *next_fragP;
11200 long padding_size, left_size, last_size;
11201
11202 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11203 if (!padding_fragP)
11204 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11205 return (fragP->tc_frag_data.length
11206 - fragP->tc_frag_data.last_length);
11207
11208 /* Compute the relative address of the padding frag in the very
11209 first time where the BRANCH_PREFIX frag sizes are zero. */
11210 if (!fragP->tc_frag_data.padding_address)
11211 fragP->tc_frag_data.padding_address
11212 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11213
11214 /* First update the last length from the previous interation. */
11215 left_size = fragP->tc_frag_data.prefix_length;
11216 for (next_fragP = fragP;
11217 next_fragP != padding_fragP;
11218 next_fragP = next_fragP->fr_next)
11219 if (next_fragP->fr_type == rs_machine_dependent
11220 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11221 == BRANCH_PREFIX))
11222 {
11223 if (left_size)
11224 {
11225 int max = next_fragP->tc_frag_data.max_bytes;
11226 if (max)
11227 {
11228 int size;
11229 if (max > left_size)
11230 size = left_size;
11231 else
11232 size = max;
11233 left_size -= size;
11234 next_fragP->tc_frag_data.last_length = size;
11235 }
11236 }
11237 else
11238 next_fragP->tc_frag_data.last_length = 0;
11239 }
11240
11241 /* Check the padding size for the padding frag. */
11242 padding_size = i386_branch_padding_size
11243 (padding_fragP, (fragP->fr_address
11244 + fragP->tc_frag_data.padding_address));
11245
11246 last_size = fragP->tc_frag_data.prefix_length;
11247 /* Check if there is change from the last interation. */
11248 if (padding_size == last_size)
11249 {
11250 /* Update the expected address of the padding frag. */
11251 padding_fragP->tc_frag_data.padding_address
11252 = (fragP->fr_address + padding_size
11253 + fragP->tc_frag_data.padding_address);
11254 return 0;
11255 }
11256
11257 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11258 {
11259 /* No padding if there is no sufficient room. Clear the
11260 expected address of the padding frag. */
11261 padding_fragP->tc_frag_data.padding_address = 0;
11262 padding_size = 0;
11263 }
11264 else
11265 /* Store the expected address of the padding frag. */
11266 padding_fragP->tc_frag_data.padding_address
11267 = (fragP->fr_address + padding_size
11268 + fragP->tc_frag_data.padding_address);
11269
11270 fragP->tc_frag_data.prefix_length = padding_size;
11271
11272 /* Update the length for the current interation. */
11273 left_size = padding_size;
11274 for (next_fragP = fragP;
11275 next_fragP != padding_fragP;
11276 next_fragP = next_fragP->fr_next)
11277 if (next_fragP->fr_type == rs_machine_dependent
11278 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11279 == BRANCH_PREFIX))
11280 {
11281 if (left_size)
11282 {
11283 int max = next_fragP->tc_frag_data.max_bytes;
11284 if (max)
11285 {
11286 int size;
11287 if (max > left_size)
11288 size = left_size;
11289 else
11290 size = max;
11291 left_size -= size;
11292 next_fragP->tc_frag_data.length = size;
11293 }
11294 }
11295 else
11296 next_fragP->tc_frag_data.length = 0;
11297 }
11298
11299 return (fragP->tc_frag_data.length
11300 - fragP->tc_frag_data.last_length);
11301 }
11302 return relax_frag (segment, fragP, stretch);
11303 }
11304
11305 /* md_estimate_size_before_relax()
11306
11307 Called just before relax() for rs_machine_dependent frags. The x86
11308 assembler uses these frags to handle variable size jump
11309 instructions.
11310
11311 Any symbol that is now undefined will not become defined.
11312 Return the correct fr_subtype in the frag.
11313 Return the initial "guess for variable size of frag" to caller.
11314 The guess is actually the growth beyond the fixed part. Whatever
11315 we do to grow the fixed or variable part contributes to our
11316 returned value. */
11317
11318 int
11319 md_estimate_size_before_relax (fragS *fragP, segT segment)
11320 {
11321 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11322 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11323 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11324 {
11325 i386_classify_machine_dependent_frag (fragP);
11326 return fragP->tc_frag_data.length;
11327 }
11328
11329 /* We've already got fragP->fr_subtype right; all we have to do is
11330 check for un-relaxable symbols. On an ELF system, we can't relax
11331 an externally visible symbol, because it may be overridden by a
11332 shared library. */
11333 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11334 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11335 || (IS_ELF
11336 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11337 fragP->fr_var))
11338 #endif
11339 #if defined (OBJ_COFF) && defined (TE_PE)
11340 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11341 && S_IS_WEAK (fragP->fr_symbol))
11342 #endif
11343 )
11344 {
11345 /* Symbol is undefined in this segment, or we need to keep a
11346 reloc so that weak symbols can be overridden. */
11347 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11348 enum bfd_reloc_code_real reloc_type;
11349 unsigned char *opcode;
11350 int old_fr_fix;
11351
11352 if (fragP->fr_var != NO_RELOC)
11353 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11354 else if (size == 2)
11355 reloc_type = BFD_RELOC_16_PCREL;
11356 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11357 else if (need_plt32_p (fragP->fr_symbol))
11358 reloc_type = BFD_RELOC_X86_64_PLT32;
11359 #endif
11360 else
11361 reloc_type = BFD_RELOC_32_PCREL;
11362
11363 old_fr_fix = fragP->fr_fix;
11364 opcode = (unsigned char *) fragP->fr_opcode;
11365
11366 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11367 {
11368 case UNCOND_JUMP:
11369 /* Make jmp (0xeb) a (d)word displacement jump. */
11370 opcode[0] = 0xe9;
11371 fragP->fr_fix += size;
11372 fix_new (fragP, old_fr_fix, size,
11373 fragP->fr_symbol,
11374 fragP->fr_offset, 1,
11375 reloc_type);
11376 break;
11377
11378 case COND_JUMP86:
11379 if (size == 2
11380 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11381 {
11382 /* Negate the condition, and branch past an
11383 unconditional jump. */
11384 opcode[0] ^= 1;
11385 opcode[1] = 3;
11386 /* Insert an unconditional jump. */
11387 opcode[2] = 0xe9;
11388 /* We added two extra opcode bytes, and have a two byte
11389 offset. */
11390 fragP->fr_fix += 2 + 2;
11391 fix_new (fragP, old_fr_fix + 2, 2,
11392 fragP->fr_symbol,
11393 fragP->fr_offset, 1,
11394 reloc_type);
11395 break;
11396 }
11397 /* Fall through. */
11398
11399 case COND_JUMP:
11400 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11401 {
11402 fixS *fixP;
11403
11404 fragP->fr_fix += 1;
11405 fixP = fix_new (fragP, old_fr_fix, 1,
11406 fragP->fr_symbol,
11407 fragP->fr_offset, 1,
11408 BFD_RELOC_8_PCREL);
11409 fixP->fx_signed = 1;
11410 break;
11411 }
11412
11413 /* This changes the byte-displacement jump 0x7N
11414 to the (d)word-displacement jump 0x0f,0x8N. */
11415 opcode[1] = opcode[0] + 0x10;
11416 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11417 /* We've added an opcode byte. */
11418 fragP->fr_fix += 1 + size;
11419 fix_new (fragP, old_fr_fix + 1, size,
11420 fragP->fr_symbol,
11421 fragP->fr_offset, 1,
11422 reloc_type);
11423 break;
11424
11425 default:
11426 BAD_CASE (fragP->fr_subtype);
11427 break;
11428 }
11429 frag_wane (fragP);
11430 return fragP->fr_fix - old_fr_fix;
11431 }
11432
11433 /* Guess size depending on current relax state. Initially the relax
11434 state will correspond to a short jump and we return 1, because
11435 the variable part of the frag (the branch offset) is one byte
11436 long. However, we can relax a section more than once and in that
11437 case we must either set fr_subtype back to the unrelaxed state,
11438 or return the value for the appropriate branch. */
11439 return md_relax_table[fragP->fr_subtype].rlx_length;
11440 }
11441
11442 /* Called after relax() is finished.
11443
11444 In: Address of frag.
11445 fr_type == rs_machine_dependent.
11446 fr_subtype is what the address relaxed to.
11447
11448 Out: Any fixSs and constants are set up.
11449 Caller will turn frag into a ".space 0". */
11450
11451 void
11452 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
11453 fragS *fragP)
11454 {
11455 unsigned char *opcode;
11456 unsigned char *where_to_put_displacement = NULL;
11457 offsetT target_address;
11458 offsetT opcode_address;
11459 unsigned int extension = 0;
11460 offsetT displacement_from_opcode_start;
11461
11462 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11463 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
11464 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11465 {
11466 /* Generate nop padding. */
11467 unsigned int size = fragP->tc_frag_data.length;
11468 if (size)
11469 {
11470 if (size > fragP->tc_frag_data.max_bytes)
11471 abort ();
11472
11473 if (flag_debug)
11474 {
11475 const char *msg;
11476 const char *branch = "branch";
11477 const char *prefix = "";
11478 fragS *padding_fragP;
11479 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11480 == BRANCH_PREFIX)
11481 {
11482 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11483 switch (fragP->tc_frag_data.default_prefix)
11484 {
11485 default:
11486 abort ();
11487 break;
11488 case CS_PREFIX_OPCODE:
11489 prefix = " cs";
11490 break;
11491 case DS_PREFIX_OPCODE:
11492 prefix = " ds";
11493 break;
11494 case ES_PREFIX_OPCODE:
11495 prefix = " es";
11496 break;
11497 case FS_PREFIX_OPCODE:
11498 prefix = " fs";
11499 break;
11500 case GS_PREFIX_OPCODE:
11501 prefix = " gs";
11502 break;
11503 case SS_PREFIX_OPCODE:
11504 prefix = " ss";
11505 break;
11506 }
11507 if (padding_fragP)
11508 msg = _("%s:%u: add %d%s at 0x%llx to align "
11509 "%s within %d-byte boundary\n");
11510 else
11511 msg = _("%s:%u: add additional %d%s at 0x%llx to "
11512 "align %s within %d-byte boundary\n");
11513 }
11514 else
11515 {
11516 padding_fragP = fragP;
11517 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
11518 "%s within %d-byte boundary\n");
11519 }
11520
11521 if (padding_fragP)
11522 switch (padding_fragP->tc_frag_data.branch_type)
11523 {
11524 case align_branch_jcc:
11525 branch = "jcc";
11526 break;
11527 case align_branch_fused:
11528 branch = "fused jcc";
11529 break;
11530 case align_branch_jmp:
11531 branch = "jmp";
11532 break;
11533 case align_branch_call:
11534 branch = "call";
11535 break;
11536 case align_branch_indirect:
11537 branch = "indiret branch";
11538 break;
11539 case align_branch_ret:
11540 branch = "ret";
11541 break;
11542 default:
11543 break;
11544 }
11545
11546 fprintf (stdout, msg,
11547 fragP->fr_file, fragP->fr_line, size, prefix,
11548 (long long) fragP->fr_address, branch,
11549 1 << align_branch_power);
11550 }
11551 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11552 memset (fragP->fr_opcode,
11553 fragP->tc_frag_data.default_prefix, size);
11554 else
11555 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
11556 size, 0);
11557 fragP->fr_fix += size;
11558 }
11559 return;
11560 }
11561
11562 opcode = (unsigned char *) fragP->fr_opcode;
11563
11564 /* Address we want to reach in file space. */
11565 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
11566
11567 /* Address opcode resides at in file space. */
11568 opcode_address = fragP->fr_address + fragP->fr_fix;
11569
11570 /* Displacement from opcode start to fill into instruction. */
11571 displacement_from_opcode_start = target_address - opcode_address;
11572
11573 if ((fragP->fr_subtype & BIG) == 0)
11574 {
11575 /* Don't have to change opcode. */
11576 extension = 1; /* 1 opcode + 1 displacement */
11577 where_to_put_displacement = &opcode[1];
11578 }
11579 else
11580 {
11581 if (no_cond_jump_promotion
11582 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
11583 as_warn_where (fragP->fr_file, fragP->fr_line,
11584 _("long jump required"));
11585
11586 switch (fragP->fr_subtype)
11587 {
11588 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
11589 extension = 4; /* 1 opcode + 4 displacement */
11590 opcode[0] = 0xe9;
11591 where_to_put_displacement = &opcode[1];
11592 break;
11593
11594 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
11595 extension = 2; /* 1 opcode + 2 displacement */
11596 opcode[0] = 0xe9;
11597 where_to_put_displacement = &opcode[1];
11598 break;
11599
11600 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
11601 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
11602 extension = 5; /* 2 opcode + 4 displacement */
11603 opcode[1] = opcode[0] + 0x10;
11604 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11605 where_to_put_displacement = &opcode[2];
11606 break;
11607
11608 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
11609 extension = 3; /* 2 opcode + 2 displacement */
11610 opcode[1] = opcode[0] + 0x10;
11611 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11612 where_to_put_displacement = &opcode[2];
11613 break;
11614
11615 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
11616 extension = 4;
11617 opcode[0] ^= 1;
11618 opcode[1] = 3;
11619 opcode[2] = 0xe9;
11620 where_to_put_displacement = &opcode[3];
11621 break;
11622
11623 default:
11624 BAD_CASE (fragP->fr_subtype);
11625 break;
11626 }
11627 }
11628
11629 /* If size if less then four we are sure that the operand fits,
11630 but if it's 4, then it could be that the displacement is larger
11631 then -/+ 2GB. */
11632 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
11633 && object_64bit
11634 && ((addressT) (displacement_from_opcode_start - extension
11635 + ((addressT) 1 << 31))
11636 > (((addressT) 2 << 31) - 1)))
11637 {
11638 as_bad_where (fragP->fr_file, fragP->fr_line,
11639 _("jump target out of range"));
11640 /* Make us emit 0. */
11641 displacement_from_opcode_start = extension;
11642 }
11643 /* Now put displacement after opcode. */
11644 md_number_to_chars ((char *) where_to_put_displacement,
11645 (valueT) (displacement_from_opcode_start - extension),
11646 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
11647 fragP->fr_fix += extension;
11648 }
11649 \f
11650 /* Apply a fixup (fixP) to segment data, once it has been determined
11651 by our caller that we have all the info we need to fix it up.
11652
11653 Parameter valP is the pointer to the value of the bits.
11654
11655 On the 386, immediates, displacements, and data pointers are all in
11656 the same (little-endian) format, so we don't need to care about which
11657 we are handling. */
11658
11659 void
11660 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
11661 {
11662 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
11663 valueT value = *valP;
11664
11665 #if !defined (TE_Mach)
11666 if (fixP->fx_pcrel)
11667 {
11668 switch (fixP->fx_r_type)
11669 {
11670 default:
11671 break;
11672
11673 case BFD_RELOC_64:
11674 fixP->fx_r_type = BFD_RELOC_64_PCREL;
11675 break;
11676 case BFD_RELOC_32:
11677 case BFD_RELOC_X86_64_32S:
11678 fixP->fx_r_type = BFD_RELOC_32_PCREL;
11679 break;
11680 case BFD_RELOC_16:
11681 fixP->fx_r_type = BFD_RELOC_16_PCREL;
11682 break;
11683 case BFD_RELOC_8:
11684 fixP->fx_r_type = BFD_RELOC_8_PCREL;
11685 break;
11686 }
11687 }
11688
11689 if (fixP->fx_addsy != NULL
11690 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
11691 || fixP->fx_r_type == BFD_RELOC_64_PCREL
11692 || fixP->fx_r_type == BFD_RELOC_16_PCREL
11693 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
11694 && !use_rela_relocations)
11695 {
11696 /* This is a hack. There should be a better way to handle this.
11697 This covers for the fact that bfd_install_relocation will
11698 subtract the current location (for partial_inplace, PC relative
11699 relocations); see more below. */
11700 #ifndef OBJ_AOUT
11701 if (IS_ELF
11702 #ifdef TE_PE
11703 || OUTPUT_FLAVOR == bfd_target_coff_flavour
11704 #endif
11705 )
11706 value += fixP->fx_where + fixP->fx_frag->fr_address;
11707 #endif
11708 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11709 if (IS_ELF)
11710 {
11711 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
11712
11713 if ((sym_seg == seg
11714 || (symbol_section_p (fixP->fx_addsy)
11715 && sym_seg != absolute_section))
11716 && !generic_force_reloc (fixP))
11717 {
11718 /* Yes, we add the values in twice. This is because
11719 bfd_install_relocation subtracts them out again. I think
11720 bfd_install_relocation is broken, but I don't dare change
11721 it. FIXME. */
11722 value += fixP->fx_where + fixP->fx_frag->fr_address;
11723 }
11724 }
11725 #endif
11726 #if defined (OBJ_COFF) && defined (TE_PE)
11727 /* For some reason, the PE format does not store a
11728 section address offset for a PC relative symbol. */
11729 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
11730 || S_IS_WEAK (fixP->fx_addsy))
11731 value += md_pcrel_from (fixP);
11732 #endif
11733 }
11734 #if defined (OBJ_COFF) && defined (TE_PE)
11735 if (fixP->fx_addsy != NULL
11736 && S_IS_WEAK (fixP->fx_addsy)
11737 /* PR 16858: Do not modify weak function references. */
11738 && ! fixP->fx_pcrel)
11739 {
11740 #if !defined (TE_PEP)
11741 /* For x86 PE weak function symbols are neither PC-relative
11742 nor do they set S_IS_FUNCTION. So the only reliable way
11743 to detect them is to check the flags of their containing
11744 section. */
11745 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
11746 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
11747 ;
11748 else
11749 #endif
11750 value -= S_GET_VALUE (fixP->fx_addsy);
11751 }
11752 #endif
11753
11754 /* Fix a few things - the dynamic linker expects certain values here,
11755 and we must not disappoint it. */
11756 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11757 if (IS_ELF && fixP->fx_addsy)
11758 switch (fixP->fx_r_type)
11759 {
11760 case BFD_RELOC_386_PLT32:
11761 case BFD_RELOC_X86_64_PLT32:
11762 /* Make the jump instruction point to the address of the operand.
11763 At runtime we merely add the offset to the actual PLT entry.
11764 NB: Subtract the offset size only for jump instructions. */
11765 if (fixP->fx_pcrel)
11766 value = -4;
11767 break;
11768
11769 case BFD_RELOC_386_TLS_GD:
11770 case BFD_RELOC_386_TLS_LDM:
11771 case BFD_RELOC_386_TLS_IE_32:
11772 case BFD_RELOC_386_TLS_IE:
11773 case BFD_RELOC_386_TLS_GOTIE:
11774 case BFD_RELOC_386_TLS_GOTDESC:
11775 case BFD_RELOC_X86_64_TLSGD:
11776 case BFD_RELOC_X86_64_TLSLD:
11777 case BFD_RELOC_X86_64_GOTTPOFF:
11778 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11779 value = 0; /* Fully resolved at runtime. No addend. */
11780 /* Fallthrough */
11781 case BFD_RELOC_386_TLS_LE:
11782 case BFD_RELOC_386_TLS_LDO_32:
11783 case BFD_RELOC_386_TLS_LE_32:
11784 case BFD_RELOC_X86_64_DTPOFF32:
11785 case BFD_RELOC_X86_64_DTPOFF64:
11786 case BFD_RELOC_X86_64_TPOFF32:
11787 case BFD_RELOC_X86_64_TPOFF64:
11788 S_SET_THREAD_LOCAL (fixP->fx_addsy);
11789 break;
11790
11791 case BFD_RELOC_386_TLS_DESC_CALL:
11792 case BFD_RELOC_X86_64_TLSDESC_CALL:
11793 value = 0; /* Fully resolved at runtime. No addend. */
11794 S_SET_THREAD_LOCAL (fixP->fx_addsy);
11795 fixP->fx_done = 0;
11796 return;
11797
11798 case BFD_RELOC_VTABLE_INHERIT:
11799 case BFD_RELOC_VTABLE_ENTRY:
11800 fixP->fx_done = 0;
11801 return;
11802
11803 default:
11804 break;
11805 }
11806 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
11807 *valP = value;
11808 #endif /* !defined (TE_Mach) */
11809
11810 /* Are we finished with this relocation now? */
11811 if (fixP->fx_addsy == NULL)
11812 fixP->fx_done = 1;
11813 #if defined (OBJ_COFF) && defined (TE_PE)
11814 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
11815 {
11816 fixP->fx_done = 0;
11817 /* Remember value for tc_gen_reloc. */
11818 fixP->fx_addnumber = value;
11819 /* Clear out the frag for now. */
11820 value = 0;
11821 }
11822 #endif
11823 else if (use_rela_relocations)
11824 {
11825 fixP->fx_no_overflow = 1;
11826 /* Remember value for tc_gen_reloc. */
11827 fixP->fx_addnumber = value;
11828 value = 0;
11829 }
11830
11831 md_number_to_chars (p, value, fixP->fx_size);
11832 }
11833 \f
11834 const char *
11835 md_atof (int type, char *litP, int *sizeP)
11836 {
11837 /* This outputs the LITTLENUMs in REVERSE order;
11838 in accord with the bigendian 386. */
11839 return ieee_md_atof (type, litP, sizeP, FALSE);
11840 }
11841 \f
11842 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
11843
11844 static char *
11845 output_invalid (int c)
11846 {
11847 if (ISPRINT (c))
11848 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11849 "'%c'", c);
11850 else
11851 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11852 "(0x%x)", (unsigned char) c);
11853 return output_invalid_buf;
11854 }
11855
11856 /* REG_STRING starts *before* REGISTER_PREFIX. */
11857
11858 static const reg_entry *
11859 parse_real_register (char *reg_string, char **end_op)
11860 {
11861 char *s = reg_string;
11862 char *p;
11863 char reg_name_given[MAX_REG_NAME_SIZE + 1];
11864 const reg_entry *r;
11865
11866 /* Skip possible REGISTER_PREFIX and possible whitespace. */
11867 if (*s == REGISTER_PREFIX)
11868 ++s;
11869
11870 if (is_space_char (*s))
11871 ++s;
11872
11873 p = reg_name_given;
11874 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
11875 {
11876 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
11877 return (const reg_entry *) NULL;
11878 s++;
11879 }
11880
11881 /* For naked regs, make sure that we are not dealing with an identifier.
11882 This prevents confusing an identifier like `eax_var' with register
11883 `eax'. */
11884 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
11885 return (const reg_entry *) NULL;
11886
11887 *end_op = s;
11888
11889 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
11890
11891 /* Handle floating point regs, allowing spaces in the (i) part. */
11892 if (r == i386_regtab /* %st is first entry of table */)
11893 {
11894 if (!cpu_arch_flags.bitfield.cpu8087
11895 && !cpu_arch_flags.bitfield.cpu287
11896 && !cpu_arch_flags.bitfield.cpu387)
11897 return (const reg_entry *) NULL;
11898
11899 if (is_space_char (*s))
11900 ++s;
11901 if (*s == '(')
11902 {
11903 ++s;
11904 if (is_space_char (*s))
11905 ++s;
11906 if (*s >= '0' && *s <= '7')
11907 {
11908 int fpr = *s - '0';
11909 ++s;
11910 if (is_space_char (*s))
11911 ++s;
11912 if (*s == ')')
11913 {
11914 *end_op = s + 1;
11915 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
11916 know (r);
11917 return r + fpr;
11918 }
11919 }
11920 /* We have "%st(" then garbage. */
11921 return (const reg_entry *) NULL;
11922 }
11923 }
11924
11925 if (r == NULL || allow_pseudo_reg)
11926 return r;
11927
11928 if (operand_type_all_zero (&r->reg_type))
11929 return (const reg_entry *) NULL;
11930
11931 if ((r->reg_type.bitfield.dword
11932 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
11933 || r->reg_type.bitfield.class == RegCR
11934 || r->reg_type.bitfield.class == RegDR
11935 || r->reg_type.bitfield.class == RegTR)
11936 && !cpu_arch_flags.bitfield.cpui386)
11937 return (const reg_entry *) NULL;
11938
11939 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
11940 return (const reg_entry *) NULL;
11941
11942 if (!cpu_arch_flags.bitfield.cpuavx512f)
11943 {
11944 if (r->reg_type.bitfield.zmmword
11945 || r->reg_type.bitfield.class == RegMask)
11946 return (const reg_entry *) NULL;
11947
11948 if (!cpu_arch_flags.bitfield.cpuavx)
11949 {
11950 if (r->reg_type.bitfield.ymmword)
11951 return (const reg_entry *) NULL;
11952
11953 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
11954 return (const reg_entry *) NULL;
11955 }
11956 }
11957
11958 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
11959 return (const reg_entry *) NULL;
11960
11961 /* Don't allow fake index register unless allow_index_reg isn't 0. */
11962 if (!allow_index_reg && r->reg_num == RegIZ)
11963 return (const reg_entry *) NULL;
11964
11965 /* Upper 16 vector registers are only available with VREX in 64bit
11966 mode, and require EVEX encoding. */
11967 if (r->reg_flags & RegVRex)
11968 {
11969 if (!cpu_arch_flags.bitfield.cpuavx512f
11970 || flag_code != CODE_64BIT)
11971 return (const reg_entry *) NULL;
11972
11973 i.vec_encoding = vex_encoding_evex;
11974 }
11975
11976 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
11977 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
11978 && flag_code != CODE_64BIT)
11979 return (const reg_entry *) NULL;
11980
11981 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
11982 && !intel_syntax)
11983 return (const reg_entry *) NULL;
11984
11985 return r;
11986 }
11987
11988 /* REG_STRING starts *before* REGISTER_PREFIX. */
11989
11990 static const reg_entry *
11991 parse_register (char *reg_string, char **end_op)
11992 {
11993 const reg_entry *r;
11994
11995 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
11996 r = parse_real_register (reg_string, end_op);
11997 else
11998 r = NULL;
11999 if (!r)
12000 {
12001 char *save = input_line_pointer;
12002 char c;
12003 symbolS *symbolP;
12004
12005 input_line_pointer = reg_string;
12006 c = get_symbol_name (&reg_string);
12007 symbolP = symbol_find (reg_string);
12008 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12009 {
12010 const expressionS *e = symbol_get_value_expression (symbolP);
12011
12012 know (e->X_op == O_register);
12013 know (e->X_add_number >= 0
12014 && (valueT) e->X_add_number < i386_regtab_size);
12015 r = i386_regtab + e->X_add_number;
12016 if ((r->reg_flags & RegVRex))
12017 i.vec_encoding = vex_encoding_evex;
12018 *end_op = input_line_pointer;
12019 }
12020 *input_line_pointer = c;
12021 input_line_pointer = save;
12022 }
12023 return r;
12024 }
12025
12026 int
12027 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12028 {
12029 const reg_entry *r;
12030 char *end = input_line_pointer;
12031
12032 *end = *nextcharP;
12033 r = parse_register (name, &input_line_pointer);
12034 if (r && end <= input_line_pointer)
12035 {
12036 *nextcharP = *input_line_pointer;
12037 *input_line_pointer = 0;
12038 e->X_op = O_register;
12039 e->X_add_number = r - i386_regtab;
12040 return 1;
12041 }
12042 input_line_pointer = end;
12043 *end = 0;
12044 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12045 }
12046
12047 void
12048 md_operand (expressionS *e)
12049 {
12050 char *end;
12051 const reg_entry *r;
12052
12053 switch (*input_line_pointer)
12054 {
12055 case REGISTER_PREFIX:
12056 r = parse_real_register (input_line_pointer, &end);
12057 if (r)
12058 {
12059 e->X_op = O_register;
12060 e->X_add_number = r - i386_regtab;
12061 input_line_pointer = end;
12062 }
12063 break;
12064
12065 case '[':
12066 gas_assert (intel_syntax);
12067 end = input_line_pointer++;
12068 expression (e);
12069 if (*input_line_pointer == ']')
12070 {
12071 ++input_line_pointer;
12072 e->X_op_symbol = make_expr_symbol (e);
12073 e->X_add_symbol = NULL;
12074 e->X_add_number = 0;
12075 e->X_op = O_index;
12076 }
12077 else
12078 {
12079 e->X_op = O_absent;
12080 input_line_pointer = end;
12081 }
12082 break;
12083 }
12084 }
12085
12086 \f
12087 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12088 const char *md_shortopts = "kVQ:sqnO::";
12089 #else
12090 const char *md_shortopts = "qnO::";
12091 #endif
12092
12093 #define OPTION_32 (OPTION_MD_BASE + 0)
12094 #define OPTION_64 (OPTION_MD_BASE + 1)
12095 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12096 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12097 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12098 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12099 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12100 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12101 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12102 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12103 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12104 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12105 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12106 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12107 #define OPTION_X32 (OPTION_MD_BASE + 14)
12108 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12109 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12110 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12111 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12112 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12113 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12114 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12115 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12116 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12117 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12118 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12119 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12120 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12121 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12122 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12123 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12124
12125 struct option md_longopts[] =
12126 {
12127 {"32", no_argument, NULL, OPTION_32},
12128 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12129 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12130 {"64", no_argument, NULL, OPTION_64},
12131 #endif
12132 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12133 {"x32", no_argument, NULL, OPTION_X32},
12134 {"mshared", no_argument, NULL, OPTION_MSHARED},
12135 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12136 #endif
12137 {"divide", no_argument, NULL, OPTION_DIVIDE},
12138 {"march", required_argument, NULL, OPTION_MARCH},
12139 {"mtune", required_argument, NULL, OPTION_MTUNE},
12140 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12141 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12142 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12143 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12144 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12145 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12146 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12147 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12148 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12149 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12150 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12151 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12152 # if defined (TE_PE) || defined (TE_PEP)
12153 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12154 #endif
12155 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12156 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12157 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12158 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12159 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12160 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12161 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12162 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12163 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12164 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12165 {NULL, no_argument, NULL, 0}
12166 };
12167 size_t md_longopts_size = sizeof (md_longopts);
12168
12169 int
12170 md_parse_option (int c, const char *arg)
12171 {
12172 unsigned int j;
12173 char *arch, *next, *saved, *type;
12174
12175 switch (c)
12176 {
12177 case 'n':
12178 optimize_align_code = 0;
12179 break;
12180
12181 case 'q':
12182 quiet_warnings = 1;
12183 break;
12184
12185 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12186 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12187 should be emitted or not. FIXME: Not implemented. */
12188 case 'Q':
12189 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12190 return 0;
12191 break;
12192
12193 /* -V: SVR4 argument to print version ID. */
12194 case 'V':
12195 print_version_id ();
12196 break;
12197
12198 /* -k: Ignore for FreeBSD compatibility. */
12199 case 'k':
12200 break;
12201
12202 case 's':
12203 /* -s: On i386 Solaris, this tells the native assembler to use
12204 .stab instead of .stab.excl. We always use .stab anyhow. */
12205 break;
12206
12207 case OPTION_MSHARED:
12208 shared = 1;
12209 break;
12210
12211 case OPTION_X86_USED_NOTE:
12212 if (strcasecmp (arg, "yes") == 0)
12213 x86_used_note = 1;
12214 else if (strcasecmp (arg, "no") == 0)
12215 x86_used_note = 0;
12216 else
12217 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12218 break;
12219
12220
12221 #endif
12222 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12223 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12224 case OPTION_64:
12225 {
12226 const char **list, **l;
12227
12228 list = bfd_target_list ();
12229 for (l = list; *l != NULL; l++)
12230 if (CONST_STRNEQ (*l, "elf64-x86-64")
12231 || strcmp (*l, "coff-x86-64") == 0
12232 || strcmp (*l, "pe-x86-64") == 0
12233 || strcmp (*l, "pei-x86-64") == 0
12234 || strcmp (*l, "mach-o-x86-64") == 0)
12235 {
12236 default_arch = "x86_64";
12237 break;
12238 }
12239 if (*l == NULL)
12240 as_fatal (_("no compiled in support for x86_64"));
12241 free (list);
12242 }
12243 break;
12244 #endif
12245
12246 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12247 case OPTION_X32:
12248 if (IS_ELF)
12249 {
12250 const char **list, **l;
12251
12252 list = bfd_target_list ();
12253 for (l = list; *l != NULL; l++)
12254 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12255 {
12256 default_arch = "x86_64:32";
12257 break;
12258 }
12259 if (*l == NULL)
12260 as_fatal (_("no compiled in support for 32bit x86_64"));
12261 free (list);
12262 }
12263 else
12264 as_fatal (_("32bit x86_64 is only supported for ELF"));
12265 break;
12266 #endif
12267
12268 case OPTION_32:
12269 default_arch = "i386";
12270 break;
12271
12272 case OPTION_DIVIDE:
12273 #ifdef SVR4_COMMENT_CHARS
12274 {
12275 char *n, *t;
12276 const char *s;
12277
12278 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12279 t = n;
12280 for (s = i386_comment_chars; *s != '\0'; s++)
12281 if (*s != '/')
12282 *t++ = *s;
12283 *t = '\0';
12284 i386_comment_chars = n;
12285 }
12286 #endif
12287 break;
12288
12289 case OPTION_MARCH:
12290 saved = xstrdup (arg);
12291 arch = saved;
12292 /* Allow -march=+nosse. */
12293 if (*arch == '+')
12294 arch++;
12295 do
12296 {
12297 if (*arch == '.')
12298 as_fatal (_("invalid -march= option: `%s'"), arg);
12299 next = strchr (arch, '+');
12300 if (next)
12301 *next++ = '\0';
12302 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12303 {
12304 if (strcmp (arch, cpu_arch [j].name) == 0)
12305 {
12306 /* Processor. */
12307 if (! cpu_arch[j].flags.bitfield.cpui386)
12308 continue;
12309
12310 cpu_arch_name = cpu_arch[j].name;
12311 cpu_sub_arch_name = NULL;
12312 cpu_arch_flags = cpu_arch[j].flags;
12313 cpu_arch_isa = cpu_arch[j].type;
12314 cpu_arch_isa_flags = cpu_arch[j].flags;
12315 if (!cpu_arch_tune_set)
12316 {
12317 cpu_arch_tune = cpu_arch_isa;
12318 cpu_arch_tune_flags = cpu_arch_isa_flags;
12319 }
12320 break;
12321 }
12322 else if (*cpu_arch [j].name == '.'
12323 && strcmp (arch, cpu_arch [j].name + 1) == 0)
12324 {
12325 /* ISA extension. */
12326 i386_cpu_flags flags;
12327
12328 flags = cpu_flags_or (cpu_arch_flags,
12329 cpu_arch[j].flags);
12330
12331 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12332 {
12333 if (cpu_sub_arch_name)
12334 {
12335 char *name = cpu_sub_arch_name;
12336 cpu_sub_arch_name = concat (name,
12337 cpu_arch[j].name,
12338 (const char *) NULL);
12339 free (name);
12340 }
12341 else
12342 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12343 cpu_arch_flags = flags;
12344 cpu_arch_isa_flags = flags;
12345 }
12346 else
12347 cpu_arch_isa_flags
12348 = cpu_flags_or (cpu_arch_isa_flags,
12349 cpu_arch[j].flags);
12350 break;
12351 }
12352 }
12353
12354 if (j >= ARRAY_SIZE (cpu_arch))
12355 {
12356 /* Disable an ISA extension. */
12357 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12358 if (strcmp (arch, cpu_noarch [j].name) == 0)
12359 {
12360 i386_cpu_flags flags;
12361
12362 flags = cpu_flags_and_not (cpu_arch_flags,
12363 cpu_noarch[j].flags);
12364 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12365 {
12366 if (cpu_sub_arch_name)
12367 {
12368 char *name = cpu_sub_arch_name;
12369 cpu_sub_arch_name = concat (arch,
12370 (const char *) NULL);
12371 free (name);
12372 }
12373 else
12374 cpu_sub_arch_name = xstrdup (arch);
12375 cpu_arch_flags = flags;
12376 cpu_arch_isa_flags = flags;
12377 }
12378 break;
12379 }
12380
12381 if (j >= ARRAY_SIZE (cpu_noarch))
12382 j = ARRAY_SIZE (cpu_arch);
12383 }
12384
12385 if (j >= ARRAY_SIZE (cpu_arch))
12386 as_fatal (_("invalid -march= option: `%s'"), arg);
12387
12388 arch = next;
12389 }
12390 while (next != NULL);
12391 free (saved);
12392 break;
12393
12394 case OPTION_MTUNE:
12395 if (*arg == '.')
12396 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12397 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12398 {
12399 if (strcmp (arg, cpu_arch [j].name) == 0)
12400 {
12401 cpu_arch_tune_set = 1;
12402 cpu_arch_tune = cpu_arch [j].type;
12403 cpu_arch_tune_flags = cpu_arch[j].flags;
12404 break;
12405 }
12406 }
12407 if (j >= ARRAY_SIZE (cpu_arch))
12408 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12409 break;
12410
12411 case OPTION_MMNEMONIC:
12412 if (strcasecmp (arg, "att") == 0)
12413 intel_mnemonic = 0;
12414 else if (strcasecmp (arg, "intel") == 0)
12415 intel_mnemonic = 1;
12416 else
12417 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
12418 break;
12419
12420 case OPTION_MSYNTAX:
12421 if (strcasecmp (arg, "att") == 0)
12422 intel_syntax = 0;
12423 else if (strcasecmp (arg, "intel") == 0)
12424 intel_syntax = 1;
12425 else
12426 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
12427 break;
12428
12429 case OPTION_MINDEX_REG:
12430 allow_index_reg = 1;
12431 break;
12432
12433 case OPTION_MNAKED_REG:
12434 allow_naked_reg = 1;
12435 break;
12436
12437 case OPTION_MSSE2AVX:
12438 sse2avx = 1;
12439 break;
12440
12441 case OPTION_MSSE_CHECK:
12442 if (strcasecmp (arg, "error") == 0)
12443 sse_check = check_error;
12444 else if (strcasecmp (arg, "warning") == 0)
12445 sse_check = check_warning;
12446 else if (strcasecmp (arg, "none") == 0)
12447 sse_check = check_none;
12448 else
12449 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
12450 break;
12451
12452 case OPTION_MOPERAND_CHECK:
12453 if (strcasecmp (arg, "error") == 0)
12454 operand_check = check_error;
12455 else if (strcasecmp (arg, "warning") == 0)
12456 operand_check = check_warning;
12457 else if (strcasecmp (arg, "none") == 0)
12458 operand_check = check_none;
12459 else
12460 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
12461 break;
12462
12463 case OPTION_MAVXSCALAR:
12464 if (strcasecmp (arg, "128") == 0)
12465 avxscalar = vex128;
12466 else if (strcasecmp (arg, "256") == 0)
12467 avxscalar = vex256;
12468 else
12469 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
12470 break;
12471
12472 case OPTION_MVEXWIG:
12473 if (strcmp (arg, "0") == 0)
12474 vexwig = vexw0;
12475 else if (strcmp (arg, "1") == 0)
12476 vexwig = vexw1;
12477 else
12478 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
12479 break;
12480
12481 case OPTION_MADD_BND_PREFIX:
12482 add_bnd_prefix = 1;
12483 break;
12484
12485 case OPTION_MEVEXLIG:
12486 if (strcmp (arg, "128") == 0)
12487 evexlig = evexl128;
12488 else if (strcmp (arg, "256") == 0)
12489 evexlig = evexl256;
12490 else if (strcmp (arg, "512") == 0)
12491 evexlig = evexl512;
12492 else
12493 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
12494 break;
12495
12496 case OPTION_MEVEXRCIG:
12497 if (strcmp (arg, "rne") == 0)
12498 evexrcig = rne;
12499 else if (strcmp (arg, "rd") == 0)
12500 evexrcig = rd;
12501 else if (strcmp (arg, "ru") == 0)
12502 evexrcig = ru;
12503 else if (strcmp (arg, "rz") == 0)
12504 evexrcig = rz;
12505 else
12506 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
12507 break;
12508
12509 case OPTION_MEVEXWIG:
12510 if (strcmp (arg, "0") == 0)
12511 evexwig = evexw0;
12512 else if (strcmp (arg, "1") == 0)
12513 evexwig = evexw1;
12514 else
12515 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
12516 break;
12517
12518 # if defined (TE_PE) || defined (TE_PEP)
12519 case OPTION_MBIG_OBJ:
12520 use_big_obj = 1;
12521 break;
12522 #endif
12523
12524 case OPTION_MOMIT_LOCK_PREFIX:
12525 if (strcasecmp (arg, "yes") == 0)
12526 omit_lock_prefix = 1;
12527 else if (strcasecmp (arg, "no") == 0)
12528 omit_lock_prefix = 0;
12529 else
12530 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
12531 break;
12532
12533 case OPTION_MFENCE_AS_LOCK_ADD:
12534 if (strcasecmp (arg, "yes") == 0)
12535 avoid_fence = 1;
12536 else if (strcasecmp (arg, "no") == 0)
12537 avoid_fence = 0;
12538 else
12539 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
12540 break;
12541
12542 case OPTION_MRELAX_RELOCATIONS:
12543 if (strcasecmp (arg, "yes") == 0)
12544 generate_relax_relocations = 1;
12545 else if (strcasecmp (arg, "no") == 0)
12546 generate_relax_relocations = 0;
12547 else
12548 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
12549 break;
12550
12551 case OPTION_MALIGN_BRANCH_BOUNDARY:
12552 {
12553 char *end;
12554 long int align = strtoul (arg, &end, 0);
12555 if (*end == '\0')
12556 {
12557 if (align == 0)
12558 {
12559 align_branch_power = 0;
12560 break;
12561 }
12562 else if (align >= 16)
12563 {
12564 int align_power;
12565 for (align_power = 0;
12566 (align & 1) == 0;
12567 align >>= 1, align_power++)
12568 continue;
12569 /* Limit alignment power to 31. */
12570 if (align == 1 && align_power < 32)
12571 {
12572 align_branch_power = align_power;
12573 break;
12574 }
12575 }
12576 }
12577 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
12578 }
12579 break;
12580
12581 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
12582 {
12583 char *end;
12584 int align = strtoul (arg, &end, 0);
12585 /* Some processors only support 5 prefixes. */
12586 if (*end == '\0' && align >= 0 && align < 6)
12587 {
12588 align_branch_prefix_size = align;
12589 break;
12590 }
12591 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
12592 arg);
12593 }
12594 break;
12595
12596 case OPTION_MALIGN_BRANCH:
12597 align_branch = 0;
12598 saved = xstrdup (arg);
12599 type = saved;
12600 do
12601 {
12602 next = strchr (type, '+');
12603 if (next)
12604 *next++ = '\0';
12605 if (strcasecmp (type, "jcc") == 0)
12606 align_branch |= align_branch_jcc_bit;
12607 else if (strcasecmp (type, "fused") == 0)
12608 align_branch |= align_branch_fused_bit;
12609 else if (strcasecmp (type, "jmp") == 0)
12610 align_branch |= align_branch_jmp_bit;
12611 else if (strcasecmp (type, "call") == 0)
12612 align_branch |= align_branch_call_bit;
12613 else if (strcasecmp (type, "ret") == 0)
12614 align_branch |= align_branch_ret_bit;
12615 else if (strcasecmp (type, "indirect") == 0)
12616 align_branch |= align_branch_indirect_bit;
12617 else
12618 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
12619 type = next;
12620 }
12621 while (next != NULL);
12622 free (saved);
12623 break;
12624
12625 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
12626 align_branch_power = 5;
12627 align_branch_prefix_size = 5;
12628 align_branch = (align_branch_jcc_bit
12629 | align_branch_fused_bit
12630 | align_branch_jmp_bit);
12631 break;
12632
12633 case OPTION_MAMD64:
12634 isa64 = amd64;
12635 break;
12636
12637 case OPTION_MINTEL64:
12638 isa64 = intel64;
12639 break;
12640
12641 case 'O':
12642 if (arg == NULL)
12643 {
12644 optimize = 1;
12645 /* Turn off -Os. */
12646 optimize_for_space = 0;
12647 }
12648 else if (*arg == 's')
12649 {
12650 optimize_for_space = 1;
12651 /* Turn on all encoding optimizations. */
12652 optimize = INT_MAX;
12653 }
12654 else
12655 {
12656 optimize = atoi (arg);
12657 /* Turn off -Os. */
12658 optimize_for_space = 0;
12659 }
12660 break;
12661
12662 default:
12663 return 0;
12664 }
12665 return 1;
12666 }
12667
12668 #define MESSAGE_TEMPLATE \
12669 " "
12670
12671 static char *
12672 output_message (FILE *stream, char *p, char *message, char *start,
12673 int *left_p, const char *name, int len)
12674 {
12675 int size = sizeof (MESSAGE_TEMPLATE);
12676 int left = *left_p;
12677
12678 /* Reserve 2 spaces for ", " or ",\0" */
12679 left -= len + 2;
12680
12681 /* Check if there is any room. */
12682 if (left >= 0)
12683 {
12684 if (p != start)
12685 {
12686 *p++ = ',';
12687 *p++ = ' ';
12688 }
12689 p = mempcpy (p, name, len);
12690 }
12691 else
12692 {
12693 /* Output the current message now and start a new one. */
12694 *p++ = ',';
12695 *p = '\0';
12696 fprintf (stream, "%s\n", message);
12697 p = start;
12698 left = size - (start - message) - len - 2;
12699
12700 gas_assert (left >= 0);
12701
12702 p = mempcpy (p, name, len);
12703 }
12704
12705 *left_p = left;
12706 return p;
12707 }
12708
12709 static void
12710 show_arch (FILE *stream, int ext, int check)
12711 {
12712 static char message[] = MESSAGE_TEMPLATE;
12713 char *start = message + 27;
12714 char *p;
12715 int size = sizeof (MESSAGE_TEMPLATE);
12716 int left;
12717 const char *name;
12718 int len;
12719 unsigned int j;
12720
12721 p = start;
12722 left = size - (start - message);
12723 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12724 {
12725 /* Should it be skipped? */
12726 if (cpu_arch [j].skip)
12727 continue;
12728
12729 name = cpu_arch [j].name;
12730 len = cpu_arch [j].len;
12731 if (*name == '.')
12732 {
12733 /* It is an extension. Skip if we aren't asked to show it. */
12734 if (ext)
12735 {
12736 name++;
12737 len--;
12738 }
12739 else
12740 continue;
12741 }
12742 else if (ext)
12743 {
12744 /* It is an processor. Skip if we show only extension. */
12745 continue;
12746 }
12747 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
12748 {
12749 /* It is an impossible processor - skip. */
12750 continue;
12751 }
12752
12753 p = output_message (stream, p, message, start, &left, name, len);
12754 }
12755
12756 /* Display disabled extensions. */
12757 if (ext)
12758 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12759 {
12760 name = cpu_noarch [j].name;
12761 len = cpu_noarch [j].len;
12762 p = output_message (stream, p, message, start, &left, name,
12763 len);
12764 }
12765
12766 *p = '\0';
12767 fprintf (stream, "%s\n", message);
12768 }
12769
12770 void
12771 md_show_usage (FILE *stream)
12772 {
12773 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12774 fprintf (stream, _("\
12775 -Qy, -Qn ignored\n\
12776 -V print assembler version number\n\
12777 -k ignored\n"));
12778 #endif
12779 fprintf (stream, _("\
12780 -n Do not optimize code alignment\n\
12781 -q quieten some warnings\n"));
12782 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12783 fprintf (stream, _("\
12784 -s ignored\n"));
12785 #endif
12786 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12787 || defined (TE_PE) || defined (TE_PEP))
12788 fprintf (stream, _("\
12789 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
12790 #endif
12791 #ifdef SVR4_COMMENT_CHARS
12792 fprintf (stream, _("\
12793 --divide do not treat `/' as a comment character\n"));
12794 #else
12795 fprintf (stream, _("\
12796 --divide ignored\n"));
12797 #endif
12798 fprintf (stream, _("\
12799 -march=CPU[,+EXTENSION...]\n\
12800 generate code for CPU and EXTENSION, CPU is one of:\n"));
12801 show_arch (stream, 0, 1);
12802 fprintf (stream, _("\
12803 EXTENSION is combination of:\n"));
12804 show_arch (stream, 1, 0);
12805 fprintf (stream, _("\
12806 -mtune=CPU optimize for CPU, CPU is one of:\n"));
12807 show_arch (stream, 0, 0);
12808 fprintf (stream, _("\
12809 -msse2avx encode SSE instructions with VEX prefix\n"));
12810 fprintf (stream, _("\
12811 -msse-check=[none|error|warning] (default: warning)\n\
12812 check SSE instructions\n"));
12813 fprintf (stream, _("\
12814 -moperand-check=[none|error|warning] (default: warning)\n\
12815 check operand combinations for validity\n"));
12816 fprintf (stream, _("\
12817 -mavxscalar=[128|256] (default: 128)\n\
12818 encode scalar AVX instructions with specific vector\n\
12819 length\n"));
12820 fprintf (stream, _("\
12821 -mvexwig=[0|1] (default: 0)\n\
12822 encode VEX instructions with specific VEX.W value\n\
12823 for VEX.W bit ignored instructions\n"));
12824 fprintf (stream, _("\
12825 -mevexlig=[128|256|512] (default: 128)\n\
12826 encode scalar EVEX instructions with specific vector\n\
12827 length\n"));
12828 fprintf (stream, _("\
12829 -mevexwig=[0|1] (default: 0)\n\
12830 encode EVEX instructions with specific EVEX.W value\n\
12831 for EVEX.W bit ignored instructions\n"));
12832 fprintf (stream, _("\
12833 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
12834 encode EVEX instructions with specific EVEX.RC value\n\
12835 for SAE-only ignored instructions\n"));
12836 fprintf (stream, _("\
12837 -mmnemonic=[att|intel] "));
12838 if (SYSV386_COMPAT)
12839 fprintf (stream, _("(default: att)\n"));
12840 else
12841 fprintf (stream, _("(default: intel)\n"));
12842 fprintf (stream, _("\
12843 use AT&T/Intel mnemonic\n"));
12844 fprintf (stream, _("\
12845 -msyntax=[att|intel] (default: att)\n\
12846 use AT&T/Intel syntax\n"));
12847 fprintf (stream, _("\
12848 -mindex-reg support pseudo index registers\n"));
12849 fprintf (stream, _("\
12850 -mnaked-reg don't require `%%' prefix for registers\n"));
12851 fprintf (stream, _("\
12852 -madd-bnd-prefix add BND prefix for all valid branches\n"));
12853 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12854 fprintf (stream, _("\
12855 -mshared disable branch optimization for shared code\n"));
12856 fprintf (stream, _("\
12857 -mx86-used-note=[no|yes] "));
12858 if (DEFAULT_X86_USED_NOTE)
12859 fprintf (stream, _("(default: yes)\n"));
12860 else
12861 fprintf (stream, _("(default: no)\n"));
12862 fprintf (stream, _("\
12863 generate x86 used ISA and feature properties\n"));
12864 #endif
12865 #if defined (TE_PE) || defined (TE_PEP)
12866 fprintf (stream, _("\
12867 -mbig-obj generate big object files\n"));
12868 #endif
12869 fprintf (stream, _("\
12870 -momit-lock-prefix=[no|yes] (default: no)\n\
12871 strip all lock prefixes\n"));
12872 fprintf (stream, _("\
12873 -mfence-as-lock-add=[no|yes] (default: no)\n\
12874 encode lfence, mfence and sfence as\n\
12875 lock addl $0x0, (%%{re}sp)\n"));
12876 fprintf (stream, _("\
12877 -mrelax-relocations=[no|yes] "));
12878 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
12879 fprintf (stream, _("(default: yes)\n"));
12880 else
12881 fprintf (stream, _("(default: no)\n"));
12882 fprintf (stream, _("\
12883 generate relax relocations\n"));
12884 fprintf (stream, _("\
12885 -malign-branch-boundary=NUM (default: 0)\n\
12886 align branches within NUM byte boundary\n"));
12887 fprintf (stream, _("\
12888 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
12889 TYPE is combination of jcc, fused, jmp, call, ret,\n\
12890 indirect\n\
12891 specify types of branches to align\n"));
12892 fprintf (stream, _("\
12893 -malign-branch-prefix-size=NUM (default: 5)\n\
12894 align branches with NUM prefixes per instruction\n"));
12895 fprintf (stream, _("\
12896 -mbranches-within-32B-boundaries\n\
12897 align branches within 32 byte boundary\n"));
12898 fprintf (stream, _("\
12899 -mamd64 accept only AMD64 ISA [default]\n"));
12900 fprintf (stream, _("\
12901 -mintel64 accept only Intel64 ISA\n"));
12902 }
12903
12904 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
12905 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12906 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12907
12908 /* Pick the target format to use. */
12909
12910 const char *
12911 i386_target_format (void)
12912 {
12913 if (!strncmp (default_arch, "x86_64", 6))
12914 {
12915 update_code_flag (CODE_64BIT, 1);
12916 if (default_arch[6] == '\0')
12917 x86_elf_abi = X86_64_ABI;
12918 else
12919 x86_elf_abi = X86_64_X32_ABI;
12920 }
12921 else if (!strcmp (default_arch, "i386"))
12922 update_code_flag (CODE_32BIT, 1);
12923 else if (!strcmp (default_arch, "iamcu"))
12924 {
12925 update_code_flag (CODE_32BIT, 1);
12926 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
12927 {
12928 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
12929 cpu_arch_name = "iamcu";
12930 cpu_sub_arch_name = NULL;
12931 cpu_arch_flags = iamcu_flags;
12932 cpu_arch_isa = PROCESSOR_IAMCU;
12933 cpu_arch_isa_flags = iamcu_flags;
12934 if (!cpu_arch_tune_set)
12935 {
12936 cpu_arch_tune = cpu_arch_isa;
12937 cpu_arch_tune_flags = cpu_arch_isa_flags;
12938 }
12939 }
12940 else if (cpu_arch_isa != PROCESSOR_IAMCU)
12941 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
12942 cpu_arch_name);
12943 }
12944 else
12945 as_fatal (_("unknown architecture"));
12946
12947 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
12948 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12949 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
12950 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12951
12952 switch (OUTPUT_FLAVOR)
12953 {
12954 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
12955 case bfd_target_aout_flavour:
12956 return AOUT_TARGET_FORMAT;
12957 #endif
12958 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
12959 # if defined (TE_PE) || defined (TE_PEP)
12960 case bfd_target_coff_flavour:
12961 if (flag_code == CODE_64BIT)
12962 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
12963 else
12964 return "pe-i386";
12965 # elif defined (TE_GO32)
12966 case bfd_target_coff_flavour:
12967 return "coff-go32";
12968 # else
12969 case bfd_target_coff_flavour:
12970 return "coff-i386";
12971 # endif
12972 #endif
12973 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12974 case bfd_target_elf_flavour:
12975 {
12976 const char *format;
12977
12978 switch (x86_elf_abi)
12979 {
12980 default:
12981 format = ELF_TARGET_FORMAT;
12982 #ifndef TE_SOLARIS
12983 tls_get_addr = "___tls_get_addr";
12984 #endif
12985 break;
12986 case X86_64_ABI:
12987 use_rela_relocations = 1;
12988 object_64bit = 1;
12989 #ifndef TE_SOLARIS
12990 tls_get_addr = "__tls_get_addr";
12991 #endif
12992 format = ELF_TARGET_FORMAT64;
12993 break;
12994 case X86_64_X32_ABI:
12995 use_rela_relocations = 1;
12996 object_64bit = 1;
12997 #ifndef TE_SOLARIS
12998 tls_get_addr = "__tls_get_addr";
12999 #endif
13000 disallow_64bit_reloc = 1;
13001 format = ELF_TARGET_FORMAT32;
13002 break;
13003 }
13004 if (cpu_arch_isa == PROCESSOR_L1OM)
13005 {
13006 if (x86_elf_abi != X86_64_ABI)
13007 as_fatal (_("Intel L1OM is 64bit only"));
13008 return ELF_TARGET_L1OM_FORMAT;
13009 }
13010 else if (cpu_arch_isa == PROCESSOR_K1OM)
13011 {
13012 if (x86_elf_abi != X86_64_ABI)
13013 as_fatal (_("Intel K1OM is 64bit only"));
13014 return ELF_TARGET_K1OM_FORMAT;
13015 }
13016 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13017 {
13018 if (x86_elf_abi != I386_ABI)
13019 as_fatal (_("Intel MCU is 32bit only"));
13020 return ELF_TARGET_IAMCU_FORMAT;
13021 }
13022 else
13023 return format;
13024 }
13025 #endif
13026 #if defined (OBJ_MACH_O)
13027 case bfd_target_mach_o_flavour:
13028 if (flag_code == CODE_64BIT)
13029 {
13030 use_rela_relocations = 1;
13031 object_64bit = 1;
13032 return "mach-o-x86-64";
13033 }
13034 else
13035 return "mach-o-i386";
13036 #endif
13037 default:
13038 abort ();
13039 return NULL;
13040 }
13041 }
13042
13043 #endif /* OBJ_MAYBE_ more than one */
13044 \f
13045 symbolS *
13046 md_undefined_symbol (char *name)
13047 {
13048 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13049 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13050 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13051 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13052 {
13053 if (!GOT_symbol)
13054 {
13055 if (symbol_find (name))
13056 as_bad (_("GOT already in symbol table"));
13057 GOT_symbol = symbol_new (name, undefined_section,
13058 (valueT) 0, &zero_address_frag);
13059 };
13060 return GOT_symbol;
13061 }
13062 return 0;
13063 }
13064
13065 /* Round up a section size to the appropriate boundary. */
13066
13067 valueT
13068 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13069 {
13070 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13071 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13072 {
13073 /* For a.out, force the section size to be aligned. If we don't do
13074 this, BFD will align it for us, but it will not write out the
13075 final bytes of the section. This may be a bug in BFD, but it is
13076 easier to fix it here since that is how the other a.out targets
13077 work. */
13078 int align;
13079
13080 align = bfd_section_alignment (segment);
13081 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13082 }
13083 #endif
13084
13085 return size;
13086 }
13087
13088 /* On the i386, PC-relative offsets are relative to the start of the
13089 next instruction. That is, the address of the offset, plus its
13090 size, since the offset is always the last part of the insn. */
13091
13092 long
13093 md_pcrel_from (fixS *fixP)
13094 {
13095 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13096 }
13097
13098 #ifndef I386COFF
13099
13100 static void
13101 s_bss (int ignore ATTRIBUTE_UNUSED)
13102 {
13103 int temp;
13104
13105 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13106 if (IS_ELF)
13107 obj_elf_section_change_hook ();
13108 #endif
13109 temp = get_absolute_expression ();
13110 subseg_set (bss_section, (subsegT) temp);
13111 demand_empty_rest_of_line ();
13112 }
13113
13114 #endif
13115
13116 /* Remember constant directive. */
13117
13118 void
13119 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13120 {
13121 if (last_insn.kind != last_insn_directive
13122 && (bfd_section_flags (now_seg) & SEC_CODE))
13123 {
13124 last_insn.seg = now_seg;
13125 last_insn.kind = last_insn_directive;
13126 last_insn.name = "constant directive";
13127 last_insn.file = as_where (&last_insn.line);
13128 }
13129 }
13130
13131 void
13132 i386_validate_fix (fixS *fixp)
13133 {
13134 if (fixp->fx_subsy)
13135 {
13136 if (fixp->fx_subsy == GOT_symbol)
13137 {
13138 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13139 {
13140 if (!object_64bit)
13141 abort ();
13142 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13143 if (fixp->fx_tcbit2)
13144 fixp->fx_r_type = (fixp->fx_tcbit
13145 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13146 : BFD_RELOC_X86_64_GOTPCRELX);
13147 else
13148 #endif
13149 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13150 }
13151 else
13152 {
13153 if (!object_64bit)
13154 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13155 else
13156 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13157 }
13158 fixp->fx_subsy = 0;
13159 }
13160 }
13161 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13162 else if (!object_64bit)
13163 {
13164 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13165 && fixp->fx_tcbit2)
13166 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13167 }
13168 #endif
13169 }
13170
13171 arelent *
13172 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13173 {
13174 arelent *rel;
13175 bfd_reloc_code_real_type code;
13176
13177 switch (fixp->fx_r_type)
13178 {
13179 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13180 case BFD_RELOC_SIZE32:
13181 case BFD_RELOC_SIZE64:
13182 if (S_IS_DEFINED (fixp->fx_addsy)
13183 && !S_IS_EXTERNAL (fixp->fx_addsy))
13184 {
13185 /* Resolve size relocation against local symbol to size of
13186 the symbol plus addend. */
13187 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13188 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13189 && !fits_in_unsigned_long (value))
13190 as_bad_where (fixp->fx_file, fixp->fx_line,
13191 _("symbol size computation overflow"));
13192 fixp->fx_addsy = NULL;
13193 fixp->fx_subsy = NULL;
13194 md_apply_fix (fixp, (valueT *) &value, NULL);
13195 return NULL;
13196 }
13197 #endif
13198 /* Fall through. */
13199
13200 case BFD_RELOC_X86_64_PLT32:
13201 case BFD_RELOC_X86_64_GOT32:
13202 case BFD_RELOC_X86_64_GOTPCREL:
13203 case BFD_RELOC_X86_64_GOTPCRELX:
13204 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13205 case BFD_RELOC_386_PLT32:
13206 case BFD_RELOC_386_GOT32:
13207 case BFD_RELOC_386_GOT32X:
13208 case BFD_RELOC_386_GOTOFF:
13209 case BFD_RELOC_386_GOTPC:
13210 case BFD_RELOC_386_TLS_GD:
13211 case BFD_RELOC_386_TLS_LDM:
13212 case BFD_RELOC_386_TLS_LDO_32:
13213 case BFD_RELOC_386_TLS_IE_32:
13214 case BFD_RELOC_386_TLS_IE:
13215 case BFD_RELOC_386_TLS_GOTIE:
13216 case BFD_RELOC_386_TLS_LE_32:
13217 case BFD_RELOC_386_TLS_LE:
13218 case BFD_RELOC_386_TLS_GOTDESC:
13219 case BFD_RELOC_386_TLS_DESC_CALL:
13220 case BFD_RELOC_X86_64_TLSGD:
13221 case BFD_RELOC_X86_64_TLSLD:
13222 case BFD_RELOC_X86_64_DTPOFF32:
13223 case BFD_RELOC_X86_64_DTPOFF64:
13224 case BFD_RELOC_X86_64_GOTTPOFF:
13225 case BFD_RELOC_X86_64_TPOFF32:
13226 case BFD_RELOC_X86_64_TPOFF64:
13227 case BFD_RELOC_X86_64_GOTOFF64:
13228 case BFD_RELOC_X86_64_GOTPC32:
13229 case BFD_RELOC_X86_64_GOT64:
13230 case BFD_RELOC_X86_64_GOTPCREL64:
13231 case BFD_RELOC_X86_64_GOTPC64:
13232 case BFD_RELOC_X86_64_GOTPLT64:
13233 case BFD_RELOC_X86_64_PLTOFF64:
13234 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13235 case BFD_RELOC_X86_64_TLSDESC_CALL:
13236 case BFD_RELOC_RVA:
13237 case BFD_RELOC_VTABLE_ENTRY:
13238 case BFD_RELOC_VTABLE_INHERIT:
13239 #ifdef TE_PE
13240 case BFD_RELOC_32_SECREL:
13241 #endif
13242 code = fixp->fx_r_type;
13243 break;
13244 case BFD_RELOC_X86_64_32S:
13245 if (!fixp->fx_pcrel)
13246 {
13247 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13248 code = fixp->fx_r_type;
13249 break;
13250 }
13251 /* Fall through. */
13252 default:
13253 if (fixp->fx_pcrel)
13254 {
13255 switch (fixp->fx_size)
13256 {
13257 default:
13258 as_bad_where (fixp->fx_file, fixp->fx_line,
13259 _("can not do %d byte pc-relative relocation"),
13260 fixp->fx_size);
13261 code = BFD_RELOC_32_PCREL;
13262 break;
13263 case 1: code = BFD_RELOC_8_PCREL; break;
13264 case 2: code = BFD_RELOC_16_PCREL; break;
13265 case 4: code = BFD_RELOC_32_PCREL; break;
13266 #ifdef BFD64
13267 case 8: code = BFD_RELOC_64_PCREL; break;
13268 #endif
13269 }
13270 }
13271 else
13272 {
13273 switch (fixp->fx_size)
13274 {
13275 default:
13276 as_bad_where (fixp->fx_file, fixp->fx_line,
13277 _("can not do %d byte relocation"),
13278 fixp->fx_size);
13279 code = BFD_RELOC_32;
13280 break;
13281 case 1: code = BFD_RELOC_8; break;
13282 case 2: code = BFD_RELOC_16; break;
13283 case 4: code = BFD_RELOC_32; break;
13284 #ifdef BFD64
13285 case 8: code = BFD_RELOC_64; break;
13286 #endif
13287 }
13288 }
13289 break;
13290 }
13291
13292 if ((code == BFD_RELOC_32
13293 || code == BFD_RELOC_32_PCREL
13294 || code == BFD_RELOC_X86_64_32S)
13295 && GOT_symbol
13296 && fixp->fx_addsy == GOT_symbol)
13297 {
13298 if (!object_64bit)
13299 code = BFD_RELOC_386_GOTPC;
13300 else
13301 code = BFD_RELOC_X86_64_GOTPC32;
13302 }
13303 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13304 && GOT_symbol
13305 && fixp->fx_addsy == GOT_symbol)
13306 {
13307 code = BFD_RELOC_X86_64_GOTPC64;
13308 }
13309
13310 rel = XNEW (arelent);
13311 rel->sym_ptr_ptr = XNEW (asymbol *);
13312 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13313
13314 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13315
13316 if (!use_rela_relocations)
13317 {
13318 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13319 vtable entry to be used in the relocation's section offset. */
13320 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13321 rel->address = fixp->fx_offset;
13322 #if defined (OBJ_COFF) && defined (TE_PE)
13323 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13324 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13325 else
13326 #endif
13327 rel->addend = 0;
13328 }
13329 /* Use the rela in 64bit mode. */
13330 else
13331 {
13332 if (disallow_64bit_reloc)
13333 switch (code)
13334 {
13335 case BFD_RELOC_X86_64_DTPOFF64:
13336 case BFD_RELOC_X86_64_TPOFF64:
13337 case BFD_RELOC_64_PCREL:
13338 case BFD_RELOC_X86_64_GOTOFF64:
13339 case BFD_RELOC_X86_64_GOT64:
13340 case BFD_RELOC_X86_64_GOTPCREL64:
13341 case BFD_RELOC_X86_64_GOTPC64:
13342 case BFD_RELOC_X86_64_GOTPLT64:
13343 case BFD_RELOC_X86_64_PLTOFF64:
13344 as_bad_where (fixp->fx_file, fixp->fx_line,
13345 _("cannot represent relocation type %s in x32 mode"),
13346 bfd_get_reloc_code_name (code));
13347 break;
13348 default:
13349 break;
13350 }
13351
13352 if (!fixp->fx_pcrel)
13353 rel->addend = fixp->fx_offset;
13354 else
13355 switch (code)
13356 {
13357 case BFD_RELOC_X86_64_PLT32:
13358 case BFD_RELOC_X86_64_GOT32:
13359 case BFD_RELOC_X86_64_GOTPCREL:
13360 case BFD_RELOC_X86_64_GOTPCRELX:
13361 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13362 case BFD_RELOC_X86_64_TLSGD:
13363 case BFD_RELOC_X86_64_TLSLD:
13364 case BFD_RELOC_X86_64_GOTTPOFF:
13365 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13366 case BFD_RELOC_X86_64_TLSDESC_CALL:
13367 rel->addend = fixp->fx_offset - fixp->fx_size;
13368 break;
13369 default:
13370 rel->addend = (section->vma
13371 - fixp->fx_size
13372 + fixp->fx_addnumber
13373 + md_pcrel_from (fixp));
13374 break;
13375 }
13376 }
13377
13378 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
13379 if (rel->howto == NULL)
13380 {
13381 as_bad_where (fixp->fx_file, fixp->fx_line,
13382 _("cannot represent relocation type %s"),
13383 bfd_get_reloc_code_name (code));
13384 /* Set howto to a garbage value so that we can keep going. */
13385 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
13386 gas_assert (rel->howto != NULL);
13387 }
13388
13389 return rel;
13390 }
13391
13392 #include "tc-i386-intel.c"
13393
13394 void
13395 tc_x86_parse_to_dw2regnum (expressionS *exp)
13396 {
13397 int saved_naked_reg;
13398 char saved_register_dot;
13399
13400 saved_naked_reg = allow_naked_reg;
13401 allow_naked_reg = 1;
13402 saved_register_dot = register_chars['.'];
13403 register_chars['.'] = '.';
13404 allow_pseudo_reg = 1;
13405 expression_and_evaluate (exp);
13406 allow_pseudo_reg = 0;
13407 register_chars['.'] = saved_register_dot;
13408 allow_naked_reg = saved_naked_reg;
13409
13410 if (exp->X_op == O_register && exp->X_add_number >= 0)
13411 {
13412 if ((addressT) exp->X_add_number < i386_regtab_size)
13413 {
13414 exp->X_op = O_constant;
13415 exp->X_add_number = i386_regtab[exp->X_add_number]
13416 .dw2_regnum[flag_code >> 1];
13417 }
13418 else
13419 exp->X_op = O_illegal;
13420 }
13421 }
13422
13423 void
13424 tc_x86_frame_initial_instructions (void)
13425 {
13426 static unsigned int sp_regno[2];
13427
13428 if (!sp_regno[flag_code >> 1])
13429 {
13430 char *saved_input = input_line_pointer;
13431 char sp[][4] = {"esp", "rsp"};
13432 expressionS exp;
13433
13434 input_line_pointer = sp[flag_code >> 1];
13435 tc_x86_parse_to_dw2regnum (&exp);
13436 gas_assert (exp.X_op == O_constant);
13437 sp_regno[flag_code >> 1] = exp.X_add_number;
13438 input_line_pointer = saved_input;
13439 }
13440
13441 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
13442 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
13443 }
13444
13445 int
13446 x86_dwarf2_addr_size (void)
13447 {
13448 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13449 if (x86_elf_abi == X86_64_X32_ABI)
13450 return 4;
13451 #endif
13452 return bfd_arch_bits_per_address (stdoutput) / 8;
13453 }
13454
13455 int
13456 i386_elf_section_type (const char *str, size_t len)
13457 {
13458 if (flag_code == CODE_64BIT
13459 && len == sizeof ("unwind") - 1
13460 && strncmp (str, "unwind", 6) == 0)
13461 return SHT_X86_64_UNWIND;
13462
13463 return -1;
13464 }
13465
13466 #ifdef TE_SOLARIS
13467 void
13468 i386_solaris_fix_up_eh_frame (segT sec)
13469 {
13470 if (flag_code == CODE_64BIT)
13471 elf_section_type (sec) = SHT_X86_64_UNWIND;
13472 }
13473 #endif
13474
13475 #ifdef TE_PE
13476 void
13477 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
13478 {
13479 expressionS exp;
13480
13481 exp.X_op = O_secrel;
13482 exp.X_add_symbol = symbol;
13483 exp.X_add_number = 0;
13484 emit_expr (&exp, size);
13485 }
13486 #endif
13487
13488 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13489 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
13490
13491 bfd_vma
13492 x86_64_section_letter (int letter, const char **ptr_msg)
13493 {
13494 if (flag_code == CODE_64BIT)
13495 {
13496 if (letter == 'l')
13497 return SHF_X86_64_LARGE;
13498
13499 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
13500 }
13501 else
13502 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
13503 return -1;
13504 }
13505
13506 bfd_vma
13507 x86_64_section_word (char *str, size_t len)
13508 {
13509 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
13510 return SHF_X86_64_LARGE;
13511
13512 return -1;
13513 }
13514
13515 static void
13516 handle_large_common (int small ATTRIBUTE_UNUSED)
13517 {
13518 if (flag_code != CODE_64BIT)
13519 {
13520 s_comm_internal (0, elf_common_parse);
13521 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
13522 }
13523 else
13524 {
13525 static segT lbss_section;
13526 asection *saved_com_section_ptr = elf_com_section_ptr;
13527 asection *saved_bss_section = bss_section;
13528
13529 if (lbss_section == NULL)
13530 {
13531 flagword applicable;
13532 segT seg = now_seg;
13533 subsegT subseg = now_subseg;
13534
13535 /* The .lbss section is for local .largecomm symbols. */
13536 lbss_section = subseg_new (".lbss", 0);
13537 applicable = bfd_applicable_section_flags (stdoutput);
13538 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
13539 seg_info (lbss_section)->bss = 1;
13540
13541 subseg_set (seg, subseg);
13542 }
13543
13544 elf_com_section_ptr = &_bfd_elf_large_com_section;
13545 bss_section = lbss_section;
13546
13547 s_comm_internal (0, elf_common_parse);
13548
13549 elf_com_section_ptr = saved_com_section_ptr;
13550 bss_section = saved_bss_section;
13551 }
13552 }
13553 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 0.321523 seconds and 4 git commands to generate.