Indent labels
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef INFER_ADDR_PREFIX
48 #define INFER_ADDR_PREFIX 1
49 #endif
50
51 #ifndef DEFAULT_ARCH
52 #define DEFAULT_ARCH "i386"
53 #endif
54
55 #ifndef INLINE
56 #if __GNUC__ >= 2
57 #define INLINE __inline__
58 #else
59 #define INLINE
60 #endif
61 #endif
62
63 /* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
68 #define WAIT_PREFIX 0
69 #define SEG_PREFIX 1
70 #define ADDR_PREFIX 2
71 #define DATA_PREFIX 3
72 #define REP_PREFIX 4
73 #define HLE_PREFIX REP_PREFIX
74 #define BND_PREFIX REP_PREFIX
75 #define LOCK_PREFIX 5
76 #define REX_PREFIX 6 /* must come last. */
77 #define MAX_PREFIXES 7 /* max prefixes per opcode */
78
79 /* we define the syntax here (modulo base,index,scale syntax) */
80 #define REGISTER_PREFIX '%'
81 #define IMMEDIATE_PREFIX '$'
82 #define ABSOLUTE_PREFIX '*'
83
84 /* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86 #define WORD_MNEM_SUFFIX 'w'
87 #define BYTE_MNEM_SUFFIX 'b'
88 #define SHORT_MNEM_SUFFIX 's'
89 #define LONG_MNEM_SUFFIX 'l'
90 #define QWORD_MNEM_SUFFIX 'q'
91 /* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95 #define END_OF_INSN '\0'
96
97 /* This matches the C -> StaticRounding alias in the opcode table. */
98 #define commutative staticrounding
99
100 /*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107 typedef struct
108 {
109 const insn_template *start;
110 const insn_template *end;
111 }
112 templates;
113
114 /* 386 operand encoding bytes: see 386 book for details of this. */
115 typedef struct
116 {
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120 }
121 modrm_byte;
122
123 /* x86-64 extension prefix. */
124 typedef int rex_byte;
125
126 /* 386 opcode byte to code indirect addressing. */
127 typedef struct
128 {
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132 }
133 sib_byte;
134
135 /* x86 arch names, types and features */
136 typedef struct
137 {
138 const char *name; /* arch name */
139 unsigned int len; /* arch string length */
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
142 unsigned int skip; /* show_arch should skip this. */
143 }
144 arch_entry;
145
146 /* Used to turn off indicated flags. */
147 typedef struct
148 {
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152 }
153 noarch_entry;
154
155 static void update_code_flag (int, int);
156 static void set_code_flag (int);
157 static void set_16bit_gcc_code_flag (int);
158 static void set_intel_syntax (int);
159 static void set_intel_mnemonic (int);
160 static void set_allow_index_reg (int);
161 static void set_check (int);
162 static void set_cpu_arch (int);
163 #ifdef TE_PE
164 static void pe_directive_secrel (int);
165 #endif
166 static void signed_cons (int);
167 static char *output_invalid (int c);
168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
172 static int i386_att_operand (char *);
173 static int i386_intel_operand (char *, int);
174 static int i386_intel_simplify (expressionS *);
175 static int i386_intel_parse_name (const char *, expressionS *);
176 static const reg_entry *parse_register (char *, char **);
177 static char *parse_insn (char *, char *);
178 static char *parse_operands (char *, const char *);
179 static void swap_operands (void);
180 static void swap_2_operands (int, int);
181 static enum flag_code i386_addressing_mode (void);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
202
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
210
211 static const char *default_arch = DEFAULT_ARCH;
212
213 /* This struct describes rounding control and SAE in the instruction. */
214 struct RC_Operation
215 {
216 enum rc_type
217 {
218 rne = 0,
219 rd,
220 ru,
221 rz,
222 saeonly
223 } type;
224 int operand;
225 };
226
227 static struct RC_Operation rc_op;
228
229 /* The struct describes masking, applied to OPERAND in the instruction.
230 MASK is a pointer to the corresponding mask register. ZEROING tells
231 whether merging or zeroing mask is used. */
232 struct Mask_Operation
233 {
234 const reg_entry *mask;
235 unsigned int zeroing;
236 /* The operand where this operation is associated. */
237 int operand;
238 };
239
240 static struct Mask_Operation mask_op;
241
242 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
243 broadcast factor. */
244 struct Broadcast_Operation
245 {
246 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
247 int type;
248
249 /* Index of broadcasted operand. */
250 int operand;
251
252 /* Number of bytes to broadcast. */
253 int bytes;
254 };
255
256 static struct Broadcast_Operation broadcast_op;
257
258 /* VEX prefix. */
259 typedef struct
260 {
261 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
262 unsigned char bytes[4];
263 unsigned int length;
264 /* Destination or source register specifier. */
265 const reg_entry *register_specifier;
266 } vex_prefix;
267
268 /* 'md_assemble ()' gathers together information and puts it into a
269 i386_insn. */
270
271 union i386_op
272 {
273 expressionS *disps;
274 expressionS *imms;
275 const reg_entry *regs;
276 };
277
278 enum i386_error
279 {
280 operand_size_mismatch,
281 operand_type_mismatch,
282 register_type_mismatch,
283 number_of_operands_mismatch,
284 invalid_instruction_suffix,
285 bad_imm4,
286 unsupported_with_intel_mnemonic,
287 unsupported_syntax,
288 unsupported,
289 invalid_vsib_address,
290 invalid_vector_register_set,
291 unsupported_vector_index_register,
292 unsupported_broadcast,
293 broadcast_needed,
294 unsupported_masking,
295 mask_not_on_destination,
296 no_default_mask,
297 unsupported_rc_sae,
298 rc_sae_operand_not_last_imm,
299 invalid_register_operand,
300 };
301
302 struct _i386_insn
303 {
304 /* TM holds the template for the insn were currently assembling. */
305 insn_template tm;
306
307 /* SUFFIX holds the instruction size suffix for byte, word, dword
308 or qword, if given. */
309 char suffix;
310
311 /* OPERANDS gives the number of given operands. */
312 unsigned int operands;
313
314 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
315 of given register, displacement, memory operands and immediate
316 operands. */
317 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
318
319 /* TYPES [i] is the type (see above #defines) which tells us how to
320 use OP[i] for the corresponding operand. */
321 i386_operand_type types[MAX_OPERANDS];
322
323 /* Displacement expression, immediate expression, or register for each
324 operand. */
325 union i386_op op[MAX_OPERANDS];
326
327 /* Flags for operands. */
328 unsigned int flags[MAX_OPERANDS];
329 #define Operand_PCrel 1
330 #define Operand_Mem 2
331
332 /* Relocation type for operand */
333 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
334
335 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
336 the base index byte below. */
337 const reg_entry *base_reg;
338 const reg_entry *index_reg;
339 unsigned int log2_scale_factor;
340
341 /* SEG gives the seg_entries of this insn. They are zero unless
342 explicit segment overrides are given. */
343 const seg_entry *seg[2];
344
345 /* Copied first memory operand string, for re-checking. */
346 char *memop1_string;
347
348 /* PREFIX holds all the given prefix opcodes (usually null).
349 PREFIXES is the number of prefix opcodes. */
350 unsigned int prefixes;
351 unsigned char prefix[MAX_PREFIXES];
352
353 /* Register is in low 3 bits of opcode. */
354 bfd_boolean short_form;
355
356 /* The operand to a branch insn indicates an absolute branch. */
357 bfd_boolean jumpabsolute;
358
359 /* Has MMX register operands. */
360 bfd_boolean has_regmmx;
361
362 /* Has XMM register operands. */
363 bfd_boolean has_regxmm;
364
365 /* Has YMM register operands. */
366 bfd_boolean has_regymm;
367
368 /* Has ZMM register operands. */
369 bfd_boolean has_regzmm;
370
371 /* Has GOTPC or TLS relocation. */
372 bfd_boolean has_gotpc_tls_reloc;
373
374 /* RM and SIB are the modrm byte and the sib byte where the
375 addressing modes of this insn are encoded. */
376 modrm_byte rm;
377 rex_byte rex;
378 rex_byte vrex;
379 sib_byte sib;
380 vex_prefix vex;
381
382 /* Masking attributes. */
383 struct Mask_Operation *mask;
384
385 /* Rounding control and SAE attributes. */
386 struct RC_Operation *rounding;
387
388 /* Broadcasting attributes. */
389 struct Broadcast_Operation *broadcast;
390
391 /* Compressed disp8*N attribute. */
392 unsigned int memshift;
393
394 /* Prefer load or store in encoding. */
395 enum
396 {
397 dir_encoding_default = 0,
398 dir_encoding_load,
399 dir_encoding_store,
400 dir_encoding_swap
401 } dir_encoding;
402
403 /* Prefer 8bit or 32bit displacement in encoding. */
404 enum
405 {
406 disp_encoding_default = 0,
407 disp_encoding_8bit,
408 disp_encoding_32bit
409 } disp_encoding;
410
411 /* Prefer the REX byte in encoding. */
412 bfd_boolean rex_encoding;
413
414 /* Disable instruction size optimization. */
415 bfd_boolean no_optimize;
416
417 /* How to encode vector instructions. */
418 enum
419 {
420 vex_encoding_default = 0,
421 vex_encoding_vex,
422 vex_encoding_vex3,
423 vex_encoding_evex
424 } vec_encoding;
425
426 /* REP prefix. */
427 const char *rep_prefix;
428
429 /* HLE prefix. */
430 const char *hle_prefix;
431
432 /* Have BND prefix. */
433 const char *bnd_prefix;
434
435 /* Have NOTRACK prefix. */
436 const char *notrack_prefix;
437
438 /* Error message. */
439 enum i386_error error;
440 };
441
442 typedef struct _i386_insn i386_insn;
443
444 /* Link RC type with corresponding string, that'll be looked for in
445 asm. */
446 struct RC_name
447 {
448 enum rc_type type;
449 const char *name;
450 unsigned int len;
451 };
452
453 static const struct RC_name RC_NamesTable[] =
454 {
455 { rne, STRING_COMMA_LEN ("rn-sae") },
456 { rd, STRING_COMMA_LEN ("rd-sae") },
457 { ru, STRING_COMMA_LEN ("ru-sae") },
458 { rz, STRING_COMMA_LEN ("rz-sae") },
459 { saeonly, STRING_COMMA_LEN ("sae") },
460 };
461
462 /* List of chars besides those in app.c:symbol_chars that can start an
463 operand. Used to prevent the scrubber eating vital white-space. */
464 const char extra_symbol_chars[] = "*%-([{}"
465 #ifdef LEX_AT
466 "@"
467 #endif
468 #ifdef LEX_QM
469 "?"
470 #endif
471 ;
472
473 #if (defined (TE_I386AIX) \
474 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
475 && !defined (TE_GNU) \
476 && !defined (TE_LINUX) \
477 && !defined (TE_NACL) \
478 && !defined (TE_FreeBSD) \
479 && !defined (TE_DragonFly) \
480 && !defined (TE_NetBSD)))
481 /* This array holds the chars that always start a comment. If the
482 pre-processor is disabled, these aren't very useful. The option
483 --divide will remove '/' from this list. */
484 const char *i386_comment_chars = "#/";
485 #define SVR4_COMMENT_CHARS 1
486 #define PREFIX_SEPARATOR '\\'
487
488 #else
489 const char *i386_comment_chars = "#";
490 #define PREFIX_SEPARATOR '/'
491 #endif
492
493 /* This array holds the chars that only start a comment at the beginning of
494 a line. If the line seems to have the form '# 123 filename'
495 .line and .file directives will appear in the pre-processed output.
496 Note that input_file.c hand checks for '#' at the beginning of the
497 first line of the input file. This is because the compiler outputs
498 #NO_APP at the beginning of its output.
499 Also note that comments started like this one will always work if
500 '/' isn't otherwise defined. */
501 const char line_comment_chars[] = "#/";
502
503 const char line_separator_chars[] = ";";
504
505 /* Chars that can be used to separate mant from exp in floating point
506 nums. */
507 const char EXP_CHARS[] = "eE";
508
509 /* Chars that mean this number is a floating point constant
510 As in 0f12.456
511 or 0d1.2345e12. */
512 const char FLT_CHARS[] = "fFdDxX";
513
514 /* Tables for lexical analysis. */
515 static char mnemonic_chars[256];
516 static char register_chars[256];
517 static char operand_chars[256];
518 static char identifier_chars[256];
519 static char digit_chars[256];
520
521 /* Lexical macros. */
522 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
523 #define is_operand_char(x) (operand_chars[(unsigned char) x])
524 #define is_register_char(x) (register_chars[(unsigned char) x])
525 #define is_space_char(x) ((x) == ' ')
526 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
527 #define is_digit_char(x) (digit_chars[(unsigned char) x])
528
529 /* All non-digit non-letter characters that may occur in an operand. */
530 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
531
532 /* md_assemble() always leaves the strings it's passed unaltered. To
533 effect this we maintain a stack of saved characters that we've smashed
534 with '\0's (indicating end of strings for various sub-fields of the
535 assembler instruction). */
536 static char save_stack[32];
537 static char *save_stack_p;
538 #define END_STRING_AND_SAVE(s) \
539 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
540 #define RESTORE_END_STRING(s) \
541 do { *(s) = *--save_stack_p; } while (0)
542
543 /* The instruction we're assembling. */
544 static i386_insn i;
545
546 /* Possible templates for current insn. */
547 static const templates *current_templates;
548
549 /* Per instruction expressionS buffers: max displacements & immediates. */
550 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
551 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
552
553 /* Current operand we are working on. */
554 static int this_operand = -1;
555
556 /* We support four different modes. FLAG_CODE variable is used to distinguish
557 these. */
558
559 enum flag_code {
560 CODE_32BIT,
561 CODE_16BIT,
562 CODE_64BIT };
563
564 static enum flag_code flag_code;
565 static unsigned int object_64bit;
566 static unsigned int disallow_64bit_reloc;
567 static int use_rela_relocations = 0;
568 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
569 static const char *tls_get_addr;
570
571 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
572 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
573 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
574
575 /* The ELF ABI to use. */
576 enum x86_elf_abi
577 {
578 I386_ABI,
579 X86_64_ABI,
580 X86_64_X32_ABI
581 };
582
583 static enum x86_elf_abi x86_elf_abi = I386_ABI;
584 #endif
585
586 #if defined (TE_PE) || defined (TE_PEP)
587 /* Use big object file format. */
588 static int use_big_obj = 0;
589 #endif
590
591 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
592 /* 1 if generating code for a shared library. */
593 static int shared = 0;
594 #endif
595
596 /* 1 for intel syntax,
597 0 if att syntax. */
598 static int intel_syntax = 0;
599
600 static enum x86_64_isa
601 {
602 amd64 = 1, /* AMD64 ISA. */
603 intel64 /* Intel64 ISA. */
604 } isa64;
605
606 /* 1 for intel mnemonic,
607 0 if att mnemonic. */
608 static int intel_mnemonic = !SYSV386_COMPAT;
609
610 /* 1 if pseudo registers are permitted. */
611 static int allow_pseudo_reg = 0;
612
613 /* 1 if register prefix % not required. */
614 static int allow_naked_reg = 0;
615
616 /* 1 if the assembler should add BND prefix for all control-transferring
617 instructions supporting it, even if this prefix wasn't specified
618 explicitly. */
619 static int add_bnd_prefix = 0;
620
621 /* 1 if pseudo index register, eiz/riz, is allowed . */
622 static int allow_index_reg = 0;
623
624 /* 1 if the assembler should ignore LOCK prefix, even if it was
625 specified explicitly. */
626 static int omit_lock_prefix = 0;
627
628 /* 1 if the assembler should encode lfence, mfence, and sfence as
629 "lock addl $0, (%{re}sp)". */
630 static int avoid_fence = 0;
631
632 /* Type of the previous instruction. */
633 static struct
634 {
635 segT seg;
636 const char *file;
637 const char *name;
638 unsigned int line;
639 enum last_insn_kind
640 {
641 last_insn_other = 0,
642 last_insn_directive,
643 last_insn_prefix
644 } kind;
645 } last_insn;
646
647 /* 1 if the assembler should generate relax relocations. */
648
649 static int generate_relax_relocations
650 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
651
652 static enum check_kind
653 {
654 check_none = 0,
655 check_warning,
656 check_error
657 }
658 sse_check, operand_check = check_warning;
659
660 /* Non-zero if branches should be aligned within power of 2 boundary. */
661 static int align_branch_power = 0;
662
663 /* Types of branches to align. */
664 enum align_branch_kind
665 {
666 align_branch_none = 0,
667 align_branch_jcc = 1,
668 align_branch_fused = 2,
669 align_branch_jmp = 3,
670 align_branch_call = 4,
671 align_branch_indirect = 5,
672 align_branch_ret = 6
673 };
674
675 /* Type bits of branches to align. */
676 enum align_branch_bit
677 {
678 align_branch_jcc_bit = 1 << align_branch_jcc,
679 align_branch_fused_bit = 1 << align_branch_fused,
680 align_branch_jmp_bit = 1 << align_branch_jmp,
681 align_branch_call_bit = 1 << align_branch_call,
682 align_branch_indirect_bit = 1 << align_branch_indirect,
683 align_branch_ret_bit = 1 << align_branch_ret
684 };
685
686 static unsigned int align_branch = (align_branch_jcc_bit
687 | align_branch_fused_bit
688 | align_branch_jmp_bit);
689
690 /* The maximum padding size for fused jcc. CMP like instruction can
691 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
692 prefixes. */
693 #define MAX_FUSED_JCC_PADDING_SIZE 20
694
695 /* The maximum number of prefixes added for an instruction. */
696 static unsigned int align_branch_prefix_size = 5;
697
698 /* Optimization:
699 1. Clear the REX_W bit with register operand if possible.
700 2. Above plus use 128bit vector instruction to clear the full vector
701 register.
702 */
703 static int optimize = 0;
704
705 /* Optimization:
706 1. Clear the REX_W bit with register operand if possible.
707 2. Above plus use 128bit vector instruction to clear the full vector
708 register.
709 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
710 "testb $imm7,%r8".
711 */
712 static int optimize_for_space = 0;
713
714 /* Register prefix used for error message. */
715 static const char *register_prefix = "%";
716
717 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
718 leave, push, and pop instructions so that gcc has the same stack
719 frame as in 32 bit mode. */
720 static char stackop_size = '\0';
721
722 /* Non-zero to optimize code alignment. */
723 int optimize_align_code = 1;
724
725 /* Non-zero to quieten some warnings. */
726 static int quiet_warnings = 0;
727
728 /* CPU name. */
729 static const char *cpu_arch_name = NULL;
730 static char *cpu_sub_arch_name = NULL;
731
732 /* CPU feature flags. */
733 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
734
735 /* If we have selected a cpu we are generating instructions for. */
736 static int cpu_arch_tune_set = 0;
737
738 /* Cpu we are generating instructions for. */
739 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
740
741 /* CPU feature flags of cpu we are generating instructions for. */
742 static i386_cpu_flags cpu_arch_tune_flags;
743
744 /* CPU instruction set architecture used. */
745 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
746
747 /* CPU feature flags of instruction set architecture used. */
748 i386_cpu_flags cpu_arch_isa_flags;
749
750 /* If set, conditional jumps are not automatically promoted to handle
751 larger than a byte offset. */
752 static unsigned int no_cond_jump_promotion = 0;
753
754 /* Encode SSE instructions with VEX prefix. */
755 static unsigned int sse2avx;
756
757 /* Encode scalar AVX instructions with specific vector length. */
758 static enum
759 {
760 vex128 = 0,
761 vex256
762 } avxscalar;
763
764 /* Encode VEX WIG instructions with specific vex.w. */
765 static enum
766 {
767 vexw0 = 0,
768 vexw1
769 } vexwig;
770
771 /* Encode scalar EVEX LIG instructions with specific vector length. */
772 static enum
773 {
774 evexl128 = 0,
775 evexl256,
776 evexl512
777 } evexlig;
778
779 /* Encode EVEX WIG instructions with specific evex.w. */
780 static enum
781 {
782 evexw0 = 0,
783 evexw1
784 } evexwig;
785
786 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
787 static enum rc_type evexrcig = rne;
788
789 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
790 static symbolS *GOT_symbol;
791
792 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
793 unsigned int x86_dwarf2_return_column;
794
795 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
796 int x86_cie_data_alignment;
797
798 /* Interface to relax_segment.
799 There are 3 major relax states for 386 jump insns because the
800 different types of jumps add different sizes to frags when we're
801 figuring out what sort of jump to choose to reach a given label.
802
803 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
804 branches which are handled by md_estimate_size_before_relax() and
805 i386_generic_table_relax_frag(). */
806
807 /* Types. */
808 #define UNCOND_JUMP 0
809 #define COND_JUMP 1
810 #define COND_JUMP86 2
811 #define BRANCH_PADDING 3
812 #define BRANCH_PREFIX 4
813 #define FUSED_JCC_PADDING 5
814
815 /* Sizes. */
816 #define CODE16 1
817 #define SMALL 0
818 #define SMALL16 (SMALL | CODE16)
819 #define BIG 2
820 #define BIG16 (BIG | CODE16)
821
822 #ifndef INLINE
823 #ifdef __GNUC__
824 #define INLINE __inline__
825 #else
826 #define INLINE
827 #endif
828 #endif
829
830 #define ENCODE_RELAX_STATE(type, size) \
831 ((relax_substateT) (((type) << 2) | (size)))
832 #define TYPE_FROM_RELAX_STATE(s) \
833 ((s) >> 2)
834 #define DISP_SIZE_FROM_RELAX_STATE(s) \
835 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
836
837 /* This table is used by relax_frag to promote short jumps to long
838 ones where necessary. SMALL (short) jumps may be promoted to BIG
839 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
840 don't allow a short jump in a 32 bit code segment to be promoted to
841 a 16 bit offset jump because it's slower (requires data size
842 prefix), and doesn't work, unless the destination is in the bottom
843 64k of the code segment (The top 16 bits of eip are zeroed). */
844
845 const relax_typeS md_relax_table[] =
846 {
847 /* The fields are:
848 1) most positive reach of this state,
849 2) most negative reach of this state,
850 3) how many bytes this mode will have in the variable part of the frag
851 4) which index into the table to try if we can't fit into this one. */
852
853 /* UNCOND_JUMP states. */
854 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
855 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
856 /* dword jmp adds 4 bytes to frag:
857 0 extra opcode bytes, 4 displacement bytes. */
858 {0, 0, 4, 0},
859 /* word jmp adds 2 byte2 to frag:
860 0 extra opcode bytes, 2 displacement bytes. */
861 {0, 0, 2, 0},
862
863 /* COND_JUMP states. */
864 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
865 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
866 /* dword conditionals adds 5 bytes to frag:
867 1 extra opcode byte, 4 displacement bytes. */
868 {0, 0, 5, 0},
869 /* word conditionals add 3 bytes to frag:
870 1 extra opcode byte, 2 displacement bytes. */
871 {0, 0, 3, 0},
872
873 /* COND_JUMP86 states. */
874 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
875 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
876 /* dword conditionals adds 5 bytes to frag:
877 1 extra opcode byte, 4 displacement bytes. */
878 {0, 0, 5, 0},
879 /* word conditionals add 4 bytes to frag:
880 1 displacement byte and a 3 byte long branch insn. */
881 {0, 0, 4, 0}
882 };
883
884 static const arch_entry cpu_arch[] =
885 {
886 /* Do not replace the first two entries - i386_target_format()
887 relies on them being there in this order. */
888 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
889 CPU_GENERIC32_FLAGS, 0 },
890 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
891 CPU_GENERIC64_FLAGS, 0 },
892 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
893 CPU_NONE_FLAGS, 0 },
894 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
895 CPU_I186_FLAGS, 0 },
896 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
897 CPU_I286_FLAGS, 0 },
898 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
899 CPU_I386_FLAGS, 0 },
900 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
901 CPU_I486_FLAGS, 0 },
902 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
903 CPU_I586_FLAGS, 0 },
904 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
905 CPU_I686_FLAGS, 0 },
906 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
907 CPU_I586_FLAGS, 0 },
908 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
909 CPU_PENTIUMPRO_FLAGS, 0 },
910 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
911 CPU_P2_FLAGS, 0 },
912 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
913 CPU_P3_FLAGS, 0 },
914 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
915 CPU_P4_FLAGS, 0 },
916 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
917 CPU_CORE_FLAGS, 0 },
918 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
919 CPU_NOCONA_FLAGS, 0 },
920 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
921 CPU_CORE_FLAGS, 1 },
922 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
923 CPU_CORE_FLAGS, 0 },
924 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
925 CPU_CORE2_FLAGS, 1 },
926 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
927 CPU_CORE2_FLAGS, 0 },
928 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
929 CPU_COREI7_FLAGS, 0 },
930 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
931 CPU_L1OM_FLAGS, 0 },
932 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
933 CPU_K1OM_FLAGS, 0 },
934 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
935 CPU_IAMCU_FLAGS, 0 },
936 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
937 CPU_K6_FLAGS, 0 },
938 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
939 CPU_K6_2_FLAGS, 0 },
940 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
941 CPU_ATHLON_FLAGS, 0 },
942 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
943 CPU_K8_FLAGS, 1 },
944 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
945 CPU_K8_FLAGS, 0 },
946 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
947 CPU_K8_FLAGS, 0 },
948 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
949 CPU_AMDFAM10_FLAGS, 0 },
950 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
951 CPU_BDVER1_FLAGS, 0 },
952 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
953 CPU_BDVER2_FLAGS, 0 },
954 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
955 CPU_BDVER3_FLAGS, 0 },
956 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
957 CPU_BDVER4_FLAGS, 0 },
958 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
959 CPU_ZNVER1_FLAGS, 0 },
960 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
961 CPU_ZNVER2_FLAGS, 0 },
962 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
963 CPU_BTVER1_FLAGS, 0 },
964 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
965 CPU_BTVER2_FLAGS, 0 },
966 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
967 CPU_8087_FLAGS, 0 },
968 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
969 CPU_287_FLAGS, 0 },
970 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
971 CPU_387_FLAGS, 0 },
972 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
973 CPU_687_FLAGS, 0 },
974 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
975 CPU_CMOV_FLAGS, 0 },
976 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
977 CPU_FXSR_FLAGS, 0 },
978 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
979 CPU_MMX_FLAGS, 0 },
980 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
981 CPU_SSE_FLAGS, 0 },
982 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
983 CPU_SSE2_FLAGS, 0 },
984 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
985 CPU_SSE3_FLAGS, 0 },
986 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
987 CPU_SSE4A_FLAGS, 0 },
988 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
989 CPU_SSSE3_FLAGS, 0 },
990 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
991 CPU_SSE4_1_FLAGS, 0 },
992 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
993 CPU_SSE4_2_FLAGS, 0 },
994 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
995 CPU_SSE4_2_FLAGS, 0 },
996 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
997 CPU_AVX_FLAGS, 0 },
998 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
999 CPU_AVX2_FLAGS, 0 },
1000 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1001 CPU_AVX512F_FLAGS, 0 },
1002 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1003 CPU_AVX512CD_FLAGS, 0 },
1004 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1005 CPU_AVX512ER_FLAGS, 0 },
1006 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1007 CPU_AVX512PF_FLAGS, 0 },
1008 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1009 CPU_AVX512DQ_FLAGS, 0 },
1010 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1011 CPU_AVX512BW_FLAGS, 0 },
1012 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1013 CPU_AVX512VL_FLAGS, 0 },
1014 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1015 CPU_VMX_FLAGS, 0 },
1016 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1017 CPU_VMFUNC_FLAGS, 0 },
1018 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1019 CPU_SMX_FLAGS, 0 },
1020 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1021 CPU_XSAVE_FLAGS, 0 },
1022 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1023 CPU_XSAVEOPT_FLAGS, 0 },
1024 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1025 CPU_XSAVEC_FLAGS, 0 },
1026 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1027 CPU_XSAVES_FLAGS, 0 },
1028 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1029 CPU_AES_FLAGS, 0 },
1030 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1031 CPU_PCLMUL_FLAGS, 0 },
1032 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1033 CPU_PCLMUL_FLAGS, 1 },
1034 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1035 CPU_FSGSBASE_FLAGS, 0 },
1036 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1037 CPU_RDRND_FLAGS, 0 },
1038 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1039 CPU_F16C_FLAGS, 0 },
1040 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1041 CPU_BMI2_FLAGS, 0 },
1042 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1043 CPU_FMA_FLAGS, 0 },
1044 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1045 CPU_FMA4_FLAGS, 0 },
1046 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1047 CPU_XOP_FLAGS, 0 },
1048 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1049 CPU_LWP_FLAGS, 0 },
1050 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1051 CPU_MOVBE_FLAGS, 0 },
1052 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1053 CPU_CX16_FLAGS, 0 },
1054 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1055 CPU_EPT_FLAGS, 0 },
1056 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1057 CPU_LZCNT_FLAGS, 0 },
1058 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1059 CPU_POPCNT_FLAGS, 0 },
1060 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1061 CPU_HLE_FLAGS, 0 },
1062 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1063 CPU_RTM_FLAGS, 0 },
1064 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1065 CPU_INVPCID_FLAGS, 0 },
1066 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1067 CPU_CLFLUSH_FLAGS, 0 },
1068 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1069 CPU_NOP_FLAGS, 0 },
1070 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1071 CPU_SYSCALL_FLAGS, 0 },
1072 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1073 CPU_RDTSCP_FLAGS, 0 },
1074 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1075 CPU_3DNOW_FLAGS, 0 },
1076 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1077 CPU_3DNOWA_FLAGS, 0 },
1078 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1079 CPU_PADLOCK_FLAGS, 0 },
1080 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1081 CPU_SVME_FLAGS, 1 },
1082 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1083 CPU_SVME_FLAGS, 0 },
1084 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1085 CPU_SSE4A_FLAGS, 0 },
1086 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1087 CPU_ABM_FLAGS, 0 },
1088 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1089 CPU_BMI_FLAGS, 0 },
1090 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1091 CPU_TBM_FLAGS, 0 },
1092 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1093 CPU_ADX_FLAGS, 0 },
1094 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1095 CPU_RDSEED_FLAGS, 0 },
1096 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1097 CPU_PRFCHW_FLAGS, 0 },
1098 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1099 CPU_SMAP_FLAGS, 0 },
1100 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1101 CPU_MPX_FLAGS, 0 },
1102 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1103 CPU_SHA_FLAGS, 0 },
1104 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1105 CPU_CLFLUSHOPT_FLAGS, 0 },
1106 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1107 CPU_PREFETCHWT1_FLAGS, 0 },
1108 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1109 CPU_SE1_FLAGS, 0 },
1110 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1111 CPU_CLWB_FLAGS, 0 },
1112 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1113 CPU_AVX512IFMA_FLAGS, 0 },
1114 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1115 CPU_AVX512VBMI_FLAGS, 0 },
1116 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1117 CPU_AVX512_4FMAPS_FLAGS, 0 },
1118 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1119 CPU_AVX512_4VNNIW_FLAGS, 0 },
1120 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1121 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1122 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1123 CPU_AVX512_VBMI2_FLAGS, 0 },
1124 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1125 CPU_AVX512_VNNI_FLAGS, 0 },
1126 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1127 CPU_AVX512_BITALG_FLAGS, 0 },
1128 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1129 CPU_CLZERO_FLAGS, 0 },
1130 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1131 CPU_MWAITX_FLAGS, 0 },
1132 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1133 CPU_OSPKE_FLAGS, 0 },
1134 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1135 CPU_RDPID_FLAGS, 0 },
1136 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1137 CPU_PTWRITE_FLAGS, 0 },
1138 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1139 CPU_IBT_FLAGS, 0 },
1140 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1141 CPU_SHSTK_FLAGS, 0 },
1142 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1143 CPU_GFNI_FLAGS, 0 },
1144 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1145 CPU_VAES_FLAGS, 0 },
1146 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1147 CPU_VPCLMULQDQ_FLAGS, 0 },
1148 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1149 CPU_WBNOINVD_FLAGS, 0 },
1150 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1151 CPU_PCONFIG_FLAGS, 0 },
1152 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1153 CPU_WAITPKG_FLAGS, 0 },
1154 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1155 CPU_CLDEMOTE_FLAGS, 0 },
1156 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1157 CPU_MOVDIRI_FLAGS, 0 },
1158 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1159 CPU_MOVDIR64B_FLAGS, 0 },
1160 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1161 CPU_AVX512_BF16_FLAGS, 0 },
1162 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1163 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1164 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1165 CPU_ENQCMD_FLAGS, 0 },
1166 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1167 CPU_RDPRU_FLAGS, 0 },
1168 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1169 CPU_MCOMMIT_FLAGS, 0 },
1170 };
1171
1172 static const noarch_entry cpu_noarch[] =
1173 {
1174 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1175 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1176 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1177 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1178 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1179 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1180 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1181 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1182 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1183 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1184 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1185 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1186 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1187 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1188 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1189 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1190 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1191 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1192 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1193 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1194 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1195 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1196 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1197 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1198 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1199 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1200 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1201 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1202 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1203 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1204 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1205 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1206 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1207 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1208 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1209 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1210 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1211 { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1212 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1213 };
1214
1215 #ifdef I386COFF
1216 /* Like s_lcomm_internal in gas/read.c but the alignment string
1217 is allowed to be optional. */
1218
1219 static symbolS *
1220 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1221 {
1222 addressT align = 0;
1223
1224 SKIP_WHITESPACE ();
1225
1226 if (needs_align
1227 && *input_line_pointer == ',')
1228 {
1229 align = parse_align (needs_align - 1);
1230
1231 if (align == (addressT) -1)
1232 return NULL;
1233 }
1234 else
1235 {
1236 if (size >= 8)
1237 align = 3;
1238 else if (size >= 4)
1239 align = 2;
1240 else if (size >= 2)
1241 align = 1;
1242 else
1243 align = 0;
1244 }
1245
1246 bss_alloc (symbolP, size, align);
1247 return symbolP;
1248 }
1249
1250 static void
1251 pe_lcomm (int needs_align)
1252 {
1253 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1254 }
1255 #endif
1256
1257 const pseudo_typeS md_pseudo_table[] =
1258 {
1259 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1260 {"align", s_align_bytes, 0},
1261 #else
1262 {"align", s_align_ptwo, 0},
1263 #endif
1264 {"arch", set_cpu_arch, 0},
1265 #ifndef I386COFF
1266 {"bss", s_bss, 0},
1267 #else
1268 {"lcomm", pe_lcomm, 1},
1269 #endif
1270 {"ffloat", float_cons, 'f'},
1271 {"dfloat", float_cons, 'd'},
1272 {"tfloat", float_cons, 'x'},
1273 {"value", cons, 2},
1274 {"slong", signed_cons, 4},
1275 {"noopt", s_ignore, 0},
1276 {"optim", s_ignore, 0},
1277 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1278 {"code16", set_code_flag, CODE_16BIT},
1279 {"code32", set_code_flag, CODE_32BIT},
1280 #ifdef BFD64
1281 {"code64", set_code_flag, CODE_64BIT},
1282 #endif
1283 {"intel_syntax", set_intel_syntax, 1},
1284 {"att_syntax", set_intel_syntax, 0},
1285 {"intel_mnemonic", set_intel_mnemonic, 1},
1286 {"att_mnemonic", set_intel_mnemonic, 0},
1287 {"allow_index_reg", set_allow_index_reg, 1},
1288 {"disallow_index_reg", set_allow_index_reg, 0},
1289 {"sse_check", set_check, 0},
1290 {"operand_check", set_check, 1},
1291 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1292 {"largecomm", handle_large_common, 0},
1293 #else
1294 {"file", dwarf2_directive_file, 0},
1295 {"loc", dwarf2_directive_loc, 0},
1296 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1297 #endif
1298 #ifdef TE_PE
1299 {"secrel32", pe_directive_secrel, 0},
1300 #endif
1301 {0, 0, 0}
1302 };
1303
1304 /* For interface with expression (). */
1305 extern char *input_line_pointer;
1306
1307 /* Hash table for instruction mnemonic lookup. */
1308 static struct hash_control *op_hash;
1309
1310 /* Hash table for register lookup. */
1311 static struct hash_control *reg_hash;
1312 \f
1313 /* Various efficient no-op patterns for aligning code labels.
1314 Note: Don't try to assemble the instructions in the comments.
1315 0L and 0w are not legal. */
1316 static const unsigned char f32_1[] =
1317 {0x90}; /* nop */
1318 static const unsigned char f32_2[] =
1319 {0x66,0x90}; /* xchg %ax,%ax */
1320 static const unsigned char f32_3[] =
1321 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1322 static const unsigned char f32_4[] =
1323 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1324 static const unsigned char f32_6[] =
1325 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1326 static const unsigned char f32_7[] =
1327 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1328 static const unsigned char f16_3[] =
1329 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1330 static const unsigned char f16_4[] =
1331 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1332 static const unsigned char jump_disp8[] =
1333 {0xeb}; /* jmp disp8 */
1334 static const unsigned char jump32_disp32[] =
1335 {0xe9}; /* jmp disp32 */
1336 static const unsigned char jump16_disp32[] =
1337 {0x66,0xe9}; /* jmp disp32 */
1338 /* 32-bit NOPs patterns. */
1339 static const unsigned char *const f32_patt[] = {
1340 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1341 };
1342 /* 16-bit NOPs patterns. */
1343 static const unsigned char *const f16_patt[] = {
1344 f32_1, f32_2, f16_3, f16_4
1345 };
1346 /* nopl (%[re]ax) */
1347 static const unsigned char alt_3[] =
1348 {0x0f,0x1f,0x00};
1349 /* nopl 0(%[re]ax) */
1350 static const unsigned char alt_4[] =
1351 {0x0f,0x1f,0x40,0x00};
1352 /* nopl 0(%[re]ax,%[re]ax,1) */
1353 static const unsigned char alt_5[] =
1354 {0x0f,0x1f,0x44,0x00,0x00};
1355 /* nopw 0(%[re]ax,%[re]ax,1) */
1356 static const unsigned char alt_6[] =
1357 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1358 /* nopl 0L(%[re]ax) */
1359 static const unsigned char alt_7[] =
1360 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1361 /* nopl 0L(%[re]ax,%[re]ax,1) */
1362 static const unsigned char alt_8[] =
1363 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1364 /* nopw 0L(%[re]ax,%[re]ax,1) */
1365 static const unsigned char alt_9[] =
1366 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1367 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1368 static const unsigned char alt_10[] =
1369 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1370 /* data16 nopw %cs:0L(%eax,%eax,1) */
1371 static const unsigned char alt_11[] =
1372 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1373 /* 32-bit and 64-bit NOPs patterns. */
1374 static const unsigned char *const alt_patt[] = {
1375 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1376 alt_9, alt_10, alt_11
1377 };
1378
1379 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1380 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1381
1382 static void
1383 i386_output_nops (char *where, const unsigned char *const *patt,
1384 int count, int max_single_nop_size)
1385
1386 {
1387 /* Place the longer NOP first. */
1388 int last;
1389 int offset;
1390 const unsigned char *nops;
1391
1392 if (max_single_nop_size < 1)
1393 {
1394 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1395 max_single_nop_size);
1396 return;
1397 }
1398
1399 nops = patt[max_single_nop_size - 1];
1400
1401 /* Use the smaller one if the requsted one isn't available. */
1402 if (nops == NULL)
1403 {
1404 max_single_nop_size--;
1405 nops = patt[max_single_nop_size - 1];
1406 }
1407
1408 last = count % max_single_nop_size;
1409
1410 count -= last;
1411 for (offset = 0; offset < count; offset += max_single_nop_size)
1412 memcpy (where + offset, nops, max_single_nop_size);
1413
1414 if (last)
1415 {
1416 nops = patt[last - 1];
1417 if (nops == NULL)
1418 {
1419 /* Use the smaller one plus one-byte NOP if the needed one
1420 isn't available. */
1421 last--;
1422 nops = patt[last - 1];
1423 memcpy (where + offset, nops, last);
1424 where[offset + last] = *patt[0];
1425 }
1426 else
1427 memcpy (where + offset, nops, last);
1428 }
1429 }
1430
1431 static INLINE int
1432 fits_in_imm7 (offsetT num)
1433 {
1434 return (num & 0x7f) == num;
1435 }
1436
1437 static INLINE int
1438 fits_in_imm31 (offsetT num)
1439 {
1440 return (num & 0x7fffffff) == num;
1441 }
1442
1443 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1444 single NOP instruction LIMIT. */
1445
1446 void
1447 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1448 {
1449 const unsigned char *const *patt = NULL;
1450 int max_single_nop_size;
1451 /* Maximum number of NOPs before switching to jump over NOPs. */
1452 int max_number_of_nops;
1453
1454 switch (fragP->fr_type)
1455 {
1456 case rs_fill_nop:
1457 case rs_align_code:
1458 break;
1459 case rs_machine_dependent:
1460 /* Allow NOP padding for jumps and calls. */
1461 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1462 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1463 break;
1464 /* Fall through. */
1465 default:
1466 return;
1467 }
1468
1469 /* We need to decide which NOP sequence to use for 32bit and
1470 64bit. When -mtune= is used:
1471
1472 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1473 PROCESSOR_GENERIC32, f32_patt will be used.
1474 2. For the rest, alt_patt will be used.
1475
1476 When -mtune= isn't used, alt_patt will be used if
1477 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1478 be used.
1479
1480 When -march= or .arch is used, we can't use anything beyond
1481 cpu_arch_isa_flags. */
1482
1483 if (flag_code == CODE_16BIT)
1484 {
1485 patt = f16_patt;
1486 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1487 /* Limit number of NOPs to 2 in 16-bit mode. */
1488 max_number_of_nops = 2;
1489 }
1490 else
1491 {
1492 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1493 {
1494 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1495 switch (cpu_arch_tune)
1496 {
1497 case PROCESSOR_UNKNOWN:
1498 /* We use cpu_arch_isa_flags to check if we SHOULD
1499 optimize with nops. */
1500 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1501 patt = alt_patt;
1502 else
1503 patt = f32_patt;
1504 break;
1505 case PROCESSOR_PENTIUM4:
1506 case PROCESSOR_NOCONA:
1507 case PROCESSOR_CORE:
1508 case PROCESSOR_CORE2:
1509 case PROCESSOR_COREI7:
1510 case PROCESSOR_L1OM:
1511 case PROCESSOR_K1OM:
1512 case PROCESSOR_GENERIC64:
1513 case PROCESSOR_K6:
1514 case PROCESSOR_ATHLON:
1515 case PROCESSOR_K8:
1516 case PROCESSOR_AMDFAM10:
1517 case PROCESSOR_BD:
1518 case PROCESSOR_ZNVER:
1519 case PROCESSOR_BT:
1520 patt = alt_patt;
1521 break;
1522 case PROCESSOR_I386:
1523 case PROCESSOR_I486:
1524 case PROCESSOR_PENTIUM:
1525 case PROCESSOR_PENTIUMPRO:
1526 case PROCESSOR_IAMCU:
1527 case PROCESSOR_GENERIC32:
1528 patt = f32_patt;
1529 break;
1530 }
1531 }
1532 else
1533 {
1534 switch (fragP->tc_frag_data.tune)
1535 {
1536 case PROCESSOR_UNKNOWN:
1537 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1538 PROCESSOR_UNKNOWN. */
1539 abort ();
1540 break;
1541
1542 case PROCESSOR_I386:
1543 case PROCESSOR_I486:
1544 case PROCESSOR_PENTIUM:
1545 case PROCESSOR_IAMCU:
1546 case PROCESSOR_K6:
1547 case PROCESSOR_ATHLON:
1548 case PROCESSOR_K8:
1549 case PROCESSOR_AMDFAM10:
1550 case PROCESSOR_BD:
1551 case PROCESSOR_ZNVER:
1552 case PROCESSOR_BT:
1553 case PROCESSOR_GENERIC32:
1554 /* We use cpu_arch_isa_flags to check if we CAN optimize
1555 with nops. */
1556 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1557 patt = alt_patt;
1558 else
1559 patt = f32_patt;
1560 break;
1561 case PROCESSOR_PENTIUMPRO:
1562 case PROCESSOR_PENTIUM4:
1563 case PROCESSOR_NOCONA:
1564 case PROCESSOR_CORE:
1565 case PROCESSOR_CORE2:
1566 case PROCESSOR_COREI7:
1567 case PROCESSOR_L1OM:
1568 case PROCESSOR_K1OM:
1569 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1570 patt = alt_patt;
1571 else
1572 patt = f32_patt;
1573 break;
1574 case PROCESSOR_GENERIC64:
1575 patt = alt_patt;
1576 break;
1577 }
1578 }
1579
1580 if (patt == f32_patt)
1581 {
1582 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1583 /* Limit number of NOPs to 2 for older processors. */
1584 max_number_of_nops = 2;
1585 }
1586 else
1587 {
1588 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1589 /* Limit number of NOPs to 7 for newer processors. */
1590 max_number_of_nops = 7;
1591 }
1592 }
1593
1594 if (limit == 0)
1595 limit = max_single_nop_size;
1596
1597 if (fragP->fr_type == rs_fill_nop)
1598 {
1599 /* Output NOPs for .nop directive. */
1600 if (limit > max_single_nop_size)
1601 {
1602 as_bad_where (fragP->fr_file, fragP->fr_line,
1603 _("invalid single nop size: %d "
1604 "(expect within [0, %d])"),
1605 limit, max_single_nop_size);
1606 return;
1607 }
1608 }
1609 else if (fragP->fr_type != rs_machine_dependent)
1610 fragP->fr_var = count;
1611
1612 if ((count / max_single_nop_size) > max_number_of_nops)
1613 {
1614 /* Generate jump over NOPs. */
1615 offsetT disp = count - 2;
1616 if (fits_in_imm7 (disp))
1617 {
1618 /* Use "jmp disp8" if possible. */
1619 count = disp;
1620 where[0] = jump_disp8[0];
1621 where[1] = count;
1622 where += 2;
1623 }
1624 else
1625 {
1626 unsigned int size_of_jump;
1627
1628 if (flag_code == CODE_16BIT)
1629 {
1630 where[0] = jump16_disp32[0];
1631 where[1] = jump16_disp32[1];
1632 size_of_jump = 2;
1633 }
1634 else
1635 {
1636 where[0] = jump32_disp32[0];
1637 size_of_jump = 1;
1638 }
1639
1640 count -= size_of_jump + 4;
1641 if (!fits_in_imm31 (count))
1642 {
1643 as_bad_where (fragP->fr_file, fragP->fr_line,
1644 _("jump over nop padding out of range"));
1645 return;
1646 }
1647
1648 md_number_to_chars (where + size_of_jump, count, 4);
1649 where += size_of_jump + 4;
1650 }
1651 }
1652
1653 /* Generate multiple NOPs. */
1654 i386_output_nops (where, patt, count, limit);
1655 }
1656
1657 static INLINE int
1658 operand_type_all_zero (const union i386_operand_type *x)
1659 {
1660 switch (ARRAY_SIZE(x->array))
1661 {
1662 case 3:
1663 if (x->array[2])
1664 return 0;
1665 /* Fall through. */
1666 case 2:
1667 if (x->array[1])
1668 return 0;
1669 /* Fall through. */
1670 case 1:
1671 return !x->array[0];
1672 default:
1673 abort ();
1674 }
1675 }
1676
1677 static INLINE void
1678 operand_type_set (union i386_operand_type *x, unsigned int v)
1679 {
1680 switch (ARRAY_SIZE(x->array))
1681 {
1682 case 3:
1683 x->array[2] = v;
1684 /* Fall through. */
1685 case 2:
1686 x->array[1] = v;
1687 /* Fall through. */
1688 case 1:
1689 x->array[0] = v;
1690 /* Fall through. */
1691 break;
1692 default:
1693 abort ();
1694 }
1695
1696 x->bitfield.class = ClassNone;
1697 x->bitfield.instance = InstanceNone;
1698 }
1699
1700 static INLINE int
1701 operand_type_equal (const union i386_operand_type *x,
1702 const union i386_operand_type *y)
1703 {
1704 switch (ARRAY_SIZE(x->array))
1705 {
1706 case 3:
1707 if (x->array[2] != y->array[2])
1708 return 0;
1709 /* Fall through. */
1710 case 2:
1711 if (x->array[1] != y->array[1])
1712 return 0;
1713 /* Fall through. */
1714 case 1:
1715 return x->array[0] == y->array[0];
1716 break;
1717 default:
1718 abort ();
1719 }
1720 }
1721
1722 static INLINE int
1723 cpu_flags_all_zero (const union i386_cpu_flags *x)
1724 {
1725 switch (ARRAY_SIZE(x->array))
1726 {
1727 case 4:
1728 if (x->array[3])
1729 return 0;
1730 /* Fall through. */
1731 case 3:
1732 if (x->array[2])
1733 return 0;
1734 /* Fall through. */
1735 case 2:
1736 if (x->array[1])
1737 return 0;
1738 /* Fall through. */
1739 case 1:
1740 return !x->array[0];
1741 default:
1742 abort ();
1743 }
1744 }
1745
1746 static INLINE int
1747 cpu_flags_equal (const union i386_cpu_flags *x,
1748 const union i386_cpu_flags *y)
1749 {
1750 switch (ARRAY_SIZE(x->array))
1751 {
1752 case 4:
1753 if (x->array[3] != y->array[3])
1754 return 0;
1755 /* Fall through. */
1756 case 3:
1757 if (x->array[2] != y->array[2])
1758 return 0;
1759 /* Fall through. */
1760 case 2:
1761 if (x->array[1] != y->array[1])
1762 return 0;
1763 /* Fall through. */
1764 case 1:
1765 return x->array[0] == y->array[0];
1766 break;
1767 default:
1768 abort ();
1769 }
1770 }
1771
1772 static INLINE int
1773 cpu_flags_check_cpu64 (i386_cpu_flags f)
1774 {
1775 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1776 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1777 }
1778
1779 static INLINE i386_cpu_flags
1780 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1781 {
1782 switch (ARRAY_SIZE (x.array))
1783 {
1784 case 4:
1785 x.array [3] &= y.array [3];
1786 /* Fall through. */
1787 case 3:
1788 x.array [2] &= y.array [2];
1789 /* Fall through. */
1790 case 2:
1791 x.array [1] &= y.array [1];
1792 /* Fall through. */
1793 case 1:
1794 x.array [0] &= y.array [0];
1795 break;
1796 default:
1797 abort ();
1798 }
1799 return x;
1800 }
1801
1802 static INLINE i386_cpu_flags
1803 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1804 {
1805 switch (ARRAY_SIZE (x.array))
1806 {
1807 case 4:
1808 x.array [3] |= y.array [3];
1809 /* Fall through. */
1810 case 3:
1811 x.array [2] |= y.array [2];
1812 /* Fall through. */
1813 case 2:
1814 x.array [1] |= y.array [1];
1815 /* Fall through. */
1816 case 1:
1817 x.array [0] |= y.array [0];
1818 break;
1819 default:
1820 abort ();
1821 }
1822 return x;
1823 }
1824
1825 static INLINE i386_cpu_flags
1826 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1827 {
1828 switch (ARRAY_SIZE (x.array))
1829 {
1830 case 4:
1831 x.array [3] &= ~y.array [3];
1832 /* Fall through. */
1833 case 3:
1834 x.array [2] &= ~y.array [2];
1835 /* Fall through. */
1836 case 2:
1837 x.array [1] &= ~y.array [1];
1838 /* Fall through. */
1839 case 1:
1840 x.array [0] &= ~y.array [0];
1841 break;
1842 default:
1843 abort ();
1844 }
1845 return x;
1846 }
1847
1848 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1849
1850 #define CPU_FLAGS_ARCH_MATCH 0x1
1851 #define CPU_FLAGS_64BIT_MATCH 0x2
1852
1853 #define CPU_FLAGS_PERFECT_MATCH \
1854 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1855
1856 /* Return CPU flags match bits. */
1857
1858 static int
1859 cpu_flags_match (const insn_template *t)
1860 {
1861 i386_cpu_flags x = t->cpu_flags;
1862 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1863
1864 x.bitfield.cpu64 = 0;
1865 x.bitfield.cpuno64 = 0;
1866
1867 if (cpu_flags_all_zero (&x))
1868 {
1869 /* This instruction is available on all archs. */
1870 match |= CPU_FLAGS_ARCH_MATCH;
1871 }
1872 else
1873 {
1874 /* This instruction is available only on some archs. */
1875 i386_cpu_flags cpu = cpu_arch_flags;
1876
1877 /* AVX512VL is no standalone feature - match it and then strip it. */
1878 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1879 return match;
1880 x.bitfield.cpuavx512vl = 0;
1881
1882 cpu = cpu_flags_and (x, cpu);
1883 if (!cpu_flags_all_zero (&cpu))
1884 {
1885 if (x.bitfield.cpuavx)
1886 {
1887 /* We need to check a few extra flags with AVX. */
1888 if (cpu.bitfield.cpuavx
1889 && (!t->opcode_modifier.sse2avx || sse2avx)
1890 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1891 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1892 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1893 match |= CPU_FLAGS_ARCH_MATCH;
1894 }
1895 else if (x.bitfield.cpuavx512f)
1896 {
1897 /* We need to check a few extra flags with AVX512F. */
1898 if (cpu.bitfield.cpuavx512f
1899 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1900 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1901 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1902 match |= CPU_FLAGS_ARCH_MATCH;
1903 }
1904 else
1905 match |= CPU_FLAGS_ARCH_MATCH;
1906 }
1907 }
1908 return match;
1909 }
1910
1911 static INLINE i386_operand_type
1912 operand_type_and (i386_operand_type x, i386_operand_type y)
1913 {
1914 if (x.bitfield.class != y.bitfield.class)
1915 x.bitfield.class = ClassNone;
1916 if (x.bitfield.instance != y.bitfield.instance)
1917 x.bitfield.instance = InstanceNone;
1918
1919 switch (ARRAY_SIZE (x.array))
1920 {
1921 case 3:
1922 x.array [2] &= y.array [2];
1923 /* Fall through. */
1924 case 2:
1925 x.array [1] &= y.array [1];
1926 /* Fall through. */
1927 case 1:
1928 x.array [0] &= y.array [0];
1929 break;
1930 default:
1931 abort ();
1932 }
1933 return x;
1934 }
1935
1936 static INLINE i386_operand_type
1937 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1938 {
1939 gas_assert (y.bitfield.class == ClassNone);
1940 gas_assert (y.bitfield.instance == InstanceNone);
1941
1942 switch (ARRAY_SIZE (x.array))
1943 {
1944 case 3:
1945 x.array [2] &= ~y.array [2];
1946 /* Fall through. */
1947 case 2:
1948 x.array [1] &= ~y.array [1];
1949 /* Fall through. */
1950 case 1:
1951 x.array [0] &= ~y.array [0];
1952 break;
1953 default:
1954 abort ();
1955 }
1956 return x;
1957 }
1958
1959 static INLINE i386_operand_type
1960 operand_type_or (i386_operand_type x, i386_operand_type y)
1961 {
1962 gas_assert (x.bitfield.class == ClassNone ||
1963 y.bitfield.class == ClassNone ||
1964 x.bitfield.class == y.bitfield.class);
1965 gas_assert (x.bitfield.instance == InstanceNone ||
1966 y.bitfield.instance == InstanceNone ||
1967 x.bitfield.instance == y.bitfield.instance);
1968
1969 switch (ARRAY_SIZE (x.array))
1970 {
1971 case 3:
1972 x.array [2] |= y.array [2];
1973 /* Fall through. */
1974 case 2:
1975 x.array [1] |= y.array [1];
1976 /* Fall through. */
1977 case 1:
1978 x.array [0] |= y.array [0];
1979 break;
1980 default:
1981 abort ();
1982 }
1983 return x;
1984 }
1985
1986 static INLINE i386_operand_type
1987 operand_type_xor (i386_operand_type x, i386_operand_type y)
1988 {
1989 gas_assert (y.bitfield.class == ClassNone);
1990 gas_assert (y.bitfield.instance == InstanceNone);
1991
1992 switch (ARRAY_SIZE (x.array))
1993 {
1994 case 3:
1995 x.array [2] ^= y.array [2];
1996 /* Fall through. */
1997 case 2:
1998 x.array [1] ^= y.array [1];
1999 /* Fall through. */
2000 case 1:
2001 x.array [0] ^= y.array [0];
2002 break;
2003 default:
2004 abort ();
2005 }
2006 return x;
2007 }
2008
2009 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2010 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2011 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2012 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2013 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2014 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2015 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2016 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2017 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2018 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2019 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2020 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2021 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2022 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2023 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2024 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2025 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2026
2027 enum operand_type
2028 {
2029 reg,
2030 imm,
2031 disp,
2032 anymem
2033 };
2034
2035 static INLINE int
2036 operand_type_check (i386_operand_type t, enum operand_type c)
2037 {
2038 switch (c)
2039 {
2040 case reg:
2041 return t.bitfield.class == Reg;
2042
2043 case imm:
2044 return (t.bitfield.imm8
2045 || t.bitfield.imm8s
2046 || t.bitfield.imm16
2047 || t.bitfield.imm32
2048 || t.bitfield.imm32s
2049 || t.bitfield.imm64);
2050
2051 case disp:
2052 return (t.bitfield.disp8
2053 || t.bitfield.disp16
2054 || t.bitfield.disp32
2055 || t.bitfield.disp32s
2056 || t.bitfield.disp64);
2057
2058 case anymem:
2059 return (t.bitfield.disp8
2060 || t.bitfield.disp16
2061 || t.bitfield.disp32
2062 || t.bitfield.disp32s
2063 || t.bitfield.disp64
2064 || t.bitfield.baseindex);
2065
2066 default:
2067 abort ();
2068 }
2069
2070 return 0;
2071 }
2072
2073 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2074 between operand GIVEN and opeand WANTED for instruction template T. */
2075
2076 static INLINE int
2077 match_operand_size (const insn_template *t, unsigned int wanted,
2078 unsigned int given)
2079 {
2080 return !((i.types[given].bitfield.byte
2081 && !t->operand_types[wanted].bitfield.byte)
2082 || (i.types[given].bitfield.word
2083 && !t->operand_types[wanted].bitfield.word)
2084 || (i.types[given].bitfield.dword
2085 && !t->operand_types[wanted].bitfield.dword)
2086 || (i.types[given].bitfield.qword
2087 && !t->operand_types[wanted].bitfield.qword)
2088 || (i.types[given].bitfield.tbyte
2089 && !t->operand_types[wanted].bitfield.tbyte));
2090 }
2091
2092 /* Return 1 if there is no conflict in SIMD register between operand
2093 GIVEN and opeand WANTED for instruction template T. */
2094
2095 static INLINE int
2096 match_simd_size (const insn_template *t, unsigned int wanted,
2097 unsigned int given)
2098 {
2099 return !((i.types[given].bitfield.xmmword
2100 && !t->operand_types[wanted].bitfield.xmmword)
2101 || (i.types[given].bitfield.ymmword
2102 && !t->operand_types[wanted].bitfield.ymmword)
2103 || (i.types[given].bitfield.zmmword
2104 && !t->operand_types[wanted].bitfield.zmmword));
2105 }
2106
2107 /* Return 1 if there is no conflict in any size between operand GIVEN
2108 and opeand WANTED for instruction template T. */
2109
2110 static INLINE int
2111 match_mem_size (const insn_template *t, unsigned int wanted,
2112 unsigned int given)
2113 {
2114 return (match_operand_size (t, wanted, given)
2115 && !((i.types[given].bitfield.unspecified
2116 && !i.broadcast
2117 && !t->operand_types[wanted].bitfield.unspecified)
2118 || (i.types[given].bitfield.fword
2119 && !t->operand_types[wanted].bitfield.fword)
2120 /* For scalar opcode templates to allow register and memory
2121 operands at the same time, some special casing is needed
2122 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2123 down-conversion vpmov*. */
2124 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2125 && !t->opcode_modifier.broadcast
2126 && (t->operand_types[wanted].bitfield.byte
2127 || t->operand_types[wanted].bitfield.word
2128 || t->operand_types[wanted].bitfield.dword
2129 || t->operand_types[wanted].bitfield.qword))
2130 ? (i.types[given].bitfield.xmmword
2131 || i.types[given].bitfield.ymmword
2132 || i.types[given].bitfield.zmmword)
2133 : !match_simd_size(t, wanted, given))));
2134 }
2135
2136 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2137 operands for instruction template T, and it has MATCH_REVERSE set if there
2138 is no size conflict on any operands for the template with operands reversed
2139 (and the template allows for reversing in the first place). */
2140
2141 #define MATCH_STRAIGHT 1
2142 #define MATCH_REVERSE 2
2143
2144 static INLINE unsigned int
2145 operand_size_match (const insn_template *t)
2146 {
2147 unsigned int j, match = MATCH_STRAIGHT;
2148
2149 /* Don't check non-absolute jump instructions. */
2150 if (t->opcode_modifier.jump
2151 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2152 return match;
2153
2154 /* Check memory and accumulator operand size. */
2155 for (j = 0; j < i.operands; j++)
2156 {
2157 if (i.types[j].bitfield.class != Reg
2158 && i.types[j].bitfield.class != RegSIMD
2159 && t->opcode_modifier.anysize)
2160 continue;
2161
2162 if (t->operand_types[j].bitfield.class == Reg
2163 && !match_operand_size (t, j, j))
2164 {
2165 match = 0;
2166 break;
2167 }
2168
2169 if (t->operand_types[j].bitfield.class == RegSIMD
2170 && !match_simd_size (t, j, j))
2171 {
2172 match = 0;
2173 break;
2174 }
2175
2176 if (t->operand_types[j].bitfield.instance == Accum
2177 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2178 {
2179 match = 0;
2180 break;
2181 }
2182
2183 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2184 {
2185 match = 0;
2186 break;
2187 }
2188 }
2189
2190 if (!t->opcode_modifier.d)
2191 {
2192 mismatch:
2193 if (!match)
2194 i.error = operand_size_mismatch;
2195 return match;
2196 }
2197
2198 /* Check reverse. */
2199 gas_assert (i.operands >= 2 && i.operands <= 3);
2200
2201 for (j = 0; j < i.operands; j++)
2202 {
2203 unsigned int given = i.operands - j - 1;
2204
2205 if (t->operand_types[j].bitfield.class == Reg
2206 && !match_operand_size (t, j, given))
2207 goto mismatch;
2208
2209 if (t->operand_types[j].bitfield.class == RegSIMD
2210 && !match_simd_size (t, j, given))
2211 goto mismatch;
2212
2213 if (t->operand_types[j].bitfield.instance == Accum
2214 && (!match_operand_size (t, j, given)
2215 || !match_simd_size (t, j, given)))
2216 goto mismatch;
2217
2218 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2219 goto mismatch;
2220 }
2221
2222 return match | MATCH_REVERSE;
2223 }
2224
2225 static INLINE int
2226 operand_type_match (i386_operand_type overlap,
2227 i386_operand_type given)
2228 {
2229 i386_operand_type temp = overlap;
2230
2231 temp.bitfield.unspecified = 0;
2232 temp.bitfield.byte = 0;
2233 temp.bitfield.word = 0;
2234 temp.bitfield.dword = 0;
2235 temp.bitfield.fword = 0;
2236 temp.bitfield.qword = 0;
2237 temp.bitfield.tbyte = 0;
2238 temp.bitfield.xmmword = 0;
2239 temp.bitfield.ymmword = 0;
2240 temp.bitfield.zmmword = 0;
2241 if (operand_type_all_zero (&temp))
2242 goto mismatch;
2243
2244 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2245 return 1;
2246
2247 mismatch:
2248 i.error = operand_type_mismatch;
2249 return 0;
2250 }
2251
2252 /* If given types g0 and g1 are registers they must be of the same type
2253 unless the expected operand type register overlap is null.
2254 Some Intel syntax memory operand size checking also happens here. */
2255
2256 static INLINE int
2257 operand_type_register_match (i386_operand_type g0,
2258 i386_operand_type t0,
2259 i386_operand_type g1,
2260 i386_operand_type t1)
2261 {
2262 if (g0.bitfield.class != Reg
2263 && g0.bitfield.class != RegSIMD
2264 && (!operand_type_check (g0, anymem)
2265 || g0.bitfield.unspecified
2266 || (t0.bitfield.class != Reg
2267 && t0.bitfield.class != RegSIMD)))
2268 return 1;
2269
2270 if (g1.bitfield.class != Reg
2271 && g1.bitfield.class != RegSIMD
2272 && (!operand_type_check (g1, anymem)
2273 || g1.bitfield.unspecified
2274 || (t1.bitfield.class != Reg
2275 && t1.bitfield.class != RegSIMD)))
2276 return 1;
2277
2278 if (g0.bitfield.byte == g1.bitfield.byte
2279 && g0.bitfield.word == g1.bitfield.word
2280 && g0.bitfield.dword == g1.bitfield.dword
2281 && g0.bitfield.qword == g1.bitfield.qword
2282 && g0.bitfield.xmmword == g1.bitfield.xmmword
2283 && g0.bitfield.ymmword == g1.bitfield.ymmword
2284 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2285 return 1;
2286
2287 if (!(t0.bitfield.byte & t1.bitfield.byte)
2288 && !(t0.bitfield.word & t1.bitfield.word)
2289 && !(t0.bitfield.dword & t1.bitfield.dword)
2290 && !(t0.bitfield.qword & t1.bitfield.qword)
2291 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2292 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2293 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2294 return 1;
2295
2296 i.error = register_type_mismatch;
2297
2298 return 0;
2299 }
2300
2301 static INLINE unsigned int
2302 register_number (const reg_entry *r)
2303 {
2304 unsigned int nr = r->reg_num;
2305
2306 if (r->reg_flags & RegRex)
2307 nr += 8;
2308
2309 if (r->reg_flags & RegVRex)
2310 nr += 16;
2311
2312 return nr;
2313 }
2314
2315 static INLINE unsigned int
2316 mode_from_disp_size (i386_operand_type t)
2317 {
2318 if (t.bitfield.disp8)
2319 return 1;
2320 else if (t.bitfield.disp16
2321 || t.bitfield.disp32
2322 || t.bitfield.disp32s)
2323 return 2;
2324 else
2325 return 0;
2326 }
2327
2328 static INLINE int
2329 fits_in_signed_byte (addressT num)
2330 {
2331 return num + 0x80 <= 0xff;
2332 }
2333
2334 static INLINE int
2335 fits_in_unsigned_byte (addressT num)
2336 {
2337 return num <= 0xff;
2338 }
2339
2340 static INLINE int
2341 fits_in_unsigned_word (addressT num)
2342 {
2343 return num <= 0xffff;
2344 }
2345
2346 static INLINE int
2347 fits_in_signed_word (addressT num)
2348 {
2349 return num + 0x8000 <= 0xffff;
2350 }
2351
2352 static INLINE int
2353 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2354 {
2355 #ifndef BFD64
2356 return 1;
2357 #else
2358 return num + 0x80000000 <= 0xffffffff;
2359 #endif
2360 } /* fits_in_signed_long() */
2361
2362 static INLINE int
2363 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2364 {
2365 #ifndef BFD64
2366 return 1;
2367 #else
2368 return num <= 0xffffffff;
2369 #endif
2370 } /* fits_in_unsigned_long() */
2371
2372 static INLINE int
2373 fits_in_disp8 (offsetT num)
2374 {
2375 int shift = i.memshift;
2376 unsigned int mask;
2377
2378 if (shift == -1)
2379 abort ();
2380
2381 mask = (1 << shift) - 1;
2382
2383 /* Return 0 if NUM isn't properly aligned. */
2384 if ((num & mask))
2385 return 0;
2386
2387 /* Check if NUM will fit in 8bit after shift. */
2388 return fits_in_signed_byte (num >> shift);
2389 }
2390
2391 static INLINE int
2392 fits_in_imm4 (offsetT num)
2393 {
2394 return (num & 0xf) == num;
2395 }
2396
2397 static i386_operand_type
2398 smallest_imm_type (offsetT num)
2399 {
2400 i386_operand_type t;
2401
2402 operand_type_set (&t, 0);
2403 t.bitfield.imm64 = 1;
2404
2405 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2406 {
2407 /* This code is disabled on the 486 because all the Imm1 forms
2408 in the opcode table are slower on the i486. They're the
2409 versions with the implicitly specified single-position
2410 displacement, which has another syntax if you really want to
2411 use that form. */
2412 t.bitfield.imm1 = 1;
2413 t.bitfield.imm8 = 1;
2414 t.bitfield.imm8s = 1;
2415 t.bitfield.imm16 = 1;
2416 t.bitfield.imm32 = 1;
2417 t.bitfield.imm32s = 1;
2418 }
2419 else if (fits_in_signed_byte (num))
2420 {
2421 t.bitfield.imm8 = 1;
2422 t.bitfield.imm8s = 1;
2423 t.bitfield.imm16 = 1;
2424 t.bitfield.imm32 = 1;
2425 t.bitfield.imm32s = 1;
2426 }
2427 else if (fits_in_unsigned_byte (num))
2428 {
2429 t.bitfield.imm8 = 1;
2430 t.bitfield.imm16 = 1;
2431 t.bitfield.imm32 = 1;
2432 t.bitfield.imm32s = 1;
2433 }
2434 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2435 {
2436 t.bitfield.imm16 = 1;
2437 t.bitfield.imm32 = 1;
2438 t.bitfield.imm32s = 1;
2439 }
2440 else if (fits_in_signed_long (num))
2441 {
2442 t.bitfield.imm32 = 1;
2443 t.bitfield.imm32s = 1;
2444 }
2445 else if (fits_in_unsigned_long (num))
2446 t.bitfield.imm32 = 1;
2447
2448 return t;
2449 }
2450
2451 static offsetT
2452 offset_in_range (offsetT val, int size)
2453 {
2454 addressT mask;
2455
2456 switch (size)
2457 {
2458 case 1: mask = ((addressT) 1 << 8) - 1; break;
2459 case 2: mask = ((addressT) 1 << 16) - 1; break;
2460 case 4: mask = ((addressT) 2 << 31) - 1; break;
2461 #ifdef BFD64
2462 case 8: mask = ((addressT) 2 << 63) - 1; break;
2463 #endif
2464 default: abort ();
2465 }
2466
2467 #ifdef BFD64
2468 /* If BFD64, sign extend val for 32bit address mode. */
2469 if (flag_code != CODE_64BIT
2470 || i.prefix[ADDR_PREFIX])
2471 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2472 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2473 #endif
2474
2475 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2476 {
2477 char buf1[40], buf2[40];
2478
2479 sprint_value (buf1, val);
2480 sprint_value (buf2, val & mask);
2481 as_warn (_("%s shortened to %s"), buf1, buf2);
2482 }
2483 return val & mask;
2484 }
2485
2486 enum PREFIX_GROUP
2487 {
2488 PREFIX_EXIST = 0,
2489 PREFIX_LOCK,
2490 PREFIX_REP,
2491 PREFIX_DS,
2492 PREFIX_OTHER
2493 };
2494
2495 /* Returns
2496 a. PREFIX_EXIST if attempting to add a prefix where one from the
2497 same class already exists.
2498 b. PREFIX_LOCK if lock prefix is added.
2499 c. PREFIX_REP if rep/repne prefix is added.
2500 d. PREFIX_DS if ds prefix is added.
2501 e. PREFIX_OTHER if other prefix is added.
2502 */
2503
2504 static enum PREFIX_GROUP
2505 add_prefix (unsigned int prefix)
2506 {
2507 enum PREFIX_GROUP ret = PREFIX_OTHER;
2508 unsigned int q;
2509
2510 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2511 && flag_code == CODE_64BIT)
2512 {
2513 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2514 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2515 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2516 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2517 ret = PREFIX_EXIST;
2518 q = REX_PREFIX;
2519 }
2520 else
2521 {
2522 switch (prefix)
2523 {
2524 default:
2525 abort ();
2526
2527 case DS_PREFIX_OPCODE:
2528 ret = PREFIX_DS;
2529 /* Fall through. */
2530 case CS_PREFIX_OPCODE:
2531 case ES_PREFIX_OPCODE:
2532 case FS_PREFIX_OPCODE:
2533 case GS_PREFIX_OPCODE:
2534 case SS_PREFIX_OPCODE:
2535 q = SEG_PREFIX;
2536 break;
2537
2538 case REPNE_PREFIX_OPCODE:
2539 case REPE_PREFIX_OPCODE:
2540 q = REP_PREFIX;
2541 ret = PREFIX_REP;
2542 break;
2543
2544 case LOCK_PREFIX_OPCODE:
2545 q = LOCK_PREFIX;
2546 ret = PREFIX_LOCK;
2547 break;
2548
2549 case FWAIT_OPCODE:
2550 q = WAIT_PREFIX;
2551 break;
2552
2553 case ADDR_PREFIX_OPCODE:
2554 q = ADDR_PREFIX;
2555 break;
2556
2557 case DATA_PREFIX_OPCODE:
2558 q = DATA_PREFIX;
2559 break;
2560 }
2561 if (i.prefix[q] != 0)
2562 ret = PREFIX_EXIST;
2563 }
2564
2565 if (ret)
2566 {
2567 if (!i.prefix[q])
2568 ++i.prefixes;
2569 i.prefix[q] |= prefix;
2570 }
2571 else
2572 as_bad (_("same type of prefix used twice"));
2573
2574 return ret;
2575 }
2576
2577 static void
2578 update_code_flag (int value, int check)
2579 {
2580 PRINTF_LIKE ((*as_error));
2581
2582 flag_code = (enum flag_code) value;
2583 if (flag_code == CODE_64BIT)
2584 {
2585 cpu_arch_flags.bitfield.cpu64 = 1;
2586 cpu_arch_flags.bitfield.cpuno64 = 0;
2587 }
2588 else
2589 {
2590 cpu_arch_flags.bitfield.cpu64 = 0;
2591 cpu_arch_flags.bitfield.cpuno64 = 1;
2592 }
2593 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2594 {
2595 if (check)
2596 as_error = as_fatal;
2597 else
2598 as_error = as_bad;
2599 (*as_error) (_("64bit mode not supported on `%s'."),
2600 cpu_arch_name ? cpu_arch_name : default_arch);
2601 }
2602 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2603 {
2604 if (check)
2605 as_error = as_fatal;
2606 else
2607 as_error = as_bad;
2608 (*as_error) (_("32bit mode not supported on `%s'."),
2609 cpu_arch_name ? cpu_arch_name : default_arch);
2610 }
2611 stackop_size = '\0';
2612 }
2613
2614 static void
2615 set_code_flag (int value)
2616 {
2617 update_code_flag (value, 0);
2618 }
2619
2620 static void
2621 set_16bit_gcc_code_flag (int new_code_flag)
2622 {
2623 flag_code = (enum flag_code) new_code_flag;
2624 if (flag_code != CODE_16BIT)
2625 abort ();
2626 cpu_arch_flags.bitfield.cpu64 = 0;
2627 cpu_arch_flags.bitfield.cpuno64 = 1;
2628 stackop_size = LONG_MNEM_SUFFIX;
2629 }
2630
2631 static void
2632 set_intel_syntax (int syntax_flag)
2633 {
2634 /* Find out if register prefixing is specified. */
2635 int ask_naked_reg = 0;
2636
2637 SKIP_WHITESPACE ();
2638 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2639 {
2640 char *string;
2641 int e = get_symbol_name (&string);
2642
2643 if (strcmp (string, "prefix") == 0)
2644 ask_naked_reg = 1;
2645 else if (strcmp (string, "noprefix") == 0)
2646 ask_naked_reg = -1;
2647 else
2648 as_bad (_("bad argument to syntax directive."));
2649 (void) restore_line_pointer (e);
2650 }
2651 demand_empty_rest_of_line ();
2652
2653 intel_syntax = syntax_flag;
2654
2655 if (ask_naked_reg == 0)
2656 allow_naked_reg = (intel_syntax
2657 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2658 else
2659 allow_naked_reg = (ask_naked_reg < 0);
2660
2661 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2662
2663 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2664 identifier_chars['$'] = intel_syntax ? '$' : 0;
2665 register_prefix = allow_naked_reg ? "" : "%";
2666 }
2667
2668 static void
2669 set_intel_mnemonic (int mnemonic_flag)
2670 {
2671 intel_mnemonic = mnemonic_flag;
2672 }
2673
2674 static void
2675 set_allow_index_reg (int flag)
2676 {
2677 allow_index_reg = flag;
2678 }
2679
2680 static void
2681 set_check (int what)
2682 {
2683 enum check_kind *kind;
2684 const char *str;
2685
2686 if (what)
2687 {
2688 kind = &operand_check;
2689 str = "operand";
2690 }
2691 else
2692 {
2693 kind = &sse_check;
2694 str = "sse";
2695 }
2696
2697 SKIP_WHITESPACE ();
2698
2699 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2700 {
2701 char *string;
2702 int e = get_symbol_name (&string);
2703
2704 if (strcmp (string, "none") == 0)
2705 *kind = check_none;
2706 else if (strcmp (string, "warning") == 0)
2707 *kind = check_warning;
2708 else if (strcmp (string, "error") == 0)
2709 *kind = check_error;
2710 else
2711 as_bad (_("bad argument to %s_check directive."), str);
2712 (void) restore_line_pointer (e);
2713 }
2714 else
2715 as_bad (_("missing argument for %s_check directive"), str);
2716
2717 demand_empty_rest_of_line ();
2718 }
2719
2720 static void
2721 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2722 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2723 {
2724 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2725 static const char *arch;
2726
2727 /* Intel LIOM is only supported on ELF. */
2728 if (!IS_ELF)
2729 return;
2730
2731 if (!arch)
2732 {
2733 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2734 use default_arch. */
2735 arch = cpu_arch_name;
2736 if (!arch)
2737 arch = default_arch;
2738 }
2739
2740 /* If we are targeting Intel MCU, we must enable it. */
2741 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2742 || new_flag.bitfield.cpuiamcu)
2743 return;
2744
2745 /* If we are targeting Intel L1OM, we must enable it. */
2746 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2747 || new_flag.bitfield.cpul1om)
2748 return;
2749
2750 /* If we are targeting Intel K1OM, we must enable it. */
2751 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2752 || new_flag.bitfield.cpuk1om)
2753 return;
2754
2755 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2756 #endif
2757 }
2758
2759 static void
2760 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2761 {
2762 SKIP_WHITESPACE ();
2763
2764 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2765 {
2766 char *string;
2767 int e = get_symbol_name (&string);
2768 unsigned int j;
2769 i386_cpu_flags flags;
2770
2771 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2772 {
2773 if (strcmp (string, cpu_arch[j].name) == 0)
2774 {
2775 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2776
2777 if (*string != '.')
2778 {
2779 cpu_arch_name = cpu_arch[j].name;
2780 cpu_sub_arch_name = NULL;
2781 cpu_arch_flags = cpu_arch[j].flags;
2782 if (flag_code == CODE_64BIT)
2783 {
2784 cpu_arch_flags.bitfield.cpu64 = 1;
2785 cpu_arch_flags.bitfield.cpuno64 = 0;
2786 }
2787 else
2788 {
2789 cpu_arch_flags.bitfield.cpu64 = 0;
2790 cpu_arch_flags.bitfield.cpuno64 = 1;
2791 }
2792 cpu_arch_isa = cpu_arch[j].type;
2793 cpu_arch_isa_flags = cpu_arch[j].flags;
2794 if (!cpu_arch_tune_set)
2795 {
2796 cpu_arch_tune = cpu_arch_isa;
2797 cpu_arch_tune_flags = cpu_arch_isa_flags;
2798 }
2799 break;
2800 }
2801
2802 flags = cpu_flags_or (cpu_arch_flags,
2803 cpu_arch[j].flags);
2804
2805 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2806 {
2807 if (cpu_sub_arch_name)
2808 {
2809 char *name = cpu_sub_arch_name;
2810 cpu_sub_arch_name = concat (name,
2811 cpu_arch[j].name,
2812 (const char *) NULL);
2813 free (name);
2814 }
2815 else
2816 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2817 cpu_arch_flags = flags;
2818 cpu_arch_isa_flags = flags;
2819 }
2820 else
2821 cpu_arch_isa_flags
2822 = cpu_flags_or (cpu_arch_isa_flags,
2823 cpu_arch[j].flags);
2824 (void) restore_line_pointer (e);
2825 demand_empty_rest_of_line ();
2826 return;
2827 }
2828 }
2829
2830 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2831 {
2832 /* Disable an ISA extension. */
2833 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2834 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2835 {
2836 flags = cpu_flags_and_not (cpu_arch_flags,
2837 cpu_noarch[j].flags);
2838 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2839 {
2840 if (cpu_sub_arch_name)
2841 {
2842 char *name = cpu_sub_arch_name;
2843 cpu_sub_arch_name = concat (name, string,
2844 (const char *) NULL);
2845 free (name);
2846 }
2847 else
2848 cpu_sub_arch_name = xstrdup (string);
2849 cpu_arch_flags = flags;
2850 cpu_arch_isa_flags = flags;
2851 }
2852 (void) restore_line_pointer (e);
2853 demand_empty_rest_of_line ();
2854 return;
2855 }
2856
2857 j = ARRAY_SIZE (cpu_arch);
2858 }
2859
2860 if (j >= ARRAY_SIZE (cpu_arch))
2861 as_bad (_("no such architecture: `%s'"), string);
2862
2863 *input_line_pointer = e;
2864 }
2865 else
2866 as_bad (_("missing cpu architecture"));
2867
2868 no_cond_jump_promotion = 0;
2869 if (*input_line_pointer == ','
2870 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2871 {
2872 char *string;
2873 char e;
2874
2875 ++input_line_pointer;
2876 e = get_symbol_name (&string);
2877
2878 if (strcmp (string, "nojumps") == 0)
2879 no_cond_jump_promotion = 1;
2880 else if (strcmp (string, "jumps") == 0)
2881 ;
2882 else
2883 as_bad (_("no such architecture modifier: `%s'"), string);
2884
2885 (void) restore_line_pointer (e);
2886 }
2887
2888 demand_empty_rest_of_line ();
2889 }
2890
2891 enum bfd_architecture
2892 i386_arch (void)
2893 {
2894 if (cpu_arch_isa == PROCESSOR_L1OM)
2895 {
2896 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2897 || flag_code != CODE_64BIT)
2898 as_fatal (_("Intel L1OM is 64bit ELF only"));
2899 return bfd_arch_l1om;
2900 }
2901 else if (cpu_arch_isa == PROCESSOR_K1OM)
2902 {
2903 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2904 || flag_code != CODE_64BIT)
2905 as_fatal (_("Intel K1OM is 64bit ELF only"));
2906 return bfd_arch_k1om;
2907 }
2908 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2909 {
2910 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2911 || flag_code == CODE_64BIT)
2912 as_fatal (_("Intel MCU is 32bit ELF only"));
2913 return bfd_arch_iamcu;
2914 }
2915 else
2916 return bfd_arch_i386;
2917 }
2918
2919 unsigned long
2920 i386_mach (void)
2921 {
2922 if (!strncmp (default_arch, "x86_64", 6))
2923 {
2924 if (cpu_arch_isa == PROCESSOR_L1OM)
2925 {
2926 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2927 || default_arch[6] != '\0')
2928 as_fatal (_("Intel L1OM is 64bit ELF only"));
2929 return bfd_mach_l1om;
2930 }
2931 else if (cpu_arch_isa == PROCESSOR_K1OM)
2932 {
2933 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2934 || default_arch[6] != '\0')
2935 as_fatal (_("Intel K1OM is 64bit ELF only"));
2936 return bfd_mach_k1om;
2937 }
2938 else if (default_arch[6] == '\0')
2939 return bfd_mach_x86_64;
2940 else
2941 return bfd_mach_x64_32;
2942 }
2943 else if (!strcmp (default_arch, "i386")
2944 || !strcmp (default_arch, "iamcu"))
2945 {
2946 if (cpu_arch_isa == PROCESSOR_IAMCU)
2947 {
2948 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2949 as_fatal (_("Intel MCU is 32bit ELF only"));
2950 return bfd_mach_i386_iamcu;
2951 }
2952 else
2953 return bfd_mach_i386_i386;
2954 }
2955 else
2956 as_fatal (_("unknown architecture"));
2957 }
2958 \f
2959 void
2960 md_begin (void)
2961 {
2962 const char *hash_err;
2963
2964 /* Support pseudo prefixes like {disp32}. */
2965 lex_type ['{'] = LEX_BEGIN_NAME;
2966
2967 /* Initialize op_hash hash table. */
2968 op_hash = hash_new ();
2969
2970 {
2971 const insn_template *optab;
2972 templates *core_optab;
2973
2974 /* Setup for loop. */
2975 optab = i386_optab;
2976 core_optab = XNEW (templates);
2977 core_optab->start = optab;
2978
2979 while (1)
2980 {
2981 ++optab;
2982 if (optab->name == NULL
2983 || strcmp (optab->name, (optab - 1)->name) != 0)
2984 {
2985 /* different name --> ship out current template list;
2986 add to hash table; & begin anew. */
2987 core_optab->end = optab;
2988 hash_err = hash_insert (op_hash,
2989 (optab - 1)->name,
2990 (void *) core_optab);
2991 if (hash_err)
2992 {
2993 as_fatal (_("can't hash %s: %s"),
2994 (optab - 1)->name,
2995 hash_err);
2996 }
2997 if (optab->name == NULL)
2998 break;
2999 core_optab = XNEW (templates);
3000 core_optab->start = optab;
3001 }
3002 }
3003 }
3004
3005 /* Initialize reg_hash hash table. */
3006 reg_hash = hash_new ();
3007 {
3008 const reg_entry *regtab;
3009 unsigned int regtab_size = i386_regtab_size;
3010
3011 for (regtab = i386_regtab; regtab_size--; regtab++)
3012 {
3013 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3014 if (hash_err)
3015 as_fatal (_("can't hash %s: %s"),
3016 regtab->reg_name,
3017 hash_err);
3018 }
3019 }
3020
3021 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3022 {
3023 int c;
3024 char *p;
3025
3026 for (c = 0; c < 256; c++)
3027 {
3028 if (ISDIGIT (c))
3029 {
3030 digit_chars[c] = c;
3031 mnemonic_chars[c] = c;
3032 register_chars[c] = c;
3033 operand_chars[c] = c;
3034 }
3035 else if (ISLOWER (c))
3036 {
3037 mnemonic_chars[c] = c;
3038 register_chars[c] = c;
3039 operand_chars[c] = c;
3040 }
3041 else if (ISUPPER (c))
3042 {
3043 mnemonic_chars[c] = TOLOWER (c);
3044 register_chars[c] = mnemonic_chars[c];
3045 operand_chars[c] = c;
3046 }
3047 else if (c == '{' || c == '}')
3048 {
3049 mnemonic_chars[c] = c;
3050 operand_chars[c] = c;
3051 }
3052
3053 if (ISALPHA (c) || ISDIGIT (c))
3054 identifier_chars[c] = c;
3055 else if (c >= 128)
3056 {
3057 identifier_chars[c] = c;
3058 operand_chars[c] = c;
3059 }
3060 }
3061
3062 #ifdef LEX_AT
3063 identifier_chars['@'] = '@';
3064 #endif
3065 #ifdef LEX_QM
3066 identifier_chars['?'] = '?';
3067 operand_chars['?'] = '?';
3068 #endif
3069 digit_chars['-'] = '-';
3070 mnemonic_chars['_'] = '_';
3071 mnemonic_chars['-'] = '-';
3072 mnemonic_chars['.'] = '.';
3073 identifier_chars['_'] = '_';
3074 identifier_chars['.'] = '.';
3075
3076 for (p = operand_special_chars; *p != '\0'; p++)
3077 operand_chars[(unsigned char) *p] = *p;
3078 }
3079
3080 if (flag_code == CODE_64BIT)
3081 {
3082 #if defined (OBJ_COFF) && defined (TE_PE)
3083 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3084 ? 32 : 16);
3085 #else
3086 x86_dwarf2_return_column = 16;
3087 #endif
3088 x86_cie_data_alignment = -8;
3089 }
3090 else
3091 {
3092 x86_dwarf2_return_column = 8;
3093 x86_cie_data_alignment = -4;
3094 }
3095
3096 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3097 can be turned into BRANCH_PREFIX frag. */
3098 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3099 abort ();
3100 }
3101
3102 void
3103 i386_print_statistics (FILE *file)
3104 {
3105 hash_print_statistics (file, "i386 opcode", op_hash);
3106 hash_print_statistics (file, "i386 register", reg_hash);
3107 }
3108 \f
3109 #ifdef DEBUG386
3110
3111 /* Debugging routines for md_assemble. */
3112 static void pte (insn_template *);
3113 static void pt (i386_operand_type);
3114 static void pe (expressionS *);
3115 static void ps (symbolS *);
3116
3117 static void
3118 pi (const char *line, i386_insn *x)
3119 {
3120 unsigned int j;
3121
3122 fprintf (stdout, "%s: template ", line);
3123 pte (&x->tm);
3124 fprintf (stdout, " address: base %s index %s scale %x\n",
3125 x->base_reg ? x->base_reg->reg_name : "none",
3126 x->index_reg ? x->index_reg->reg_name : "none",
3127 x->log2_scale_factor);
3128 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3129 x->rm.mode, x->rm.reg, x->rm.regmem);
3130 fprintf (stdout, " sib: base %x index %x scale %x\n",
3131 x->sib.base, x->sib.index, x->sib.scale);
3132 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3133 (x->rex & REX_W) != 0,
3134 (x->rex & REX_R) != 0,
3135 (x->rex & REX_X) != 0,
3136 (x->rex & REX_B) != 0);
3137 for (j = 0; j < x->operands; j++)
3138 {
3139 fprintf (stdout, " #%d: ", j + 1);
3140 pt (x->types[j]);
3141 fprintf (stdout, "\n");
3142 if (x->types[j].bitfield.class == Reg
3143 || x->types[j].bitfield.class == RegMMX
3144 || x->types[j].bitfield.class == RegSIMD
3145 || x->types[j].bitfield.class == SReg
3146 || x->types[j].bitfield.class == RegCR
3147 || x->types[j].bitfield.class == RegDR
3148 || x->types[j].bitfield.class == RegTR)
3149 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3150 if (operand_type_check (x->types[j], imm))
3151 pe (x->op[j].imms);
3152 if (operand_type_check (x->types[j], disp))
3153 pe (x->op[j].disps);
3154 }
3155 }
3156
3157 static void
3158 pte (insn_template *t)
3159 {
3160 unsigned int j;
3161 fprintf (stdout, " %d operands ", t->operands);
3162 fprintf (stdout, "opcode %x ", t->base_opcode);
3163 if (t->extension_opcode != None)
3164 fprintf (stdout, "ext %x ", t->extension_opcode);
3165 if (t->opcode_modifier.d)
3166 fprintf (stdout, "D");
3167 if (t->opcode_modifier.w)
3168 fprintf (stdout, "W");
3169 fprintf (stdout, "\n");
3170 for (j = 0; j < t->operands; j++)
3171 {
3172 fprintf (stdout, " #%d type ", j + 1);
3173 pt (t->operand_types[j]);
3174 fprintf (stdout, "\n");
3175 }
3176 }
3177
3178 static void
3179 pe (expressionS *e)
3180 {
3181 fprintf (stdout, " operation %d\n", e->X_op);
3182 fprintf (stdout, " add_number %ld (%lx)\n",
3183 (long) e->X_add_number, (long) e->X_add_number);
3184 if (e->X_add_symbol)
3185 {
3186 fprintf (stdout, " add_symbol ");
3187 ps (e->X_add_symbol);
3188 fprintf (stdout, "\n");
3189 }
3190 if (e->X_op_symbol)
3191 {
3192 fprintf (stdout, " op_symbol ");
3193 ps (e->X_op_symbol);
3194 fprintf (stdout, "\n");
3195 }
3196 }
3197
3198 static void
3199 ps (symbolS *s)
3200 {
3201 fprintf (stdout, "%s type %s%s",
3202 S_GET_NAME (s),
3203 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3204 segment_name (S_GET_SEGMENT (s)));
3205 }
3206
3207 static struct type_name
3208 {
3209 i386_operand_type mask;
3210 const char *name;
3211 }
3212 const type_names[] =
3213 {
3214 { OPERAND_TYPE_REG8, "r8" },
3215 { OPERAND_TYPE_REG16, "r16" },
3216 { OPERAND_TYPE_REG32, "r32" },
3217 { OPERAND_TYPE_REG64, "r64" },
3218 { OPERAND_TYPE_ACC8, "acc8" },
3219 { OPERAND_TYPE_ACC16, "acc16" },
3220 { OPERAND_TYPE_ACC32, "acc32" },
3221 { OPERAND_TYPE_ACC64, "acc64" },
3222 { OPERAND_TYPE_IMM8, "i8" },
3223 { OPERAND_TYPE_IMM8, "i8s" },
3224 { OPERAND_TYPE_IMM16, "i16" },
3225 { OPERAND_TYPE_IMM32, "i32" },
3226 { OPERAND_TYPE_IMM32S, "i32s" },
3227 { OPERAND_TYPE_IMM64, "i64" },
3228 { OPERAND_TYPE_IMM1, "i1" },
3229 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3230 { OPERAND_TYPE_DISP8, "d8" },
3231 { OPERAND_TYPE_DISP16, "d16" },
3232 { OPERAND_TYPE_DISP32, "d32" },
3233 { OPERAND_TYPE_DISP32S, "d32s" },
3234 { OPERAND_TYPE_DISP64, "d64" },
3235 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3236 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3237 { OPERAND_TYPE_CONTROL, "control reg" },
3238 { OPERAND_TYPE_TEST, "test reg" },
3239 { OPERAND_TYPE_DEBUG, "debug reg" },
3240 { OPERAND_TYPE_FLOATREG, "FReg" },
3241 { OPERAND_TYPE_FLOATACC, "FAcc" },
3242 { OPERAND_TYPE_SREG, "SReg" },
3243 { OPERAND_TYPE_REGMMX, "rMMX" },
3244 { OPERAND_TYPE_REGXMM, "rXMM" },
3245 { OPERAND_TYPE_REGYMM, "rYMM" },
3246 { OPERAND_TYPE_REGZMM, "rZMM" },
3247 { OPERAND_TYPE_REGMASK, "Mask reg" },
3248 };
3249
3250 static void
3251 pt (i386_operand_type t)
3252 {
3253 unsigned int j;
3254 i386_operand_type a;
3255
3256 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3257 {
3258 a = operand_type_and (t, type_names[j].mask);
3259 if (operand_type_equal (&a, &type_names[j].mask))
3260 fprintf (stdout, "%s, ", type_names[j].name);
3261 }
3262 fflush (stdout);
3263 }
3264
3265 #endif /* DEBUG386 */
3266 \f
3267 static bfd_reloc_code_real_type
3268 reloc (unsigned int size,
3269 int pcrel,
3270 int sign,
3271 bfd_reloc_code_real_type other)
3272 {
3273 if (other != NO_RELOC)
3274 {
3275 reloc_howto_type *rel;
3276
3277 if (size == 8)
3278 switch (other)
3279 {
3280 case BFD_RELOC_X86_64_GOT32:
3281 return BFD_RELOC_X86_64_GOT64;
3282 break;
3283 case BFD_RELOC_X86_64_GOTPLT64:
3284 return BFD_RELOC_X86_64_GOTPLT64;
3285 break;
3286 case BFD_RELOC_X86_64_PLTOFF64:
3287 return BFD_RELOC_X86_64_PLTOFF64;
3288 break;
3289 case BFD_RELOC_X86_64_GOTPC32:
3290 other = BFD_RELOC_X86_64_GOTPC64;
3291 break;
3292 case BFD_RELOC_X86_64_GOTPCREL:
3293 other = BFD_RELOC_X86_64_GOTPCREL64;
3294 break;
3295 case BFD_RELOC_X86_64_TPOFF32:
3296 other = BFD_RELOC_X86_64_TPOFF64;
3297 break;
3298 case BFD_RELOC_X86_64_DTPOFF32:
3299 other = BFD_RELOC_X86_64_DTPOFF64;
3300 break;
3301 default:
3302 break;
3303 }
3304
3305 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3306 if (other == BFD_RELOC_SIZE32)
3307 {
3308 if (size == 8)
3309 other = BFD_RELOC_SIZE64;
3310 if (pcrel)
3311 {
3312 as_bad (_("there are no pc-relative size relocations"));
3313 return NO_RELOC;
3314 }
3315 }
3316 #endif
3317
3318 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3319 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3320 sign = -1;
3321
3322 rel = bfd_reloc_type_lookup (stdoutput, other);
3323 if (!rel)
3324 as_bad (_("unknown relocation (%u)"), other);
3325 else if (size != bfd_get_reloc_size (rel))
3326 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3327 bfd_get_reloc_size (rel),
3328 size);
3329 else if (pcrel && !rel->pc_relative)
3330 as_bad (_("non-pc-relative relocation for pc-relative field"));
3331 else if ((rel->complain_on_overflow == complain_overflow_signed
3332 && !sign)
3333 || (rel->complain_on_overflow == complain_overflow_unsigned
3334 && sign > 0))
3335 as_bad (_("relocated field and relocation type differ in signedness"));
3336 else
3337 return other;
3338 return NO_RELOC;
3339 }
3340
3341 if (pcrel)
3342 {
3343 if (!sign)
3344 as_bad (_("there are no unsigned pc-relative relocations"));
3345 switch (size)
3346 {
3347 case 1: return BFD_RELOC_8_PCREL;
3348 case 2: return BFD_RELOC_16_PCREL;
3349 case 4: return BFD_RELOC_32_PCREL;
3350 case 8: return BFD_RELOC_64_PCREL;
3351 }
3352 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3353 }
3354 else
3355 {
3356 if (sign > 0)
3357 switch (size)
3358 {
3359 case 4: return BFD_RELOC_X86_64_32S;
3360 }
3361 else
3362 switch (size)
3363 {
3364 case 1: return BFD_RELOC_8;
3365 case 2: return BFD_RELOC_16;
3366 case 4: return BFD_RELOC_32;
3367 case 8: return BFD_RELOC_64;
3368 }
3369 as_bad (_("cannot do %s %u byte relocation"),
3370 sign > 0 ? "signed" : "unsigned", size);
3371 }
3372
3373 return NO_RELOC;
3374 }
3375
3376 /* Here we decide which fixups can be adjusted to make them relative to
3377 the beginning of the section instead of the symbol. Basically we need
3378 to make sure that the dynamic relocations are done correctly, so in
3379 some cases we force the original symbol to be used. */
3380
3381 int
3382 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3383 {
3384 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3385 if (!IS_ELF)
3386 return 1;
3387
3388 /* Don't adjust pc-relative references to merge sections in 64-bit
3389 mode. */
3390 if (use_rela_relocations
3391 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3392 && fixP->fx_pcrel)
3393 return 0;
3394
3395 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3396 and changed later by validate_fix. */
3397 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3398 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3399 return 0;
3400
3401 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3402 for size relocations. */
3403 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3404 || fixP->fx_r_type == BFD_RELOC_SIZE64
3405 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3406 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3407 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3408 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3409 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3410 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3411 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3412 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3413 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3414 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3415 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3416 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3417 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3418 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3419 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3420 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3421 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3422 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3423 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3424 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3425 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3426 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3427 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3428 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3429 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3430 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3431 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3432 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3433 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3434 return 0;
3435 #endif
3436 return 1;
3437 }
3438
3439 static int
3440 intel_float_operand (const char *mnemonic)
3441 {
3442 /* Note that the value returned is meaningful only for opcodes with (memory)
3443 operands, hence the code here is free to improperly handle opcodes that
3444 have no operands (for better performance and smaller code). */
3445
3446 if (mnemonic[0] != 'f')
3447 return 0; /* non-math */
3448
3449 switch (mnemonic[1])
3450 {
3451 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3452 the fs segment override prefix not currently handled because no
3453 call path can make opcodes without operands get here */
3454 case 'i':
3455 return 2 /* integer op */;
3456 case 'l':
3457 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3458 return 3; /* fldcw/fldenv */
3459 break;
3460 case 'n':
3461 if (mnemonic[2] != 'o' /* fnop */)
3462 return 3; /* non-waiting control op */
3463 break;
3464 case 'r':
3465 if (mnemonic[2] == 's')
3466 return 3; /* frstor/frstpm */
3467 break;
3468 case 's':
3469 if (mnemonic[2] == 'a')
3470 return 3; /* fsave */
3471 if (mnemonic[2] == 't')
3472 {
3473 switch (mnemonic[3])
3474 {
3475 case 'c': /* fstcw */
3476 case 'd': /* fstdw */
3477 case 'e': /* fstenv */
3478 case 's': /* fsts[gw] */
3479 return 3;
3480 }
3481 }
3482 break;
3483 case 'x':
3484 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3485 return 0; /* fxsave/fxrstor are not really math ops */
3486 break;
3487 }
3488
3489 return 1;
3490 }
3491
3492 /* Build the VEX prefix. */
3493
3494 static void
3495 build_vex_prefix (const insn_template *t)
3496 {
3497 unsigned int register_specifier;
3498 unsigned int implied_prefix;
3499 unsigned int vector_length;
3500 unsigned int w;
3501
3502 /* Check register specifier. */
3503 if (i.vex.register_specifier)
3504 {
3505 register_specifier =
3506 ~register_number (i.vex.register_specifier) & 0xf;
3507 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3508 }
3509 else
3510 register_specifier = 0xf;
3511
3512 /* Use 2-byte VEX prefix by swapping destination and source operand
3513 if there are more than 1 register operand. */
3514 if (i.reg_operands > 1
3515 && i.vec_encoding != vex_encoding_vex3
3516 && i.dir_encoding == dir_encoding_default
3517 && i.operands == i.reg_operands
3518 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3519 && i.tm.opcode_modifier.vexopcode == VEX0F
3520 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3521 && i.rex == REX_B)
3522 {
3523 unsigned int xchg = i.operands - 1;
3524 union i386_op temp_op;
3525 i386_operand_type temp_type;
3526
3527 temp_type = i.types[xchg];
3528 i.types[xchg] = i.types[0];
3529 i.types[0] = temp_type;
3530 temp_op = i.op[xchg];
3531 i.op[xchg] = i.op[0];
3532 i.op[0] = temp_op;
3533
3534 gas_assert (i.rm.mode == 3);
3535
3536 i.rex = REX_R;
3537 xchg = i.rm.regmem;
3538 i.rm.regmem = i.rm.reg;
3539 i.rm.reg = xchg;
3540
3541 if (i.tm.opcode_modifier.d)
3542 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3543 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3544 else /* Use the next insn. */
3545 i.tm = t[1];
3546 }
3547
3548 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3549 are no memory operands and at least 3 register ones. */
3550 if (i.reg_operands >= 3
3551 && i.vec_encoding != vex_encoding_vex3
3552 && i.reg_operands == i.operands - i.imm_operands
3553 && i.tm.opcode_modifier.vex
3554 && i.tm.opcode_modifier.commutative
3555 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3556 && i.rex == REX_B
3557 && i.vex.register_specifier
3558 && !(i.vex.register_specifier->reg_flags & RegRex))
3559 {
3560 unsigned int xchg = i.operands - i.reg_operands;
3561 union i386_op temp_op;
3562 i386_operand_type temp_type;
3563
3564 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3565 gas_assert (!i.tm.opcode_modifier.sae);
3566 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3567 &i.types[i.operands - 3]));
3568 gas_assert (i.rm.mode == 3);
3569
3570 temp_type = i.types[xchg];
3571 i.types[xchg] = i.types[xchg + 1];
3572 i.types[xchg + 1] = temp_type;
3573 temp_op = i.op[xchg];
3574 i.op[xchg] = i.op[xchg + 1];
3575 i.op[xchg + 1] = temp_op;
3576
3577 i.rex = 0;
3578 xchg = i.rm.regmem | 8;
3579 i.rm.regmem = ~register_specifier & 0xf;
3580 gas_assert (!(i.rm.regmem & 8));
3581 i.vex.register_specifier += xchg - i.rm.regmem;
3582 register_specifier = ~xchg & 0xf;
3583 }
3584
3585 if (i.tm.opcode_modifier.vex == VEXScalar)
3586 vector_length = avxscalar;
3587 else if (i.tm.opcode_modifier.vex == VEX256)
3588 vector_length = 1;
3589 else
3590 {
3591 unsigned int op;
3592
3593 /* Determine vector length from the last multi-length vector
3594 operand. */
3595 vector_length = 0;
3596 for (op = t->operands; op--;)
3597 if (t->operand_types[op].bitfield.xmmword
3598 && t->operand_types[op].bitfield.ymmword
3599 && i.types[op].bitfield.ymmword)
3600 {
3601 vector_length = 1;
3602 break;
3603 }
3604 }
3605
3606 switch ((i.tm.base_opcode >> 8) & 0xff)
3607 {
3608 case 0:
3609 implied_prefix = 0;
3610 break;
3611 case DATA_PREFIX_OPCODE:
3612 implied_prefix = 1;
3613 break;
3614 case REPE_PREFIX_OPCODE:
3615 implied_prefix = 2;
3616 break;
3617 case REPNE_PREFIX_OPCODE:
3618 implied_prefix = 3;
3619 break;
3620 default:
3621 abort ();
3622 }
3623
3624 /* Check the REX.W bit and VEXW. */
3625 if (i.tm.opcode_modifier.vexw == VEXWIG)
3626 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3627 else if (i.tm.opcode_modifier.vexw)
3628 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3629 else
3630 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3631
3632 /* Use 2-byte VEX prefix if possible. */
3633 if (w == 0
3634 && i.vec_encoding != vex_encoding_vex3
3635 && i.tm.opcode_modifier.vexopcode == VEX0F
3636 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3637 {
3638 /* 2-byte VEX prefix. */
3639 unsigned int r;
3640
3641 i.vex.length = 2;
3642 i.vex.bytes[0] = 0xc5;
3643
3644 /* Check the REX.R bit. */
3645 r = (i.rex & REX_R) ? 0 : 1;
3646 i.vex.bytes[1] = (r << 7
3647 | register_specifier << 3
3648 | vector_length << 2
3649 | implied_prefix);
3650 }
3651 else
3652 {
3653 /* 3-byte VEX prefix. */
3654 unsigned int m;
3655
3656 i.vex.length = 3;
3657
3658 switch (i.tm.opcode_modifier.vexopcode)
3659 {
3660 case VEX0F:
3661 m = 0x1;
3662 i.vex.bytes[0] = 0xc4;
3663 break;
3664 case VEX0F38:
3665 m = 0x2;
3666 i.vex.bytes[0] = 0xc4;
3667 break;
3668 case VEX0F3A:
3669 m = 0x3;
3670 i.vex.bytes[0] = 0xc4;
3671 break;
3672 case XOP08:
3673 m = 0x8;
3674 i.vex.bytes[0] = 0x8f;
3675 break;
3676 case XOP09:
3677 m = 0x9;
3678 i.vex.bytes[0] = 0x8f;
3679 break;
3680 case XOP0A:
3681 m = 0xa;
3682 i.vex.bytes[0] = 0x8f;
3683 break;
3684 default:
3685 abort ();
3686 }
3687
3688 /* The high 3 bits of the second VEX byte are 1's compliment
3689 of RXB bits from REX. */
3690 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3691
3692 i.vex.bytes[2] = (w << 7
3693 | register_specifier << 3
3694 | vector_length << 2
3695 | implied_prefix);
3696 }
3697 }
3698
3699 static INLINE bfd_boolean
3700 is_evex_encoding (const insn_template *t)
3701 {
3702 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3703 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3704 || t->opcode_modifier.sae;
3705 }
3706
3707 static INLINE bfd_boolean
3708 is_any_vex_encoding (const insn_template *t)
3709 {
3710 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3711 || is_evex_encoding (t);
3712 }
3713
3714 /* Build the EVEX prefix. */
3715
3716 static void
3717 build_evex_prefix (void)
3718 {
3719 unsigned int register_specifier;
3720 unsigned int implied_prefix;
3721 unsigned int m, w;
3722 rex_byte vrex_used = 0;
3723
3724 /* Check register specifier. */
3725 if (i.vex.register_specifier)
3726 {
3727 gas_assert ((i.vrex & REX_X) == 0);
3728
3729 register_specifier = i.vex.register_specifier->reg_num;
3730 if ((i.vex.register_specifier->reg_flags & RegRex))
3731 register_specifier += 8;
3732 /* The upper 16 registers are encoded in the fourth byte of the
3733 EVEX prefix. */
3734 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3735 i.vex.bytes[3] = 0x8;
3736 register_specifier = ~register_specifier & 0xf;
3737 }
3738 else
3739 {
3740 register_specifier = 0xf;
3741
3742 /* Encode upper 16 vector index register in the fourth byte of
3743 the EVEX prefix. */
3744 if (!(i.vrex & REX_X))
3745 i.vex.bytes[3] = 0x8;
3746 else
3747 vrex_used |= REX_X;
3748 }
3749
3750 switch ((i.tm.base_opcode >> 8) & 0xff)
3751 {
3752 case 0:
3753 implied_prefix = 0;
3754 break;
3755 case DATA_PREFIX_OPCODE:
3756 implied_prefix = 1;
3757 break;
3758 case REPE_PREFIX_OPCODE:
3759 implied_prefix = 2;
3760 break;
3761 case REPNE_PREFIX_OPCODE:
3762 implied_prefix = 3;
3763 break;
3764 default:
3765 abort ();
3766 }
3767
3768 /* 4 byte EVEX prefix. */
3769 i.vex.length = 4;
3770 i.vex.bytes[0] = 0x62;
3771
3772 /* mmmm bits. */
3773 switch (i.tm.opcode_modifier.vexopcode)
3774 {
3775 case VEX0F:
3776 m = 1;
3777 break;
3778 case VEX0F38:
3779 m = 2;
3780 break;
3781 case VEX0F3A:
3782 m = 3;
3783 break;
3784 default:
3785 abort ();
3786 break;
3787 }
3788
3789 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3790 bits from REX. */
3791 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3792
3793 /* The fifth bit of the second EVEX byte is 1's compliment of the
3794 REX_R bit in VREX. */
3795 if (!(i.vrex & REX_R))
3796 i.vex.bytes[1] |= 0x10;
3797 else
3798 vrex_used |= REX_R;
3799
3800 if ((i.reg_operands + i.imm_operands) == i.operands)
3801 {
3802 /* When all operands are registers, the REX_X bit in REX is not
3803 used. We reuse it to encode the upper 16 registers, which is
3804 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3805 as 1's compliment. */
3806 if ((i.vrex & REX_B))
3807 {
3808 vrex_used |= REX_B;
3809 i.vex.bytes[1] &= ~0x40;
3810 }
3811 }
3812
3813 /* EVEX instructions shouldn't need the REX prefix. */
3814 i.vrex &= ~vrex_used;
3815 gas_assert (i.vrex == 0);
3816
3817 /* Check the REX.W bit and VEXW. */
3818 if (i.tm.opcode_modifier.vexw == VEXWIG)
3819 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3820 else if (i.tm.opcode_modifier.vexw)
3821 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3822 else
3823 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3824
3825 /* Encode the U bit. */
3826 implied_prefix |= 0x4;
3827
3828 /* The third byte of the EVEX prefix. */
3829 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3830
3831 /* The fourth byte of the EVEX prefix. */
3832 /* The zeroing-masking bit. */
3833 if (i.mask && i.mask->zeroing)
3834 i.vex.bytes[3] |= 0x80;
3835
3836 /* Don't always set the broadcast bit if there is no RC. */
3837 if (!i.rounding)
3838 {
3839 /* Encode the vector length. */
3840 unsigned int vec_length;
3841
3842 if (!i.tm.opcode_modifier.evex
3843 || i.tm.opcode_modifier.evex == EVEXDYN)
3844 {
3845 unsigned int op;
3846
3847 /* Determine vector length from the last multi-length vector
3848 operand. */
3849 vec_length = 0;
3850 for (op = i.operands; op--;)
3851 if (i.tm.operand_types[op].bitfield.xmmword
3852 + i.tm.operand_types[op].bitfield.ymmword
3853 + i.tm.operand_types[op].bitfield.zmmword > 1)
3854 {
3855 if (i.types[op].bitfield.zmmword)
3856 {
3857 i.tm.opcode_modifier.evex = EVEX512;
3858 break;
3859 }
3860 else if (i.types[op].bitfield.ymmword)
3861 {
3862 i.tm.opcode_modifier.evex = EVEX256;
3863 break;
3864 }
3865 else if (i.types[op].bitfield.xmmword)
3866 {
3867 i.tm.opcode_modifier.evex = EVEX128;
3868 break;
3869 }
3870 else if (i.broadcast && (int) op == i.broadcast->operand)
3871 {
3872 switch (i.broadcast->bytes)
3873 {
3874 case 64:
3875 i.tm.opcode_modifier.evex = EVEX512;
3876 break;
3877 case 32:
3878 i.tm.opcode_modifier.evex = EVEX256;
3879 break;
3880 case 16:
3881 i.tm.opcode_modifier.evex = EVEX128;
3882 break;
3883 default:
3884 abort ();
3885 }
3886 break;
3887 }
3888 }
3889
3890 if (op >= MAX_OPERANDS)
3891 abort ();
3892 }
3893
3894 switch (i.tm.opcode_modifier.evex)
3895 {
3896 case EVEXLIG: /* LL' is ignored */
3897 vec_length = evexlig << 5;
3898 break;
3899 case EVEX128:
3900 vec_length = 0 << 5;
3901 break;
3902 case EVEX256:
3903 vec_length = 1 << 5;
3904 break;
3905 case EVEX512:
3906 vec_length = 2 << 5;
3907 break;
3908 default:
3909 abort ();
3910 break;
3911 }
3912 i.vex.bytes[3] |= vec_length;
3913 /* Encode the broadcast bit. */
3914 if (i.broadcast)
3915 i.vex.bytes[3] |= 0x10;
3916 }
3917 else
3918 {
3919 if (i.rounding->type != saeonly)
3920 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3921 else
3922 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3923 }
3924
3925 if (i.mask && i.mask->mask)
3926 i.vex.bytes[3] |= i.mask->mask->reg_num;
3927 }
3928
3929 static void
3930 process_immext (void)
3931 {
3932 expressionS *exp;
3933
3934 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3935 which is coded in the same place as an 8-bit immediate field
3936 would be. Here we fake an 8-bit immediate operand from the
3937 opcode suffix stored in tm.extension_opcode.
3938
3939 AVX instructions also use this encoding, for some of
3940 3 argument instructions. */
3941
3942 gas_assert (i.imm_operands <= 1
3943 && (i.operands <= 2
3944 || (is_any_vex_encoding (&i.tm)
3945 && i.operands <= 4)));
3946
3947 exp = &im_expressions[i.imm_operands++];
3948 i.op[i.operands].imms = exp;
3949 i.types[i.operands] = imm8;
3950 i.operands++;
3951 exp->X_op = O_constant;
3952 exp->X_add_number = i.tm.extension_opcode;
3953 i.tm.extension_opcode = None;
3954 }
3955
3956
3957 static int
3958 check_hle (void)
3959 {
3960 switch (i.tm.opcode_modifier.hleprefixok)
3961 {
3962 default:
3963 abort ();
3964 case HLEPrefixNone:
3965 as_bad (_("invalid instruction `%s' after `%s'"),
3966 i.tm.name, i.hle_prefix);
3967 return 0;
3968 case HLEPrefixLock:
3969 if (i.prefix[LOCK_PREFIX])
3970 return 1;
3971 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3972 return 0;
3973 case HLEPrefixAny:
3974 return 1;
3975 case HLEPrefixRelease:
3976 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3977 {
3978 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3979 i.tm.name);
3980 return 0;
3981 }
3982 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
3983 {
3984 as_bad (_("memory destination needed for instruction `%s'"
3985 " after `xrelease'"), i.tm.name);
3986 return 0;
3987 }
3988 return 1;
3989 }
3990 }
3991
3992 /* Try the shortest encoding by shortening operand size. */
3993
3994 static void
3995 optimize_encoding (void)
3996 {
3997 unsigned int j;
3998
3999 if (optimize_for_space
4000 && !is_any_vex_encoding (&i.tm)
4001 && i.reg_operands == 1
4002 && i.imm_operands == 1
4003 && !i.types[1].bitfield.byte
4004 && i.op[0].imms->X_op == O_constant
4005 && fits_in_imm7 (i.op[0].imms->X_add_number)
4006 && (i.tm.base_opcode == 0xa8
4007 || (i.tm.base_opcode == 0xf6
4008 && i.tm.extension_opcode == 0x0)))
4009 {
4010 /* Optimize: -Os:
4011 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4012 */
4013 unsigned int base_regnum = i.op[1].regs->reg_num;
4014 if (flag_code == CODE_64BIT || base_regnum < 4)
4015 {
4016 i.types[1].bitfield.byte = 1;
4017 /* Ignore the suffix. */
4018 i.suffix = 0;
4019 /* Convert to byte registers. */
4020 if (i.types[1].bitfield.word)
4021 j = 16;
4022 else if (i.types[1].bitfield.dword)
4023 j = 32;
4024 else
4025 j = 48;
4026 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4027 j += 8;
4028 i.op[1].regs -= j;
4029 }
4030 }
4031 else if (flag_code == CODE_64BIT
4032 && !is_any_vex_encoding (&i.tm)
4033 && ((i.types[1].bitfield.qword
4034 && i.reg_operands == 1
4035 && i.imm_operands == 1
4036 && i.op[0].imms->X_op == O_constant
4037 && ((i.tm.base_opcode == 0xb8
4038 && i.tm.extension_opcode == None
4039 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4040 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4041 && ((i.tm.base_opcode == 0x24
4042 || i.tm.base_opcode == 0xa8)
4043 || (i.tm.base_opcode == 0x80
4044 && i.tm.extension_opcode == 0x4)
4045 || ((i.tm.base_opcode == 0xf6
4046 || (i.tm.base_opcode | 1) == 0xc7)
4047 && i.tm.extension_opcode == 0x0)))
4048 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4049 && i.tm.base_opcode == 0x83
4050 && i.tm.extension_opcode == 0x4)))
4051 || (i.types[0].bitfield.qword
4052 && ((i.reg_operands == 2
4053 && i.op[0].regs == i.op[1].regs
4054 && (i.tm.base_opcode == 0x30
4055 || i.tm.base_opcode == 0x28))
4056 || (i.reg_operands == 1
4057 && i.operands == 1
4058 && i.tm.base_opcode == 0x30)))))
4059 {
4060 /* Optimize: -O:
4061 andq $imm31, %r64 -> andl $imm31, %r32
4062 andq $imm7, %r64 -> andl $imm7, %r32
4063 testq $imm31, %r64 -> testl $imm31, %r32
4064 xorq %r64, %r64 -> xorl %r32, %r32
4065 subq %r64, %r64 -> subl %r32, %r32
4066 movq $imm31, %r64 -> movl $imm31, %r32
4067 movq $imm32, %r64 -> movl $imm32, %r32
4068 */
4069 i.tm.opcode_modifier.norex64 = 1;
4070 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4071 {
4072 /* Handle
4073 movq $imm31, %r64 -> movl $imm31, %r32
4074 movq $imm32, %r64 -> movl $imm32, %r32
4075 */
4076 i.tm.operand_types[0].bitfield.imm32 = 1;
4077 i.tm.operand_types[0].bitfield.imm32s = 0;
4078 i.tm.operand_types[0].bitfield.imm64 = 0;
4079 i.types[0].bitfield.imm32 = 1;
4080 i.types[0].bitfield.imm32s = 0;
4081 i.types[0].bitfield.imm64 = 0;
4082 i.types[1].bitfield.dword = 1;
4083 i.types[1].bitfield.qword = 0;
4084 if ((i.tm.base_opcode | 1) == 0xc7)
4085 {
4086 /* Handle
4087 movq $imm31, %r64 -> movl $imm31, %r32
4088 */
4089 i.tm.base_opcode = 0xb8;
4090 i.tm.extension_opcode = None;
4091 i.tm.opcode_modifier.w = 0;
4092 i.tm.opcode_modifier.modrm = 0;
4093 }
4094 }
4095 }
4096 else if (optimize > 1
4097 && !optimize_for_space
4098 && !is_any_vex_encoding (&i.tm)
4099 && i.reg_operands == 2
4100 && i.op[0].regs == i.op[1].regs
4101 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4102 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4103 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4104 {
4105 /* Optimize: -O2:
4106 andb %rN, %rN -> testb %rN, %rN
4107 andw %rN, %rN -> testw %rN, %rN
4108 andq %rN, %rN -> testq %rN, %rN
4109 orb %rN, %rN -> testb %rN, %rN
4110 orw %rN, %rN -> testw %rN, %rN
4111 orq %rN, %rN -> testq %rN, %rN
4112
4113 and outside of 64-bit mode
4114
4115 andl %rN, %rN -> testl %rN, %rN
4116 orl %rN, %rN -> testl %rN, %rN
4117 */
4118 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4119 }
4120 else if (i.reg_operands == 3
4121 && i.op[0].regs == i.op[1].regs
4122 && !i.types[2].bitfield.xmmword
4123 && (i.tm.opcode_modifier.vex
4124 || ((!i.mask || i.mask->zeroing)
4125 && !i.rounding
4126 && is_evex_encoding (&i.tm)
4127 && (i.vec_encoding != vex_encoding_evex
4128 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4129 || i.tm.cpu_flags.bitfield.cpuavx512vl
4130 || (i.tm.operand_types[2].bitfield.zmmword
4131 && i.types[2].bitfield.ymmword))))
4132 && ((i.tm.base_opcode == 0x55
4133 || i.tm.base_opcode == 0x6655
4134 || i.tm.base_opcode == 0x66df
4135 || i.tm.base_opcode == 0x57
4136 || i.tm.base_opcode == 0x6657
4137 || i.tm.base_opcode == 0x66ef
4138 || i.tm.base_opcode == 0x66f8
4139 || i.tm.base_opcode == 0x66f9
4140 || i.tm.base_opcode == 0x66fa
4141 || i.tm.base_opcode == 0x66fb
4142 || i.tm.base_opcode == 0x42
4143 || i.tm.base_opcode == 0x6642
4144 || i.tm.base_opcode == 0x47
4145 || i.tm.base_opcode == 0x6647)
4146 && i.tm.extension_opcode == None))
4147 {
4148 /* Optimize: -O1:
4149 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4150 vpsubq and vpsubw:
4151 EVEX VOP %zmmM, %zmmM, %zmmN
4152 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4153 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4154 EVEX VOP %ymmM, %ymmM, %ymmN
4155 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4156 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4157 VEX VOP %ymmM, %ymmM, %ymmN
4158 -> VEX VOP %xmmM, %xmmM, %xmmN
4159 VOP, one of vpandn and vpxor:
4160 VEX VOP %ymmM, %ymmM, %ymmN
4161 -> VEX VOP %xmmM, %xmmM, %xmmN
4162 VOP, one of vpandnd and vpandnq:
4163 EVEX VOP %zmmM, %zmmM, %zmmN
4164 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4165 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4166 EVEX VOP %ymmM, %ymmM, %ymmN
4167 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4168 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4169 VOP, one of vpxord and vpxorq:
4170 EVEX VOP %zmmM, %zmmM, %zmmN
4171 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4172 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4173 EVEX VOP %ymmM, %ymmM, %ymmN
4174 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4175 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4176 VOP, one of kxord and kxorq:
4177 VEX VOP %kM, %kM, %kN
4178 -> VEX kxorw %kM, %kM, %kN
4179 VOP, one of kandnd and kandnq:
4180 VEX VOP %kM, %kM, %kN
4181 -> VEX kandnw %kM, %kM, %kN
4182 */
4183 if (is_evex_encoding (&i.tm))
4184 {
4185 if (i.vec_encoding != vex_encoding_evex)
4186 {
4187 i.tm.opcode_modifier.vex = VEX128;
4188 i.tm.opcode_modifier.vexw = VEXW0;
4189 i.tm.opcode_modifier.evex = 0;
4190 }
4191 else if (optimize > 1)
4192 i.tm.opcode_modifier.evex = EVEX128;
4193 else
4194 return;
4195 }
4196 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4197 {
4198 i.tm.base_opcode &= 0xff;
4199 i.tm.opcode_modifier.vexw = VEXW0;
4200 }
4201 else
4202 i.tm.opcode_modifier.vex = VEX128;
4203
4204 if (i.tm.opcode_modifier.vex)
4205 for (j = 0; j < 3; j++)
4206 {
4207 i.types[j].bitfield.xmmword = 1;
4208 i.types[j].bitfield.ymmword = 0;
4209 }
4210 }
4211 else if (i.vec_encoding != vex_encoding_evex
4212 && !i.types[0].bitfield.zmmword
4213 && !i.types[1].bitfield.zmmword
4214 && !i.mask
4215 && !i.broadcast
4216 && is_evex_encoding (&i.tm)
4217 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4218 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4219 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4220 || (i.tm.base_opcode & ~4) == 0x66db
4221 || (i.tm.base_opcode & ~4) == 0x66eb)
4222 && i.tm.extension_opcode == None)
4223 {
4224 /* Optimize: -O1:
4225 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4226 vmovdqu32 and vmovdqu64:
4227 EVEX VOP %xmmM, %xmmN
4228 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4229 EVEX VOP %ymmM, %ymmN
4230 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4231 EVEX VOP %xmmM, mem
4232 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4233 EVEX VOP %ymmM, mem
4234 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4235 EVEX VOP mem, %xmmN
4236 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4237 EVEX VOP mem, %ymmN
4238 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4239 VOP, one of vpand, vpandn, vpor, vpxor:
4240 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4241 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4242 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4243 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4244 EVEX VOP{d,q} mem, %xmmM, %xmmN
4245 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4246 EVEX VOP{d,q} mem, %ymmM, %ymmN
4247 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4248 */
4249 for (j = 0; j < i.operands; j++)
4250 if (operand_type_check (i.types[j], disp)
4251 && i.op[j].disps->X_op == O_constant)
4252 {
4253 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4254 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4255 bytes, we choose EVEX Disp8 over VEX Disp32. */
4256 int evex_disp8, vex_disp8;
4257 unsigned int memshift = i.memshift;
4258 offsetT n = i.op[j].disps->X_add_number;
4259
4260 evex_disp8 = fits_in_disp8 (n);
4261 i.memshift = 0;
4262 vex_disp8 = fits_in_disp8 (n);
4263 if (evex_disp8 != vex_disp8)
4264 {
4265 i.memshift = memshift;
4266 return;
4267 }
4268
4269 i.types[j].bitfield.disp8 = vex_disp8;
4270 break;
4271 }
4272 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4273 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4274 i.tm.opcode_modifier.vex
4275 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4276 i.tm.opcode_modifier.vexw = VEXW0;
4277 /* VPAND, VPOR, and VPXOR are commutative. */
4278 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4279 i.tm.opcode_modifier.commutative = 1;
4280 i.tm.opcode_modifier.evex = 0;
4281 i.tm.opcode_modifier.masking = 0;
4282 i.tm.opcode_modifier.broadcast = 0;
4283 i.tm.opcode_modifier.disp8memshift = 0;
4284 i.memshift = 0;
4285 if (j < i.operands)
4286 i.types[j].bitfield.disp8
4287 = fits_in_disp8 (i.op[j].disps->X_add_number);
4288 }
4289 }
4290
4291 /* This is the guts of the machine-dependent assembler. LINE points to a
4292 machine dependent instruction. This function is supposed to emit
4293 the frags/bytes it assembles to. */
4294
4295 void
4296 md_assemble (char *line)
4297 {
4298 unsigned int j;
4299 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4300 const insn_template *t;
4301
4302 /* Initialize globals. */
4303 memset (&i, '\0', sizeof (i));
4304 for (j = 0; j < MAX_OPERANDS; j++)
4305 i.reloc[j] = NO_RELOC;
4306 memset (disp_expressions, '\0', sizeof (disp_expressions));
4307 memset (im_expressions, '\0', sizeof (im_expressions));
4308 save_stack_p = save_stack;
4309
4310 /* First parse an instruction mnemonic & call i386_operand for the operands.
4311 We assume that the scrubber has arranged it so that line[0] is the valid
4312 start of a (possibly prefixed) mnemonic. */
4313
4314 line = parse_insn (line, mnemonic);
4315 if (line == NULL)
4316 return;
4317 mnem_suffix = i.suffix;
4318
4319 line = parse_operands (line, mnemonic);
4320 this_operand = -1;
4321 xfree (i.memop1_string);
4322 i.memop1_string = NULL;
4323 if (line == NULL)
4324 return;
4325
4326 /* Now we've parsed the mnemonic into a set of templates, and have the
4327 operands at hand. */
4328
4329 /* All Intel opcodes have reversed operands except for "bound", "enter"
4330 "monitor*", and "mwait*". We also don't reverse intersegment "jmp"
4331 and "call" instructions with 2 immediate operands so that the immediate
4332 segment precedes the offset, as it does when in AT&T mode. */
4333 if (intel_syntax
4334 && i.operands > 1
4335 && (strcmp (mnemonic, "bound") != 0)
4336 && (strcmp (mnemonic, "invlpga") != 0)
4337 && (strncmp (mnemonic, "monitor", 7) != 0)
4338 && (strncmp (mnemonic, "mwait", 5) != 0)
4339 && !(operand_type_check (i.types[0], imm)
4340 && operand_type_check (i.types[1], imm)))
4341 swap_operands ();
4342
4343 /* The order of the immediates should be reversed
4344 for 2 immediates extrq and insertq instructions */
4345 if (i.imm_operands == 2
4346 && (strcmp (mnemonic, "extrq") == 0
4347 || strcmp (mnemonic, "insertq") == 0))
4348 swap_2_operands (0, 1);
4349
4350 if (i.imm_operands)
4351 optimize_imm ();
4352
4353 /* Don't optimize displacement for movabs since it only takes 64bit
4354 displacement. */
4355 if (i.disp_operands
4356 && i.disp_encoding != disp_encoding_32bit
4357 && (flag_code != CODE_64BIT
4358 || strcmp (mnemonic, "movabs") != 0))
4359 optimize_disp ();
4360
4361 /* Next, we find a template that matches the given insn,
4362 making sure the overlap of the given operands types is consistent
4363 with the template operand types. */
4364
4365 if (!(t = match_template (mnem_suffix)))
4366 return;
4367
4368 if (sse_check != check_none
4369 && !i.tm.opcode_modifier.noavx
4370 && !i.tm.cpu_flags.bitfield.cpuavx
4371 && !i.tm.cpu_flags.bitfield.cpuavx512f
4372 && (i.tm.cpu_flags.bitfield.cpusse
4373 || i.tm.cpu_flags.bitfield.cpusse2
4374 || i.tm.cpu_flags.bitfield.cpusse3
4375 || i.tm.cpu_flags.bitfield.cpussse3
4376 || i.tm.cpu_flags.bitfield.cpusse4_1
4377 || i.tm.cpu_flags.bitfield.cpusse4_2
4378 || i.tm.cpu_flags.bitfield.cpusse4a
4379 || i.tm.cpu_flags.bitfield.cpupclmul
4380 || i.tm.cpu_flags.bitfield.cpuaes
4381 || i.tm.cpu_flags.bitfield.cpusha
4382 || i.tm.cpu_flags.bitfield.cpugfni))
4383 {
4384 (sse_check == check_warning
4385 ? as_warn
4386 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4387 }
4388
4389 if (i.tm.opcode_modifier.fwait)
4390 if (!add_prefix (FWAIT_OPCODE))
4391 return;
4392
4393 /* Check if REP prefix is OK. */
4394 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4395 {
4396 as_bad (_("invalid instruction `%s' after `%s'"),
4397 i.tm.name, i.rep_prefix);
4398 return;
4399 }
4400
4401 /* Check for lock without a lockable instruction. Destination operand
4402 must be memory unless it is xchg (0x86). */
4403 if (i.prefix[LOCK_PREFIX]
4404 && (!i.tm.opcode_modifier.islockable
4405 || i.mem_operands == 0
4406 || (i.tm.base_opcode != 0x86
4407 && !(i.flags[i.operands - 1] & Operand_Mem))))
4408 {
4409 as_bad (_("expecting lockable instruction after `lock'"));
4410 return;
4411 }
4412
4413 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4414 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4415 {
4416 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4417 return;
4418 }
4419
4420 /* Check if HLE prefix is OK. */
4421 if (i.hle_prefix && !check_hle ())
4422 return;
4423
4424 /* Check BND prefix. */
4425 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4426 as_bad (_("expecting valid branch instruction after `bnd'"));
4427
4428 /* Check NOTRACK prefix. */
4429 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4430 as_bad (_("expecting indirect branch instruction after `notrack'"));
4431
4432 if (i.tm.cpu_flags.bitfield.cpumpx)
4433 {
4434 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4435 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4436 else if (flag_code != CODE_16BIT
4437 ? i.prefix[ADDR_PREFIX]
4438 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4439 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4440 }
4441
4442 /* Insert BND prefix. */
4443 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4444 {
4445 if (!i.prefix[BND_PREFIX])
4446 add_prefix (BND_PREFIX_OPCODE);
4447 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4448 {
4449 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4450 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4451 }
4452 }
4453
4454 /* Check string instruction segment overrides. */
4455 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4456 {
4457 gas_assert (i.mem_operands);
4458 if (!check_string ())
4459 return;
4460 i.disp_operands = 0;
4461 }
4462
4463 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4464 optimize_encoding ();
4465
4466 if (!process_suffix ())
4467 return;
4468
4469 /* Update operand types. */
4470 for (j = 0; j < i.operands; j++)
4471 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4472
4473 /* Make still unresolved immediate matches conform to size of immediate
4474 given in i.suffix. */
4475 if (!finalize_imm ())
4476 return;
4477
4478 if (i.types[0].bitfield.imm1)
4479 i.imm_operands = 0; /* kludge for shift insns. */
4480
4481 /* We only need to check those implicit registers for instructions
4482 with 3 operands or less. */
4483 if (i.operands <= 3)
4484 for (j = 0; j < i.operands; j++)
4485 if (i.types[j].bitfield.instance != InstanceNone
4486 && !i.types[j].bitfield.xmmword)
4487 i.reg_operands--;
4488
4489 /* ImmExt should be processed after SSE2AVX. */
4490 if (!i.tm.opcode_modifier.sse2avx
4491 && i.tm.opcode_modifier.immext)
4492 process_immext ();
4493
4494 /* For insns with operands there are more diddles to do to the opcode. */
4495 if (i.operands)
4496 {
4497 if (!process_operands ())
4498 return;
4499 }
4500 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4501 {
4502 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4503 as_warn (_("translating to `%sp'"), i.tm.name);
4504 }
4505
4506 if (is_any_vex_encoding (&i.tm))
4507 {
4508 if (!cpu_arch_flags.bitfield.cpui286)
4509 {
4510 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4511 i.tm.name);
4512 return;
4513 }
4514
4515 if (i.tm.opcode_modifier.vex)
4516 build_vex_prefix (t);
4517 else
4518 build_evex_prefix ();
4519 }
4520
4521 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4522 instructions may define INT_OPCODE as well, so avoid this corner
4523 case for those instructions that use MODRM. */
4524 if (i.tm.base_opcode == INT_OPCODE
4525 && !i.tm.opcode_modifier.modrm
4526 && i.op[0].imms->X_add_number == 3)
4527 {
4528 i.tm.base_opcode = INT3_OPCODE;
4529 i.imm_operands = 0;
4530 }
4531
4532 if ((i.tm.opcode_modifier.jump == JUMP
4533 || i.tm.opcode_modifier.jump == JUMP_BYTE
4534 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4535 && i.op[0].disps->X_op == O_constant)
4536 {
4537 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4538 the absolute address given by the constant. Since ix86 jumps and
4539 calls are pc relative, we need to generate a reloc. */
4540 i.op[0].disps->X_add_symbol = &abs_symbol;
4541 i.op[0].disps->X_op = O_symbol;
4542 }
4543
4544 if (i.tm.opcode_modifier.rex64)
4545 i.rex |= REX_W;
4546
4547 /* For 8 bit registers we need an empty rex prefix. Also if the
4548 instruction already has a prefix, we need to convert old
4549 registers to new ones. */
4550
4551 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4552 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4553 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4554 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4555 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4556 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4557 && i.rex != 0))
4558 {
4559 int x;
4560
4561 i.rex |= REX_OPCODE;
4562 for (x = 0; x < 2; x++)
4563 {
4564 /* Look for 8 bit operand that uses old registers. */
4565 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4566 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4567 {
4568 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4569 /* In case it is "hi" register, give up. */
4570 if (i.op[x].regs->reg_num > 3)
4571 as_bad (_("can't encode register '%s%s' in an "
4572 "instruction requiring REX prefix."),
4573 register_prefix, i.op[x].regs->reg_name);
4574
4575 /* Otherwise it is equivalent to the extended register.
4576 Since the encoding doesn't change this is merely
4577 cosmetic cleanup for debug output. */
4578
4579 i.op[x].regs = i.op[x].regs + 8;
4580 }
4581 }
4582 }
4583
4584 if (i.rex == 0 && i.rex_encoding)
4585 {
4586 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4587 that uses legacy register. If it is "hi" register, don't add
4588 the REX_OPCODE byte. */
4589 int x;
4590 for (x = 0; x < 2; x++)
4591 if (i.types[x].bitfield.class == Reg
4592 && i.types[x].bitfield.byte
4593 && (i.op[x].regs->reg_flags & RegRex64) == 0
4594 && i.op[x].regs->reg_num > 3)
4595 {
4596 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4597 i.rex_encoding = FALSE;
4598 break;
4599 }
4600
4601 if (i.rex_encoding)
4602 i.rex = REX_OPCODE;
4603 }
4604
4605 if (i.rex != 0)
4606 add_prefix (REX_OPCODE | i.rex);
4607
4608 /* We are ready to output the insn. */
4609 output_insn ();
4610
4611 last_insn.seg = now_seg;
4612
4613 if (i.tm.opcode_modifier.isprefix)
4614 {
4615 last_insn.kind = last_insn_prefix;
4616 last_insn.name = i.tm.name;
4617 last_insn.file = as_where (&last_insn.line);
4618 }
4619 else
4620 last_insn.kind = last_insn_other;
4621 }
4622
4623 static char *
4624 parse_insn (char *line, char *mnemonic)
4625 {
4626 char *l = line;
4627 char *token_start = l;
4628 char *mnem_p;
4629 int supported;
4630 const insn_template *t;
4631 char *dot_p = NULL;
4632
4633 while (1)
4634 {
4635 mnem_p = mnemonic;
4636 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4637 {
4638 if (*mnem_p == '.')
4639 dot_p = mnem_p;
4640 mnem_p++;
4641 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4642 {
4643 as_bad (_("no such instruction: `%s'"), token_start);
4644 return NULL;
4645 }
4646 l++;
4647 }
4648 if (!is_space_char (*l)
4649 && *l != END_OF_INSN
4650 && (intel_syntax
4651 || (*l != PREFIX_SEPARATOR
4652 && *l != ',')))
4653 {
4654 as_bad (_("invalid character %s in mnemonic"),
4655 output_invalid (*l));
4656 return NULL;
4657 }
4658 if (token_start == l)
4659 {
4660 if (!intel_syntax && *l == PREFIX_SEPARATOR)
4661 as_bad (_("expecting prefix; got nothing"));
4662 else
4663 as_bad (_("expecting mnemonic; got nothing"));
4664 return NULL;
4665 }
4666
4667 /* Look up instruction (or prefix) via hash table. */
4668 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4669
4670 if (*l != END_OF_INSN
4671 && (!is_space_char (*l) || l[1] != END_OF_INSN)
4672 && current_templates
4673 && current_templates->start->opcode_modifier.isprefix)
4674 {
4675 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4676 {
4677 as_bad ((flag_code != CODE_64BIT
4678 ? _("`%s' is only supported in 64-bit mode")
4679 : _("`%s' is not supported in 64-bit mode")),
4680 current_templates->start->name);
4681 return NULL;
4682 }
4683 /* If we are in 16-bit mode, do not allow addr16 or data16.
4684 Similarly, in 32-bit mode, do not allow addr32 or data32. */
4685 if ((current_templates->start->opcode_modifier.size == SIZE16
4686 || current_templates->start->opcode_modifier.size == SIZE32)
4687 && flag_code != CODE_64BIT
4688 && ((current_templates->start->opcode_modifier.size == SIZE32)
4689 ^ (flag_code == CODE_16BIT)))
4690 {
4691 as_bad (_("redundant %s prefix"),
4692 current_templates->start->name);
4693 return NULL;
4694 }
4695 if (current_templates->start->opcode_length == 0)
4696 {
4697 /* Handle pseudo prefixes. */
4698 switch (current_templates->start->base_opcode)
4699 {
4700 case 0x0:
4701 /* {disp8} */
4702 i.disp_encoding = disp_encoding_8bit;
4703 break;
4704 case 0x1:
4705 /* {disp32} */
4706 i.disp_encoding = disp_encoding_32bit;
4707 break;
4708 case 0x2:
4709 /* {load} */
4710 i.dir_encoding = dir_encoding_load;
4711 break;
4712 case 0x3:
4713 /* {store} */
4714 i.dir_encoding = dir_encoding_store;
4715 break;
4716 case 0x4:
4717 /* {vex} */
4718 i.vec_encoding = vex_encoding_vex;
4719 break;
4720 case 0x5:
4721 /* {vex3} */
4722 i.vec_encoding = vex_encoding_vex3;
4723 break;
4724 case 0x6:
4725 /* {evex} */
4726 i.vec_encoding = vex_encoding_evex;
4727 break;
4728 case 0x7:
4729 /* {rex} */
4730 i.rex_encoding = TRUE;
4731 break;
4732 case 0x8:
4733 /* {nooptimize} */
4734 i.no_optimize = TRUE;
4735 break;
4736 default:
4737 abort ();
4738 }
4739 }
4740 else
4741 {
4742 /* Add prefix, checking for repeated prefixes. */
4743 switch (add_prefix (current_templates->start->base_opcode))
4744 {
4745 case PREFIX_EXIST:
4746 return NULL;
4747 case PREFIX_DS:
4748 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4749 i.notrack_prefix = current_templates->start->name;
4750 break;
4751 case PREFIX_REP:
4752 if (current_templates->start->cpu_flags.bitfield.cpuhle)
4753 i.hle_prefix = current_templates->start->name;
4754 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4755 i.bnd_prefix = current_templates->start->name;
4756 else
4757 i.rep_prefix = current_templates->start->name;
4758 break;
4759 default:
4760 break;
4761 }
4762 }
4763 /* Skip past PREFIX_SEPARATOR and reset token_start. */
4764 token_start = ++l;
4765 }
4766 else
4767 break;
4768 }
4769
4770 if (!current_templates)
4771 {
4772 /* Deprecated functionality (new code should use pseudo-prefixes instead):
4773 Check if we should swap operand or force 32bit displacement in
4774 encoding. */
4775 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4776 i.dir_encoding = dir_encoding_swap;
4777 else if (mnem_p - 3 == dot_p
4778 && dot_p[1] == 'd'
4779 && dot_p[2] == '8')
4780 i.disp_encoding = disp_encoding_8bit;
4781 else if (mnem_p - 4 == dot_p
4782 && dot_p[1] == 'd'
4783 && dot_p[2] == '3'
4784 && dot_p[3] == '2')
4785 i.disp_encoding = disp_encoding_32bit;
4786 else
4787 goto check_suffix;
4788 mnem_p = dot_p;
4789 *dot_p = '\0';
4790 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4791 }
4792
4793 if (!current_templates)
4794 {
4795 check_suffix:
4796 if (mnem_p > mnemonic)
4797 {
4798 /* See if we can get a match by trimming off a suffix. */
4799 switch (mnem_p[-1])
4800 {
4801 case WORD_MNEM_SUFFIX:
4802 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4803 i.suffix = SHORT_MNEM_SUFFIX;
4804 else
4805 /* Fall through. */
4806 case BYTE_MNEM_SUFFIX:
4807 case QWORD_MNEM_SUFFIX:
4808 i.suffix = mnem_p[-1];
4809 mnem_p[-1] = '\0';
4810 current_templates = (const templates *) hash_find (op_hash,
4811 mnemonic);
4812 break;
4813 case SHORT_MNEM_SUFFIX:
4814 case LONG_MNEM_SUFFIX:
4815 if (!intel_syntax)
4816 {
4817 i.suffix = mnem_p[-1];
4818 mnem_p[-1] = '\0';
4819 current_templates = (const templates *) hash_find (op_hash,
4820 mnemonic);
4821 }
4822 break;
4823
4824 /* Intel Syntax. */
4825 case 'd':
4826 if (intel_syntax)
4827 {
4828 if (intel_float_operand (mnemonic) == 1)
4829 i.suffix = SHORT_MNEM_SUFFIX;
4830 else
4831 i.suffix = LONG_MNEM_SUFFIX;
4832 mnem_p[-1] = '\0';
4833 current_templates = (const templates *) hash_find (op_hash,
4834 mnemonic);
4835 }
4836 break;
4837 }
4838 }
4839
4840 if (!current_templates)
4841 {
4842 as_bad (_("no such instruction: `%s'"), token_start);
4843 return NULL;
4844 }
4845 }
4846
4847 if (current_templates->start->opcode_modifier.jump == JUMP
4848 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
4849 {
4850 /* Check for a branch hint. We allow ",pt" and ",pn" for
4851 predict taken and predict not taken respectively.
4852 I'm not sure that branch hints actually do anything on loop
4853 and jcxz insns (JumpByte) for current Pentium4 chips. They
4854 may work in the future and it doesn't hurt to accept them
4855 now. */
4856 if (l[0] == ',' && l[1] == 'p')
4857 {
4858 if (l[2] == 't')
4859 {
4860 if (!add_prefix (DS_PREFIX_OPCODE))
4861 return NULL;
4862 l += 3;
4863 }
4864 else if (l[2] == 'n')
4865 {
4866 if (!add_prefix (CS_PREFIX_OPCODE))
4867 return NULL;
4868 l += 3;
4869 }
4870 }
4871 }
4872 /* Any other comma loses. */
4873 if (*l == ',')
4874 {
4875 as_bad (_("invalid character %s in mnemonic"),
4876 output_invalid (*l));
4877 return NULL;
4878 }
4879
4880 /* Check if instruction is supported on specified architecture. */
4881 supported = 0;
4882 for (t = current_templates->start; t < current_templates->end; ++t)
4883 {
4884 supported |= cpu_flags_match (t);
4885 if (supported == CPU_FLAGS_PERFECT_MATCH)
4886 {
4887 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4888 as_warn (_("use .code16 to ensure correct addressing mode"));
4889
4890 return l;
4891 }
4892 }
4893
4894 if (!(supported & CPU_FLAGS_64BIT_MATCH))
4895 as_bad (flag_code == CODE_64BIT
4896 ? _("`%s' is not supported in 64-bit mode")
4897 : _("`%s' is only supported in 64-bit mode"),
4898 current_templates->start->name);
4899 else
4900 as_bad (_("`%s' is not supported on `%s%s'"),
4901 current_templates->start->name,
4902 cpu_arch_name ? cpu_arch_name : default_arch,
4903 cpu_sub_arch_name ? cpu_sub_arch_name : "");
4904
4905 return NULL;
4906 }
4907
4908 static char *
4909 parse_operands (char *l, const char *mnemonic)
4910 {
4911 char *token_start;
4912
4913 /* 1 if operand is pending after ','. */
4914 unsigned int expecting_operand = 0;
4915
4916 /* Non-zero if operand parens not balanced. */
4917 unsigned int paren_not_balanced;
4918
4919 while (*l != END_OF_INSN)
4920 {
4921 /* Skip optional white space before operand. */
4922 if (is_space_char (*l))
4923 ++l;
4924 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4925 {
4926 as_bad (_("invalid character %s before operand %d"),
4927 output_invalid (*l),
4928 i.operands + 1);
4929 return NULL;
4930 }
4931 token_start = l; /* After white space. */
4932 paren_not_balanced = 0;
4933 while (paren_not_balanced || *l != ',')
4934 {
4935 if (*l == END_OF_INSN)
4936 {
4937 if (paren_not_balanced)
4938 {
4939 if (!intel_syntax)
4940 as_bad (_("unbalanced parenthesis in operand %d."),
4941 i.operands + 1);
4942 else
4943 as_bad (_("unbalanced brackets in operand %d."),
4944 i.operands + 1);
4945 return NULL;
4946 }
4947 else
4948 break; /* we are done */
4949 }
4950 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4951 {
4952 as_bad (_("invalid character %s in operand %d"),
4953 output_invalid (*l),
4954 i.operands + 1);
4955 return NULL;
4956 }
4957 if (!intel_syntax)
4958 {
4959 if (*l == '(')
4960 ++paren_not_balanced;
4961 if (*l == ')')
4962 --paren_not_balanced;
4963 }
4964 else
4965 {
4966 if (*l == '[')
4967 ++paren_not_balanced;
4968 if (*l == ']')
4969 --paren_not_balanced;
4970 }
4971 l++;
4972 }
4973 if (l != token_start)
4974 { /* Yes, we've read in another operand. */
4975 unsigned int operand_ok;
4976 this_operand = i.operands++;
4977 if (i.operands > MAX_OPERANDS)
4978 {
4979 as_bad (_("spurious operands; (%d operands/instruction max)"),
4980 MAX_OPERANDS);
4981 return NULL;
4982 }
4983 i.types[this_operand].bitfield.unspecified = 1;
4984 /* Now parse operand adding info to 'i' as we go along. */
4985 END_STRING_AND_SAVE (l);
4986
4987 if (i.mem_operands > 1)
4988 {
4989 as_bad (_("too many memory references for `%s'"),
4990 mnemonic);
4991 return 0;
4992 }
4993
4994 if (intel_syntax)
4995 operand_ok =
4996 i386_intel_operand (token_start,
4997 intel_float_operand (mnemonic));
4998 else
4999 operand_ok = i386_att_operand (token_start);
5000
5001 RESTORE_END_STRING (l);
5002 if (!operand_ok)
5003 return NULL;
5004 }
5005 else
5006 {
5007 if (expecting_operand)
5008 {
5009 expecting_operand_after_comma:
5010 as_bad (_("expecting operand after ','; got nothing"));
5011 return NULL;
5012 }
5013 if (*l == ',')
5014 {
5015 as_bad (_("expecting operand before ','; got nothing"));
5016 return NULL;
5017 }
5018 }
5019
5020 /* Now *l must be either ',' or END_OF_INSN. */
5021 if (*l == ',')
5022 {
5023 if (*++l == END_OF_INSN)
5024 {
5025 /* Just skip it, if it's \n complain. */
5026 goto expecting_operand_after_comma;
5027 }
5028 expecting_operand = 1;
5029 }
5030 }
5031 return l;
5032 }
5033
5034 static void
5035 swap_2_operands (int xchg1, int xchg2)
5036 {
5037 union i386_op temp_op;
5038 i386_operand_type temp_type;
5039 unsigned int temp_flags;
5040 enum bfd_reloc_code_real temp_reloc;
5041
5042 temp_type = i.types[xchg2];
5043 i.types[xchg2] = i.types[xchg1];
5044 i.types[xchg1] = temp_type;
5045
5046 temp_flags = i.flags[xchg2];
5047 i.flags[xchg2] = i.flags[xchg1];
5048 i.flags[xchg1] = temp_flags;
5049
5050 temp_op = i.op[xchg2];
5051 i.op[xchg2] = i.op[xchg1];
5052 i.op[xchg1] = temp_op;
5053
5054 temp_reloc = i.reloc[xchg2];
5055 i.reloc[xchg2] = i.reloc[xchg1];
5056 i.reloc[xchg1] = temp_reloc;
5057
5058 if (i.mask)
5059 {
5060 if (i.mask->operand == xchg1)
5061 i.mask->operand = xchg2;
5062 else if (i.mask->operand == xchg2)
5063 i.mask->operand = xchg1;
5064 }
5065 if (i.broadcast)
5066 {
5067 if (i.broadcast->operand == xchg1)
5068 i.broadcast->operand = xchg2;
5069 else if (i.broadcast->operand == xchg2)
5070 i.broadcast->operand = xchg1;
5071 }
5072 if (i.rounding)
5073 {
5074 if (i.rounding->operand == xchg1)
5075 i.rounding->operand = xchg2;
5076 else if (i.rounding->operand == xchg2)
5077 i.rounding->operand = xchg1;
5078 }
5079 }
5080
5081 static void
5082 swap_operands (void)
5083 {
5084 switch (i.operands)
5085 {
5086 case 5:
5087 case 4:
5088 swap_2_operands (1, i.operands - 2);
5089 /* Fall through. */
5090 case 3:
5091 case 2:
5092 swap_2_operands (0, i.operands - 1);
5093 break;
5094 default:
5095 abort ();
5096 }
5097
5098 if (i.mem_operands == 2)
5099 {
5100 const seg_entry *temp_seg;
5101 temp_seg = i.seg[0];
5102 i.seg[0] = i.seg[1];
5103 i.seg[1] = temp_seg;
5104 }
5105 }
5106
5107 /* Try to ensure constant immediates are represented in the smallest
5108 opcode possible. */
5109 static void
5110 optimize_imm (void)
5111 {
5112 char guess_suffix = 0;
5113 int op;
5114
5115 if (i.suffix)
5116 guess_suffix = i.suffix;
5117 else if (i.reg_operands)
5118 {
5119 /* Figure out a suffix from the last register operand specified.
5120 We can't do this properly yet, i.e. excluding special register
5121 instances, but the following works for instructions with
5122 immediates. In any case, we can't set i.suffix yet. */
5123 for (op = i.operands; --op >= 0;)
5124 if (i.types[op].bitfield.class != Reg)
5125 continue;
5126 else if (i.types[op].bitfield.byte)
5127 {
5128 guess_suffix = BYTE_MNEM_SUFFIX;
5129 break;
5130 }
5131 else if (i.types[op].bitfield.word)
5132 {
5133 guess_suffix = WORD_MNEM_SUFFIX;
5134 break;
5135 }
5136 else if (i.types[op].bitfield.dword)
5137 {
5138 guess_suffix = LONG_MNEM_SUFFIX;
5139 break;
5140 }
5141 else if (i.types[op].bitfield.qword)
5142 {
5143 guess_suffix = QWORD_MNEM_SUFFIX;
5144 break;
5145 }
5146 }
5147 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5148 guess_suffix = WORD_MNEM_SUFFIX;
5149
5150 for (op = i.operands; --op >= 0;)
5151 if (operand_type_check (i.types[op], imm))
5152 {
5153 switch (i.op[op].imms->X_op)
5154 {
5155 case O_constant:
5156 /* If a suffix is given, this operand may be shortened. */
5157 switch (guess_suffix)
5158 {
5159 case LONG_MNEM_SUFFIX:
5160 i.types[op].bitfield.imm32 = 1;
5161 i.types[op].bitfield.imm64 = 1;
5162 break;
5163 case WORD_MNEM_SUFFIX:
5164 i.types[op].bitfield.imm16 = 1;
5165 i.types[op].bitfield.imm32 = 1;
5166 i.types[op].bitfield.imm32s = 1;
5167 i.types[op].bitfield.imm64 = 1;
5168 break;
5169 case BYTE_MNEM_SUFFIX:
5170 i.types[op].bitfield.imm8 = 1;
5171 i.types[op].bitfield.imm8s = 1;
5172 i.types[op].bitfield.imm16 = 1;
5173 i.types[op].bitfield.imm32 = 1;
5174 i.types[op].bitfield.imm32s = 1;
5175 i.types[op].bitfield.imm64 = 1;
5176 break;
5177 }
5178
5179 /* If this operand is at most 16 bits, convert it
5180 to a signed 16 bit number before trying to see
5181 whether it will fit in an even smaller size.
5182 This allows a 16-bit operand such as $0xffe0 to
5183 be recognised as within Imm8S range. */
5184 if ((i.types[op].bitfield.imm16)
5185 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5186 {
5187 i.op[op].imms->X_add_number =
5188 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5189 }
5190 #ifdef BFD64
5191 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5192 if ((i.types[op].bitfield.imm32)
5193 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5194 == 0))
5195 {
5196 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5197 ^ ((offsetT) 1 << 31))
5198 - ((offsetT) 1 << 31));
5199 }
5200 #endif
5201 i.types[op]
5202 = operand_type_or (i.types[op],
5203 smallest_imm_type (i.op[op].imms->X_add_number));
5204
5205 /* We must avoid matching of Imm32 templates when 64bit
5206 only immediate is available. */
5207 if (guess_suffix == QWORD_MNEM_SUFFIX)
5208 i.types[op].bitfield.imm32 = 0;
5209 break;
5210
5211 case O_absent:
5212 case O_register:
5213 abort ();
5214
5215 /* Symbols and expressions. */
5216 default:
5217 /* Convert symbolic operand to proper sizes for matching, but don't
5218 prevent matching a set of insns that only supports sizes other
5219 than those matching the insn suffix. */
5220 {
5221 i386_operand_type mask, allowed;
5222 const insn_template *t;
5223
5224 operand_type_set (&mask, 0);
5225 operand_type_set (&allowed, 0);
5226
5227 for (t = current_templates->start;
5228 t < current_templates->end;
5229 ++t)
5230 {
5231 allowed = operand_type_or (allowed, t->operand_types[op]);
5232 allowed = operand_type_and (allowed, anyimm);
5233 }
5234 switch (guess_suffix)
5235 {
5236 case QWORD_MNEM_SUFFIX:
5237 mask.bitfield.imm64 = 1;
5238 mask.bitfield.imm32s = 1;
5239 break;
5240 case LONG_MNEM_SUFFIX:
5241 mask.bitfield.imm32 = 1;
5242 break;
5243 case WORD_MNEM_SUFFIX:
5244 mask.bitfield.imm16 = 1;
5245 break;
5246 case BYTE_MNEM_SUFFIX:
5247 mask.bitfield.imm8 = 1;
5248 break;
5249 default:
5250 break;
5251 }
5252 allowed = operand_type_and (mask, allowed);
5253 if (!operand_type_all_zero (&allowed))
5254 i.types[op] = operand_type_and (i.types[op], mask);
5255 }
5256 break;
5257 }
5258 }
5259 }
5260
5261 /* Try to use the smallest displacement type too. */
5262 static void
5263 optimize_disp (void)
5264 {
5265 int op;
5266
5267 for (op = i.operands; --op >= 0;)
5268 if (operand_type_check (i.types[op], disp))
5269 {
5270 if (i.op[op].disps->X_op == O_constant)
5271 {
5272 offsetT op_disp = i.op[op].disps->X_add_number;
5273
5274 if (i.types[op].bitfield.disp16
5275 && (op_disp & ~(offsetT) 0xffff) == 0)
5276 {
5277 /* If this operand is at most 16 bits, convert
5278 to a signed 16 bit number and don't use 64bit
5279 displacement. */
5280 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5281 i.types[op].bitfield.disp64 = 0;
5282 }
5283 #ifdef BFD64
5284 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5285 if (i.types[op].bitfield.disp32
5286 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5287 {
5288 /* If this operand is at most 32 bits, convert
5289 to a signed 32 bit number and don't use 64bit
5290 displacement. */
5291 op_disp &= (((offsetT) 2 << 31) - 1);
5292 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5293 i.types[op].bitfield.disp64 = 0;
5294 }
5295 #endif
5296 if (!op_disp && i.types[op].bitfield.baseindex)
5297 {
5298 i.types[op].bitfield.disp8 = 0;
5299 i.types[op].bitfield.disp16 = 0;
5300 i.types[op].bitfield.disp32 = 0;
5301 i.types[op].bitfield.disp32s = 0;
5302 i.types[op].bitfield.disp64 = 0;
5303 i.op[op].disps = 0;
5304 i.disp_operands--;
5305 }
5306 else if (flag_code == CODE_64BIT)
5307 {
5308 if (fits_in_signed_long (op_disp))
5309 {
5310 i.types[op].bitfield.disp64 = 0;
5311 i.types[op].bitfield.disp32s = 1;
5312 }
5313 if (i.prefix[ADDR_PREFIX]
5314 && fits_in_unsigned_long (op_disp))
5315 i.types[op].bitfield.disp32 = 1;
5316 }
5317 if ((i.types[op].bitfield.disp32
5318 || i.types[op].bitfield.disp32s
5319 || i.types[op].bitfield.disp16)
5320 && fits_in_disp8 (op_disp))
5321 i.types[op].bitfield.disp8 = 1;
5322 }
5323 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5324 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5325 {
5326 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5327 i.op[op].disps, 0, i.reloc[op]);
5328 i.types[op].bitfield.disp8 = 0;
5329 i.types[op].bitfield.disp16 = 0;
5330 i.types[op].bitfield.disp32 = 0;
5331 i.types[op].bitfield.disp32s = 0;
5332 i.types[op].bitfield.disp64 = 0;
5333 }
5334 else
5335 /* We only support 64bit displacement on constants. */
5336 i.types[op].bitfield.disp64 = 0;
5337 }
5338 }
5339
5340 /* Return 1 if there is a match in broadcast bytes between operand
5341 GIVEN and instruction template T. */
5342
5343 static INLINE int
5344 match_broadcast_size (const insn_template *t, unsigned int given)
5345 {
5346 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5347 && i.types[given].bitfield.byte)
5348 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5349 && i.types[given].bitfield.word)
5350 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5351 && i.types[given].bitfield.dword)
5352 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5353 && i.types[given].bitfield.qword));
5354 }
5355
5356 /* Check if operands are valid for the instruction. */
5357
5358 static int
5359 check_VecOperands (const insn_template *t)
5360 {
5361 unsigned int op;
5362 i386_cpu_flags cpu;
5363
5364 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5365 any one operand are implicity requiring AVX512VL support if the actual
5366 operand size is YMMword or XMMword. Since this function runs after
5367 template matching, there's no need to check for YMMword/XMMword in
5368 the template. */
5369 cpu = cpu_flags_and (t->cpu_flags, avx512);
5370 if (!cpu_flags_all_zero (&cpu)
5371 && !t->cpu_flags.bitfield.cpuavx512vl
5372 && !cpu_arch_flags.bitfield.cpuavx512vl)
5373 {
5374 for (op = 0; op < t->operands; ++op)
5375 {
5376 if (t->operand_types[op].bitfield.zmmword
5377 && (i.types[op].bitfield.ymmword
5378 || i.types[op].bitfield.xmmword))
5379 {
5380 i.error = unsupported;
5381 return 1;
5382 }
5383 }
5384 }
5385
5386 /* Without VSIB byte, we can't have a vector register for index. */
5387 if (!t->opcode_modifier.vecsib
5388 && i.index_reg
5389 && (i.index_reg->reg_type.bitfield.xmmword
5390 || i.index_reg->reg_type.bitfield.ymmword
5391 || i.index_reg->reg_type.bitfield.zmmword))
5392 {
5393 i.error = unsupported_vector_index_register;
5394 return 1;
5395 }
5396
5397 /* Check if default mask is allowed. */
5398 if (t->opcode_modifier.nodefmask
5399 && (!i.mask || i.mask->mask->reg_num == 0))
5400 {
5401 i.error = no_default_mask;
5402 return 1;
5403 }
5404
5405 /* For VSIB byte, we need a vector register for index, and all vector
5406 registers must be distinct. */
5407 if (t->opcode_modifier.vecsib)
5408 {
5409 if (!i.index_reg
5410 || !((t->opcode_modifier.vecsib == VecSIB128
5411 && i.index_reg->reg_type.bitfield.xmmword)
5412 || (t->opcode_modifier.vecsib == VecSIB256
5413 && i.index_reg->reg_type.bitfield.ymmword)
5414 || (t->opcode_modifier.vecsib == VecSIB512
5415 && i.index_reg->reg_type.bitfield.zmmword)))
5416 {
5417 i.error = invalid_vsib_address;
5418 return 1;
5419 }
5420
5421 gas_assert (i.reg_operands == 2 || i.mask);
5422 if (i.reg_operands == 2 && !i.mask)
5423 {
5424 gas_assert (i.types[0].bitfield.class == RegSIMD);
5425 gas_assert (i.types[0].bitfield.xmmword
5426 || i.types[0].bitfield.ymmword);
5427 gas_assert (i.types[2].bitfield.class == RegSIMD);
5428 gas_assert (i.types[2].bitfield.xmmword
5429 || i.types[2].bitfield.ymmword);
5430 if (operand_check == check_none)
5431 return 0;
5432 if (register_number (i.op[0].regs)
5433 != register_number (i.index_reg)
5434 && register_number (i.op[2].regs)
5435 != register_number (i.index_reg)
5436 && register_number (i.op[0].regs)
5437 != register_number (i.op[2].regs))
5438 return 0;
5439 if (operand_check == check_error)
5440 {
5441 i.error = invalid_vector_register_set;
5442 return 1;
5443 }
5444 as_warn (_("mask, index, and destination registers should be distinct"));
5445 }
5446 else if (i.reg_operands == 1 && i.mask)
5447 {
5448 if (i.types[1].bitfield.class == RegSIMD
5449 && (i.types[1].bitfield.xmmword
5450 || i.types[1].bitfield.ymmword
5451 || i.types[1].bitfield.zmmword)
5452 && (register_number (i.op[1].regs)
5453 == register_number (i.index_reg)))
5454 {
5455 if (operand_check == check_error)
5456 {
5457 i.error = invalid_vector_register_set;
5458 return 1;
5459 }
5460 if (operand_check != check_none)
5461 as_warn (_("index and destination registers should be distinct"));
5462 }
5463 }
5464 }
5465
5466 /* Check if broadcast is supported by the instruction and is applied
5467 to the memory operand. */
5468 if (i.broadcast)
5469 {
5470 i386_operand_type type, overlap;
5471
5472 /* Check if specified broadcast is supported in this instruction,
5473 and its broadcast bytes match the memory operand. */
5474 op = i.broadcast->operand;
5475 if (!t->opcode_modifier.broadcast
5476 || !(i.flags[op] & Operand_Mem)
5477 || (!i.types[op].bitfield.unspecified
5478 && !match_broadcast_size (t, op)))
5479 {
5480 bad_broadcast:
5481 i.error = unsupported_broadcast;
5482 return 1;
5483 }
5484
5485 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5486 * i.broadcast->type);
5487 operand_type_set (&type, 0);
5488 switch (i.broadcast->bytes)
5489 {
5490 case 2:
5491 type.bitfield.word = 1;
5492 break;
5493 case 4:
5494 type.bitfield.dword = 1;
5495 break;
5496 case 8:
5497 type.bitfield.qword = 1;
5498 break;
5499 case 16:
5500 type.bitfield.xmmword = 1;
5501 break;
5502 case 32:
5503 type.bitfield.ymmword = 1;
5504 break;
5505 case 64:
5506 type.bitfield.zmmword = 1;
5507 break;
5508 default:
5509 goto bad_broadcast;
5510 }
5511
5512 overlap = operand_type_and (type, t->operand_types[op]);
5513 if (operand_type_all_zero (&overlap))
5514 goto bad_broadcast;
5515
5516 if (t->opcode_modifier.checkregsize)
5517 {
5518 unsigned int j;
5519
5520 type.bitfield.baseindex = 1;
5521 for (j = 0; j < i.operands; ++j)
5522 {
5523 if (j != op
5524 && !operand_type_register_match(i.types[j],
5525 t->operand_types[j],
5526 type,
5527 t->operand_types[op]))
5528 goto bad_broadcast;
5529 }
5530 }
5531 }
5532 /* If broadcast is supported in this instruction, we need to check if
5533 operand of one-element size isn't specified without broadcast. */
5534 else if (t->opcode_modifier.broadcast && i.mem_operands)
5535 {
5536 /* Find memory operand. */
5537 for (op = 0; op < i.operands; op++)
5538 if (i.flags[op] & Operand_Mem)
5539 break;
5540 gas_assert (op < i.operands);
5541 /* Check size of the memory operand. */
5542 if (match_broadcast_size (t, op))
5543 {
5544 i.error = broadcast_needed;
5545 return 1;
5546 }
5547 }
5548 else
5549 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5550
5551 /* Check if requested masking is supported. */
5552 if (i.mask)
5553 {
5554 switch (t->opcode_modifier.masking)
5555 {
5556 case BOTH_MASKING:
5557 break;
5558 case MERGING_MASKING:
5559 if (i.mask->zeroing)
5560 {
5561 case 0:
5562 i.error = unsupported_masking;
5563 return 1;
5564 }
5565 break;
5566 case DYNAMIC_MASKING:
5567 /* Memory destinations allow only merging masking. */
5568 if (i.mask->zeroing && i.mem_operands)
5569 {
5570 /* Find memory operand. */
5571 for (op = 0; op < i.operands; op++)
5572 if (i.flags[op] & Operand_Mem)
5573 break;
5574 gas_assert (op < i.operands);
5575 if (op == i.operands - 1)
5576 {
5577 i.error = unsupported_masking;
5578 return 1;
5579 }
5580 }
5581 break;
5582 default:
5583 abort ();
5584 }
5585 }
5586
5587 /* Check if masking is applied to dest operand. */
5588 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5589 {
5590 i.error = mask_not_on_destination;
5591 return 1;
5592 }
5593
5594 /* Check RC/SAE. */
5595 if (i.rounding)
5596 {
5597 if (!t->opcode_modifier.sae
5598 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5599 {
5600 i.error = unsupported_rc_sae;
5601 return 1;
5602 }
5603 /* If the instruction has several immediate operands and one of
5604 them is rounding, the rounding operand should be the last
5605 immediate operand. */
5606 if (i.imm_operands > 1
5607 && i.rounding->operand != (int) (i.imm_operands - 1))
5608 {
5609 i.error = rc_sae_operand_not_last_imm;
5610 return 1;
5611 }
5612 }
5613
5614 /* Check vector Disp8 operand. */
5615 if (t->opcode_modifier.disp8memshift
5616 && i.disp_encoding != disp_encoding_32bit)
5617 {
5618 if (i.broadcast)
5619 i.memshift = t->opcode_modifier.broadcast - 1;
5620 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5621 i.memshift = t->opcode_modifier.disp8memshift;
5622 else
5623 {
5624 const i386_operand_type *type = NULL;
5625
5626 i.memshift = 0;
5627 for (op = 0; op < i.operands; op++)
5628 if (i.flags[op] & Operand_Mem)
5629 {
5630 if (t->opcode_modifier.evex == EVEXLIG)
5631 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5632 else if (t->operand_types[op].bitfield.xmmword
5633 + t->operand_types[op].bitfield.ymmword
5634 + t->operand_types[op].bitfield.zmmword <= 1)
5635 type = &t->operand_types[op];
5636 else if (!i.types[op].bitfield.unspecified)
5637 type = &i.types[op];
5638 }
5639 else if (i.types[op].bitfield.class == RegSIMD
5640 && t->opcode_modifier.evex != EVEXLIG)
5641 {
5642 if (i.types[op].bitfield.zmmword)
5643 i.memshift = 6;
5644 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5645 i.memshift = 5;
5646 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5647 i.memshift = 4;
5648 }
5649
5650 if (type)
5651 {
5652 if (type->bitfield.zmmword)
5653 i.memshift = 6;
5654 else if (type->bitfield.ymmword)
5655 i.memshift = 5;
5656 else if (type->bitfield.xmmword)
5657 i.memshift = 4;
5658 }
5659
5660 /* For the check in fits_in_disp8(). */
5661 if (i.memshift == 0)
5662 i.memshift = -1;
5663 }
5664
5665 for (op = 0; op < i.operands; op++)
5666 if (operand_type_check (i.types[op], disp)
5667 && i.op[op].disps->X_op == O_constant)
5668 {
5669 if (fits_in_disp8 (i.op[op].disps->X_add_number))
5670 {
5671 i.types[op].bitfield.disp8 = 1;
5672 return 0;
5673 }
5674 i.types[op].bitfield.disp8 = 0;
5675 }
5676 }
5677
5678 i.memshift = 0;
5679
5680 return 0;
5681 }
5682
5683 /* Check if operands are valid for the instruction. Update VEX
5684 operand types. */
5685
5686 static int
5687 VEX_check_operands (const insn_template *t)
5688 {
5689 if (i.vec_encoding == vex_encoding_evex)
5690 {
5691 /* This instruction must be encoded with EVEX prefix. */
5692 if (!is_evex_encoding (t))
5693 {
5694 i.error = unsupported;
5695 return 1;
5696 }
5697 return 0;
5698 }
5699
5700 if (!t->opcode_modifier.vex)
5701 {
5702 /* This instruction template doesn't have VEX prefix. */
5703 if (i.vec_encoding != vex_encoding_default)
5704 {
5705 i.error = unsupported;
5706 return 1;
5707 }
5708 return 0;
5709 }
5710
5711 /* Check the special Imm4 cases; must be the first operand. */
5712 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
5713 {
5714 if (i.op[0].imms->X_op != O_constant
5715 || !fits_in_imm4 (i.op[0].imms->X_add_number))
5716 {
5717 i.error = bad_imm4;
5718 return 1;
5719 }
5720
5721 /* Turn off Imm<N> so that update_imm won't complain. */
5722 operand_type_set (&i.types[0], 0);
5723 }
5724
5725 return 0;
5726 }
5727
5728 static const insn_template *
5729 match_template (char mnem_suffix)
5730 {
5731 /* Points to template once we've found it. */
5732 const insn_template *t;
5733 i386_operand_type overlap0, overlap1, overlap2, overlap3;
5734 i386_operand_type overlap4;
5735 unsigned int found_reverse_match;
5736 i386_opcode_modifier suffix_check;
5737 i386_operand_type operand_types [MAX_OPERANDS];
5738 int addr_prefix_disp;
5739 unsigned int j, size_match, check_register;
5740 enum i386_error specific_error = 0;
5741
5742 #if MAX_OPERANDS != 5
5743 # error "MAX_OPERANDS must be 5."
5744 #endif
5745
5746 found_reverse_match = 0;
5747 addr_prefix_disp = -1;
5748
5749 /* Prepare for mnemonic suffix check. */
5750 memset (&suffix_check, 0, sizeof (suffix_check));
5751 switch (mnem_suffix)
5752 {
5753 case BYTE_MNEM_SUFFIX:
5754 suffix_check.no_bsuf = 1;
5755 break;
5756 case WORD_MNEM_SUFFIX:
5757 suffix_check.no_wsuf = 1;
5758 break;
5759 case SHORT_MNEM_SUFFIX:
5760 suffix_check.no_ssuf = 1;
5761 break;
5762 case LONG_MNEM_SUFFIX:
5763 suffix_check.no_lsuf = 1;
5764 break;
5765 case QWORD_MNEM_SUFFIX:
5766 suffix_check.no_qsuf = 1;
5767 break;
5768 default:
5769 /* NB: In Intel syntax, normally we can check for memory operand
5770 size when there is no mnemonic suffix. But jmp and call have
5771 2 different encodings with Dword memory operand size, one with
5772 No_ldSuf and the other without. i.suffix is set to
5773 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
5774 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5775 suffix_check.no_ldsuf = 1;
5776 }
5777
5778 /* Must have right number of operands. */
5779 i.error = number_of_operands_mismatch;
5780
5781 for (t = current_templates->start; t < current_templates->end; t++)
5782 {
5783 addr_prefix_disp = -1;
5784 found_reverse_match = 0;
5785
5786 if (i.operands != t->operands)
5787 continue;
5788
5789 /* Check processor support. */
5790 i.error = unsupported;
5791 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
5792 continue;
5793
5794 /* Check AT&T mnemonic. */
5795 i.error = unsupported_with_intel_mnemonic;
5796 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5797 continue;
5798
5799 /* Check AT&T/Intel syntax. */
5800 i.error = unsupported_syntax;
5801 if ((intel_syntax && t->opcode_modifier.attsyntax)
5802 || (!intel_syntax && t->opcode_modifier.intelsyntax))
5803 continue;
5804
5805 /* Check Intel64/AMD64 ISA. */
5806 switch (isa64)
5807 {
5808 default:
5809 /* Default: Don't accept Intel64. */
5810 if (t->opcode_modifier.isa64 == INTEL64)
5811 continue;
5812 break;
5813 case amd64:
5814 /* -mamd64: Don't accept Intel64 and Intel64 only. */
5815 if (t->opcode_modifier.isa64 >= INTEL64)
5816 continue;
5817 break;
5818 case intel64:
5819 /* -mintel64: Don't accept AMD64. */
5820 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
5821 continue;
5822 break;
5823 }
5824
5825 /* Check the suffix. */
5826 i.error = invalid_instruction_suffix;
5827 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5828 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5829 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5830 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5831 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5832 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
5833 continue;
5834
5835 size_match = operand_size_match (t);
5836 if (!size_match)
5837 continue;
5838
5839 /* This is intentionally not
5840
5841 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
5842
5843 as the case of a missing * on the operand is accepted (perhaps with
5844 a warning, issued further down). */
5845 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5846 {
5847 i.error = operand_type_mismatch;
5848 continue;
5849 }
5850
5851 for (j = 0; j < MAX_OPERANDS; j++)
5852 operand_types[j] = t->operand_types[j];
5853
5854 /* In general, don't allow 64-bit operands in 32-bit mode. */
5855 if (i.suffix == QWORD_MNEM_SUFFIX
5856 && flag_code != CODE_64BIT
5857 && (intel_syntax
5858 ? (!t->opcode_modifier.ignoresize
5859 && !t->opcode_modifier.broadcast
5860 && !intel_float_operand (t->name))
5861 : intel_float_operand (t->name) != 2)
5862 && ((operand_types[0].bitfield.class != RegMMX
5863 && operand_types[0].bitfield.class != RegSIMD)
5864 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5865 && operand_types[t->operands > 1].bitfield.class != RegSIMD))
5866 && (t->base_opcode != 0x0fc7
5867 || t->extension_opcode != 1 /* cmpxchg8b */))
5868 continue;
5869
5870 /* In general, don't allow 32-bit operands on pre-386. */
5871 else if (i.suffix == LONG_MNEM_SUFFIX
5872 && !cpu_arch_flags.bitfield.cpui386
5873 && (intel_syntax
5874 ? (!t->opcode_modifier.ignoresize
5875 && !intel_float_operand (t->name))
5876 : intel_float_operand (t->name) != 2)
5877 && ((operand_types[0].bitfield.class != RegMMX
5878 && operand_types[0].bitfield.class != RegSIMD)
5879 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5880 && operand_types[t->operands > 1].bitfield.class
5881 != RegSIMD)))
5882 continue;
5883
5884 /* Do not verify operands when there are none. */
5885 else
5886 {
5887 if (!t->operands)
5888 /* We've found a match; break out of loop. */
5889 break;
5890 }
5891
5892 if (!t->opcode_modifier.jump
5893 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
5894 {
5895 /* There should be only one Disp operand. */
5896 for (j = 0; j < MAX_OPERANDS; j++)
5897 if (operand_type_check (operand_types[j], disp))
5898 break;
5899 if (j < MAX_OPERANDS)
5900 {
5901 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
5902
5903 addr_prefix_disp = j;
5904
5905 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
5906 operand into Disp32/Disp32/Disp16/Disp32 operand. */
5907 switch (flag_code)
5908 {
5909 case CODE_16BIT:
5910 override = !override;
5911 /* Fall through. */
5912 case CODE_32BIT:
5913 if (operand_types[j].bitfield.disp32
5914 && operand_types[j].bitfield.disp16)
5915 {
5916 operand_types[j].bitfield.disp16 = override;
5917 operand_types[j].bitfield.disp32 = !override;
5918 }
5919 operand_types[j].bitfield.disp32s = 0;
5920 operand_types[j].bitfield.disp64 = 0;
5921 break;
5922
5923 case CODE_64BIT:
5924 if (operand_types[j].bitfield.disp32s
5925 || operand_types[j].bitfield.disp64)
5926 {
5927 operand_types[j].bitfield.disp64 &= !override;
5928 operand_types[j].bitfield.disp32s &= !override;
5929 operand_types[j].bitfield.disp32 = override;
5930 }
5931 operand_types[j].bitfield.disp16 = 0;
5932 break;
5933 }
5934 }
5935 }
5936
5937 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
5938 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5939 continue;
5940
5941 /* We check register size if needed. */
5942 if (t->opcode_modifier.checkregsize)
5943 {
5944 check_register = (1 << t->operands) - 1;
5945 if (i.broadcast)
5946 check_register &= ~(1 << i.broadcast->operand);
5947 }
5948 else
5949 check_register = 0;
5950
5951 overlap0 = operand_type_and (i.types[0], operand_types[0]);
5952 switch (t->operands)
5953 {
5954 case 1:
5955 if (!operand_type_match (overlap0, i.types[0]))
5956 continue;
5957 break;
5958 case 2:
5959 /* xchg %eax, %eax is a special case. It is an alias for nop
5960 only in 32bit mode and we can use opcode 0x90. In 64bit
5961 mode, we can't use 0x90 for xchg %eax, %eax since it should
5962 zero-extend %eax to %rax. */
5963 if (flag_code == CODE_64BIT
5964 && t->base_opcode == 0x90
5965 && i.types[0].bitfield.instance == Accum
5966 && i.types[0].bitfield.dword
5967 && i.types[1].bitfield.instance == Accum
5968 && i.types[1].bitfield.dword)
5969 continue;
5970 /* xrelease mov %eax, <disp> is another special case. It must not
5971 match the accumulator-only encoding of mov. */
5972 if (flag_code != CODE_64BIT
5973 && i.hle_prefix
5974 && t->base_opcode == 0xa0
5975 && i.types[0].bitfield.instance == Accum
5976 && (i.flags[1] & Operand_Mem))
5977 continue;
5978 /* Fall through. */
5979
5980 case 3:
5981 if (!(size_match & MATCH_STRAIGHT))
5982 goto check_reverse;
5983 /* Reverse direction of operands if swapping is possible in the first
5984 place (operands need to be symmetric) and
5985 - the load form is requested, and the template is a store form,
5986 - the store form is requested, and the template is a load form,
5987 - the non-default (swapped) form is requested. */
5988 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5989 if (t->opcode_modifier.d && i.reg_operands == i.operands
5990 && !operand_type_all_zero (&overlap1))
5991 switch (i.dir_encoding)
5992 {
5993 case dir_encoding_load:
5994 if (operand_type_check (operand_types[i.operands - 1], anymem)
5995 || t->opcode_modifier.regmem)
5996 goto check_reverse;
5997 break;
5998
5999 case dir_encoding_store:
6000 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6001 && !t->opcode_modifier.regmem)
6002 goto check_reverse;
6003 break;
6004
6005 case dir_encoding_swap:
6006 goto check_reverse;
6007
6008 case dir_encoding_default:
6009 break;
6010 }
6011 /* If we want store form, we skip the current load. */
6012 if ((i.dir_encoding == dir_encoding_store
6013 || i.dir_encoding == dir_encoding_swap)
6014 && i.mem_operands == 0
6015 && t->opcode_modifier.load)
6016 continue;
6017 /* Fall through. */
6018 case 4:
6019 case 5:
6020 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6021 if (!operand_type_match (overlap0, i.types[0])
6022 || !operand_type_match (overlap1, i.types[1])
6023 || ((check_register & 3) == 3
6024 && !operand_type_register_match (i.types[0],
6025 operand_types[0],
6026 i.types[1],
6027 operand_types[1])))
6028 {
6029 /* Check if other direction is valid ... */
6030 if (!t->opcode_modifier.d)
6031 continue;
6032
6033 check_reverse:
6034 if (!(size_match & MATCH_REVERSE))
6035 continue;
6036 /* Try reversing direction of operands. */
6037 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6038 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6039 if (!operand_type_match (overlap0, i.types[0])
6040 || !operand_type_match (overlap1, i.types[i.operands - 1])
6041 || (check_register
6042 && !operand_type_register_match (i.types[0],
6043 operand_types[i.operands - 1],
6044 i.types[i.operands - 1],
6045 operand_types[0])))
6046 {
6047 /* Does not match either direction. */
6048 continue;
6049 }
6050 /* found_reverse_match holds which of D or FloatR
6051 we've found. */
6052 if (!t->opcode_modifier.d)
6053 found_reverse_match = 0;
6054 else if (operand_types[0].bitfield.tbyte)
6055 found_reverse_match = Opcode_FloatD;
6056 else if (operand_types[0].bitfield.xmmword
6057 || operand_types[i.operands - 1].bitfield.xmmword
6058 || operand_types[0].bitfield.class == RegMMX
6059 || operand_types[i.operands - 1].bitfield.class == RegMMX
6060 || is_any_vex_encoding(t))
6061 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6062 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6063 else
6064 found_reverse_match = Opcode_D;
6065 if (t->opcode_modifier.floatr)
6066 found_reverse_match |= Opcode_FloatR;
6067 }
6068 else
6069 {
6070 /* Found a forward 2 operand match here. */
6071 switch (t->operands)
6072 {
6073 case 5:
6074 overlap4 = operand_type_and (i.types[4],
6075 operand_types[4]);
6076 /* Fall through. */
6077 case 4:
6078 overlap3 = operand_type_and (i.types[3],
6079 operand_types[3]);
6080 /* Fall through. */
6081 case 3:
6082 overlap2 = operand_type_and (i.types[2],
6083 operand_types[2]);
6084 break;
6085 }
6086
6087 switch (t->operands)
6088 {
6089 case 5:
6090 if (!operand_type_match (overlap4, i.types[4])
6091 || !operand_type_register_match (i.types[3],
6092 operand_types[3],
6093 i.types[4],
6094 operand_types[4]))
6095 continue;
6096 /* Fall through. */
6097 case 4:
6098 if (!operand_type_match (overlap3, i.types[3])
6099 || ((check_register & 0xa) == 0xa
6100 && !operand_type_register_match (i.types[1],
6101 operand_types[1],
6102 i.types[3],
6103 operand_types[3]))
6104 || ((check_register & 0xc) == 0xc
6105 && !operand_type_register_match (i.types[2],
6106 operand_types[2],
6107 i.types[3],
6108 operand_types[3])))
6109 continue;
6110 /* Fall through. */
6111 case 3:
6112 /* Here we make use of the fact that there are no
6113 reverse match 3 operand instructions. */
6114 if (!operand_type_match (overlap2, i.types[2])
6115 || ((check_register & 5) == 5
6116 && !operand_type_register_match (i.types[0],
6117 operand_types[0],
6118 i.types[2],
6119 operand_types[2]))
6120 || ((check_register & 6) == 6
6121 && !operand_type_register_match (i.types[1],
6122 operand_types[1],
6123 i.types[2],
6124 operand_types[2])))
6125 continue;
6126 break;
6127 }
6128 }
6129 /* Found either forward/reverse 2, 3 or 4 operand match here:
6130 slip through to break. */
6131 }
6132
6133 /* Check if vector and VEX operands are valid. */
6134 if (check_VecOperands (t) || VEX_check_operands (t))
6135 {
6136 specific_error = i.error;
6137 continue;
6138 }
6139
6140 /* We've found a match; break out of loop. */
6141 break;
6142 }
6143
6144 if (t == current_templates->end)
6145 {
6146 /* We found no match. */
6147 const char *err_msg;
6148 switch (specific_error ? specific_error : i.error)
6149 {
6150 default:
6151 abort ();
6152 case operand_size_mismatch:
6153 err_msg = _("operand size mismatch");
6154 break;
6155 case operand_type_mismatch:
6156 err_msg = _("operand type mismatch");
6157 break;
6158 case register_type_mismatch:
6159 err_msg = _("register type mismatch");
6160 break;
6161 case number_of_operands_mismatch:
6162 err_msg = _("number of operands mismatch");
6163 break;
6164 case invalid_instruction_suffix:
6165 err_msg = _("invalid instruction suffix");
6166 break;
6167 case bad_imm4:
6168 err_msg = _("constant doesn't fit in 4 bits");
6169 break;
6170 case unsupported_with_intel_mnemonic:
6171 err_msg = _("unsupported with Intel mnemonic");
6172 break;
6173 case unsupported_syntax:
6174 err_msg = _("unsupported syntax");
6175 break;
6176 case unsupported:
6177 as_bad (_("unsupported instruction `%s'"),
6178 current_templates->start->name);
6179 return NULL;
6180 case invalid_vsib_address:
6181 err_msg = _("invalid VSIB address");
6182 break;
6183 case invalid_vector_register_set:
6184 err_msg = _("mask, index, and destination registers must be distinct");
6185 break;
6186 case unsupported_vector_index_register:
6187 err_msg = _("unsupported vector index register");
6188 break;
6189 case unsupported_broadcast:
6190 err_msg = _("unsupported broadcast");
6191 break;
6192 case broadcast_needed:
6193 err_msg = _("broadcast is needed for operand of such type");
6194 break;
6195 case unsupported_masking:
6196 err_msg = _("unsupported masking");
6197 break;
6198 case mask_not_on_destination:
6199 err_msg = _("mask not on destination operand");
6200 break;
6201 case no_default_mask:
6202 err_msg = _("default mask isn't allowed");
6203 break;
6204 case unsupported_rc_sae:
6205 err_msg = _("unsupported static rounding/sae");
6206 break;
6207 case rc_sae_operand_not_last_imm:
6208 if (intel_syntax)
6209 err_msg = _("RC/SAE operand must precede immediate operands");
6210 else
6211 err_msg = _("RC/SAE operand must follow immediate operands");
6212 break;
6213 case invalid_register_operand:
6214 err_msg = _("invalid register operand");
6215 break;
6216 }
6217 as_bad (_("%s for `%s'"), err_msg,
6218 current_templates->start->name);
6219 return NULL;
6220 }
6221
6222 if (!quiet_warnings)
6223 {
6224 if (!intel_syntax
6225 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6226 as_warn (_("indirect %s without `*'"), t->name);
6227
6228 if (t->opcode_modifier.isprefix
6229 && t->opcode_modifier.ignoresize)
6230 {
6231 /* Warn them that a data or address size prefix doesn't
6232 affect assembly of the next line of code. */
6233 as_warn (_("stand-alone `%s' prefix"), t->name);
6234 }
6235 }
6236
6237 /* Copy the template we found. */
6238 i.tm = *t;
6239
6240 if (addr_prefix_disp != -1)
6241 i.tm.operand_types[addr_prefix_disp]
6242 = operand_types[addr_prefix_disp];
6243
6244 if (found_reverse_match)
6245 {
6246 /* If we found a reverse match we must alter the opcode direction
6247 bit and clear/flip the regmem modifier one. found_reverse_match
6248 holds bits to change (different for int & float insns). */
6249
6250 i.tm.base_opcode ^= found_reverse_match;
6251
6252 i.tm.operand_types[0] = operand_types[i.operands - 1];
6253 i.tm.operand_types[i.operands - 1] = operand_types[0];
6254
6255 /* Certain SIMD insns have their load forms specified in the opcode
6256 table, and hence we need to _set_ RegMem instead of clearing it.
6257 We need to avoid setting the bit though on insns like KMOVW. */
6258 i.tm.opcode_modifier.regmem
6259 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6260 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6261 && !i.tm.opcode_modifier.regmem;
6262 }
6263
6264 return t;
6265 }
6266
6267 static int
6268 check_string (void)
6269 {
6270 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6271 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6272
6273 if (i.seg[op] != NULL && i.seg[op] != &es)
6274 {
6275 as_bad (_("`%s' operand %u must use `%ses' segment"),
6276 i.tm.name,
6277 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6278 register_prefix);
6279 return 0;
6280 }
6281
6282 /* There's only ever one segment override allowed per instruction.
6283 This instruction possibly has a legal segment override on the
6284 second operand, so copy the segment to where non-string
6285 instructions store it, allowing common code. */
6286 i.seg[op] = i.seg[1];
6287
6288 return 1;
6289 }
6290
6291 static int
6292 process_suffix (void)
6293 {
6294 /* If matched instruction specifies an explicit instruction mnemonic
6295 suffix, use it. */
6296 if (i.tm.opcode_modifier.size == SIZE16)
6297 i.suffix = WORD_MNEM_SUFFIX;
6298 else if (i.tm.opcode_modifier.size == SIZE32)
6299 i.suffix = LONG_MNEM_SUFFIX;
6300 else if (i.tm.opcode_modifier.size == SIZE64)
6301 i.suffix = QWORD_MNEM_SUFFIX;
6302 else if (i.reg_operands
6303 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6304 && !i.tm.opcode_modifier.addrprefixopreg)
6305 {
6306 unsigned int numop = i.operands;
6307
6308 /* movsx/movzx want only their source operand considered here, for the
6309 ambiguity checking below. The suffix will be replaced afterwards
6310 to represent the destination (register). */
6311 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6312 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6313 --i.operands;
6314
6315 /* If there's no instruction mnemonic suffix we try to invent one
6316 based on GPR operands. */
6317 if (!i.suffix)
6318 {
6319 /* We take i.suffix from the last register operand specified,
6320 Destination register type is more significant than source
6321 register type. crc32 in SSE4.2 prefers source register
6322 type. */
6323 unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6324
6325 while (op--)
6326 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6327 || i.tm.operand_types[op].bitfield.instance == Accum)
6328 {
6329 if (i.types[op].bitfield.class != Reg)
6330 continue;
6331 if (i.types[op].bitfield.byte)
6332 i.suffix = BYTE_MNEM_SUFFIX;
6333 else if (i.types[op].bitfield.word)
6334 i.suffix = WORD_MNEM_SUFFIX;
6335 else if (i.types[op].bitfield.dword)
6336 i.suffix = LONG_MNEM_SUFFIX;
6337 else if (i.types[op].bitfield.qword)
6338 i.suffix = QWORD_MNEM_SUFFIX;
6339 else
6340 continue;
6341 break;
6342 }
6343
6344 /* As an exception, movsx/movzx silently default to a byte source
6345 in AT&T mode. */
6346 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6347 && !i.suffix && !intel_syntax)
6348 i.suffix = BYTE_MNEM_SUFFIX;
6349 }
6350 else if (i.suffix == BYTE_MNEM_SUFFIX)
6351 {
6352 if (intel_syntax
6353 && i.tm.opcode_modifier.ignoresize
6354 && i.tm.opcode_modifier.no_bsuf)
6355 i.suffix = 0;
6356 else if (!check_byte_reg ())
6357 return 0;
6358 }
6359 else if (i.suffix == LONG_MNEM_SUFFIX)
6360 {
6361 if (intel_syntax
6362 && i.tm.opcode_modifier.ignoresize
6363 && i.tm.opcode_modifier.no_lsuf
6364 && !i.tm.opcode_modifier.todword
6365 && !i.tm.opcode_modifier.toqword)
6366 i.suffix = 0;
6367 else if (!check_long_reg ())
6368 return 0;
6369 }
6370 else if (i.suffix == QWORD_MNEM_SUFFIX)
6371 {
6372 if (intel_syntax
6373 && i.tm.opcode_modifier.ignoresize
6374 && i.tm.opcode_modifier.no_qsuf
6375 && !i.tm.opcode_modifier.todword
6376 && !i.tm.opcode_modifier.toqword)
6377 i.suffix = 0;
6378 else if (!check_qword_reg ())
6379 return 0;
6380 }
6381 else if (i.suffix == WORD_MNEM_SUFFIX)
6382 {
6383 if (intel_syntax
6384 && i.tm.opcode_modifier.ignoresize
6385 && i.tm.opcode_modifier.no_wsuf)
6386 i.suffix = 0;
6387 else if (!check_word_reg ())
6388 return 0;
6389 }
6390 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6391 /* Do nothing if the instruction is going to ignore the prefix. */
6392 ;
6393 else
6394 abort ();
6395
6396 /* Undo the movsx/movzx change done above. */
6397 i.operands = numop;
6398 }
6399 else if (i.tm.opcode_modifier.defaultsize && !i.suffix)
6400 {
6401 i.suffix = stackop_size;
6402 if (stackop_size == LONG_MNEM_SUFFIX)
6403 {
6404 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6405 .code16gcc directive to support 16-bit mode with
6406 32-bit address. For IRET without a suffix, generate
6407 16-bit IRET (opcode 0xcf) to return from an interrupt
6408 handler. */
6409 if (i.tm.base_opcode == 0xcf)
6410 {
6411 i.suffix = WORD_MNEM_SUFFIX;
6412 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6413 }
6414 /* Warn about changed behavior for segment register push/pop. */
6415 else if ((i.tm.base_opcode | 1) == 0x07)
6416 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6417 i.tm.name);
6418 }
6419 }
6420 else if (!i.suffix
6421 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6422 || i.tm.opcode_modifier.jump == JUMP_BYTE
6423 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6424 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6425 && i.tm.extension_opcode <= 3)))
6426 {
6427 switch (flag_code)
6428 {
6429 case CODE_64BIT:
6430 if (!i.tm.opcode_modifier.no_qsuf)
6431 {
6432 i.suffix = QWORD_MNEM_SUFFIX;
6433 break;
6434 }
6435 /* Fall through. */
6436 case CODE_32BIT:
6437 if (!i.tm.opcode_modifier.no_lsuf)
6438 i.suffix = LONG_MNEM_SUFFIX;
6439 break;
6440 case CODE_16BIT:
6441 if (!i.tm.opcode_modifier.no_wsuf)
6442 i.suffix = WORD_MNEM_SUFFIX;
6443 break;
6444 }
6445 }
6446
6447 if (!i.suffix
6448 && (!i.tm.opcode_modifier.defaultsize
6449 /* Also cover lret/retf/iret in 64-bit mode. */
6450 || (flag_code == CODE_64BIT
6451 && !i.tm.opcode_modifier.no_lsuf
6452 && !i.tm.opcode_modifier.no_qsuf))
6453 && !i.tm.opcode_modifier.ignoresize
6454 /* Accept FLDENV et al without suffix. */
6455 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6456 {
6457 unsigned int suffixes, evex = 0;
6458
6459 suffixes = !i.tm.opcode_modifier.no_bsuf;
6460 if (!i.tm.opcode_modifier.no_wsuf)
6461 suffixes |= 1 << 1;
6462 if (!i.tm.opcode_modifier.no_lsuf)
6463 suffixes |= 1 << 2;
6464 if (!i.tm.opcode_modifier.no_ldsuf)
6465 suffixes |= 1 << 3;
6466 if (!i.tm.opcode_modifier.no_ssuf)
6467 suffixes |= 1 << 4;
6468 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6469 suffixes |= 1 << 5;
6470
6471 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6472 also suitable for AT&T syntax mode, it was requested that this be
6473 restricted to just Intel syntax. */
6474 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6475 {
6476 unsigned int op;
6477
6478 for (op = 0; op < i.tm.operands; ++op)
6479 {
6480 if (is_evex_encoding (&i.tm)
6481 && !cpu_arch_flags.bitfield.cpuavx512vl)
6482 {
6483 if (i.tm.operand_types[op].bitfield.ymmword)
6484 i.tm.operand_types[op].bitfield.xmmword = 0;
6485 if (i.tm.operand_types[op].bitfield.zmmword)
6486 i.tm.operand_types[op].bitfield.ymmword = 0;
6487 if (!i.tm.opcode_modifier.evex
6488 || i.tm.opcode_modifier.evex == EVEXDYN)
6489 i.tm.opcode_modifier.evex = EVEX512;
6490 }
6491
6492 if (i.tm.operand_types[op].bitfield.xmmword
6493 + i.tm.operand_types[op].bitfield.ymmword
6494 + i.tm.operand_types[op].bitfield.zmmword < 2)
6495 continue;
6496
6497 /* Any properly sized operand disambiguates the insn. */
6498 if (i.types[op].bitfield.xmmword
6499 || i.types[op].bitfield.ymmword
6500 || i.types[op].bitfield.zmmword)
6501 {
6502 suffixes &= ~(7 << 6);
6503 evex = 0;
6504 break;
6505 }
6506
6507 if ((i.flags[op] & Operand_Mem)
6508 && i.tm.operand_types[op].bitfield.unspecified)
6509 {
6510 if (i.tm.operand_types[op].bitfield.xmmword)
6511 suffixes |= 1 << 6;
6512 if (i.tm.operand_types[op].bitfield.ymmword)
6513 suffixes |= 1 << 7;
6514 if (i.tm.operand_types[op].bitfield.zmmword)
6515 suffixes |= 1 << 8;
6516 if (is_evex_encoding (&i.tm))
6517 evex = EVEX512;
6518 }
6519 }
6520 }
6521
6522 /* Are multiple suffixes / operand sizes allowed? */
6523 if (suffixes & (suffixes - 1))
6524 {
6525 if (intel_syntax
6526 && (!i.tm.opcode_modifier.defaultsize
6527 || operand_check == check_error))
6528 {
6529 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6530 return 0;
6531 }
6532 if (operand_check == check_error)
6533 {
6534 as_bad (_("no instruction mnemonic suffix given and "
6535 "no register operands; can't size `%s'"), i.tm.name);
6536 return 0;
6537 }
6538 if (operand_check == check_warning)
6539 as_warn (_("%s; using default for `%s'"),
6540 intel_syntax
6541 ? _("ambiguous operand size")
6542 : _("no instruction mnemonic suffix given and "
6543 "no register operands"),
6544 i.tm.name);
6545
6546 if (i.tm.opcode_modifier.floatmf)
6547 i.suffix = SHORT_MNEM_SUFFIX;
6548 else if ((i.tm.base_opcode | 8) == 0xfbe
6549 || (i.tm.base_opcode == 0x63
6550 && i.tm.cpu_flags.bitfield.cpu64))
6551 /* handled below */;
6552 else if (evex)
6553 i.tm.opcode_modifier.evex = evex;
6554 else if (flag_code == CODE_16BIT)
6555 i.suffix = WORD_MNEM_SUFFIX;
6556 else if (!i.tm.opcode_modifier.no_lsuf)
6557 i.suffix = LONG_MNEM_SUFFIX;
6558 else
6559 i.suffix = QWORD_MNEM_SUFFIX;
6560 }
6561 }
6562
6563 if ((i.tm.base_opcode | 8) == 0xfbe
6564 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6565 {
6566 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
6567 In AT&T syntax, if there is no suffix (warned about above), the default
6568 will be byte extension. */
6569 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
6570 i.tm.base_opcode |= 1;
6571
6572 /* For further processing, the suffix should represent the destination
6573 (register). This is already the case when one was used with
6574 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
6575 no suffix to begin with. */
6576 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
6577 {
6578 if (i.types[1].bitfield.word)
6579 i.suffix = WORD_MNEM_SUFFIX;
6580 else if (i.types[1].bitfield.qword)
6581 i.suffix = QWORD_MNEM_SUFFIX;
6582 else
6583 i.suffix = LONG_MNEM_SUFFIX;
6584
6585 i.tm.opcode_modifier.w = 0;
6586 }
6587 }
6588
6589 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
6590 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
6591 != (i.tm.operand_types[1].bitfield.class == Reg);
6592
6593 /* Change the opcode based on the operand size given by i.suffix. */
6594 switch (i.suffix)
6595 {
6596 /* Size floating point instruction. */
6597 case LONG_MNEM_SUFFIX:
6598 if (i.tm.opcode_modifier.floatmf)
6599 {
6600 i.tm.base_opcode ^= 4;
6601 break;
6602 }
6603 /* fall through */
6604 case WORD_MNEM_SUFFIX:
6605 case QWORD_MNEM_SUFFIX:
6606 /* It's not a byte, select word/dword operation. */
6607 if (i.tm.opcode_modifier.w)
6608 {
6609 if (i.short_form)
6610 i.tm.base_opcode |= 8;
6611 else
6612 i.tm.base_opcode |= 1;
6613 }
6614 /* fall through */
6615 case SHORT_MNEM_SUFFIX:
6616 /* Now select between word & dword operations via the operand
6617 size prefix, except for instructions that will ignore this
6618 prefix anyway. */
6619 if (i.suffix != QWORD_MNEM_SUFFIX
6620 && !i.tm.opcode_modifier.ignoresize
6621 && !i.tm.opcode_modifier.floatmf
6622 && !is_any_vex_encoding (&i.tm)
6623 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6624 || (flag_code == CODE_64BIT
6625 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
6626 {
6627 unsigned int prefix = DATA_PREFIX_OPCODE;
6628
6629 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
6630 prefix = ADDR_PREFIX_OPCODE;
6631
6632 if (!add_prefix (prefix))
6633 return 0;
6634 }
6635
6636 /* Set mode64 for an operand. */
6637 if (i.suffix == QWORD_MNEM_SUFFIX
6638 && flag_code == CODE_64BIT
6639 && !i.tm.opcode_modifier.norex64
6640 /* Special case for xchg %rax,%rax. It is NOP and doesn't
6641 need rex64. */
6642 && ! (i.operands == 2
6643 && i.tm.base_opcode == 0x90
6644 && i.tm.extension_opcode == None
6645 && i.types[0].bitfield.instance == Accum
6646 && i.types[0].bitfield.qword
6647 && i.types[1].bitfield.instance == Accum
6648 && i.types[1].bitfield.qword))
6649 i.rex |= REX_W;
6650
6651 break;
6652 }
6653
6654 if (i.tm.opcode_modifier.addrprefixopreg)
6655 {
6656 gas_assert (!i.suffix);
6657 gas_assert (i.reg_operands);
6658
6659 if (i.tm.operand_types[0].bitfield.instance == Accum
6660 || i.operands == 1)
6661 {
6662 /* The address size override prefix changes the size of the
6663 first operand. */
6664 if (flag_code == CODE_64BIT
6665 && i.op[0].regs->reg_type.bitfield.word)
6666 {
6667 as_bad (_("16-bit addressing unavailable for `%s'"),
6668 i.tm.name);
6669 return 0;
6670 }
6671
6672 if ((flag_code == CODE_32BIT
6673 ? i.op[0].regs->reg_type.bitfield.word
6674 : i.op[0].regs->reg_type.bitfield.dword)
6675 && !add_prefix (ADDR_PREFIX_OPCODE))
6676 return 0;
6677 }
6678 else
6679 {
6680 /* Check invalid register operand when the address size override
6681 prefix changes the size of register operands. */
6682 unsigned int op;
6683 enum { need_word, need_dword, need_qword } need;
6684
6685 if (flag_code == CODE_32BIT)
6686 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6687 else if (i.prefix[ADDR_PREFIX])
6688 need = need_dword;
6689 else
6690 need = flag_code == CODE_64BIT ? need_qword : need_word;
6691
6692 for (op = 0; op < i.operands; op++)
6693 {
6694 if (i.types[op].bitfield.class != Reg)
6695 continue;
6696
6697 switch (need)
6698 {
6699 case need_word:
6700 if (i.op[op].regs->reg_type.bitfield.word)
6701 continue;
6702 break;
6703 case need_dword:
6704 if (i.op[op].regs->reg_type.bitfield.dword)
6705 continue;
6706 break;
6707 case need_qword:
6708 if (i.op[op].regs->reg_type.bitfield.qword)
6709 continue;
6710 break;
6711 }
6712
6713 as_bad (_("invalid register operand size for `%s'"),
6714 i.tm.name);
6715 return 0;
6716 }
6717 }
6718 }
6719
6720 return 1;
6721 }
6722
6723 static int
6724 check_byte_reg (void)
6725 {
6726 int op;
6727
6728 for (op = i.operands; --op >= 0;)
6729 {
6730 /* Skip non-register operands. */
6731 if (i.types[op].bitfield.class != Reg)
6732 continue;
6733
6734 /* If this is an eight bit register, it's OK. If it's the 16 or
6735 32 bit version of an eight bit register, we will just use the
6736 low portion, and that's OK too. */
6737 if (i.types[op].bitfield.byte)
6738 continue;
6739
6740 /* I/O port address operands are OK too. */
6741 if (i.tm.operand_types[op].bitfield.instance == RegD
6742 && i.tm.operand_types[op].bitfield.word)
6743 continue;
6744
6745 /* crc32 only wants its source operand checked here. */
6746 if (i.tm.base_opcode == 0xf20f38f0 && op)
6747 continue;
6748
6749 /* Any other register is bad. */
6750 if (i.types[op].bitfield.class == Reg
6751 || i.types[op].bitfield.class == RegMMX
6752 || i.types[op].bitfield.class == RegSIMD
6753 || i.types[op].bitfield.class == SReg
6754 || i.types[op].bitfield.class == RegCR
6755 || i.types[op].bitfield.class == RegDR
6756 || i.types[op].bitfield.class == RegTR)
6757 {
6758 as_bad (_("`%s%s' not allowed with `%s%c'"),
6759 register_prefix,
6760 i.op[op].regs->reg_name,
6761 i.tm.name,
6762 i.suffix);
6763 return 0;
6764 }
6765 }
6766 return 1;
6767 }
6768
6769 static int
6770 check_long_reg (void)
6771 {
6772 int op;
6773
6774 for (op = i.operands; --op >= 0;)
6775 /* Skip non-register operands. */
6776 if (i.types[op].bitfield.class != Reg)
6777 continue;
6778 /* Reject eight bit registers, except where the template requires
6779 them. (eg. movzb) */
6780 else if (i.types[op].bitfield.byte
6781 && (i.tm.operand_types[op].bitfield.class == Reg
6782 || i.tm.operand_types[op].bitfield.instance == Accum)
6783 && (i.tm.operand_types[op].bitfield.word
6784 || i.tm.operand_types[op].bitfield.dword))
6785 {
6786 as_bad (_("`%s%s' not allowed with `%s%c'"),
6787 register_prefix,
6788 i.op[op].regs->reg_name,
6789 i.tm.name,
6790 i.suffix);
6791 return 0;
6792 }
6793 /* Error if the e prefix on a general reg is missing. */
6794 else if (i.types[op].bitfield.word
6795 && (i.tm.operand_types[op].bitfield.class == Reg
6796 || i.tm.operand_types[op].bitfield.instance == Accum)
6797 && i.tm.operand_types[op].bitfield.dword)
6798 {
6799 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6800 register_prefix, i.op[op].regs->reg_name,
6801 i.suffix);
6802 return 0;
6803 }
6804 /* Warn if the r prefix on a general reg is present. */
6805 else if (i.types[op].bitfield.qword
6806 && (i.tm.operand_types[op].bitfield.class == Reg
6807 || i.tm.operand_types[op].bitfield.instance == Accum)
6808 && i.tm.operand_types[op].bitfield.dword)
6809 {
6810 if (intel_syntax
6811 && i.tm.opcode_modifier.toqword
6812 && i.types[0].bitfield.class != RegSIMD)
6813 {
6814 /* Convert to QWORD. We want REX byte. */
6815 i.suffix = QWORD_MNEM_SUFFIX;
6816 }
6817 else
6818 {
6819 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6820 register_prefix, i.op[op].regs->reg_name,
6821 i.suffix);
6822 return 0;
6823 }
6824 }
6825 return 1;
6826 }
6827
6828 static int
6829 check_qword_reg (void)
6830 {
6831 int op;
6832
6833 for (op = i.operands; --op >= 0; )
6834 /* Skip non-register operands. */
6835 if (i.types[op].bitfield.class != Reg)
6836 continue;
6837 /* Reject eight bit registers, except where the template requires
6838 them. (eg. movzb) */
6839 else if (i.types[op].bitfield.byte
6840 && (i.tm.operand_types[op].bitfield.class == Reg
6841 || i.tm.operand_types[op].bitfield.instance == Accum)
6842 && (i.tm.operand_types[op].bitfield.word
6843 || i.tm.operand_types[op].bitfield.dword))
6844 {
6845 as_bad (_("`%s%s' not allowed with `%s%c'"),
6846 register_prefix,
6847 i.op[op].regs->reg_name,
6848 i.tm.name,
6849 i.suffix);
6850 return 0;
6851 }
6852 /* Warn if the r prefix on a general reg is missing. */
6853 else if ((i.types[op].bitfield.word
6854 || i.types[op].bitfield.dword)
6855 && (i.tm.operand_types[op].bitfield.class == Reg
6856 || i.tm.operand_types[op].bitfield.instance == Accum)
6857 && i.tm.operand_types[op].bitfield.qword)
6858 {
6859 /* Prohibit these changes in the 64bit mode, since the
6860 lowering is more complicated. */
6861 if (intel_syntax
6862 && i.tm.opcode_modifier.todword
6863 && i.types[0].bitfield.class != RegSIMD)
6864 {
6865 /* Convert to DWORD. We don't want REX byte. */
6866 i.suffix = LONG_MNEM_SUFFIX;
6867 }
6868 else
6869 {
6870 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6871 register_prefix, i.op[op].regs->reg_name,
6872 i.suffix);
6873 return 0;
6874 }
6875 }
6876 return 1;
6877 }
6878
6879 static int
6880 check_word_reg (void)
6881 {
6882 int op;
6883 for (op = i.operands; --op >= 0;)
6884 /* Skip non-register operands. */
6885 if (i.types[op].bitfield.class != Reg)
6886 continue;
6887 /* Reject eight bit registers, except where the template requires
6888 them. (eg. movzb) */
6889 else if (i.types[op].bitfield.byte
6890 && (i.tm.operand_types[op].bitfield.class == Reg
6891 || i.tm.operand_types[op].bitfield.instance == Accum)
6892 && (i.tm.operand_types[op].bitfield.word
6893 || i.tm.operand_types[op].bitfield.dword))
6894 {
6895 as_bad (_("`%s%s' not allowed with `%s%c'"),
6896 register_prefix,
6897 i.op[op].regs->reg_name,
6898 i.tm.name,
6899 i.suffix);
6900 return 0;
6901 }
6902 /* Error if the e or r prefix on a general reg is present. */
6903 else if ((i.types[op].bitfield.dword
6904 || i.types[op].bitfield.qword)
6905 && (i.tm.operand_types[op].bitfield.class == Reg
6906 || i.tm.operand_types[op].bitfield.instance == Accum)
6907 && i.tm.operand_types[op].bitfield.word)
6908 {
6909 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6910 register_prefix, i.op[op].regs->reg_name,
6911 i.suffix);
6912 return 0;
6913 }
6914 return 1;
6915 }
6916
6917 static int
6918 update_imm (unsigned int j)
6919 {
6920 i386_operand_type overlap = i.types[j];
6921 if ((overlap.bitfield.imm8
6922 || overlap.bitfield.imm8s
6923 || overlap.bitfield.imm16
6924 || overlap.bitfield.imm32
6925 || overlap.bitfield.imm32s
6926 || overlap.bitfield.imm64)
6927 && !operand_type_equal (&overlap, &imm8)
6928 && !operand_type_equal (&overlap, &imm8s)
6929 && !operand_type_equal (&overlap, &imm16)
6930 && !operand_type_equal (&overlap, &imm32)
6931 && !operand_type_equal (&overlap, &imm32s)
6932 && !operand_type_equal (&overlap, &imm64))
6933 {
6934 if (i.suffix)
6935 {
6936 i386_operand_type temp;
6937
6938 operand_type_set (&temp, 0);
6939 if (i.suffix == BYTE_MNEM_SUFFIX)
6940 {
6941 temp.bitfield.imm8 = overlap.bitfield.imm8;
6942 temp.bitfield.imm8s = overlap.bitfield.imm8s;
6943 }
6944 else if (i.suffix == WORD_MNEM_SUFFIX)
6945 temp.bitfield.imm16 = overlap.bitfield.imm16;
6946 else if (i.suffix == QWORD_MNEM_SUFFIX)
6947 {
6948 temp.bitfield.imm64 = overlap.bitfield.imm64;
6949 temp.bitfield.imm32s = overlap.bitfield.imm32s;
6950 }
6951 else
6952 temp.bitfield.imm32 = overlap.bitfield.imm32;
6953 overlap = temp;
6954 }
6955 else if (operand_type_equal (&overlap, &imm16_32_32s)
6956 || operand_type_equal (&overlap, &imm16_32)
6957 || operand_type_equal (&overlap, &imm16_32s))
6958 {
6959 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6960 overlap = imm16;
6961 else
6962 overlap = imm32s;
6963 }
6964 if (!operand_type_equal (&overlap, &imm8)
6965 && !operand_type_equal (&overlap, &imm8s)
6966 && !operand_type_equal (&overlap, &imm16)
6967 && !operand_type_equal (&overlap, &imm32)
6968 && !operand_type_equal (&overlap, &imm32s)
6969 && !operand_type_equal (&overlap, &imm64))
6970 {
6971 as_bad (_("no instruction mnemonic suffix given; "
6972 "can't determine immediate size"));
6973 return 0;
6974 }
6975 }
6976 i.types[j] = overlap;
6977
6978 return 1;
6979 }
6980
6981 static int
6982 finalize_imm (void)
6983 {
6984 unsigned int j, n;
6985
6986 /* Update the first 2 immediate operands. */
6987 n = i.operands > 2 ? 2 : i.operands;
6988 if (n)
6989 {
6990 for (j = 0; j < n; j++)
6991 if (update_imm (j) == 0)
6992 return 0;
6993
6994 /* The 3rd operand can't be immediate operand. */
6995 gas_assert (operand_type_check (i.types[2], imm) == 0);
6996 }
6997
6998 return 1;
6999 }
7000
7001 static int
7002 process_operands (void)
7003 {
7004 /* Default segment register this instruction will use for memory
7005 accesses. 0 means unknown. This is only for optimizing out
7006 unnecessary segment overrides. */
7007 const seg_entry *default_seg = 0;
7008
7009 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7010 {
7011 unsigned int dupl = i.operands;
7012 unsigned int dest = dupl - 1;
7013 unsigned int j;
7014
7015 /* The destination must be an xmm register. */
7016 gas_assert (i.reg_operands
7017 && MAX_OPERANDS > dupl
7018 && operand_type_equal (&i.types[dest], &regxmm));
7019
7020 if (i.tm.operand_types[0].bitfield.instance == Accum
7021 && i.tm.operand_types[0].bitfield.xmmword)
7022 {
7023 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7024 {
7025 /* Keep xmm0 for instructions with VEX prefix and 3
7026 sources. */
7027 i.tm.operand_types[0].bitfield.instance = InstanceNone;
7028 i.tm.operand_types[0].bitfield.class = RegSIMD;
7029 goto duplicate;
7030 }
7031 else
7032 {
7033 /* We remove the first xmm0 and keep the number of
7034 operands unchanged, which in fact duplicates the
7035 destination. */
7036 for (j = 1; j < i.operands; j++)
7037 {
7038 i.op[j - 1] = i.op[j];
7039 i.types[j - 1] = i.types[j];
7040 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7041 i.flags[j - 1] = i.flags[j];
7042 }
7043 }
7044 }
7045 else if (i.tm.opcode_modifier.implicit1stxmm0)
7046 {
7047 gas_assert ((MAX_OPERANDS - 1) > dupl
7048 && (i.tm.opcode_modifier.vexsources
7049 == VEX3SOURCES));
7050
7051 /* Add the implicit xmm0 for instructions with VEX prefix
7052 and 3 sources. */
7053 for (j = i.operands; j > 0; j--)
7054 {
7055 i.op[j] = i.op[j - 1];
7056 i.types[j] = i.types[j - 1];
7057 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7058 i.flags[j] = i.flags[j - 1];
7059 }
7060 i.op[0].regs
7061 = (const reg_entry *) hash_find (reg_hash, "xmm0");
7062 i.types[0] = regxmm;
7063 i.tm.operand_types[0] = regxmm;
7064
7065 i.operands += 2;
7066 i.reg_operands += 2;
7067 i.tm.operands += 2;
7068
7069 dupl++;
7070 dest++;
7071 i.op[dupl] = i.op[dest];
7072 i.types[dupl] = i.types[dest];
7073 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7074 i.flags[dupl] = i.flags[dest];
7075 }
7076 else
7077 {
7078 duplicate:
7079 i.operands++;
7080 i.reg_operands++;
7081 i.tm.operands++;
7082
7083 i.op[dupl] = i.op[dest];
7084 i.types[dupl] = i.types[dest];
7085 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7086 i.flags[dupl] = i.flags[dest];
7087 }
7088
7089 if (i.tm.opcode_modifier.immext)
7090 process_immext ();
7091 }
7092 else if (i.tm.operand_types[0].bitfield.instance == Accum
7093 && i.tm.operand_types[0].bitfield.xmmword)
7094 {
7095 unsigned int j;
7096
7097 for (j = 1; j < i.operands; j++)
7098 {
7099 i.op[j - 1] = i.op[j];
7100 i.types[j - 1] = i.types[j];
7101
7102 /* We need to adjust fields in i.tm since they are used by
7103 build_modrm_byte. */
7104 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7105
7106 i.flags[j - 1] = i.flags[j];
7107 }
7108
7109 i.operands--;
7110 i.reg_operands--;
7111 i.tm.operands--;
7112 }
7113 else if (i.tm.opcode_modifier.implicitquadgroup)
7114 {
7115 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7116
7117 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7118 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7119 regnum = register_number (i.op[1].regs);
7120 first_reg_in_group = regnum & ~3;
7121 last_reg_in_group = first_reg_in_group + 3;
7122 if (regnum != first_reg_in_group)
7123 as_warn (_("source register `%s%s' implicitly denotes"
7124 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7125 register_prefix, i.op[1].regs->reg_name,
7126 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7127 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7128 i.tm.name);
7129 }
7130 else if (i.tm.opcode_modifier.regkludge)
7131 {
7132 /* The imul $imm, %reg instruction is converted into
7133 imul $imm, %reg, %reg, and the clr %reg instruction
7134 is converted into xor %reg, %reg. */
7135
7136 unsigned int first_reg_op;
7137
7138 if (operand_type_check (i.types[0], reg))
7139 first_reg_op = 0;
7140 else
7141 first_reg_op = 1;
7142 /* Pretend we saw the extra register operand. */
7143 gas_assert (i.reg_operands == 1
7144 && i.op[first_reg_op + 1].regs == 0);
7145 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7146 i.types[first_reg_op + 1] = i.types[first_reg_op];
7147 i.operands++;
7148 i.reg_operands++;
7149 }
7150
7151 if (i.tm.opcode_modifier.modrm)
7152 {
7153 /* The opcode is completed (modulo i.tm.extension_opcode which
7154 must be put into the modrm byte). Now, we make the modrm and
7155 index base bytes based on all the info we've collected. */
7156
7157 default_seg = build_modrm_byte ();
7158 }
7159 else if (i.types[0].bitfield.class == SReg)
7160 {
7161 if (flag_code != CODE_64BIT
7162 ? i.tm.base_opcode == POP_SEG_SHORT
7163 && i.op[0].regs->reg_num == 1
7164 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7165 && i.op[0].regs->reg_num < 4)
7166 {
7167 as_bad (_("you can't `%s %s%s'"),
7168 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7169 return 0;
7170 }
7171 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7172 {
7173 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7174 i.tm.opcode_length = 2;
7175 }
7176 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7177 }
7178 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7179 {
7180 default_seg = &ds;
7181 }
7182 else if (i.tm.opcode_modifier.isstring)
7183 {
7184 /* For the string instructions that allow a segment override
7185 on one of their operands, the default segment is ds. */
7186 default_seg = &ds;
7187 }
7188 else if (i.short_form)
7189 {
7190 /* The register or float register operand is in operand
7191 0 or 1. */
7192 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7193
7194 /* Register goes in low 3 bits of opcode. */
7195 i.tm.base_opcode |= i.op[op].regs->reg_num;
7196 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7197 i.rex |= REX_B;
7198 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7199 {
7200 /* Warn about some common errors, but press on regardless.
7201 The first case can be generated by gcc (<= 2.8.1). */
7202 if (i.operands == 2)
7203 {
7204 /* Reversed arguments on faddp, fsubp, etc. */
7205 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7206 register_prefix, i.op[!intel_syntax].regs->reg_name,
7207 register_prefix, i.op[intel_syntax].regs->reg_name);
7208 }
7209 else
7210 {
7211 /* Extraneous `l' suffix on fp insn. */
7212 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7213 register_prefix, i.op[0].regs->reg_name);
7214 }
7215 }
7216 }
7217
7218 if ((i.seg[0] || i.prefix[SEG_PREFIX])
7219 && i.tm.base_opcode == 0x8d /* lea */
7220 && !is_any_vex_encoding(&i.tm))
7221 {
7222 if (!quiet_warnings)
7223 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7224 if (optimize)
7225 {
7226 i.seg[0] = NULL;
7227 i.prefix[SEG_PREFIX] = 0;
7228 }
7229 }
7230
7231 /* If a segment was explicitly specified, and the specified segment
7232 is neither the default nor the one already recorded from a prefix,
7233 use an opcode prefix to select it. If we never figured out what
7234 the default segment is, then default_seg will be zero at this
7235 point, and the specified segment prefix will always be used. */
7236 if (i.seg[0]
7237 && i.seg[0] != default_seg
7238 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7239 {
7240 if (!add_prefix (i.seg[0]->seg_prefix))
7241 return 0;
7242 }
7243 return 1;
7244 }
7245
7246 static const seg_entry *
7247 build_modrm_byte (void)
7248 {
7249 const seg_entry *default_seg = 0;
7250 unsigned int source, dest;
7251 int vex_3_sources;
7252
7253 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7254 if (vex_3_sources)
7255 {
7256 unsigned int nds, reg_slot;
7257 expressionS *exp;
7258
7259 dest = i.operands - 1;
7260 nds = dest - 1;
7261
7262 /* There are 2 kinds of instructions:
7263 1. 5 operands: 4 register operands or 3 register operands
7264 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7265 VexW0 or VexW1. The destination must be either XMM, YMM or
7266 ZMM register.
7267 2. 4 operands: 4 register operands or 3 register operands
7268 plus 1 memory operand, with VexXDS. */
7269 gas_assert ((i.reg_operands == 4
7270 || (i.reg_operands == 3 && i.mem_operands == 1))
7271 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7272 && i.tm.opcode_modifier.vexw
7273 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7274
7275 /* If VexW1 is set, the first non-immediate operand is the source and
7276 the second non-immediate one is encoded in the immediate operand. */
7277 if (i.tm.opcode_modifier.vexw == VEXW1)
7278 {
7279 source = i.imm_operands;
7280 reg_slot = i.imm_operands + 1;
7281 }
7282 else
7283 {
7284 source = i.imm_operands + 1;
7285 reg_slot = i.imm_operands;
7286 }
7287
7288 if (i.imm_operands == 0)
7289 {
7290 /* When there is no immediate operand, generate an 8bit
7291 immediate operand to encode the first operand. */
7292 exp = &im_expressions[i.imm_operands++];
7293 i.op[i.operands].imms = exp;
7294 i.types[i.operands] = imm8;
7295 i.operands++;
7296
7297 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7298 exp->X_op = O_constant;
7299 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7300 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7301 }
7302 else
7303 {
7304 gas_assert (i.imm_operands == 1);
7305 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7306 gas_assert (!i.tm.opcode_modifier.immext);
7307
7308 /* Turn on Imm8 again so that output_imm will generate it. */
7309 i.types[0].bitfield.imm8 = 1;
7310
7311 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7312 i.op[0].imms->X_add_number
7313 |= register_number (i.op[reg_slot].regs) << 4;
7314 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7315 }
7316
7317 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7318 i.vex.register_specifier = i.op[nds].regs;
7319 }
7320 else
7321 source = dest = 0;
7322
7323 /* i.reg_operands MUST be the number of real register operands;
7324 implicit registers do not count. If there are 3 register
7325 operands, it must be a instruction with VexNDS. For a
7326 instruction with VexNDD, the destination register is encoded
7327 in VEX prefix. If there are 4 register operands, it must be
7328 a instruction with VEX prefix and 3 sources. */
7329 if (i.mem_operands == 0
7330 && ((i.reg_operands == 2
7331 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7332 || (i.reg_operands == 3
7333 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7334 || (i.reg_operands == 4 && vex_3_sources)))
7335 {
7336 switch (i.operands)
7337 {
7338 case 2:
7339 source = 0;
7340 break;
7341 case 3:
7342 /* When there are 3 operands, one of them may be immediate,
7343 which may be the first or the last operand. Otherwise,
7344 the first operand must be shift count register (cl) or it
7345 is an instruction with VexNDS. */
7346 gas_assert (i.imm_operands == 1
7347 || (i.imm_operands == 0
7348 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7349 || (i.types[0].bitfield.instance == RegC
7350 && i.types[0].bitfield.byte))));
7351 if (operand_type_check (i.types[0], imm)
7352 || (i.types[0].bitfield.instance == RegC
7353 && i.types[0].bitfield.byte))
7354 source = 1;
7355 else
7356 source = 0;
7357 break;
7358 case 4:
7359 /* When there are 4 operands, the first two must be 8bit
7360 immediate operands. The source operand will be the 3rd
7361 one.
7362
7363 For instructions with VexNDS, if the first operand
7364 an imm8, the source operand is the 2nd one. If the last
7365 operand is imm8, the source operand is the first one. */
7366 gas_assert ((i.imm_operands == 2
7367 && i.types[0].bitfield.imm8
7368 && i.types[1].bitfield.imm8)
7369 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7370 && i.imm_operands == 1
7371 && (i.types[0].bitfield.imm8
7372 || i.types[i.operands - 1].bitfield.imm8
7373 || i.rounding)));
7374 if (i.imm_operands == 2)
7375 source = 2;
7376 else
7377 {
7378 if (i.types[0].bitfield.imm8)
7379 source = 1;
7380 else
7381 source = 0;
7382 }
7383 break;
7384 case 5:
7385 if (is_evex_encoding (&i.tm))
7386 {
7387 /* For EVEX instructions, when there are 5 operands, the
7388 first one must be immediate operand. If the second one
7389 is immediate operand, the source operand is the 3th
7390 one. If the last one is immediate operand, the source
7391 operand is the 2nd one. */
7392 gas_assert (i.imm_operands == 2
7393 && i.tm.opcode_modifier.sae
7394 && operand_type_check (i.types[0], imm));
7395 if (operand_type_check (i.types[1], imm))
7396 source = 2;
7397 else if (operand_type_check (i.types[4], imm))
7398 source = 1;
7399 else
7400 abort ();
7401 }
7402 break;
7403 default:
7404 abort ();
7405 }
7406
7407 if (!vex_3_sources)
7408 {
7409 dest = source + 1;
7410
7411 /* RC/SAE operand could be between DEST and SRC. That happens
7412 when one operand is GPR and the other one is XMM/YMM/ZMM
7413 register. */
7414 if (i.rounding && i.rounding->operand == (int) dest)
7415 dest++;
7416
7417 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7418 {
7419 /* For instructions with VexNDS, the register-only source
7420 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7421 register. It is encoded in VEX prefix. */
7422
7423 i386_operand_type op;
7424 unsigned int vvvv;
7425
7426 /* Check register-only source operand when two source
7427 operands are swapped. */
7428 if (!i.tm.operand_types[source].bitfield.baseindex
7429 && i.tm.operand_types[dest].bitfield.baseindex)
7430 {
7431 vvvv = source;
7432 source = dest;
7433 }
7434 else
7435 vvvv = dest;
7436
7437 op = i.tm.operand_types[vvvv];
7438 if ((dest + 1) >= i.operands
7439 || ((op.bitfield.class != Reg
7440 || (!op.bitfield.dword && !op.bitfield.qword))
7441 && op.bitfield.class != RegSIMD
7442 && !operand_type_equal (&op, &regmask)))
7443 abort ();
7444 i.vex.register_specifier = i.op[vvvv].regs;
7445 dest++;
7446 }
7447 }
7448
7449 i.rm.mode = 3;
7450 /* One of the register operands will be encoded in the i.rm.reg
7451 field, the other in the combined i.rm.mode and i.rm.regmem
7452 fields. If no form of this instruction supports a memory
7453 destination operand, then we assume the source operand may
7454 sometimes be a memory operand and so we need to store the
7455 destination in the i.rm.reg field. */
7456 if (!i.tm.opcode_modifier.regmem
7457 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7458 {
7459 i.rm.reg = i.op[dest].regs->reg_num;
7460 i.rm.regmem = i.op[source].regs->reg_num;
7461 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7462 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7463 i.has_regmmx = TRUE;
7464 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7465 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7466 {
7467 if (i.types[dest].bitfield.zmmword
7468 || i.types[source].bitfield.zmmword)
7469 i.has_regzmm = TRUE;
7470 else if (i.types[dest].bitfield.ymmword
7471 || i.types[source].bitfield.ymmword)
7472 i.has_regymm = TRUE;
7473 else
7474 i.has_regxmm = TRUE;
7475 }
7476 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7477 i.rex |= REX_R;
7478 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7479 i.vrex |= REX_R;
7480 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7481 i.rex |= REX_B;
7482 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7483 i.vrex |= REX_B;
7484 }
7485 else
7486 {
7487 i.rm.reg = i.op[source].regs->reg_num;
7488 i.rm.regmem = i.op[dest].regs->reg_num;
7489 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7490 i.rex |= REX_B;
7491 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7492 i.vrex |= REX_B;
7493 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7494 i.rex |= REX_R;
7495 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7496 i.vrex |= REX_R;
7497 }
7498 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7499 {
7500 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7501 abort ();
7502 i.rex &= ~REX_R;
7503 add_prefix (LOCK_PREFIX_OPCODE);
7504 }
7505 }
7506 else
7507 { /* If it's not 2 reg operands... */
7508 unsigned int mem;
7509
7510 if (i.mem_operands)
7511 {
7512 unsigned int fake_zero_displacement = 0;
7513 unsigned int op;
7514
7515 for (op = 0; op < i.operands; op++)
7516 if (i.flags[op] & Operand_Mem)
7517 break;
7518 gas_assert (op < i.operands);
7519
7520 if (i.tm.opcode_modifier.vecsib)
7521 {
7522 if (i.index_reg->reg_num == RegIZ)
7523 abort ();
7524
7525 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7526 if (!i.base_reg)
7527 {
7528 i.sib.base = NO_BASE_REGISTER;
7529 i.sib.scale = i.log2_scale_factor;
7530 i.types[op].bitfield.disp8 = 0;
7531 i.types[op].bitfield.disp16 = 0;
7532 i.types[op].bitfield.disp64 = 0;
7533 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7534 {
7535 /* Must be 32 bit */
7536 i.types[op].bitfield.disp32 = 1;
7537 i.types[op].bitfield.disp32s = 0;
7538 }
7539 else
7540 {
7541 i.types[op].bitfield.disp32 = 0;
7542 i.types[op].bitfield.disp32s = 1;
7543 }
7544 }
7545 i.sib.index = i.index_reg->reg_num;
7546 if ((i.index_reg->reg_flags & RegRex) != 0)
7547 i.rex |= REX_X;
7548 if ((i.index_reg->reg_flags & RegVRex) != 0)
7549 i.vrex |= REX_X;
7550 }
7551
7552 default_seg = &ds;
7553
7554 if (i.base_reg == 0)
7555 {
7556 i.rm.mode = 0;
7557 if (!i.disp_operands)
7558 fake_zero_displacement = 1;
7559 if (i.index_reg == 0)
7560 {
7561 i386_operand_type newdisp;
7562
7563 gas_assert (!i.tm.opcode_modifier.vecsib);
7564 /* Operand is just <disp> */
7565 if (flag_code == CODE_64BIT)
7566 {
7567 /* 64bit mode overwrites the 32bit absolute
7568 addressing by RIP relative addressing and
7569 absolute addressing is encoded by one of the
7570 redundant SIB forms. */
7571 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7572 i.sib.base = NO_BASE_REGISTER;
7573 i.sib.index = NO_INDEX_REGISTER;
7574 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7575 }
7576 else if ((flag_code == CODE_16BIT)
7577 ^ (i.prefix[ADDR_PREFIX] != 0))
7578 {
7579 i.rm.regmem = NO_BASE_REGISTER_16;
7580 newdisp = disp16;
7581 }
7582 else
7583 {
7584 i.rm.regmem = NO_BASE_REGISTER;
7585 newdisp = disp32;
7586 }
7587 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7588 i.types[op] = operand_type_or (i.types[op], newdisp);
7589 }
7590 else if (!i.tm.opcode_modifier.vecsib)
7591 {
7592 /* !i.base_reg && i.index_reg */
7593 if (i.index_reg->reg_num == RegIZ)
7594 i.sib.index = NO_INDEX_REGISTER;
7595 else
7596 i.sib.index = i.index_reg->reg_num;
7597 i.sib.base = NO_BASE_REGISTER;
7598 i.sib.scale = i.log2_scale_factor;
7599 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7600 i.types[op].bitfield.disp8 = 0;
7601 i.types[op].bitfield.disp16 = 0;
7602 i.types[op].bitfield.disp64 = 0;
7603 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7604 {
7605 /* Must be 32 bit */
7606 i.types[op].bitfield.disp32 = 1;
7607 i.types[op].bitfield.disp32s = 0;
7608 }
7609 else
7610 {
7611 i.types[op].bitfield.disp32 = 0;
7612 i.types[op].bitfield.disp32s = 1;
7613 }
7614 if ((i.index_reg->reg_flags & RegRex) != 0)
7615 i.rex |= REX_X;
7616 }
7617 }
7618 /* RIP addressing for 64bit mode. */
7619 else if (i.base_reg->reg_num == RegIP)
7620 {
7621 gas_assert (!i.tm.opcode_modifier.vecsib);
7622 i.rm.regmem = NO_BASE_REGISTER;
7623 i.types[op].bitfield.disp8 = 0;
7624 i.types[op].bitfield.disp16 = 0;
7625 i.types[op].bitfield.disp32 = 0;
7626 i.types[op].bitfield.disp32s = 1;
7627 i.types[op].bitfield.disp64 = 0;
7628 i.flags[op] |= Operand_PCrel;
7629 if (! i.disp_operands)
7630 fake_zero_displacement = 1;
7631 }
7632 else if (i.base_reg->reg_type.bitfield.word)
7633 {
7634 gas_assert (!i.tm.opcode_modifier.vecsib);
7635 switch (i.base_reg->reg_num)
7636 {
7637 case 3: /* (%bx) */
7638 if (i.index_reg == 0)
7639 i.rm.regmem = 7;
7640 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
7641 i.rm.regmem = i.index_reg->reg_num - 6;
7642 break;
7643 case 5: /* (%bp) */
7644 default_seg = &ss;
7645 if (i.index_reg == 0)
7646 {
7647 i.rm.regmem = 6;
7648 if (operand_type_check (i.types[op], disp) == 0)
7649 {
7650 /* fake (%bp) into 0(%bp) */
7651 i.types[op].bitfield.disp8 = 1;
7652 fake_zero_displacement = 1;
7653 }
7654 }
7655 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
7656 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7657 break;
7658 default: /* (%si) -> 4 or (%di) -> 5 */
7659 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7660 }
7661 i.rm.mode = mode_from_disp_size (i.types[op]);
7662 }
7663 else /* i.base_reg and 32/64 bit mode */
7664 {
7665 if (flag_code == CODE_64BIT
7666 && operand_type_check (i.types[op], disp))
7667 {
7668 i.types[op].bitfield.disp16 = 0;
7669 i.types[op].bitfield.disp64 = 0;
7670 if (i.prefix[ADDR_PREFIX] == 0)
7671 {
7672 i.types[op].bitfield.disp32 = 0;
7673 i.types[op].bitfield.disp32s = 1;
7674 }
7675 else
7676 {
7677 i.types[op].bitfield.disp32 = 1;
7678 i.types[op].bitfield.disp32s = 0;
7679 }
7680 }
7681
7682 if (!i.tm.opcode_modifier.vecsib)
7683 i.rm.regmem = i.base_reg->reg_num;
7684 if ((i.base_reg->reg_flags & RegRex) != 0)
7685 i.rex |= REX_B;
7686 i.sib.base = i.base_reg->reg_num;
7687 /* x86-64 ignores REX prefix bit here to avoid decoder
7688 complications. */
7689 if (!(i.base_reg->reg_flags & RegRex)
7690 && (i.base_reg->reg_num == EBP_REG_NUM
7691 || i.base_reg->reg_num == ESP_REG_NUM))
7692 default_seg = &ss;
7693 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7694 {
7695 fake_zero_displacement = 1;
7696 i.types[op].bitfield.disp8 = 1;
7697 }
7698 i.sib.scale = i.log2_scale_factor;
7699 if (i.index_reg == 0)
7700 {
7701 gas_assert (!i.tm.opcode_modifier.vecsib);
7702 /* <disp>(%esp) becomes two byte modrm with no index
7703 register. We've already stored the code for esp
7704 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7705 Any base register besides %esp will not use the
7706 extra modrm byte. */
7707 i.sib.index = NO_INDEX_REGISTER;
7708 }
7709 else if (!i.tm.opcode_modifier.vecsib)
7710 {
7711 if (i.index_reg->reg_num == RegIZ)
7712 i.sib.index = NO_INDEX_REGISTER;
7713 else
7714 i.sib.index = i.index_reg->reg_num;
7715 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7716 if ((i.index_reg->reg_flags & RegRex) != 0)
7717 i.rex |= REX_X;
7718 }
7719
7720 if (i.disp_operands
7721 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7722 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7723 i.rm.mode = 0;
7724 else
7725 {
7726 if (!fake_zero_displacement
7727 && !i.disp_operands
7728 && i.disp_encoding)
7729 {
7730 fake_zero_displacement = 1;
7731 if (i.disp_encoding == disp_encoding_8bit)
7732 i.types[op].bitfield.disp8 = 1;
7733 else
7734 i.types[op].bitfield.disp32 = 1;
7735 }
7736 i.rm.mode = mode_from_disp_size (i.types[op]);
7737 }
7738 }
7739
7740 if (fake_zero_displacement)
7741 {
7742 /* Fakes a zero displacement assuming that i.types[op]
7743 holds the correct displacement size. */
7744 expressionS *exp;
7745
7746 gas_assert (i.op[op].disps == 0);
7747 exp = &disp_expressions[i.disp_operands++];
7748 i.op[op].disps = exp;
7749 exp->X_op = O_constant;
7750 exp->X_add_number = 0;
7751 exp->X_add_symbol = (symbolS *) 0;
7752 exp->X_op_symbol = (symbolS *) 0;
7753 }
7754
7755 mem = op;
7756 }
7757 else
7758 mem = ~0;
7759
7760 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7761 {
7762 if (operand_type_check (i.types[0], imm))
7763 i.vex.register_specifier = NULL;
7764 else
7765 {
7766 /* VEX.vvvv encodes one of the sources when the first
7767 operand is not an immediate. */
7768 if (i.tm.opcode_modifier.vexw == VEXW0)
7769 i.vex.register_specifier = i.op[0].regs;
7770 else
7771 i.vex.register_specifier = i.op[1].regs;
7772 }
7773
7774 /* Destination is a XMM register encoded in the ModRM.reg
7775 and VEX.R bit. */
7776 i.rm.reg = i.op[2].regs->reg_num;
7777 if ((i.op[2].regs->reg_flags & RegRex) != 0)
7778 i.rex |= REX_R;
7779
7780 /* ModRM.rm and VEX.B encodes the other source. */
7781 if (!i.mem_operands)
7782 {
7783 i.rm.mode = 3;
7784
7785 if (i.tm.opcode_modifier.vexw == VEXW0)
7786 i.rm.regmem = i.op[1].regs->reg_num;
7787 else
7788 i.rm.regmem = i.op[0].regs->reg_num;
7789
7790 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7791 i.rex |= REX_B;
7792 }
7793 }
7794 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7795 {
7796 i.vex.register_specifier = i.op[2].regs;
7797 if (!i.mem_operands)
7798 {
7799 i.rm.mode = 3;
7800 i.rm.regmem = i.op[1].regs->reg_num;
7801 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7802 i.rex |= REX_B;
7803 }
7804 }
7805 /* Fill in i.rm.reg or i.rm.regmem field with register operand
7806 (if any) based on i.tm.extension_opcode. Again, we must be
7807 careful to make sure that segment/control/debug/test/MMX
7808 registers are coded into the i.rm.reg field. */
7809 else if (i.reg_operands)
7810 {
7811 unsigned int op;
7812 unsigned int vex_reg = ~0;
7813
7814 for (op = 0; op < i.operands; op++)
7815 {
7816 if (i.types[op].bitfield.class == Reg
7817 || i.types[op].bitfield.class == RegBND
7818 || i.types[op].bitfield.class == RegMask
7819 || i.types[op].bitfield.class == SReg
7820 || i.types[op].bitfield.class == RegCR
7821 || i.types[op].bitfield.class == RegDR
7822 || i.types[op].bitfield.class == RegTR)
7823 break;
7824 if (i.types[op].bitfield.class == RegSIMD)
7825 {
7826 if (i.types[op].bitfield.zmmword)
7827 i.has_regzmm = TRUE;
7828 else if (i.types[op].bitfield.ymmword)
7829 i.has_regymm = TRUE;
7830 else
7831 i.has_regxmm = TRUE;
7832 break;
7833 }
7834 if (i.types[op].bitfield.class == RegMMX)
7835 {
7836 i.has_regmmx = TRUE;
7837 break;
7838 }
7839 }
7840
7841 if (vex_3_sources)
7842 op = dest;
7843 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7844 {
7845 /* For instructions with VexNDS, the register-only
7846 source operand is encoded in VEX prefix. */
7847 gas_assert (mem != (unsigned int) ~0);
7848
7849 if (op > mem)
7850 {
7851 vex_reg = op++;
7852 gas_assert (op < i.operands);
7853 }
7854 else
7855 {
7856 /* Check register-only source operand when two source
7857 operands are swapped. */
7858 if (!i.tm.operand_types[op].bitfield.baseindex
7859 && i.tm.operand_types[op + 1].bitfield.baseindex)
7860 {
7861 vex_reg = op;
7862 op += 2;
7863 gas_assert (mem == (vex_reg + 1)
7864 && op < i.operands);
7865 }
7866 else
7867 {
7868 vex_reg = op + 1;
7869 gas_assert (vex_reg < i.operands);
7870 }
7871 }
7872 }
7873 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7874 {
7875 /* For instructions with VexNDD, the register destination
7876 is encoded in VEX prefix. */
7877 if (i.mem_operands == 0)
7878 {
7879 /* There is no memory operand. */
7880 gas_assert ((op + 2) == i.operands);
7881 vex_reg = op + 1;
7882 }
7883 else
7884 {
7885 /* There are only 2 non-immediate operands. */
7886 gas_assert (op < i.imm_operands + 2
7887 && i.operands == i.imm_operands + 2);
7888 vex_reg = i.imm_operands + 1;
7889 }
7890 }
7891 else
7892 gas_assert (op < i.operands);
7893
7894 if (vex_reg != (unsigned int) ~0)
7895 {
7896 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7897
7898 if ((type->bitfield.class != Reg
7899 || (!type->bitfield.dword && !type->bitfield.qword))
7900 && type->bitfield.class != RegSIMD
7901 && !operand_type_equal (type, &regmask))
7902 abort ();
7903
7904 i.vex.register_specifier = i.op[vex_reg].regs;
7905 }
7906
7907 /* Don't set OP operand twice. */
7908 if (vex_reg != op)
7909 {
7910 /* If there is an extension opcode to put here, the
7911 register number must be put into the regmem field. */
7912 if (i.tm.extension_opcode != None)
7913 {
7914 i.rm.regmem = i.op[op].regs->reg_num;
7915 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7916 i.rex |= REX_B;
7917 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7918 i.vrex |= REX_B;
7919 }
7920 else
7921 {
7922 i.rm.reg = i.op[op].regs->reg_num;
7923 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7924 i.rex |= REX_R;
7925 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7926 i.vrex |= REX_R;
7927 }
7928 }
7929
7930 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7931 must set it to 3 to indicate this is a register operand
7932 in the regmem field. */
7933 if (!i.mem_operands)
7934 i.rm.mode = 3;
7935 }
7936
7937 /* Fill in i.rm.reg field with extension opcode (if any). */
7938 if (i.tm.extension_opcode != None)
7939 i.rm.reg = i.tm.extension_opcode;
7940 }
7941 return default_seg;
7942 }
7943
7944 static unsigned int
7945 flip_code16 (unsigned int code16)
7946 {
7947 gas_assert (i.tm.operands == 1);
7948
7949 return !(i.prefix[REX_PREFIX] & REX_W)
7950 && (code16 ? i.tm.operand_types[0].bitfield.disp32
7951 || i.tm.operand_types[0].bitfield.disp32s
7952 : i.tm.operand_types[0].bitfield.disp16)
7953 ? CODE16 : 0;
7954 }
7955
7956 static void
7957 output_branch (void)
7958 {
7959 char *p;
7960 int size;
7961 int code16;
7962 int prefix;
7963 relax_substateT subtype;
7964 symbolS *sym;
7965 offsetT off;
7966
7967 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7968 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7969
7970 prefix = 0;
7971 if (i.prefix[DATA_PREFIX] != 0)
7972 {
7973 prefix = 1;
7974 i.prefixes -= 1;
7975 code16 ^= flip_code16(code16);
7976 }
7977 /* Pentium4 branch hints. */
7978 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7979 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7980 {
7981 prefix++;
7982 i.prefixes--;
7983 }
7984 if (i.prefix[REX_PREFIX] != 0)
7985 {
7986 prefix++;
7987 i.prefixes--;
7988 }
7989
7990 /* BND prefixed jump. */
7991 if (i.prefix[BND_PREFIX] != 0)
7992 {
7993 prefix++;
7994 i.prefixes--;
7995 }
7996
7997 if (i.prefixes != 0)
7998 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
7999
8000 /* It's always a symbol; End frag & setup for relax.
8001 Make sure there is enough room in this frag for the largest
8002 instruction we may generate in md_convert_frag. This is 2
8003 bytes for the opcode and room for the prefix and largest
8004 displacement. */
8005 frag_grow (prefix + 2 + 4);
8006 /* Prefix and 1 opcode byte go in fr_fix. */
8007 p = frag_more (prefix + 1);
8008 if (i.prefix[DATA_PREFIX] != 0)
8009 *p++ = DATA_PREFIX_OPCODE;
8010 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8011 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8012 *p++ = i.prefix[SEG_PREFIX];
8013 if (i.prefix[BND_PREFIX] != 0)
8014 *p++ = BND_PREFIX_OPCODE;
8015 if (i.prefix[REX_PREFIX] != 0)
8016 *p++ = i.prefix[REX_PREFIX];
8017 *p = i.tm.base_opcode;
8018
8019 if ((unsigned char) *p == JUMP_PC_RELATIVE)
8020 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8021 else if (cpu_arch_flags.bitfield.cpui386)
8022 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8023 else
8024 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8025 subtype |= code16;
8026
8027 sym = i.op[0].disps->X_add_symbol;
8028 off = i.op[0].disps->X_add_number;
8029
8030 if (i.op[0].disps->X_op != O_constant
8031 && i.op[0].disps->X_op != O_symbol)
8032 {
8033 /* Handle complex expressions. */
8034 sym = make_expr_symbol (i.op[0].disps);
8035 off = 0;
8036 }
8037
8038 /* 1 possible extra opcode + 4 byte displacement go in var part.
8039 Pass reloc in fr_var. */
8040 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8041 }
8042
8043 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8044 /* Return TRUE iff PLT32 relocation should be used for branching to
8045 symbol S. */
8046
8047 static bfd_boolean
8048 need_plt32_p (symbolS *s)
8049 {
8050 /* PLT32 relocation is ELF only. */
8051 if (!IS_ELF)
8052 return FALSE;
8053
8054 #ifdef TE_SOLARIS
8055 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8056 krtld support it. */
8057 return FALSE;
8058 #endif
8059
8060 /* Since there is no need to prepare for PLT branch on x86-64, we
8061 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8062 be used as a marker for 32-bit PC-relative branches. */
8063 if (!object_64bit)
8064 return FALSE;
8065
8066 /* Weak or undefined symbol need PLT32 relocation. */
8067 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8068 return TRUE;
8069
8070 /* Non-global symbol doesn't need PLT32 relocation. */
8071 if (! S_IS_EXTERNAL (s))
8072 return FALSE;
8073
8074 /* Other global symbols need PLT32 relocation. NB: Symbol with
8075 non-default visibilities are treated as normal global symbol
8076 so that PLT32 relocation can be used as a marker for 32-bit
8077 PC-relative branches. It is useful for linker relaxation. */
8078 return TRUE;
8079 }
8080 #endif
8081
8082 static void
8083 output_jump (void)
8084 {
8085 char *p;
8086 int size;
8087 fixS *fixP;
8088 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8089
8090 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8091 {
8092 /* This is a loop or jecxz type instruction. */
8093 size = 1;
8094 if (i.prefix[ADDR_PREFIX] != 0)
8095 {
8096 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8097 i.prefixes -= 1;
8098 }
8099 /* Pentium4 branch hints. */
8100 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8101 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8102 {
8103 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8104 i.prefixes--;
8105 }
8106 }
8107 else
8108 {
8109 int code16;
8110
8111 code16 = 0;
8112 if (flag_code == CODE_16BIT)
8113 code16 = CODE16;
8114
8115 if (i.prefix[DATA_PREFIX] != 0)
8116 {
8117 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8118 i.prefixes -= 1;
8119 code16 ^= flip_code16(code16);
8120 }
8121
8122 size = 4;
8123 if (code16)
8124 size = 2;
8125 }
8126
8127 /* BND prefixed jump. */
8128 if (i.prefix[BND_PREFIX] != 0)
8129 {
8130 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8131 i.prefixes -= 1;
8132 }
8133
8134 if (i.prefix[REX_PREFIX] != 0)
8135 {
8136 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8137 i.prefixes -= 1;
8138 }
8139
8140 if (i.prefixes != 0)
8141 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8142
8143 p = frag_more (i.tm.opcode_length + size);
8144 switch (i.tm.opcode_length)
8145 {
8146 case 2:
8147 *p++ = i.tm.base_opcode >> 8;
8148 /* Fall through. */
8149 case 1:
8150 *p++ = i.tm.base_opcode;
8151 break;
8152 default:
8153 abort ();
8154 }
8155
8156 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8157 if (size == 4
8158 && jump_reloc == NO_RELOC
8159 && need_plt32_p (i.op[0].disps->X_add_symbol))
8160 jump_reloc = BFD_RELOC_X86_64_PLT32;
8161 #endif
8162
8163 jump_reloc = reloc (size, 1, 1, jump_reloc);
8164
8165 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8166 i.op[0].disps, 1, jump_reloc);
8167
8168 /* All jumps handled here are signed, but don't use a signed limit
8169 check for 32 and 16 bit jumps as we want to allow wrap around at
8170 4G and 64k respectively. */
8171 if (size == 1)
8172 fixP->fx_signed = 1;
8173 }
8174
8175 static void
8176 output_interseg_jump (void)
8177 {
8178 char *p;
8179 int size;
8180 int prefix;
8181 int code16;
8182
8183 code16 = 0;
8184 if (flag_code == CODE_16BIT)
8185 code16 = CODE16;
8186
8187 prefix = 0;
8188 if (i.prefix[DATA_PREFIX] != 0)
8189 {
8190 prefix = 1;
8191 i.prefixes -= 1;
8192 code16 ^= CODE16;
8193 }
8194
8195 gas_assert (!i.prefix[REX_PREFIX]);
8196
8197 size = 4;
8198 if (code16)
8199 size = 2;
8200
8201 if (i.prefixes != 0)
8202 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8203
8204 /* 1 opcode; 2 segment; offset */
8205 p = frag_more (prefix + 1 + 2 + size);
8206
8207 if (i.prefix[DATA_PREFIX] != 0)
8208 *p++ = DATA_PREFIX_OPCODE;
8209
8210 if (i.prefix[REX_PREFIX] != 0)
8211 *p++ = i.prefix[REX_PREFIX];
8212
8213 *p++ = i.tm.base_opcode;
8214 if (i.op[1].imms->X_op == O_constant)
8215 {
8216 offsetT n = i.op[1].imms->X_add_number;
8217
8218 if (size == 2
8219 && !fits_in_unsigned_word (n)
8220 && !fits_in_signed_word (n))
8221 {
8222 as_bad (_("16-bit jump out of range"));
8223 return;
8224 }
8225 md_number_to_chars (p, n, size);
8226 }
8227 else
8228 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8229 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8230 if (i.op[0].imms->X_op != O_constant)
8231 as_bad (_("can't handle non absolute segment in `%s'"),
8232 i.tm.name);
8233 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8234 }
8235
8236 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8237 void
8238 x86_cleanup (void)
8239 {
8240 char *p;
8241 asection *seg = now_seg;
8242 subsegT subseg = now_subseg;
8243 asection *sec;
8244 unsigned int alignment, align_size_1;
8245 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8246 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8247 unsigned int padding;
8248
8249 if (!IS_ELF || !x86_used_note)
8250 return;
8251
8252 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8253
8254 /* The .note.gnu.property section layout:
8255
8256 Field Length Contents
8257 ---- ---- ----
8258 n_namsz 4 4
8259 n_descsz 4 The note descriptor size
8260 n_type 4 NT_GNU_PROPERTY_TYPE_0
8261 n_name 4 "GNU"
8262 n_desc n_descsz The program property array
8263 .... .... ....
8264 */
8265
8266 /* Create the .note.gnu.property section. */
8267 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8268 bfd_set_section_flags (sec,
8269 (SEC_ALLOC
8270 | SEC_LOAD
8271 | SEC_DATA
8272 | SEC_HAS_CONTENTS
8273 | SEC_READONLY));
8274
8275 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8276 {
8277 align_size_1 = 7;
8278 alignment = 3;
8279 }
8280 else
8281 {
8282 align_size_1 = 3;
8283 alignment = 2;
8284 }
8285
8286 bfd_set_section_alignment (sec, alignment);
8287 elf_section_type (sec) = SHT_NOTE;
8288
8289 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8290 + 4-byte data */
8291 isa_1_descsz_raw = 4 + 4 + 4;
8292 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8293 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8294
8295 feature_2_descsz_raw = isa_1_descsz;
8296 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8297 + 4-byte data */
8298 feature_2_descsz_raw += 4 + 4 + 4;
8299 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8300 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8301 & ~align_size_1);
8302
8303 descsz = feature_2_descsz;
8304 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8305 p = frag_more (4 + 4 + 4 + 4 + descsz);
8306
8307 /* Write n_namsz. */
8308 md_number_to_chars (p, (valueT) 4, 4);
8309
8310 /* Write n_descsz. */
8311 md_number_to_chars (p + 4, (valueT) descsz, 4);
8312
8313 /* Write n_type. */
8314 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8315
8316 /* Write n_name. */
8317 memcpy (p + 4 * 3, "GNU", 4);
8318
8319 /* Write 4-byte type. */
8320 md_number_to_chars (p + 4 * 4,
8321 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8322
8323 /* Write 4-byte data size. */
8324 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8325
8326 /* Write 4-byte data. */
8327 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8328
8329 /* Zero out paddings. */
8330 padding = isa_1_descsz - isa_1_descsz_raw;
8331 if (padding)
8332 memset (p + 4 * 7, 0, padding);
8333
8334 /* Write 4-byte type. */
8335 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8336 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8337
8338 /* Write 4-byte data size. */
8339 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8340
8341 /* Write 4-byte data. */
8342 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8343 (valueT) x86_feature_2_used, 4);
8344
8345 /* Zero out paddings. */
8346 padding = feature_2_descsz - feature_2_descsz_raw;
8347 if (padding)
8348 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8349
8350 /* We probably can't restore the current segment, for there likely
8351 isn't one yet... */
8352 if (seg && subseg)
8353 subseg_set (seg, subseg);
8354 }
8355 #endif
8356
8357 static unsigned int
8358 encoding_length (const fragS *start_frag, offsetT start_off,
8359 const char *frag_now_ptr)
8360 {
8361 unsigned int len = 0;
8362
8363 if (start_frag != frag_now)
8364 {
8365 const fragS *fr = start_frag;
8366
8367 do {
8368 len += fr->fr_fix;
8369 fr = fr->fr_next;
8370 } while (fr && fr != frag_now);
8371 }
8372
8373 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8374 }
8375
8376 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8377 be macro-fused with conditional jumps. */
8378
8379 static int
8380 maybe_fused_with_jcc_p (void)
8381 {
8382 /* No RIP address. */
8383 if (i.base_reg && i.base_reg->reg_num == RegIP)
8384 return 0;
8385
8386 /* No VEX/EVEX encoding. */
8387 if (is_any_vex_encoding (&i.tm))
8388 return 0;
8389
8390 /* and, add, sub with destination register. */
8391 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8392 || i.tm.base_opcode <= 5
8393 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8394 || ((i.tm.base_opcode | 3) == 0x83
8395 && ((i.tm.extension_opcode | 1) == 0x5
8396 || i.tm.extension_opcode == 0x0)))
8397 return (i.types[1].bitfield.class == Reg
8398 || i.types[1].bitfield.instance == Accum);
8399
8400 /* test, cmp with any register. */
8401 if ((i.tm.base_opcode | 1) == 0x85
8402 || (i.tm.base_opcode | 1) == 0xa9
8403 || ((i.tm.base_opcode | 1) == 0xf7
8404 && i.tm.extension_opcode == 0)
8405 || (i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8406 || ((i.tm.base_opcode | 3) == 0x83
8407 && (i.tm.extension_opcode == 0x7)))
8408 return (i.types[0].bitfield.class == Reg
8409 || i.types[0].bitfield.instance == Accum
8410 || i.types[1].bitfield.class == Reg
8411 || i.types[1].bitfield.instance == Accum);
8412
8413 /* inc, dec with any register. */
8414 if ((i.tm.cpu_flags.bitfield.cpuno64
8415 && (i.tm.base_opcode | 0xf) == 0x4f)
8416 || ((i.tm.base_opcode | 1) == 0xff
8417 && i.tm.extension_opcode <= 0x1))
8418 return (i.types[0].bitfield.class == Reg
8419 || i.types[0].bitfield.instance == Accum);
8420
8421 return 0;
8422 }
8423
8424 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8425
8426 static int
8427 add_fused_jcc_padding_frag_p (void)
8428 {
8429 /* NB: Don't work with COND_JUMP86 without i386. */
8430 if (!align_branch_power
8431 || now_seg == absolute_section
8432 || !cpu_arch_flags.bitfield.cpui386
8433 || !(align_branch & align_branch_fused_bit))
8434 return 0;
8435
8436 if (maybe_fused_with_jcc_p ())
8437 {
8438 if (last_insn.kind == last_insn_other
8439 || last_insn.seg != now_seg)
8440 return 1;
8441 if (flag_debug)
8442 as_warn_where (last_insn.file, last_insn.line,
8443 _("`%s` skips -malign-branch-boundary on `%s`"),
8444 last_insn.name, i.tm.name);
8445 }
8446
8447 return 0;
8448 }
8449
8450 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
8451
8452 static int
8453 add_branch_prefix_frag_p (void)
8454 {
8455 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8456 to PadLock instructions since they include prefixes in opcode. */
8457 if (!align_branch_power
8458 || !align_branch_prefix_size
8459 || now_seg == absolute_section
8460 || i.tm.cpu_flags.bitfield.cpupadlock
8461 || !cpu_arch_flags.bitfield.cpui386)
8462 return 0;
8463
8464 /* Don't add prefix if it is a prefix or there is no operand in case
8465 that segment prefix is special. */
8466 if (!i.operands || i.tm.opcode_modifier.isprefix)
8467 return 0;
8468
8469 if (last_insn.kind == last_insn_other
8470 || last_insn.seg != now_seg)
8471 return 1;
8472
8473 if (flag_debug)
8474 as_warn_where (last_insn.file, last_insn.line,
8475 _("`%s` skips -malign-branch-boundary on `%s`"),
8476 last_insn.name, i.tm.name);
8477
8478 return 0;
8479 }
8480
8481 /* Return 1 if a BRANCH_PADDING frag should be generated. */
8482
8483 static int
8484 add_branch_padding_frag_p (enum align_branch_kind *branch_p)
8485 {
8486 int add_padding;
8487
8488 /* NB: Don't work with COND_JUMP86 without i386. */
8489 if (!align_branch_power
8490 || now_seg == absolute_section
8491 || !cpu_arch_flags.bitfield.cpui386)
8492 return 0;
8493
8494 add_padding = 0;
8495
8496 /* Check for jcc and direct jmp. */
8497 if (i.tm.opcode_modifier.jump == JUMP)
8498 {
8499 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8500 {
8501 *branch_p = align_branch_jmp;
8502 add_padding = align_branch & align_branch_jmp_bit;
8503 }
8504 else
8505 {
8506 *branch_p = align_branch_jcc;
8507 if ((align_branch & align_branch_jcc_bit))
8508 add_padding = 1;
8509 }
8510 }
8511 else if (is_any_vex_encoding (&i.tm))
8512 return 0;
8513 else if ((i.tm.base_opcode | 1) == 0xc3)
8514 {
8515 /* Near ret. */
8516 *branch_p = align_branch_ret;
8517 if ((align_branch & align_branch_ret_bit))
8518 add_padding = 1;
8519 }
8520 else
8521 {
8522 /* Check for indirect jmp, direct and indirect calls. */
8523 if (i.tm.base_opcode == 0xe8)
8524 {
8525 /* Direct call. */
8526 *branch_p = align_branch_call;
8527 if ((align_branch & align_branch_call_bit))
8528 add_padding = 1;
8529 }
8530 else if (i.tm.base_opcode == 0xff
8531 && (i.tm.extension_opcode == 2
8532 || i.tm.extension_opcode == 4))
8533 {
8534 /* Indirect call and jmp. */
8535 *branch_p = align_branch_indirect;
8536 if ((align_branch & align_branch_indirect_bit))
8537 add_padding = 1;
8538 }
8539
8540 if (add_padding
8541 && i.disp_operands
8542 && tls_get_addr
8543 && (i.op[0].disps->X_op == O_symbol
8544 || (i.op[0].disps->X_op == O_subtract
8545 && i.op[0].disps->X_op_symbol == GOT_symbol)))
8546 {
8547 symbolS *s = i.op[0].disps->X_add_symbol;
8548 /* No padding to call to global or undefined tls_get_addr. */
8549 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
8550 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
8551 return 0;
8552 }
8553 }
8554
8555 if (add_padding
8556 && last_insn.kind != last_insn_other
8557 && last_insn.seg == now_seg)
8558 {
8559 if (flag_debug)
8560 as_warn_where (last_insn.file, last_insn.line,
8561 _("`%s` skips -malign-branch-boundary on `%s`"),
8562 last_insn.name, i.tm.name);
8563 return 0;
8564 }
8565
8566 return add_padding;
8567 }
8568
8569 static void
8570 output_insn (void)
8571 {
8572 fragS *insn_start_frag;
8573 offsetT insn_start_off;
8574 fragS *fragP = NULL;
8575 enum align_branch_kind branch = align_branch_none;
8576
8577 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8578 if (IS_ELF && x86_used_note)
8579 {
8580 if (i.tm.cpu_flags.bitfield.cpucmov)
8581 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8582 if (i.tm.cpu_flags.bitfield.cpusse)
8583 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8584 if (i.tm.cpu_flags.bitfield.cpusse2)
8585 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8586 if (i.tm.cpu_flags.bitfield.cpusse3)
8587 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8588 if (i.tm.cpu_flags.bitfield.cpussse3)
8589 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8590 if (i.tm.cpu_flags.bitfield.cpusse4_1)
8591 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8592 if (i.tm.cpu_flags.bitfield.cpusse4_2)
8593 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8594 if (i.tm.cpu_flags.bitfield.cpuavx)
8595 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8596 if (i.tm.cpu_flags.bitfield.cpuavx2)
8597 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8598 if (i.tm.cpu_flags.bitfield.cpufma)
8599 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8600 if (i.tm.cpu_flags.bitfield.cpuavx512f)
8601 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8602 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8603 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8604 if (i.tm.cpu_flags.bitfield.cpuavx512er)
8605 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8606 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8607 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8608 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8609 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8610 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8611 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8612 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8613 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8614 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8615 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8616 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8617 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8618 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8619 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8620 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8621 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8622 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8623 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8624 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8625 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8626 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8627 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8628 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8629 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8630
8631 if (i.tm.cpu_flags.bitfield.cpu8087
8632 || i.tm.cpu_flags.bitfield.cpu287
8633 || i.tm.cpu_flags.bitfield.cpu387
8634 || i.tm.cpu_flags.bitfield.cpu687
8635 || i.tm.cpu_flags.bitfield.cpufisttp)
8636 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8637 if (i.has_regmmx
8638 || i.tm.base_opcode == 0xf77 /* emms */
8639 || i.tm.base_opcode == 0xf0e /* femms */
8640 || i.tm.base_opcode == 0xf2a /* cvtpi2ps */
8641 || i.tm.base_opcode == 0x660f2a /* cvtpi2pd */)
8642 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8643 if (i.has_regxmm)
8644 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8645 if (i.has_regymm)
8646 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8647 if (i.has_regzmm)
8648 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8649 if (i.tm.cpu_flags.bitfield.cpufxsr)
8650 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8651 if (i.tm.cpu_flags.bitfield.cpuxsave)
8652 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8653 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8654 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8655 if (i.tm.cpu_flags.bitfield.cpuxsavec)
8656 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8657 }
8658 #endif
8659
8660 /* Tie dwarf2 debug info to the address at the start of the insn.
8661 We can't do this after the insn has been output as the current
8662 frag may have been closed off. eg. by frag_var. */
8663 dwarf2_emit_insn (0);
8664
8665 insn_start_frag = frag_now;
8666 insn_start_off = frag_now_fix ();
8667
8668 if (add_branch_padding_frag_p (&branch))
8669 {
8670 char *p;
8671 /* Branch can be 8 bytes. Leave some room for prefixes. */
8672 unsigned int max_branch_padding_size = 14;
8673
8674 /* Align section to boundary. */
8675 record_alignment (now_seg, align_branch_power);
8676
8677 /* Make room for padding. */
8678 frag_grow (max_branch_padding_size);
8679
8680 /* Start of the padding. */
8681 p = frag_more (0);
8682
8683 fragP = frag_now;
8684
8685 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
8686 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
8687 NULL, 0, p);
8688
8689 fragP->tc_frag_data.branch_type = branch;
8690 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
8691 }
8692
8693 /* Output jumps. */
8694 if (i.tm.opcode_modifier.jump == JUMP)
8695 output_branch ();
8696 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
8697 || i.tm.opcode_modifier.jump == JUMP_DWORD)
8698 output_jump ();
8699 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
8700 output_interseg_jump ();
8701 else
8702 {
8703 /* Output normal instructions here. */
8704 char *p;
8705 unsigned char *q;
8706 unsigned int j;
8707 unsigned int prefix;
8708
8709 if (avoid_fence
8710 && (i.tm.base_opcode == 0xfaee8
8711 || i.tm.base_opcode == 0xfaef0
8712 || i.tm.base_opcode == 0xfaef8))
8713 {
8714 /* Encode lfence, mfence, and sfence as
8715 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
8716 offsetT val = 0x240483f0ULL;
8717 p = frag_more (5);
8718 md_number_to_chars (p, val, 5);
8719 return;
8720 }
8721
8722 /* Some processors fail on LOCK prefix. This options makes
8723 assembler ignore LOCK prefix and serves as a workaround. */
8724 if (omit_lock_prefix)
8725 {
8726 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8727 return;
8728 i.prefix[LOCK_PREFIX] = 0;
8729 }
8730
8731 if (branch)
8732 /* Skip if this is a branch. */
8733 ;
8734 else if (add_fused_jcc_padding_frag_p ())
8735 {
8736 /* Make room for padding. */
8737 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
8738 p = frag_more (0);
8739
8740 fragP = frag_now;
8741
8742 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
8743 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
8744 NULL, 0, p);
8745
8746 fragP->tc_frag_data.branch_type = align_branch_fused;
8747 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
8748 }
8749 else if (add_branch_prefix_frag_p ())
8750 {
8751 unsigned int max_prefix_size = align_branch_prefix_size;
8752
8753 /* Make room for padding. */
8754 frag_grow (max_prefix_size);
8755 p = frag_more (0);
8756
8757 fragP = frag_now;
8758
8759 frag_var (rs_machine_dependent, max_prefix_size, 0,
8760 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
8761 NULL, 0, p);
8762
8763 fragP->tc_frag_data.max_bytes = max_prefix_size;
8764 }
8765
8766 /* Since the VEX/EVEX prefix contains the implicit prefix, we
8767 don't need the explicit prefix. */
8768 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8769 {
8770 switch (i.tm.opcode_length)
8771 {
8772 case 3:
8773 if (i.tm.base_opcode & 0xff000000)
8774 {
8775 prefix = (i.tm.base_opcode >> 24) & 0xff;
8776 if (!i.tm.cpu_flags.bitfield.cpupadlock
8777 || prefix != REPE_PREFIX_OPCODE
8778 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8779 add_prefix (prefix);
8780 }
8781 break;
8782 case 2:
8783 if ((i.tm.base_opcode & 0xff0000) != 0)
8784 {
8785 prefix = (i.tm.base_opcode >> 16) & 0xff;
8786 add_prefix (prefix);
8787 }
8788 break;
8789 case 1:
8790 break;
8791 case 0:
8792 /* Check for pseudo prefixes. */
8793 as_bad_where (insn_start_frag->fr_file,
8794 insn_start_frag->fr_line,
8795 _("pseudo prefix without instruction"));
8796 return;
8797 default:
8798 abort ();
8799 }
8800
8801 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8802 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8803 R_X86_64_GOTTPOFF relocation so that linker can safely
8804 perform IE->LE optimization. A dummy REX_OPCODE prefix
8805 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
8806 relocation for GDesc -> IE/LE optimization. */
8807 if (x86_elf_abi == X86_64_X32_ABI
8808 && i.operands == 2
8809 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8810 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
8811 && i.prefix[REX_PREFIX] == 0)
8812 add_prefix (REX_OPCODE);
8813 #endif
8814
8815 /* The prefix bytes. */
8816 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8817 if (*q)
8818 FRAG_APPEND_1_CHAR (*q);
8819 }
8820 else
8821 {
8822 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8823 if (*q)
8824 switch (j)
8825 {
8826 case REX_PREFIX:
8827 /* REX byte is encoded in VEX prefix. */
8828 break;
8829 case SEG_PREFIX:
8830 case ADDR_PREFIX:
8831 FRAG_APPEND_1_CHAR (*q);
8832 break;
8833 default:
8834 /* There should be no other prefixes for instructions
8835 with VEX prefix. */
8836 abort ();
8837 }
8838
8839 /* For EVEX instructions i.vrex should become 0 after
8840 build_evex_prefix. For VEX instructions upper 16 registers
8841 aren't available, so VREX should be 0. */
8842 if (i.vrex)
8843 abort ();
8844 /* Now the VEX prefix. */
8845 p = frag_more (i.vex.length);
8846 for (j = 0; j < i.vex.length; j++)
8847 p[j] = i.vex.bytes[j];
8848 }
8849
8850 /* Now the opcode; be careful about word order here! */
8851 if (i.tm.opcode_length == 1)
8852 {
8853 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8854 }
8855 else
8856 {
8857 switch (i.tm.opcode_length)
8858 {
8859 case 4:
8860 p = frag_more (4);
8861 *p++ = (i.tm.base_opcode >> 24) & 0xff;
8862 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8863 break;
8864 case 3:
8865 p = frag_more (3);
8866 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8867 break;
8868 case 2:
8869 p = frag_more (2);
8870 break;
8871 default:
8872 abort ();
8873 break;
8874 }
8875
8876 /* Put out high byte first: can't use md_number_to_chars! */
8877 *p++ = (i.tm.base_opcode >> 8) & 0xff;
8878 *p = i.tm.base_opcode & 0xff;
8879 }
8880
8881 /* Now the modrm byte and sib byte (if present). */
8882 if (i.tm.opcode_modifier.modrm)
8883 {
8884 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8885 | i.rm.reg << 3
8886 | i.rm.mode << 6));
8887 /* If i.rm.regmem == ESP (4)
8888 && i.rm.mode != (Register mode)
8889 && not 16 bit
8890 ==> need second modrm byte. */
8891 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8892 && i.rm.mode != 3
8893 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8894 FRAG_APPEND_1_CHAR ((i.sib.base << 0
8895 | i.sib.index << 3
8896 | i.sib.scale << 6));
8897 }
8898
8899 if (i.disp_operands)
8900 output_disp (insn_start_frag, insn_start_off);
8901
8902 if (i.imm_operands)
8903 output_imm (insn_start_frag, insn_start_off);
8904
8905 /*
8906 * frag_now_fix () returning plain abs_section_offset when we're in the
8907 * absolute section, and abs_section_offset not getting updated as data
8908 * gets added to the frag breaks the logic below.
8909 */
8910 if (now_seg != absolute_section)
8911 {
8912 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8913 if (j > 15)
8914 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8915 j);
8916 else if (fragP)
8917 {
8918 /* NB: Don't add prefix with GOTPC relocation since
8919 output_disp() above depends on the fixed encoding
8920 length. Can't add prefix with TLS relocation since
8921 it breaks TLS linker optimization. */
8922 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
8923 /* Prefix count on the current instruction. */
8924 unsigned int count = i.vex.length;
8925 unsigned int k;
8926 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
8927 /* REX byte is encoded in VEX/EVEX prefix. */
8928 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
8929 count++;
8930
8931 /* Count prefixes for extended opcode maps. */
8932 if (!i.vex.length)
8933 switch (i.tm.opcode_length)
8934 {
8935 case 3:
8936 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
8937 {
8938 count++;
8939 switch ((i.tm.base_opcode >> 8) & 0xff)
8940 {
8941 case 0x38:
8942 case 0x3a:
8943 count++;
8944 break;
8945 default:
8946 break;
8947 }
8948 }
8949 break;
8950 case 2:
8951 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
8952 count++;
8953 break;
8954 case 1:
8955 break;
8956 default:
8957 abort ();
8958 }
8959
8960 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
8961 == BRANCH_PREFIX)
8962 {
8963 /* Set the maximum prefix size in BRANCH_PREFIX
8964 frag. */
8965 if (fragP->tc_frag_data.max_bytes > max)
8966 fragP->tc_frag_data.max_bytes = max;
8967 if (fragP->tc_frag_data.max_bytes > count)
8968 fragP->tc_frag_data.max_bytes -= count;
8969 else
8970 fragP->tc_frag_data.max_bytes = 0;
8971 }
8972 else
8973 {
8974 /* Remember the maximum prefix size in FUSED_JCC_PADDING
8975 frag. */
8976 unsigned int max_prefix_size;
8977 if (align_branch_prefix_size > max)
8978 max_prefix_size = max;
8979 else
8980 max_prefix_size = align_branch_prefix_size;
8981 if (max_prefix_size > count)
8982 fragP->tc_frag_data.max_prefix_length
8983 = max_prefix_size - count;
8984 }
8985
8986 /* Use existing segment prefix if possible. Use CS
8987 segment prefix in 64-bit mode. In 32-bit mode, use SS
8988 segment prefix with ESP/EBP base register and use DS
8989 segment prefix without ESP/EBP base register. */
8990 if (i.prefix[SEG_PREFIX])
8991 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
8992 else if (flag_code == CODE_64BIT)
8993 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
8994 else if (i.base_reg
8995 && (i.base_reg->reg_num == 4
8996 || i.base_reg->reg_num == 5))
8997 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
8998 else
8999 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9000 }
9001 }
9002 }
9003
9004 /* NB: Don't work with COND_JUMP86 without i386. */
9005 if (align_branch_power
9006 && now_seg != absolute_section
9007 && cpu_arch_flags.bitfield.cpui386)
9008 {
9009 /* Terminate each frag so that we can add prefix and check for
9010 fused jcc. */
9011 frag_wane (frag_now);
9012 frag_new (0);
9013 }
9014
9015 #ifdef DEBUG386
9016 if (flag_debug)
9017 {
9018 pi ("" /*line*/, &i);
9019 }
9020 #endif /* DEBUG386 */
9021 }
9022
9023 /* Return the size of the displacement operand N. */
9024
9025 static int
9026 disp_size (unsigned int n)
9027 {
9028 int size = 4;
9029
9030 if (i.types[n].bitfield.disp64)
9031 size = 8;
9032 else if (i.types[n].bitfield.disp8)
9033 size = 1;
9034 else if (i.types[n].bitfield.disp16)
9035 size = 2;
9036 return size;
9037 }
9038
9039 /* Return the size of the immediate operand N. */
9040
9041 static int
9042 imm_size (unsigned int n)
9043 {
9044 int size = 4;
9045 if (i.types[n].bitfield.imm64)
9046 size = 8;
9047 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9048 size = 1;
9049 else if (i.types[n].bitfield.imm16)
9050 size = 2;
9051 return size;
9052 }
9053
9054 static void
9055 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9056 {
9057 char *p;
9058 unsigned int n;
9059
9060 for (n = 0; n < i.operands; n++)
9061 {
9062 if (operand_type_check (i.types[n], disp))
9063 {
9064 if (i.op[n].disps->X_op == O_constant)
9065 {
9066 int size = disp_size (n);
9067 offsetT val = i.op[n].disps->X_add_number;
9068
9069 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9070 size);
9071 p = frag_more (size);
9072 md_number_to_chars (p, val, size);
9073 }
9074 else
9075 {
9076 enum bfd_reloc_code_real reloc_type;
9077 int size = disp_size (n);
9078 int sign = i.types[n].bitfield.disp32s;
9079 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9080 fixS *fixP;
9081
9082 /* We can't have 8 bit displacement here. */
9083 gas_assert (!i.types[n].bitfield.disp8);
9084
9085 /* The PC relative address is computed relative
9086 to the instruction boundary, so in case immediate
9087 fields follows, we need to adjust the value. */
9088 if (pcrel && i.imm_operands)
9089 {
9090 unsigned int n1;
9091 int sz = 0;
9092
9093 for (n1 = 0; n1 < i.operands; n1++)
9094 if (operand_type_check (i.types[n1], imm))
9095 {
9096 /* Only one immediate is allowed for PC
9097 relative address. */
9098 gas_assert (sz == 0);
9099 sz = imm_size (n1);
9100 i.op[n].disps->X_add_number -= sz;
9101 }
9102 /* We should find the immediate. */
9103 gas_assert (sz != 0);
9104 }
9105
9106 p = frag_more (size);
9107 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9108 if (GOT_symbol
9109 && GOT_symbol == i.op[n].disps->X_add_symbol
9110 && (((reloc_type == BFD_RELOC_32
9111 || reloc_type == BFD_RELOC_X86_64_32S
9112 || (reloc_type == BFD_RELOC_64
9113 && object_64bit))
9114 && (i.op[n].disps->X_op == O_symbol
9115 || (i.op[n].disps->X_op == O_add
9116 && ((symbol_get_value_expression
9117 (i.op[n].disps->X_op_symbol)->X_op)
9118 == O_subtract))))
9119 || reloc_type == BFD_RELOC_32_PCREL))
9120 {
9121 if (!object_64bit)
9122 {
9123 reloc_type = BFD_RELOC_386_GOTPC;
9124 i.has_gotpc_tls_reloc = TRUE;
9125 i.op[n].imms->X_add_number +=
9126 encoding_length (insn_start_frag, insn_start_off, p);
9127 }
9128 else if (reloc_type == BFD_RELOC_64)
9129 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9130 else
9131 /* Don't do the adjustment for x86-64, as there
9132 the pcrel addressing is relative to the _next_
9133 insn, and that is taken care of in other code. */
9134 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9135 }
9136 else if (align_branch_power)
9137 {
9138 switch (reloc_type)
9139 {
9140 case BFD_RELOC_386_TLS_GD:
9141 case BFD_RELOC_386_TLS_LDM:
9142 case BFD_RELOC_386_TLS_IE:
9143 case BFD_RELOC_386_TLS_IE_32:
9144 case BFD_RELOC_386_TLS_GOTIE:
9145 case BFD_RELOC_386_TLS_GOTDESC:
9146 case BFD_RELOC_386_TLS_DESC_CALL:
9147 case BFD_RELOC_X86_64_TLSGD:
9148 case BFD_RELOC_X86_64_TLSLD:
9149 case BFD_RELOC_X86_64_GOTTPOFF:
9150 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9151 case BFD_RELOC_X86_64_TLSDESC_CALL:
9152 i.has_gotpc_tls_reloc = TRUE;
9153 default:
9154 break;
9155 }
9156 }
9157 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9158 size, i.op[n].disps, pcrel,
9159 reloc_type);
9160 /* Check for "call/jmp *mem", "mov mem, %reg",
9161 "test %reg, mem" and "binop mem, %reg" where binop
9162 is one of adc, add, and, cmp, or, sbb, sub, xor
9163 instructions without data prefix. Always generate
9164 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9165 if (i.prefix[DATA_PREFIX] == 0
9166 && (generate_relax_relocations
9167 || (!object_64bit
9168 && i.rm.mode == 0
9169 && i.rm.regmem == 5))
9170 && (i.rm.mode == 2
9171 || (i.rm.mode == 0 && i.rm.regmem == 5))
9172 && !is_any_vex_encoding(&i.tm)
9173 && ((i.operands == 1
9174 && i.tm.base_opcode == 0xff
9175 && (i.rm.reg == 2 || i.rm.reg == 4))
9176 || (i.operands == 2
9177 && (i.tm.base_opcode == 0x8b
9178 || i.tm.base_opcode == 0x85
9179 || (i.tm.base_opcode & ~0x38) == 0x03))))
9180 {
9181 if (object_64bit)
9182 {
9183 fixP->fx_tcbit = i.rex != 0;
9184 if (i.base_reg
9185 && (i.base_reg->reg_num == RegIP))
9186 fixP->fx_tcbit2 = 1;
9187 }
9188 else
9189 fixP->fx_tcbit2 = 1;
9190 }
9191 }
9192 }
9193 }
9194 }
9195
9196 static void
9197 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9198 {
9199 char *p;
9200 unsigned int n;
9201
9202 for (n = 0; n < i.operands; n++)
9203 {
9204 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9205 if (i.rounding && (int) n == i.rounding->operand)
9206 continue;
9207
9208 if (operand_type_check (i.types[n], imm))
9209 {
9210 if (i.op[n].imms->X_op == O_constant)
9211 {
9212 int size = imm_size (n);
9213 offsetT val;
9214
9215 val = offset_in_range (i.op[n].imms->X_add_number,
9216 size);
9217 p = frag_more (size);
9218 md_number_to_chars (p, val, size);
9219 }
9220 else
9221 {
9222 /* Not absolute_section.
9223 Need a 32-bit fixup (don't support 8bit
9224 non-absolute imms). Try to support other
9225 sizes ... */
9226 enum bfd_reloc_code_real reloc_type;
9227 int size = imm_size (n);
9228 int sign;
9229
9230 if (i.types[n].bitfield.imm32s
9231 && (i.suffix == QWORD_MNEM_SUFFIX
9232 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9233 sign = 1;
9234 else
9235 sign = 0;
9236
9237 p = frag_more (size);
9238 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9239
9240 /* This is tough to explain. We end up with this one if we
9241 * have operands that look like
9242 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9243 * obtain the absolute address of the GOT, and it is strongly
9244 * preferable from a performance point of view to avoid using
9245 * a runtime relocation for this. The actual sequence of
9246 * instructions often look something like:
9247 *
9248 * call .L66
9249 * .L66:
9250 * popl %ebx
9251 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9252 *
9253 * The call and pop essentially return the absolute address
9254 * of the label .L66 and store it in %ebx. The linker itself
9255 * will ultimately change the first operand of the addl so
9256 * that %ebx points to the GOT, but to keep things simple, the
9257 * .o file must have this operand set so that it generates not
9258 * the absolute address of .L66, but the absolute address of
9259 * itself. This allows the linker itself simply treat a GOTPC
9260 * relocation as asking for a pcrel offset to the GOT to be
9261 * added in, and the addend of the relocation is stored in the
9262 * operand field for the instruction itself.
9263 *
9264 * Our job here is to fix the operand so that it would add
9265 * the correct offset so that %ebx would point to itself. The
9266 * thing that is tricky is that .-.L66 will point to the
9267 * beginning of the instruction, so we need to further modify
9268 * the operand so that it will point to itself. There are
9269 * other cases where you have something like:
9270 *
9271 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9272 *
9273 * and here no correction would be required. Internally in
9274 * the assembler we treat operands of this form as not being
9275 * pcrel since the '.' is explicitly mentioned, and I wonder
9276 * whether it would simplify matters to do it this way. Who
9277 * knows. In earlier versions of the PIC patches, the
9278 * pcrel_adjust field was used to store the correction, but
9279 * since the expression is not pcrel, I felt it would be
9280 * confusing to do it this way. */
9281
9282 if ((reloc_type == BFD_RELOC_32
9283 || reloc_type == BFD_RELOC_X86_64_32S
9284 || reloc_type == BFD_RELOC_64)
9285 && GOT_symbol
9286 && GOT_symbol == i.op[n].imms->X_add_symbol
9287 && (i.op[n].imms->X_op == O_symbol
9288 || (i.op[n].imms->X_op == O_add
9289 && ((symbol_get_value_expression
9290 (i.op[n].imms->X_op_symbol)->X_op)
9291 == O_subtract))))
9292 {
9293 if (!object_64bit)
9294 reloc_type = BFD_RELOC_386_GOTPC;
9295 else if (size == 4)
9296 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9297 else if (size == 8)
9298 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9299 i.has_gotpc_tls_reloc = TRUE;
9300 i.op[n].imms->X_add_number +=
9301 encoding_length (insn_start_frag, insn_start_off, p);
9302 }
9303 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9304 i.op[n].imms, 0, reloc_type);
9305 }
9306 }
9307 }
9308 }
9309 \f
9310 /* x86_cons_fix_new is called via the expression parsing code when a
9311 reloc is needed. We use this hook to get the correct .got reloc. */
9312 static int cons_sign = -1;
9313
9314 void
9315 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9316 expressionS *exp, bfd_reloc_code_real_type r)
9317 {
9318 r = reloc (len, 0, cons_sign, r);
9319
9320 #ifdef TE_PE
9321 if (exp->X_op == O_secrel)
9322 {
9323 exp->X_op = O_symbol;
9324 r = BFD_RELOC_32_SECREL;
9325 }
9326 #endif
9327
9328 fix_new_exp (frag, off, len, exp, 0, r);
9329 }
9330
9331 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9332 purpose of the `.dc.a' internal pseudo-op. */
9333
9334 int
9335 x86_address_bytes (void)
9336 {
9337 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9338 return 4;
9339 return stdoutput->arch_info->bits_per_address / 8;
9340 }
9341
9342 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9343 || defined (LEX_AT)
9344 # define lex_got(reloc, adjust, types) NULL
9345 #else
9346 /* Parse operands of the form
9347 <symbol>@GOTOFF+<nnn>
9348 and similar .plt or .got references.
9349
9350 If we find one, set up the correct relocation in RELOC and copy the
9351 input string, minus the `@GOTOFF' into a malloc'd buffer for
9352 parsing by the calling routine. Return this buffer, and if ADJUST
9353 is non-null set it to the length of the string we removed from the
9354 input line. Otherwise return NULL. */
9355 static char *
9356 lex_got (enum bfd_reloc_code_real *rel,
9357 int *adjust,
9358 i386_operand_type *types)
9359 {
9360 /* Some of the relocations depend on the size of what field is to
9361 be relocated. But in our callers i386_immediate and i386_displacement
9362 we don't yet know the operand size (this will be set by insn
9363 matching). Hence we record the word32 relocation here,
9364 and adjust the reloc according to the real size in reloc(). */
9365 static const struct {
9366 const char *str;
9367 int len;
9368 const enum bfd_reloc_code_real rel[2];
9369 const i386_operand_type types64;
9370 } gotrel[] = {
9371 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9372 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9373 BFD_RELOC_SIZE32 },
9374 OPERAND_TYPE_IMM32_64 },
9375 #endif
9376 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9377 BFD_RELOC_X86_64_PLTOFF64 },
9378 OPERAND_TYPE_IMM64 },
9379 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9380 BFD_RELOC_X86_64_PLT32 },
9381 OPERAND_TYPE_IMM32_32S_DISP32 },
9382 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9383 BFD_RELOC_X86_64_GOTPLT64 },
9384 OPERAND_TYPE_IMM64_DISP64 },
9385 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9386 BFD_RELOC_X86_64_GOTOFF64 },
9387 OPERAND_TYPE_IMM64_DISP64 },
9388 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9389 BFD_RELOC_X86_64_GOTPCREL },
9390 OPERAND_TYPE_IMM32_32S_DISP32 },
9391 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9392 BFD_RELOC_X86_64_TLSGD },
9393 OPERAND_TYPE_IMM32_32S_DISP32 },
9394 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9395 _dummy_first_bfd_reloc_code_real },
9396 OPERAND_TYPE_NONE },
9397 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9398 BFD_RELOC_X86_64_TLSLD },
9399 OPERAND_TYPE_IMM32_32S_DISP32 },
9400 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9401 BFD_RELOC_X86_64_GOTTPOFF },
9402 OPERAND_TYPE_IMM32_32S_DISP32 },
9403 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9404 BFD_RELOC_X86_64_TPOFF32 },
9405 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9406 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9407 _dummy_first_bfd_reloc_code_real },
9408 OPERAND_TYPE_NONE },
9409 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9410 BFD_RELOC_X86_64_DTPOFF32 },
9411 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9412 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9413 _dummy_first_bfd_reloc_code_real },
9414 OPERAND_TYPE_NONE },
9415 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9416 _dummy_first_bfd_reloc_code_real },
9417 OPERAND_TYPE_NONE },
9418 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9419 BFD_RELOC_X86_64_GOT32 },
9420 OPERAND_TYPE_IMM32_32S_64_DISP32 },
9421 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9422 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9423 OPERAND_TYPE_IMM32_32S_DISP32 },
9424 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9425 BFD_RELOC_X86_64_TLSDESC_CALL },
9426 OPERAND_TYPE_IMM32_32S_DISP32 },
9427 };
9428 char *cp;
9429 unsigned int j;
9430
9431 #if defined (OBJ_MAYBE_ELF)
9432 if (!IS_ELF)
9433 return NULL;
9434 #endif
9435
9436 for (cp = input_line_pointer; *cp != '@'; cp++)
9437 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9438 return NULL;
9439
9440 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9441 {
9442 int len = gotrel[j].len;
9443 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9444 {
9445 if (gotrel[j].rel[object_64bit] != 0)
9446 {
9447 int first, second;
9448 char *tmpbuf, *past_reloc;
9449
9450 *rel = gotrel[j].rel[object_64bit];
9451
9452 if (types)
9453 {
9454 if (flag_code != CODE_64BIT)
9455 {
9456 types->bitfield.imm32 = 1;
9457 types->bitfield.disp32 = 1;
9458 }
9459 else
9460 *types = gotrel[j].types64;
9461 }
9462
9463 if (j != 0 && GOT_symbol == NULL)
9464 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9465
9466 /* The length of the first part of our input line. */
9467 first = cp - input_line_pointer;
9468
9469 /* The second part goes from after the reloc token until
9470 (and including) an end_of_line char or comma. */
9471 past_reloc = cp + 1 + len;
9472 cp = past_reloc;
9473 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9474 ++cp;
9475 second = cp + 1 - past_reloc;
9476
9477 /* Allocate and copy string. The trailing NUL shouldn't
9478 be necessary, but be safe. */
9479 tmpbuf = XNEWVEC (char, first + second + 2);
9480 memcpy (tmpbuf, input_line_pointer, first);
9481 if (second != 0 && *past_reloc != ' ')
9482 /* Replace the relocation token with ' ', so that
9483 errors like foo@GOTOFF1 will be detected. */
9484 tmpbuf[first++] = ' ';
9485 else
9486 /* Increment length by 1 if the relocation token is
9487 removed. */
9488 len++;
9489 if (adjust)
9490 *adjust = len;
9491 memcpy (tmpbuf + first, past_reloc, second);
9492 tmpbuf[first + second] = '\0';
9493 return tmpbuf;
9494 }
9495
9496 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9497 gotrel[j].str, 1 << (5 + object_64bit));
9498 return NULL;
9499 }
9500 }
9501
9502 /* Might be a symbol version string. Don't as_bad here. */
9503 return NULL;
9504 }
9505 #endif
9506
9507 #ifdef TE_PE
9508 #ifdef lex_got
9509 #undef lex_got
9510 #endif
9511 /* Parse operands of the form
9512 <symbol>@SECREL32+<nnn>
9513
9514 If we find one, set up the correct relocation in RELOC and copy the
9515 input string, minus the `@SECREL32' into a malloc'd buffer for
9516 parsing by the calling routine. Return this buffer, and if ADJUST
9517 is non-null set it to the length of the string we removed from the
9518 input line. Otherwise return NULL.
9519
9520 This function is copied from the ELF version above adjusted for PE targets. */
9521
9522 static char *
9523 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
9524 int *adjust ATTRIBUTE_UNUSED,
9525 i386_operand_type *types)
9526 {
9527 static const struct
9528 {
9529 const char *str;
9530 int len;
9531 const enum bfd_reloc_code_real rel[2];
9532 const i386_operand_type types64;
9533 }
9534 gotrel[] =
9535 {
9536 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
9537 BFD_RELOC_32_SECREL },
9538 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9539 };
9540
9541 char *cp;
9542 unsigned j;
9543
9544 for (cp = input_line_pointer; *cp != '@'; cp++)
9545 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9546 return NULL;
9547
9548 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9549 {
9550 int len = gotrel[j].len;
9551
9552 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9553 {
9554 if (gotrel[j].rel[object_64bit] != 0)
9555 {
9556 int first, second;
9557 char *tmpbuf, *past_reloc;
9558
9559 *rel = gotrel[j].rel[object_64bit];
9560 if (adjust)
9561 *adjust = len;
9562
9563 if (types)
9564 {
9565 if (flag_code != CODE_64BIT)
9566 {
9567 types->bitfield.imm32 = 1;
9568 types->bitfield.disp32 = 1;
9569 }
9570 else
9571 *types = gotrel[j].types64;
9572 }
9573
9574 /* The length of the first part of our input line. */
9575 first = cp - input_line_pointer;
9576
9577 /* The second part goes from after the reloc token until
9578 (and including) an end_of_line char or comma. */
9579 past_reloc = cp + 1 + len;
9580 cp = past_reloc;
9581 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9582 ++cp;
9583 second = cp + 1 - past_reloc;
9584
9585 /* Allocate and copy string. The trailing NUL shouldn't
9586 be necessary, but be safe. */
9587 tmpbuf = XNEWVEC (char, first + second + 2);
9588 memcpy (tmpbuf, input_line_pointer, first);
9589 if (second != 0 && *past_reloc != ' ')
9590 /* Replace the relocation token with ' ', so that
9591 errors like foo@SECLREL321 will be detected. */
9592 tmpbuf[first++] = ' ';
9593 memcpy (tmpbuf + first, past_reloc, second);
9594 tmpbuf[first + second] = '\0';
9595 return tmpbuf;
9596 }
9597
9598 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9599 gotrel[j].str, 1 << (5 + object_64bit));
9600 return NULL;
9601 }
9602 }
9603
9604 /* Might be a symbol version string. Don't as_bad here. */
9605 return NULL;
9606 }
9607
9608 #endif /* TE_PE */
9609
9610 bfd_reloc_code_real_type
9611 x86_cons (expressionS *exp, int size)
9612 {
9613 bfd_reloc_code_real_type got_reloc = NO_RELOC;
9614
9615 intel_syntax = -intel_syntax;
9616
9617 exp->X_md = 0;
9618 if (size == 4 || (object_64bit && size == 8))
9619 {
9620 /* Handle @GOTOFF and the like in an expression. */
9621 char *save;
9622 char *gotfree_input_line;
9623 int adjust = 0;
9624
9625 save = input_line_pointer;
9626 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9627 if (gotfree_input_line)
9628 input_line_pointer = gotfree_input_line;
9629
9630 expression (exp);
9631
9632 if (gotfree_input_line)
9633 {
9634 /* expression () has merrily parsed up to the end of line,
9635 or a comma - in the wrong buffer. Transfer how far
9636 input_line_pointer has moved to the right buffer. */
9637 input_line_pointer = (save
9638 + (input_line_pointer - gotfree_input_line)
9639 + adjust);
9640 free (gotfree_input_line);
9641 if (exp->X_op == O_constant
9642 || exp->X_op == O_absent
9643 || exp->X_op == O_illegal
9644 || exp->X_op == O_register
9645 || exp->X_op == O_big)
9646 {
9647 char c = *input_line_pointer;
9648 *input_line_pointer = 0;
9649 as_bad (_("missing or invalid expression `%s'"), save);
9650 *input_line_pointer = c;
9651 }
9652 else if ((got_reloc == BFD_RELOC_386_PLT32
9653 || got_reloc == BFD_RELOC_X86_64_PLT32)
9654 && exp->X_op != O_symbol)
9655 {
9656 char c = *input_line_pointer;
9657 *input_line_pointer = 0;
9658 as_bad (_("invalid PLT expression `%s'"), save);
9659 *input_line_pointer = c;
9660 }
9661 }
9662 }
9663 else
9664 expression (exp);
9665
9666 intel_syntax = -intel_syntax;
9667
9668 if (intel_syntax)
9669 i386_intel_simplify (exp);
9670
9671 return got_reloc;
9672 }
9673
9674 static void
9675 signed_cons (int size)
9676 {
9677 if (flag_code == CODE_64BIT)
9678 cons_sign = 1;
9679 cons (size);
9680 cons_sign = -1;
9681 }
9682
9683 #ifdef TE_PE
9684 static void
9685 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9686 {
9687 expressionS exp;
9688
9689 do
9690 {
9691 expression (&exp);
9692 if (exp.X_op == O_symbol)
9693 exp.X_op = O_secrel;
9694
9695 emit_expr (&exp, 4);
9696 }
9697 while (*input_line_pointer++ == ',');
9698
9699 input_line_pointer--;
9700 demand_empty_rest_of_line ();
9701 }
9702 #endif
9703
9704 /* Handle Vector operations. */
9705
9706 static char *
9707 check_VecOperations (char *op_string, char *op_end)
9708 {
9709 const reg_entry *mask;
9710 const char *saved;
9711 char *end_op;
9712
9713 while (*op_string
9714 && (op_end == NULL || op_string < op_end))
9715 {
9716 saved = op_string;
9717 if (*op_string == '{')
9718 {
9719 op_string++;
9720
9721 /* Check broadcasts. */
9722 if (strncmp (op_string, "1to", 3) == 0)
9723 {
9724 int bcst_type;
9725
9726 if (i.broadcast)
9727 goto duplicated_vec_op;
9728
9729 op_string += 3;
9730 if (*op_string == '8')
9731 bcst_type = 8;
9732 else if (*op_string == '4')
9733 bcst_type = 4;
9734 else if (*op_string == '2')
9735 bcst_type = 2;
9736 else if (*op_string == '1'
9737 && *(op_string+1) == '6')
9738 {
9739 bcst_type = 16;
9740 op_string++;
9741 }
9742 else
9743 {
9744 as_bad (_("Unsupported broadcast: `%s'"), saved);
9745 return NULL;
9746 }
9747 op_string++;
9748
9749 broadcast_op.type = bcst_type;
9750 broadcast_op.operand = this_operand;
9751 broadcast_op.bytes = 0;
9752 i.broadcast = &broadcast_op;
9753 }
9754 /* Check masking operation. */
9755 else if ((mask = parse_register (op_string, &end_op)) != NULL)
9756 {
9757 /* k0 can't be used for write mask. */
9758 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
9759 {
9760 as_bad (_("`%s%s' can't be used for write mask"),
9761 register_prefix, mask->reg_name);
9762 return NULL;
9763 }
9764
9765 if (!i.mask)
9766 {
9767 mask_op.mask = mask;
9768 mask_op.zeroing = 0;
9769 mask_op.operand = this_operand;
9770 i.mask = &mask_op;
9771 }
9772 else
9773 {
9774 if (i.mask->mask)
9775 goto duplicated_vec_op;
9776
9777 i.mask->mask = mask;
9778
9779 /* Only "{z}" is allowed here. No need to check
9780 zeroing mask explicitly. */
9781 if (i.mask->operand != this_operand)
9782 {
9783 as_bad (_("invalid write mask `%s'"), saved);
9784 return NULL;
9785 }
9786 }
9787
9788 op_string = end_op;
9789 }
9790 /* Check zeroing-flag for masking operation. */
9791 else if (*op_string == 'z')
9792 {
9793 if (!i.mask)
9794 {
9795 mask_op.mask = NULL;
9796 mask_op.zeroing = 1;
9797 mask_op.operand = this_operand;
9798 i.mask = &mask_op;
9799 }
9800 else
9801 {
9802 if (i.mask->zeroing)
9803 {
9804 duplicated_vec_op:
9805 as_bad (_("duplicated `%s'"), saved);
9806 return NULL;
9807 }
9808
9809 i.mask->zeroing = 1;
9810
9811 /* Only "{%k}" is allowed here. No need to check mask
9812 register explicitly. */
9813 if (i.mask->operand != this_operand)
9814 {
9815 as_bad (_("invalid zeroing-masking `%s'"),
9816 saved);
9817 return NULL;
9818 }
9819 }
9820
9821 op_string++;
9822 }
9823 else
9824 goto unknown_vec_op;
9825
9826 if (*op_string != '}')
9827 {
9828 as_bad (_("missing `}' in `%s'"), saved);
9829 return NULL;
9830 }
9831 op_string++;
9832
9833 /* Strip whitespace since the addition of pseudo prefixes
9834 changed how the scrubber treats '{'. */
9835 if (is_space_char (*op_string))
9836 ++op_string;
9837
9838 continue;
9839 }
9840 unknown_vec_op:
9841 /* We don't know this one. */
9842 as_bad (_("unknown vector operation: `%s'"), saved);
9843 return NULL;
9844 }
9845
9846 if (i.mask && i.mask->zeroing && !i.mask->mask)
9847 {
9848 as_bad (_("zeroing-masking only allowed with write mask"));
9849 return NULL;
9850 }
9851
9852 return op_string;
9853 }
9854
9855 static int
9856 i386_immediate (char *imm_start)
9857 {
9858 char *save_input_line_pointer;
9859 char *gotfree_input_line;
9860 segT exp_seg = 0;
9861 expressionS *exp;
9862 i386_operand_type types;
9863
9864 operand_type_set (&types, ~0);
9865
9866 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9867 {
9868 as_bad (_("at most %d immediate operands are allowed"),
9869 MAX_IMMEDIATE_OPERANDS);
9870 return 0;
9871 }
9872
9873 exp = &im_expressions[i.imm_operands++];
9874 i.op[this_operand].imms = exp;
9875
9876 if (is_space_char (*imm_start))
9877 ++imm_start;
9878
9879 save_input_line_pointer = input_line_pointer;
9880 input_line_pointer = imm_start;
9881
9882 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9883 if (gotfree_input_line)
9884 input_line_pointer = gotfree_input_line;
9885
9886 exp_seg = expression (exp);
9887
9888 SKIP_WHITESPACE ();
9889
9890 /* Handle vector operations. */
9891 if (*input_line_pointer == '{')
9892 {
9893 input_line_pointer = check_VecOperations (input_line_pointer,
9894 NULL);
9895 if (input_line_pointer == NULL)
9896 return 0;
9897 }
9898
9899 if (*input_line_pointer)
9900 as_bad (_("junk `%s' after expression"), input_line_pointer);
9901
9902 input_line_pointer = save_input_line_pointer;
9903 if (gotfree_input_line)
9904 {
9905 free (gotfree_input_line);
9906
9907 if (exp->X_op == O_constant || exp->X_op == O_register)
9908 exp->X_op = O_illegal;
9909 }
9910
9911 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9912 }
9913
9914 static int
9915 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9916 i386_operand_type types, const char *imm_start)
9917 {
9918 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9919 {
9920 if (imm_start)
9921 as_bad (_("missing or invalid immediate expression `%s'"),
9922 imm_start);
9923 return 0;
9924 }
9925 else if (exp->X_op == O_constant)
9926 {
9927 /* Size it properly later. */
9928 i.types[this_operand].bitfield.imm64 = 1;
9929 /* If not 64bit, sign extend val. */
9930 if (flag_code != CODE_64BIT
9931 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9932 exp->X_add_number
9933 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9934 }
9935 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9936 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9937 && exp_seg != absolute_section
9938 && exp_seg != text_section
9939 && exp_seg != data_section
9940 && exp_seg != bss_section
9941 && exp_seg != undefined_section
9942 && !bfd_is_com_section (exp_seg))
9943 {
9944 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9945 return 0;
9946 }
9947 #endif
9948 else if (!intel_syntax && exp_seg == reg_section)
9949 {
9950 if (imm_start)
9951 as_bad (_("illegal immediate register operand %s"), imm_start);
9952 return 0;
9953 }
9954 else
9955 {
9956 /* This is an address. The size of the address will be
9957 determined later, depending on destination register,
9958 suffix, or the default for the section. */
9959 i.types[this_operand].bitfield.imm8 = 1;
9960 i.types[this_operand].bitfield.imm16 = 1;
9961 i.types[this_operand].bitfield.imm32 = 1;
9962 i.types[this_operand].bitfield.imm32s = 1;
9963 i.types[this_operand].bitfield.imm64 = 1;
9964 i.types[this_operand] = operand_type_and (i.types[this_operand],
9965 types);
9966 }
9967
9968 return 1;
9969 }
9970
9971 static char *
9972 i386_scale (char *scale)
9973 {
9974 offsetT val;
9975 char *save = input_line_pointer;
9976
9977 input_line_pointer = scale;
9978 val = get_absolute_expression ();
9979
9980 switch (val)
9981 {
9982 case 1:
9983 i.log2_scale_factor = 0;
9984 break;
9985 case 2:
9986 i.log2_scale_factor = 1;
9987 break;
9988 case 4:
9989 i.log2_scale_factor = 2;
9990 break;
9991 case 8:
9992 i.log2_scale_factor = 3;
9993 break;
9994 default:
9995 {
9996 char sep = *input_line_pointer;
9997
9998 *input_line_pointer = '\0';
9999 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10000 scale);
10001 *input_line_pointer = sep;
10002 input_line_pointer = save;
10003 return NULL;
10004 }
10005 }
10006 if (i.log2_scale_factor != 0 && i.index_reg == 0)
10007 {
10008 as_warn (_("scale factor of %d without an index register"),
10009 1 << i.log2_scale_factor);
10010 i.log2_scale_factor = 0;
10011 }
10012 scale = input_line_pointer;
10013 input_line_pointer = save;
10014 return scale;
10015 }
10016
10017 static int
10018 i386_displacement (char *disp_start, char *disp_end)
10019 {
10020 expressionS *exp;
10021 segT exp_seg = 0;
10022 char *save_input_line_pointer;
10023 char *gotfree_input_line;
10024 int override;
10025 i386_operand_type bigdisp, types = anydisp;
10026 int ret;
10027
10028 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10029 {
10030 as_bad (_("at most %d displacement operands are allowed"),
10031 MAX_MEMORY_OPERANDS);
10032 return 0;
10033 }
10034
10035 operand_type_set (&bigdisp, 0);
10036 if (i.jumpabsolute
10037 || i.types[this_operand].bitfield.baseindex
10038 || (current_templates->start->opcode_modifier.jump != JUMP
10039 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10040 {
10041 i386_addressing_mode ();
10042 override = (i.prefix[ADDR_PREFIX] != 0);
10043 if (flag_code == CODE_64BIT)
10044 {
10045 if (!override)
10046 {
10047 bigdisp.bitfield.disp32s = 1;
10048 bigdisp.bitfield.disp64 = 1;
10049 }
10050 else
10051 bigdisp.bitfield.disp32 = 1;
10052 }
10053 else if ((flag_code == CODE_16BIT) ^ override)
10054 bigdisp.bitfield.disp16 = 1;
10055 else
10056 bigdisp.bitfield.disp32 = 1;
10057 }
10058 else
10059 {
10060 /* For PC-relative branches, the width of the displacement may be
10061 dependent upon data size, but is never dependent upon address size.
10062 Also make sure to not unintentionally match against a non-PC-relative
10063 branch template. */
10064 static templates aux_templates;
10065 const insn_template *t = current_templates->start;
10066 bfd_boolean has_intel64 = FALSE;
10067
10068 aux_templates.start = t;
10069 while (++t < current_templates->end)
10070 {
10071 if (t->opcode_modifier.jump
10072 != current_templates->start->opcode_modifier.jump)
10073 break;
10074 if ((t->opcode_modifier.isa64 >= INTEL64))
10075 has_intel64 = TRUE;
10076 }
10077 if (t < current_templates->end)
10078 {
10079 aux_templates.end = t;
10080 current_templates = &aux_templates;
10081 }
10082
10083 override = (i.prefix[DATA_PREFIX] != 0);
10084 if (flag_code == CODE_64BIT)
10085 {
10086 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10087 && (!intel64 || !has_intel64))
10088 bigdisp.bitfield.disp16 = 1;
10089 else
10090 bigdisp.bitfield.disp32s = 1;
10091 }
10092 else
10093 {
10094 if (!override)
10095 override = (i.suffix == (flag_code != CODE_16BIT
10096 ? WORD_MNEM_SUFFIX
10097 : LONG_MNEM_SUFFIX));
10098 bigdisp.bitfield.disp32 = 1;
10099 if ((flag_code == CODE_16BIT) ^ override)
10100 {
10101 bigdisp.bitfield.disp32 = 0;
10102 bigdisp.bitfield.disp16 = 1;
10103 }
10104 }
10105 }
10106 i.types[this_operand] = operand_type_or (i.types[this_operand],
10107 bigdisp);
10108
10109 exp = &disp_expressions[i.disp_operands];
10110 i.op[this_operand].disps = exp;
10111 i.disp_operands++;
10112 save_input_line_pointer = input_line_pointer;
10113 input_line_pointer = disp_start;
10114 END_STRING_AND_SAVE (disp_end);
10115
10116 #ifndef GCC_ASM_O_HACK
10117 #define GCC_ASM_O_HACK 0
10118 #endif
10119 #if GCC_ASM_O_HACK
10120 END_STRING_AND_SAVE (disp_end + 1);
10121 if (i.types[this_operand].bitfield.baseIndex
10122 && displacement_string_end[-1] == '+')
10123 {
10124 /* This hack is to avoid a warning when using the "o"
10125 constraint within gcc asm statements.
10126 For instance:
10127
10128 #define _set_tssldt_desc(n,addr,limit,type) \
10129 __asm__ __volatile__ ( \
10130 "movw %w2,%0\n\t" \
10131 "movw %w1,2+%0\n\t" \
10132 "rorl $16,%1\n\t" \
10133 "movb %b1,4+%0\n\t" \
10134 "movb %4,5+%0\n\t" \
10135 "movb $0,6+%0\n\t" \
10136 "movb %h1,7+%0\n\t" \
10137 "rorl $16,%1" \
10138 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10139
10140 This works great except that the output assembler ends
10141 up looking a bit weird if it turns out that there is
10142 no offset. You end up producing code that looks like:
10143
10144 #APP
10145 movw $235,(%eax)
10146 movw %dx,2+(%eax)
10147 rorl $16,%edx
10148 movb %dl,4+(%eax)
10149 movb $137,5+(%eax)
10150 movb $0,6+(%eax)
10151 movb %dh,7+(%eax)
10152 rorl $16,%edx
10153 #NO_APP
10154
10155 So here we provide the missing zero. */
10156
10157 *displacement_string_end = '0';
10158 }
10159 #endif
10160 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10161 if (gotfree_input_line)
10162 input_line_pointer = gotfree_input_line;
10163
10164 exp_seg = expression (exp);
10165
10166 SKIP_WHITESPACE ();
10167 if (*input_line_pointer)
10168 as_bad (_("junk `%s' after expression"), input_line_pointer);
10169 #if GCC_ASM_O_HACK
10170 RESTORE_END_STRING (disp_end + 1);
10171 #endif
10172 input_line_pointer = save_input_line_pointer;
10173 if (gotfree_input_line)
10174 {
10175 free (gotfree_input_line);
10176
10177 if (exp->X_op == O_constant || exp->X_op == O_register)
10178 exp->X_op = O_illegal;
10179 }
10180
10181 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10182
10183 RESTORE_END_STRING (disp_end);
10184
10185 return ret;
10186 }
10187
10188 static int
10189 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10190 i386_operand_type types, const char *disp_start)
10191 {
10192 i386_operand_type bigdisp;
10193 int ret = 1;
10194
10195 /* We do this to make sure that the section symbol is in
10196 the symbol table. We will ultimately change the relocation
10197 to be relative to the beginning of the section. */
10198 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10199 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10200 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10201 {
10202 if (exp->X_op != O_symbol)
10203 goto inv_disp;
10204
10205 if (S_IS_LOCAL (exp->X_add_symbol)
10206 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10207 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10208 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10209 exp->X_op = O_subtract;
10210 exp->X_op_symbol = GOT_symbol;
10211 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10212 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10213 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10214 i.reloc[this_operand] = BFD_RELOC_64;
10215 else
10216 i.reloc[this_operand] = BFD_RELOC_32;
10217 }
10218
10219 else if (exp->X_op == O_absent
10220 || exp->X_op == O_illegal
10221 || exp->X_op == O_big)
10222 {
10223 inv_disp:
10224 as_bad (_("missing or invalid displacement expression `%s'"),
10225 disp_start);
10226 ret = 0;
10227 }
10228
10229 else if (flag_code == CODE_64BIT
10230 && !i.prefix[ADDR_PREFIX]
10231 && exp->X_op == O_constant)
10232 {
10233 /* Since displacement is signed extended to 64bit, don't allow
10234 disp32 and turn off disp32s if they are out of range. */
10235 i.types[this_operand].bitfield.disp32 = 0;
10236 if (!fits_in_signed_long (exp->X_add_number))
10237 {
10238 i.types[this_operand].bitfield.disp32s = 0;
10239 if (i.types[this_operand].bitfield.baseindex)
10240 {
10241 as_bad (_("0x%lx out range of signed 32bit displacement"),
10242 (long) exp->X_add_number);
10243 ret = 0;
10244 }
10245 }
10246 }
10247
10248 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10249 else if (exp->X_op != O_constant
10250 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10251 && exp_seg != absolute_section
10252 && exp_seg != text_section
10253 && exp_seg != data_section
10254 && exp_seg != bss_section
10255 && exp_seg != undefined_section
10256 && !bfd_is_com_section (exp_seg))
10257 {
10258 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10259 ret = 0;
10260 }
10261 #endif
10262
10263 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10264 /* Constants get taken care of by optimize_disp(). */
10265 && exp->X_op != O_constant)
10266 i.types[this_operand].bitfield.disp8 = 1;
10267
10268 /* Check if this is a displacement only operand. */
10269 bigdisp = i.types[this_operand];
10270 bigdisp.bitfield.disp8 = 0;
10271 bigdisp.bitfield.disp16 = 0;
10272 bigdisp.bitfield.disp32 = 0;
10273 bigdisp.bitfield.disp32s = 0;
10274 bigdisp.bitfield.disp64 = 0;
10275 if (operand_type_all_zero (&bigdisp))
10276 i.types[this_operand] = operand_type_and (i.types[this_operand],
10277 types);
10278
10279 return ret;
10280 }
10281
10282 /* Return the active addressing mode, taking address override and
10283 registers forming the address into consideration. Update the
10284 address override prefix if necessary. */
10285
10286 static enum flag_code
10287 i386_addressing_mode (void)
10288 {
10289 enum flag_code addr_mode;
10290
10291 if (i.prefix[ADDR_PREFIX])
10292 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10293 else
10294 {
10295 addr_mode = flag_code;
10296
10297 #if INFER_ADDR_PREFIX
10298 if (i.mem_operands == 0)
10299 {
10300 /* Infer address prefix from the first memory operand. */
10301 const reg_entry *addr_reg = i.base_reg;
10302
10303 if (addr_reg == NULL)
10304 addr_reg = i.index_reg;
10305
10306 if (addr_reg)
10307 {
10308 if (addr_reg->reg_type.bitfield.dword)
10309 addr_mode = CODE_32BIT;
10310 else if (flag_code != CODE_64BIT
10311 && addr_reg->reg_type.bitfield.word)
10312 addr_mode = CODE_16BIT;
10313
10314 if (addr_mode != flag_code)
10315 {
10316 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10317 i.prefixes += 1;
10318 /* Change the size of any displacement too. At most one
10319 of Disp16 or Disp32 is set.
10320 FIXME. There doesn't seem to be any real need for
10321 separate Disp16 and Disp32 flags. The same goes for
10322 Imm16 and Imm32. Removing them would probably clean
10323 up the code quite a lot. */
10324 if (flag_code != CODE_64BIT
10325 && (i.types[this_operand].bitfield.disp16
10326 || i.types[this_operand].bitfield.disp32))
10327 i.types[this_operand]
10328 = operand_type_xor (i.types[this_operand], disp16_32);
10329 }
10330 }
10331 }
10332 #endif
10333 }
10334
10335 return addr_mode;
10336 }
10337
10338 /* Make sure the memory operand we've been dealt is valid.
10339 Return 1 on success, 0 on a failure. */
10340
10341 static int
10342 i386_index_check (const char *operand_string)
10343 {
10344 const char *kind = "base/index";
10345 enum flag_code addr_mode = i386_addressing_mode ();
10346
10347 if (current_templates->start->opcode_modifier.isstring
10348 && !current_templates->start->cpu_flags.bitfield.cpupadlock
10349 && (current_templates->end[-1].opcode_modifier.isstring
10350 || i.mem_operands))
10351 {
10352 /* Memory operands of string insns are special in that they only allow
10353 a single register (rDI, rSI, or rBX) as their memory address. */
10354 const reg_entry *expected_reg;
10355 static const char *di_si[][2] =
10356 {
10357 { "esi", "edi" },
10358 { "si", "di" },
10359 { "rsi", "rdi" }
10360 };
10361 static const char *bx[] = { "ebx", "bx", "rbx" };
10362
10363 kind = "string address";
10364
10365 if (current_templates->start->opcode_modifier.repprefixok)
10366 {
10367 int es_op = current_templates->end[-1].opcode_modifier.isstring
10368 - IS_STRING_ES_OP0;
10369 int op = 0;
10370
10371 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10372 || ((!i.mem_operands != !intel_syntax)
10373 && current_templates->end[-1].operand_types[1]
10374 .bitfield.baseindex))
10375 op = 1;
10376 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10377 }
10378 else
10379 expected_reg = hash_find (reg_hash, bx[addr_mode]);
10380
10381 if (i.base_reg != expected_reg
10382 || i.index_reg
10383 || operand_type_check (i.types[this_operand], disp))
10384 {
10385 /* The second memory operand must have the same size as
10386 the first one. */
10387 if (i.mem_operands
10388 && i.base_reg
10389 && !((addr_mode == CODE_64BIT
10390 && i.base_reg->reg_type.bitfield.qword)
10391 || (addr_mode == CODE_32BIT
10392 ? i.base_reg->reg_type.bitfield.dword
10393 : i.base_reg->reg_type.bitfield.word)))
10394 goto bad_address;
10395
10396 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10397 operand_string,
10398 intel_syntax ? '[' : '(',
10399 register_prefix,
10400 expected_reg->reg_name,
10401 intel_syntax ? ']' : ')');
10402 return 1;
10403 }
10404 else
10405 return 1;
10406
10407 bad_address:
10408 as_bad (_("`%s' is not a valid %s expression"),
10409 operand_string, kind);
10410 return 0;
10411 }
10412 else
10413 {
10414 if (addr_mode != CODE_16BIT)
10415 {
10416 /* 32-bit/64-bit checks. */
10417 if ((i.base_reg
10418 && ((addr_mode == CODE_64BIT
10419 ? !i.base_reg->reg_type.bitfield.qword
10420 : !i.base_reg->reg_type.bitfield.dword)
10421 || (i.index_reg && i.base_reg->reg_num == RegIP)
10422 || i.base_reg->reg_num == RegIZ))
10423 || (i.index_reg
10424 && !i.index_reg->reg_type.bitfield.xmmword
10425 && !i.index_reg->reg_type.bitfield.ymmword
10426 && !i.index_reg->reg_type.bitfield.zmmword
10427 && ((addr_mode == CODE_64BIT
10428 ? !i.index_reg->reg_type.bitfield.qword
10429 : !i.index_reg->reg_type.bitfield.dword)
10430 || !i.index_reg->reg_type.bitfield.baseindex)))
10431 goto bad_address;
10432
10433 /* bndmk, bndldx, and bndstx have special restrictions. */
10434 if (current_templates->start->base_opcode == 0xf30f1b
10435 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10436 {
10437 /* They cannot use RIP-relative addressing. */
10438 if (i.base_reg && i.base_reg->reg_num == RegIP)
10439 {
10440 as_bad (_("`%s' cannot be used here"), operand_string);
10441 return 0;
10442 }
10443
10444 /* bndldx and bndstx ignore their scale factor. */
10445 if (current_templates->start->base_opcode != 0xf30f1b
10446 && i.log2_scale_factor)
10447 as_warn (_("register scaling is being ignored here"));
10448 }
10449 }
10450 else
10451 {
10452 /* 16-bit checks. */
10453 if ((i.base_reg
10454 && (!i.base_reg->reg_type.bitfield.word
10455 || !i.base_reg->reg_type.bitfield.baseindex))
10456 || (i.index_reg
10457 && (!i.index_reg->reg_type.bitfield.word
10458 || !i.index_reg->reg_type.bitfield.baseindex
10459 || !(i.base_reg
10460 && i.base_reg->reg_num < 6
10461 && i.index_reg->reg_num >= 6
10462 && i.log2_scale_factor == 0))))
10463 goto bad_address;
10464 }
10465 }
10466 return 1;
10467 }
10468
10469 /* Handle vector immediates. */
10470
10471 static int
10472 RC_SAE_immediate (const char *imm_start)
10473 {
10474 unsigned int match_found, j;
10475 const char *pstr = imm_start;
10476 expressionS *exp;
10477
10478 if (*pstr != '{')
10479 return 0;
10480
10481 pstr++;
10482 match_found = 0;
10483 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10484 {
10485 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10486 {
10487 if (!i.rounding)
10488 {
10489 rc_op.type = RC_NamesTable[j].type;
10490 rc_op.operand = this_operand;
10491 i.rounding = &rc_op;
10492 }
10493 else
10494 {
10495 as_bad (_("duplicated `%s'"), imm_start);
10496 return 0;
10497 }
10498 pstr += RC_NamesTable[j].len;
10499 match_found = 1;
10500 break;
10501 }
10502 }
10503 if (!match_found)
10504 return 0;
10505
10506 if (*pstr++ != '}')
10507 {
10508 as_bad (_("Missing '}': '%s'"), imm_start);
10509 return 0;
10510 }
10511 /* RC/SAE immediate string should contain nothing more. */;
10512 if (*pstr != 0)
10513 {
10514 as_bad (_("Junk after '}': '%s'"), imm_start);
10515 return 0;
10516 }
10517
10518 exp = &im_expressions[i.imm_operands++];
10519 i.op[this_operand].imms = exp;
10520
10521 exp->X_op = O_constant;
10522 exp->X_add_number = 0;
10523 exp->X_add_symbol = (symbolS *) 0;
10524 exp->X_op_symbol = (symbolS *) 0;
10525
10526 i.types[this_operand].bitfield.imm8 = 1;
10527 return 1;
10528 }
10529
10530 /* Only string instructions can have a second memory operand, so
10531 reduce current_templates to just those if it contains any. */
10532 static int
10533 maybe_adjust_templates (void)
10534 {
10535 const insn_template *t;
10536
10537 gas_assert (i.mem_operands == 1);
10538
10539 for (t = current_templates->start; t < current_templates->end; ++t)
10540 if (t->opcode_modifier.isstring)
10541 break;
10542
10543 if (t < current_templates->end)
10544 {
10545 static templates aux_templates;
10546 bfd_boolean recheck;
10547
10548 aux_templates.start = t;
10549 for (; t < current_templates->end; ++t)
10550 if (!t->opcode_modifier.isstring)
10551 break;
10552 aux_templates.end = t;
10553
10554 /* Determine whether to re-check the first memory operand. */
10555 recheck = (aux_templates.start != current_templates->start
10556 || t != current_templates->end);
10557
10558 current_templates = &aux_templates;
10559
10560 if (recheck)
10561 {
10562 i.mem_operands = 0;
10563 if (i.memop1_string != NULL
10564 && i386_index_check (i.memop1_string) == 0)
10565 return 0;
10566 i.mem_operands = 1;
10567 }
10568 }
10569
10570 return 1;
10571 }
10572
10573 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
10574 on error. */
10575
10576 static int
10577 i386_att_operand (char *operand_string)
10578 {
10579 const reg_entry *r;
10580 char *end_op;
10581 char *op_string = operand_string;
10582
10583 if (is_space_char (*op_string))
10584 ++op_string;
10585
10586 /* We check for an absolute prefix (differentiating,
10587 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
10588 if (*op_string == ABSOLUTE_PREFIX)
10589 {
10590 ++op_string;
10591 if (is_space_char (*op_string))
10592 ++op_string;
10593 i.jumpabsolute = TRUE;
10594 }
10595
10596 /* Check if operand is a register. */
10597 if ((r = parse_register (op_string, &end_op)) != NULL)
10598 {
10599 i386_operand_type temp;
10600
10601 /* Check for a segment override by searching for ':' after a
10602 segment register. */
10603 op_string = end_op;
10604 if (is_space_char (*op_string))
10605 ++op_string;
10606 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
10607 {
10608 switch (r->reg_num)
10609 {
10610 case 0:
10611 i.seg[i.mem_operands] = &es;
10612 break;
10613 case 1:
10614 i.seg[i.mem_operands] = &cs;
10615 break;
10616 case 2:
10617 i.seg[i.mem_operands] = &ss;
10618 break;
10619 case 3:
10620 i.seg[i.mem_operands] = &ds;
10621 break;
10622 case 4:
10623 i.seg[i.mem_operands] = &fs;
10624 break;
10625 case 5:
10626 i.seg[i.mem_operands] = &gs;
10627 break;
10628 }
10629
10630 /* Skip the ':' and whitespace. */
10631 ++op_string;
10632 if (is_space_char (*op_string))
10633 ++op_string;
10634
10635 if (!is_digit_char (*op_string)
10636 && !is_identifier_char (*op_string)
10637 && *op_string != '('
10638 && *op_string != ABSOLUTE_PREFIX)
10639 {
10640 as_bad (_("bad memory operand `%s'"), op_string);
10641 return 0;
10642 }
10643 /* Handle case of %es:*foo. */
10644 if (*op_string == ABSOLUTE_PREFIX)
10645 {
10646 ++op_string;
10647 if (is_space_char (*op_string))
10648 ++op_string;
10649 i.jumpabsolute = TRUE;
10650 }
10651 goto do_memory_reference;
10652 }
10653
10654 /* Handle vector operations. */
10655 if (*op_string == '{')
10656 {
10657 op_string = check_VecOperations (op_string, NULL);
10658 if (op_string == NULL)
10659 return 0;
10660 }
10661
10662 if (*op_string)
10663 {
10664 as_bad (_("junk `%s' after register"), op_string);
10665 return 0;
10666 }
10667 temp = r->reg_type;
10668 temp.bitfield.baseindex = 0;
10669 i.types[this_operand] = operand_type_or (i.types[this_operand],
10670 temp);
10671 i.types[this_operand].bitfield.unspecified = 0;
10672 i.op[this_operand].regs = r;
10673 i.reg_operands++;
10674 }
10675 else if (*op_string == REGISTER_PREFIX)
10676 {
10677 as_bad (_("bad register name `%s'"), op_string);
10678 return 0;
10679 }
10680 else if (*op_string == IMMEDIATE_PREFIX)
10681 {
10682 ++op_string;
10683 if (i.jumpabsolute)
10684 {
10685 as_bad (_("immediate operand illegal with absolute jump"));
10686 return 0;
10687 }
10688 if (!i386_immediate (op_string))
10689 return 0;
10690 }
10691 else if (RC_SAE_immediate (operand_string))
10692 {
10693 /* If it is a RC or SAE immediate, do nothing. */
10694 ;
10695 }
10696 else if (is_digit_char (*op_string)
10697 || is_identifier_char (*op_string)
10698 || *op_string == '"'
10699 || *op_string == '(')
10700 {
10701 /* This is a memory reference of some sort. */
10702 char *base_string;
10703
10704 /* Start and end of displacement string expression (if found). */
10705 char *displacement_string_start;
10706 char *displacement_string_end;
10707 char *vop_start;
10708
10709 do_memory_reference:
10710 if (i.mem_operands == 1 && !maybe_adjust_templates ())
10711 return 0;
10712 if ((i.mem_operands == 1
10713 && !current_templates->start->opcode_modifier.isstring)
10714 || i.mem_operands == 2)
10715 {
10716 as_bad (_("too many memory references for `%s'"),
10717 current_templates->start->name);
10718 return 0;
10719 }
10720
10721 /* Check for base index form. We detect the base index form by
10722 looking for an ')' at the end of the operand, searching
10723 for the '(' matching it, and finding a REGISTER_PREFIX or ','
10724 after the '('. */
10725 base_string = op_string + strlen (op_string);
10726
10727 /* Handle vector operations. */
10728 vop_start = strchr (op_string, '{');
10729 if (vop_start && vop_start < base_string)
10730 {
10731 if (check_VecOperations (vop_start, base_string) == NULL)
10732 return 0;
10733 base_string = vop_start;
10734 }
10735
10736 --base_string;
10737 if (is_space_char (*base_string))
10738 --base_string;
10739
10740 /* If we only have a displacement, set-up for it to be parsed later. */
10741 displacement_string_start = op_string;
10742 displacement_string_end = base_string + 1;
10743
10744 if (*base_string == ')')
10745 {
10746 char *temp_string;
10747 unsigned int parens_balanced = 1;
10748 /* We've already checked that the number of left & right ()'s are
10749 equal, so this loop will not be infinite. */
10750 do
10751 {
10752 base_string--;
10753 if (*base_string == ')')
10754 parens_balanced++;
10755 if (*base_string == '(')
10756 parens_balanced--;
10757 }
10758 while (parens_balanced);
10759
10760 temp_string = base_string;
10761
10762 /* Skip past '(' and whitespace. */
10763 ++base_string;
10764 if (is_space_char (*base_string))
10765 ++base_string;
10766
10767 if (*base_string == ','
10768 || ((i.base_reg = parse_register (base_string, &end_op))
10769 != NULL))
10770 {
10771 displacement_string_end = temp_string;
10772
10773 i.types[this_operand].bitfield.baseindex = 1;
10774
10775 if (i.base_reg)
10776 {
10777 base_string = end_op;
10778 if (is_space_char (*base_string))
10779 ++base_string;
10780 }
10781
10782 /* There may be an index reg or scale factor here. */
10783 if (*base_string == ',')
10784 {
10785 ++base_string;
10786 if (is_space_char (*base_string))
10787 ++base_string;
10788
10789 if ((i.index_reg = parse_register (base_string, &end_op))
10790 != NULL)
10791 {
10792 base_string = end_op;
10793 if (is_space_char (*base_string))
10794 ++base_string;
10795 if (*base_string == ',')
10796 {
10797 ++base_string;
10798 if (is_space_char (*base_string))
10799 ++base_string;
10800 }
10801 else if (*base_string != ')')
10802 {
10803 as_bad (_("expecting `,' or `)' "
10804 "after index register in `%s'"),
10805 operand_string);
10806 return 0;
10807 }
10808 }
10809 else if (*base_string == REGISTER_PREFIX)
10810 {
10811 end_op = strchr (base_string, ',');
10812 if (end_op)
10813 *end_op = '\0';
10814 as_bad (_("bad register name `%s'"), base_string);
10815 return 0;
10816 }
10817
10818 /* Check for scale factor. */
10819 if (*base_string != ')')
10820 {
10821 char *end_scale = i386_scale (base_string);
10822
10823 if (!end_scale)
10824 return 0;
10825
10826 base_string = end_scale;
10827 if (is_space_char (*base_string))
10828 ++base_string;
10829 if (*base_string != ')')
10830 {
10831 as_bad (_("expecting `)' "
10832 "after scale factor in `%s'"),
10833 operand_string);
10834 return 0;
10835 }
10836 }
10837 else if (!i.index_reg)
10838 {
10839 as_bad (_("expecting index register or scale factor "
10840 "after `,'; got '%c'"),
10841 *base_string);
10842 return 0;
10843 }
10844 }
10845 else if (*base_string != ')')
10846 {
10847 as_bad (_("expecting `,' or `)' "
10848 "after base register in `%s'"),
10849 operand_string);
10850 return 0;
10851 }
10852 }
10853 else if (*base_string == REGISTER_PREFIX)
10854 {
10855 end_op = strchr (base_string, ',');
10856 if (end_op)
10857 *end_op = '\0';
10858 as_bad (_("bad register name `%s'"), base_string);
10859 return 0;
10860 }
10861 }
10862
10863 /* If there's an expression beginning the operand, parse it,
10864 assuming displacement_string_start and
10865 displacement_string_end are meaningful. */
10866 if (displacement_string_start != displacement_string_end)
10867 {
10868 if (!i386_displacement (displacement_string_start,
10869 displacement_string_end))
10870 return 0;
10871 }
10872
10873 /* Special case for (%dx) while doing input/output op. */
10874 if (i.base_reg
10875 && i.base_reg->reg_type.bitfield.instance == RegD
10876 && i.base_reg->reg_type.bitfield.word
10877 && i.index_reg == 0
10878 && i.log2_scale_factor == 0
10879 && i.seg[i.mem_operands] == 0
10880 && !operand_type_check (i.types[this_operand], disp))
10881 {
10882 i.types[this_operand] = i.base_reg->reg_type;
10883 return 1;
10884 }
10885
10886 if (i386_index_check (operand_string) == 0)
10887 return 0;
10888 i.flags[this_operand] |= Operand_Mem;
10889 if (i.mem_operands == 0)
10890 i.memop1_string = xstrdup (operand_string);
10891 i.mem_operands++;
10892 }
10893 else
10894 {
10895 /* It's not a memory operand; argh! */
10896 as_bad (_("invalid char %s beginning operand %d `%s'"),
10897 output_invalid (*op_string),
10898 this_operand + 1,
10899 op_string);
10900 return 0;
10901 }
10902 return 1; /* Normal return. */
10903 }
10904 \f
10905 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10906 that an rs_machine_dependent frag may reach. */
10907
10908 unsigned int
10909 i386_frag_max_var (fragS *frag)
10910 {
10911 /* The only relaxable frags are for jumps.
10912 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
10913 gas_assert (frag->fr_type == rs_machine_dependent);
10914 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10915 }
10916
10917 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10918 static int
10919 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10920 {
10921 /* STT_GNU_IFUNC symbol must go through PLT. */
10922 if ((symbol_get_bfdsym (fr_symbol)->flags
10923 & BSF_GNU_INDIRECT_FUNCTION) != 0)
10924 return 0;
10925
10926 if (!S_IS_EXTERNAL (fr_symbol))
10927 /* Symbol may be weak or local. */
10928 return !S_IS_WEAK (fr_symbol);
10929
10930 /* Global symbols with non-default visibility can't be preempted. */
10931 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10932 return 1;
10933
10934 if (fr_var != NO_RELOC)
10935 switch ((enum bfd_reloc_code_real) fr_var)
10936 {
10937 case BFD_RELOC_386_PLT32:
10938 case BFD_RELOC_X86_64_PLT32:
10939 /* Symbol with PLT relocation may be preempted. */
10940 return 0;
10941 default:
10942 abort ();
10943 }
10944
10945 /* Global symbols with default visibility in a shared library may be
10946 preempted by another definition. */
10947 return !shared;
10948 }
10949 #endif
10950
10951 /* Return the next non-empty frag. */
10952
10953 static fragS *
10954 i386_next_non_empty_frag (fragS *fragP)
10955 {
10956 /* There may be a frag with a ".fill 0" when there is no room in
10957 the current frag for frag_grow in output_insn. */
10958 for (fragP = fragP->fr_next;
10959 (fragP != NULL
10960 && fragP->fr_type == rs_fill
10961 && fragP->fr_fix == 0);
10962 fragP = fragP->fr_next)
10963 ;
10964 return fragP;
10965 }
10966
10967 /* Return the next jcc frag after BRANCH_PADDING. */
10968
10969 static fragS *
10970 i386_next_jcc_frag (fragS *fragP)
10971 {
10972 if (!fragP)
10973 return NULL;
10974
10975 if (fragP->fr_type == rs_machine_dependent
10976 && (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10977 == BRANCH_PADDING))
10978 {
10979 fragP = i386_next_non_empty_frag (fragP);
10980 if (fragP->fr_type != rs_machine_dependent)
10981 return NULL;
10982 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == COND_JUMP)
10983 return fragP;
10984 }
10985
10986 return NULL;
10987 }
10988
10989 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
10990
10991 static void
10992 i386_classify_machine_dependent_frag (fragS *fragP)
10993 {
10994 fragS *cmp_fragP;
10995 fragS *pad_fragP;
10996 fragS *branch_fragP;
10997 fragS *next_fragP;
10998 unsigned int max_prefix_length;
10999
11000 if (fragP->tc_frag_data.classified)
11001 return;
11002
11003 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11004 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11005 for (next_fragP = fragP;
11006 next_fragP != NULL;
11007 next_fragP = next_fragP->fr_next)
11008 {
11009 next_fragP->tc_frag_data.classified = 1;
11010 if (next_fragP->fr_type == rs_machine_dependent)
11011 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11012 {
11013 case BRANCH_PADDING:
11014 /* The BRANCH_PADDING frag must be followed by a branch
11015 frag. */
11016 branch_fragP = i386_next_non_empty_frag (next_fragP);
11017 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11018 break;
11019 case FUSED_JCC_PADDING:
11020 /* Check if this is a fused jcc:
11021 FUSED_JCC_PADDING
11022 CMP like instruction
11023 BRANCH_PADDING
11024 COND_JUMP
11025 */
11026 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11027 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11028 branch_fragP = i386_next_jcc_frag (pad_fragP);
11029 if (branch_fragP)
11030 {
11031 /* The BRANCH_PADDING frag is merged with the
11032 FUSED_JCC_PADDING frag. */
11033 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11034 /* CMP like instruction size. */
11035 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11036 frag_wane (pad_fragP);
11037 /* Skip to branch_fragP. */
11038 next_fragP = branch_fragP;
11039 }
11040 else if (next_fragP->tc_frag_data.max_prefix_length)
11041 {
11042 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11043 a fused jcc. */
11044 next_fragP->fr_subtype
11045 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11046 next_fragP->tc_frag_data.max_bytes
11047 = next_fragP->tc_frag_data.max_prefix_length;
11048 /* This will be updated in the BRANCH_PREFIX scan. */
11049 next_fragP->tc_frag_data.max_prefix_length = 0;
11050 }
11051 else
11052 frag_wane (next_fragP);
11053 break;
11054 }
11055 }
11056
11057 /* Stop if there is no BRANCH_PREFIX. */
11058 if (!align_branch_prefix_size)
11059 return;
11060
11061 /* Scan for BRANCH_PREFIX. */
11062 for (; fragP != NULL; fragP = fragP->fr_next)
11063 {
11064 if (fragP->fr_type != rs_machine_dependent
11065 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11066 != BRANCH_PREFIX))
11067 continue;
11068
11069 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11070 COND_JUMP_PREFIX. */
11071 max_prefix_length = 0;
11072 for (next_fragP = fragP;
11073 next_fragP != NULL;
11074 next_fragP = next_fragP->fr_next)
11075 {
11076 if (next_fragP->fr_type == rs_fill)
11077 /* Skip rs_fill frags. */
11078 continue;
11079 else if (next_fragP->fr_type != rs_machine_dependent)
11080 /* Stop for all other frags. */
11081 break;
11082
11083 /* rs_machine_dependent frags. */
11084 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11085 == BRANCH_PREFIX)
11086 {
11087 /* Count BRANCH_PREFIX frags. */
11088 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11089 {
11090 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11091 frag_wane (next_fragP);
11092 }
11093 else
11094 max_prefix_length
11095 += next_fragP->tc_frag_data.max_bytes;
11096 }
11097 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11098 == BRANCH_PADDING)
11099 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11100 == FUSED_JCC_PADDING))
11101 {
11102 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11103 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11104 break;
11105 }
11106 else
11107 /* Stop for other rs_machine_dependent frags. */
11108 break;
11109 }
11110
11111 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11112
11113 /* Skip to the next frag. */
11114 fragP = next_fragP;
11115 }
11116 }
11117
11118 /* Compute padding size for
11119
11120 FUSED_JCC_PADDING
11121 CMP like instruction
11122 BRANCH_PADDING
11123 COND_JUMP/UNCOND_JUMP
11124
11125 or
11126
11127 BRANCH_PADDING
11128 COND_JUMP/UNCOND_JUMP
11129 */
11130
11131 static int
11132 i386_branch_padding_size (fragS *fragP, offsetT address)
11133 {
11134 unsigned int offset, size, padding_size;
11135 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11136
11137 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11138 if (!address)
11139 address = fragP->fr_address;
11140 address += fragP->fr_fix;
11141
11142 /* CMP like instrunction size. */
11143 size = fragP->tc_frag_data.cmp_size;
11144
11145 /* The base size of the branch frag. */
11146 size += branch_fragP->fr_fix;
11147
11148 /* Add opcode and displacement bytes for the rs_machine_dependent
11149 branch frag. */
11150 if (branch_fragP->fr_type == rs_machine_dependent)
11151 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11152
11153 /* Check if branch is within boundary and doesn't end at the last
11154 byte. */
11155 offset = address & ((1U << align_branch_power) - 1);
11156 if ((offset + size) >= (1U << align_branch_power))
11157 /* Padding needed to avoid crossing boundary. */
11158 padding_size = (1U << align_branch_power) - offset;
11159 else
11160 /* No padding needed. */
11161 padding_size = 0;
11162
11163 /* The return value may be saved in tc_frag_data.length which is
11164 unsigned byte. */
11165 if (!fits_in_unsigned_byte (padding_size))
11166 abort ();
11167
11168 return padding_size;
11169 }
11170
11171 /* i386_generic_table_relax_frag()
11172
11173 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11174 grow/shrink padding to align branch frags. Hand others to
11175 relax_frag(). */
11176
11177 long
11178 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11179 {
11180 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11181 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11182 {
11183 long padding_size = i386_branch_padding_size (fragP, 0);
11184 long grow = padding_size - fragP->tc_frag_data.length;
11185
11186 /* When the BRANCH_PREFIX frag is used, the computed address
11187 must match the actual address and there should be no padding. */
11188 if (fragP->tc_frag_data.padding_address
11189 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11190 || padding_size))
11191 abort ();
11192
11193 /* Update the padding size. */
11194 if (grow)
11195 fragP->tc_frag_data.length = padding_size;
11196
11197 return grow;
11198 }
11199 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11200 {
11201 fragS *padding_fragP, *next_fragP;
11202 long padding_size, left_size, last_size;
11203
11204 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11205 if (!padding_fragP)
11206 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11207 return (fragP->tc_frag_data.length
11208 - fragP->tc_frag_data.last_length);
11209
11210 /* Compute the relative address of the padding frag in the very
11211 first time where the BRANCH_PREFIX frag sizes are zero. */
11212 if (!fragP->tc_frag_data.padding_address)
11213 fragP->tc_frag_data.padding_address
11214 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11215
11216 /* First update the last length from the previous interation. */
11217 left_size = fragP->tc_frag_data.prefix_length;
11218 for (next_fragP = fragP;
11219 next_fragP != padding_fragP;
11220 next_fragP = next_fragP->fr_next)
11221 if (next_fragP->fr_type == rs_machine_dependent
11222 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11223 == BRANCH_PREFIX))
11224 {
11225 if (left_size)
11226 {
11227 int max = next_fragP->tc_frag_data.max_bytes;
11228 if (max)
11229 {
11230 int size;
11231 if (max > left_size)
11232 size = left_size;
11233 else
11234 size = max;
11235 left_size -= size;
11236 next_fragP->tc_frag_data.last_length = size;
11237 }
11238 }
11239 else
11240 next_fragP->tc_frag_data.last_length = 0;
11241 }
11242
11243 /* Check the padding size for the padding frag. */
11244 padding_size = i386_branch_padding_size
11245 (padding_fragP, (fragP->fr_address
11246 + fragP->tc_frag_data.padding_address));
11247
11248 last_size = fragP->tc_frag_data.prefix_length;
11249 /* Check if there is change from the last interation. */
11250 if (padding_size == last_size)
11251 {
11252 /* Update the expected address of the padding frag. */
11253 padding_fragP->tc_frag_data.padding_address
11254 = (fragP->fr_address + padding_size
11255 + fragP->tc_frag_data.padding_address);
11256 return 0;
11257 }
11258
11259 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11260 {
11261 /* No padding if there is no sufficient room. Clear the
11262 expected address of the padding frag. */
11263 padding_fragP->tc_frag_data.padding_address = 0;
11264 padding_size = 0;
11265 }
11266 else
11267 /* Store the expected address of the padding frag. */
11268 padding_fragP->tc_frag_data.padding_address
11269 = (fragP->fr_address + padding_size
11270 + fragP->tc_frag_data.padding_address);
11271
11272 fragP->tc_frag_data.prefix_length = padding_size;
11273
11274 /* Update the length for the current interation. */
11275 left_size = padding_size;
11276 for (next_fragP = fragP;
11277 next_fragP != padding_fragP;
11278 next_fragP = next_fragP->fr_next)
11279 if (next_fragP->fr_type == rs_machine_dependent
11280 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11281 == BRANCH_PREFIX))
11282 {
11283 if (left_size)
11284 {
11285 int max = next_fragP->tc_frag_data.max_bytes;
11286 if (max)
11287 {
11288 int size;
11289 if (max > left_size)
11290 size = left_size;
11291 else
11292 size = max;
11293 left_size -= size;
11294 next_fragP->tc_frag_data.length = size;
11295 }
11296 }
11297 else
11298 next_fragP->tc_frag_data.length = 0;
11299 }
11300
11301 return (fragP->tc_frag_data.length
11302 - fragP->tc_frag_data.last_length);
11303 }
11304 return relax_frag (segment, fragP, stretch);
11305 }
11306
11307 /* md_estimate_size_before_relax()
11308
11309 Called just before relax() for rs_machine_dependent frags. The x86
11310 assembler uses these frags to handle variable size jump
11311 instructions.
11312
11313 Any symbol that is now undefined will not become defined.
11314 Return the correct fr_subtype in the frag.
11315 Return the initial "guess for variable size of frag" to caller.
11316 The guess is actually the growth beyond the fixed part. Whatever
11317 we do to grow the fixed or variable part contributes to our
11318 returned value. */
11319
11320 int
11321 md_estimate_size_before_relax (fragS *fragP, segT segment)
11322 {
11323 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11324 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11325 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11326 {
11327 i386_classify_machine_dependent_frag (fragP);
11328 return fragP->tc_frag_data.length;
11329 }
11330
11331 /* We've already got fragP->fr_subtype right; all we have to do is
11332 check for un-relaxable symbols. On an ELF system, we can't relax
11333 an externally visible symbol, because it may be overridden by a
11334 shared library. */
11335 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11336 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11337 || (IS_ELF
11338 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11339 fragP->fr_var))
11340 #endif
11341 #if defined (OBJ_COFF) && defined (TE_PE)
11342 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11343 && S_IS_WEAK (fragP->fr_symbol))
11344 #endif
11345 )
11346 {
11347 /* Symbol is undefined in this segment, or we need to keep a
11348 reloc so that weak symbols can be overridden. */
11349 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11350 enum bfd_reloc_code_real reloc_type;
11351 unsigned char *opcode;
11352 int old_fr_fix;
11353
11354 if (fragP->fr_var != NO_RELOC)
11355 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11356 else if (size == 2)
11357 reloc_type = BFD_RELOC_16_PCREL;
11358 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11359 else if (need_plt32_p (fragP->fr_symbol))
11360 reloc_type = BFD_RELOC_X86_64_PLT32;
11361 #endif
11362 else
11363 reloc_type = BFD_RELOC_32_PCREL;
11364
11365 old_fr_fix = fragP->fr_fix;
11366 opcode = (unsigned char *) fragP->fr_opcode;
11367
11368 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11369 {
11370 case UNCOND_JUMP:
11371 /* Make jmp (0xeb) a (d)word displacement jump. */
11372 opcode[0] = 0xe9;
11373 fragP->fr_fix += size;
11374 fix_new (fragP, old_fr_fix, size,
11375 fragP->fr_symbol,
11376 fragP->fr_offset, 1,
11377 reloc_type);
11378 break;
11379
11380 case COND_JUMP86:
11381 if (size == 2
11382 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11383 {
11384 /* Negate the condition, and branch past an
11385 unconditional jump. */
11386 opcode[0] ^= 1;
11387 opcode[1] = 3;
11388 /* Insert an unconditional jump. */
11389 opcode[2] = 0xe9;
11390 /* We added two extra opcode bytes, and have a two byte
11391 offset. */
11392 fragP->fr_fix += 2 + 2;
11393 fix_new (fragP, old_fr_fix + 2, 2,
11394 fragP->fr_symbol,
11395 fragP->fr_offset, 1,
11396 reloc_type);
11397 break;
11398 }
11399 /* Fall through. */
11400
11401 case COND_JUMP:
11402 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11403 {
11404 fixS *fixP;
11405
11406 fragP->fr_fix += 1;
11407 fixP = fix_new (fragP, old_fr_fix, 1,
11408 fragP->fr_symbol,
11409 fragP->fr_offset, 1,
11410 BFD_RELOC_8_PCREL);
11411 fixP->fx_signed = 1;
11412 break;
11413 }
11414
11415 /* This changes the byte-displacement jump 0x7N
11416 to the (d)word-displacement jump 0x0f,0x8N. */
11417 opcode[1] = opcode[0] + 0x10;
11418 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11419 /* We've added an opcode byte. */
11420 fragP->fr_fix += 1 + size;
11421 fix_new (fragP, old_fr_fix + 1, size,
11422 fragP->fr_symbol,
11423 fragP->fr_offset, 1,
11424 reloc_type);
11425 break;
11426
11427 default:
11428 BAD_CASE (fragP->fr_subtype);
11429 break;
11430 }
11431 frag_wane (fragP);
11432 return fragP->fr_fix - old_fr_fix;
11433 }
11434
11435 /* Guess size depending on current relax state. Initially the relax
11436 state will correspond to a short jump and we return 1, because
11437 the variable part of the frag (the branch offset) is one byte
11438 long. However, we can relax a section more than once and in that
11439 case we must either set fr_subtype back to the unrelaxed state,
11440 or return the value for the appropriate branch. */
11441 return md_relax_table[fragP->fr_subtype].rlx_length;
11442 }
11443
11444 /* Called after relax() is finished.
11445
11446 In: Address of frag.
11447 fr_type == rs_machine_dependent.
11448 fr_subtype is what the address relaxed to.
11449
11450 Out: Any fixSs and constants are set up.
11451 Caller will turn frag into a ".space 0". */
11452
11453 void
11454 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
11455 fragS *fragP)
11456 {
11457 unsigned char *opcode;
11458 unsigned char *where_to_put_displacement = NULL;
11459 offsetT target_address;
11460 offsetT opcode_address;
11461 unsigned int extension = 0;
11462 offsetT displacement_from_opcode_start;
11463
11464 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11465 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
11466 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11467 {
11468 /* Generate nop padding. */
11469 unsigned int size = fragP->tc_frag_data.length;
11470 if (size)
11471 {
11472 if (size > fragP->tc_frag_data.max_bytes)
11473 abort ();
11474
11475 if (flag_debug)
11476 {
11477 const char *msg;
11478 const char *branch = "branch";
11479 const char *prefix = "";
11480 fragS *padding_fragP;
11481 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11482 == BRANCH_PREFIX)
11483 {
11484 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11485 switch (fragP->tc_frag_data.default_prefix)
11486 {
11487 default:
11488 abort ();
11489 break;
11490 case CS_PREFIX_OPCODE:
11491 prefix = " cs";
11492 break;
11493 case DS_PREFIX_OPCODE:
11494 prefix = " ds";
11495 break;
11496 case ES_PREFIX_OPCODE:
11497 prefix = " es";
11498 break;
11499 case FS_PREFIX_OPCODE:
11500 prefix = " fs";
11501 break;
11502 case GS_PREFIX_OPCODE:
11503 prefix = " gs";
11504 break;
11505 case SS_PREFIX_OPCODE:
11506 prefix = " ss";
11507 break;
11508 }
11509 if (padding_fragP)
11510 msg = _("%s:%u: add %d%s at 0x%llx to align "
11511 "%s within %d-byte boundary\n");
11512 else
11513 msg = _("%s:%u: add additional %d%s at 0x%llx to "
11514 "align %s within %d-byte boundary\n");
11515 }
11516 else
11517 {
11518 padding_fragP = fragP;
11519 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
11520 "%s within %d-byte boundary\n");
11521 }
11522
11523 if (padding_fragP)
11524 switch (padding_fragP->tc_frag_data.branch_type)
11525 {
11526 case align_branch_jcc:
11527 branch = "jcc";
11528 break;
11529 case align_branch_fused:
11530 branch = "fused jcc";
11531 break;
11532 case align_branch_jmp:
11533 branch = "jmp";
11534 break;
11535 case align_branch_call:
11536 branch = "call";
11537 break;
11538 case align_branch_indirect:
11539 branch = "indiret branch";
11540 break;
11541 case align_branch_ret:
11542 branch = "ret";
11543 break;
11544 default:
11545 break;
11546 }
11547
11548 fprintf (stdout, msg,
11549 fragP->fr_file, fragP->fr_line, size, prefix,
11550 (long long) fragP->fr_address, branch,
11551 1 << align_branch_power);
11552 }
11553 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11554 memset (fragP->fr_opcode,
11555 fragP->tc_frag_data.default_prefix, size);
11556 else
11557 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
11558 size, 0);
11559 fragP->fr_fix += size;
11560 }
11561 return;
11562 }
11563
11564 opcode = (unsigned char *) fragP->fr_opcode;
11565
11566 /* Address we want to reach in file space. */
11567 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
11568
11569 /* Address opcode resides at in file space. */
11570 opcode_address = fragP->fr_address + fragP->fr_fix;
11571
11572 /* Displacement from opcode start to fill into instruction. */
11573 displacement_from_opcode_start = target_address - opcode_address;
11574
11575 if ((fragP->fr_subtype & BIG) == 0)
11576 {
11577 /* Don't have to change opcode. */
11578 extension = 1; /* 1 opcode + 1 displacement */
11579 where_to_put_displacement = &opcode[1];
11580 }
11581 else
11582 {
11583 if (no_cond_jump_promotion
11584 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
11585 as_warn_where (fragP->fr_file, fragP->fr_line,
11586 _("long jump required"));
11587
11588 switch (fragP->fr_subtype)
11589 {
11590 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
11591 extension = 4; /* 1 opcode + 4 displacement */
11592 opcode[0] = 0xe9;
11593 where_to_put_displacement = &opcode[1];
11594 break;
11595
11596 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
11597 extension = 2; /* 1 opcode + 2 displacement */
11598 opcode[0] = 0xe9;
11599 where_to_put_displacement = &opcode[1];
11600 break;
11601
11602 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
11603 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
11604 extension = 5; /* 2 opcode + 4 displacement */
11605 opcode[1] = opcode[0] + 0x10;
11606 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11607 where_to_put_displacement = &opcode[2];
11608 break;
11609
11610 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
11611 extension = 3; /* 2 opcode + 2 displacement */
11612 opcode[1] = opcode[0] + 0x10;
11613 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11614 where_to_put_displacement = &opcode[2];
11615 break;
11616
11617 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
11618 extension = 4;
11619 opcode[0] ^= 1;
11620 opcode[1] = 3;
11621 opcode[2] = 0xe9;
11622 where_to_put_displacement = &opcode[3];
11623 break;
11624
11625 default:
11626 BAD_CASE (fragP->fr_subtype);
11627 break;
11628 }
11629 }
11630
11631 /* If size if less then four we are sure that the operand fits,
11632 but if it's 4, then it could be that the displacement is larger
11633 then -/+ 2GB. */
11634 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
11635 && object_64bit
11636 && ((addressT) (displacement_from_opcode_start - extension
11637 + ((addressT) 1 << 31))
11638 > (((addressT) 2 << 31) - 1)))
11639 {
11640 as_bad_where (fragP->fr_file, fragP->fr_line,
11641 _("jump target out of range"));
11642 /* Make us emit 0. */
11643 displacement_from_opcode_start = extension;
11644 }
11645 /* Now put displacement after opcode. */
11646 md_number_to_chars ((char *) where_to_put_displacement,
11647 (valueT) (displacement_from_opcode_start - extension),
11648 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
11649 fragP->fr_fix += extension;
11650 }
11651 \f
11652 /* Apply a fixup (fixP) to segment data, once it has been determined
11653 by our caller that we have all the info we need to fix it up.
11654
11655 Parameter valP is the pointer to the value of the bits.
11656
11657 On the 386, immediates, displacements, and data pointers are all in
11658 the same (little-endian) format, so we don't need to care about which
11659 we are handling. */
11660
11661 void
11662 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
11663 {
11664 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
11665 valueT value = *valP;
11666
11667 #if !defined (TE_Mach)
11668 if (fixP->fx_pcrel)
11669 {
11670 switch (fixP->fx_r_type)
11671 {
11672 default:
11673 break;
11674
11675 case BFD_RELOC_64:
11676 fixP->fx_r_type = BFD_RELOC_64_PCREL;
11677 break;
11678 case BFD_RELOC_32:
11679 case BFD_RELOC_X86_64_32S:
11680 fixP->fx_r_type = BFD_RELOC_32_PCREL;
11681 break;
11682 case BFD_RELOC_16:
11683 fixP->fx_r_type = BFD_RELOC_16_PCREL;
11684 break;
11685 case BFD_RELOC_8:
11686 fixP->fx_r_type = BFD_RELOC_8_PCREL;
11687 break;
11688 }
11689 }
11690
11691 if (fixP->fx_addsy != NULL
11692 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
11693 || fixP->fx_r_type == BFD_RELOC_64_PCREL
11694 || fixP->fx_r_type == BFD_RELOC_16_PCREL
11695 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
11696 && !use_rela_relocations)
11697 {
11698 /* This is a hack. There should be a better way to handle this.
11699 This covers for the fact that bfd_install_relocation will
11700 subtract the current location (for partial_inplace, PC relative
11701 relocations); see more below. */
11702 #ifndef OBJ_AOUT
11703 if (IS_ELF
11704 #ifdef TE_PE
11705 || OUTPUT_FLAVOR == bfd_target_coff_flavour
11706 #endif
11707 )
11708 value += fixP->fx_where + fixP->fx_frag->fr_address;
11709 #endif
11710 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11711 if (IS_ELF)
11712 {
11713 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
11714
11715 if ((sym_seg == seg
11716 || (symbol_section_p (fixP->fx_addsy)
11717 && sym_seg != absolute_section))
11718 && !generic_force_reloc (fixP))
11719 {
11720 /* Yes, we add the values in twice. This is because
11721 bfd_install_relocation subtracts them out again. I think
11722 bfd_install_relocation is broken, but I don't dare change
11723 it. FIXME. */
11724 value += fixP->fx_where + fixP->fx_frag->fr_address;
11725 }
11726 }
11727 #endif
11728 #if defined (OBJ_COFF) && defined (TE_PE)
11729 /* For some reason, the PE format does not store a
11730 section address offset for a PC relative symbol. */
11731 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
11732 || S_IS_WEAK (fixP->fx_addsy))
11733 value += md_pcrel_from (fixP);
11734 #endif
11735 }
11736 #if defined (OBJ_COFF) && defined (TE_PE)
11737 if (fixP->fx_addsy != NULL
11738 && S_IS_WEAK (fixP->fx_addsy)
11739 /* PR 16858: Do not modify weak function references. */
11740 && ! fixP->fx_pcrel)
11741 {
11742 #if !defined (TE_PEP)
11743 /* For x86 PE weak function symbols are neither PC-relative
11744 nor do they set S_IS_FUNCTION. So the only reliable way
11745 to detect them is to check the flags of their containing
11746 section. */
11747 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
11748 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
11749 ;
11750 else
11751 #endif
11752 value -= S_GET_VALUE (fixP->fx_addsy);
11753 }
11754 #endif
11755
11756 /* Fix a few things - the dynamic linker expects certain values here,
11757 and we must not disappoint it. */
11758 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11759 if (IS_ELF && fixP->fx_addsy)
11760 switch (fixP->fx_r_type)
11761 {
11762 case BFD_RELOC_386_PLT32:
11763 case BFD_RELOC_X86_64_PLT32:
11764 /* Make the jump instruction point to the address of the operand.
11765 At runtime we merely add the offset to the actual PLT entry.
11766 NB: Subtract the offset size only for jump instructions. */
11767 if (fixP->fx_pcrel)
11768 value = -4;
11769 break;
11770
11771 case BFD_RELOC_386_TLS_GD:
11772 case BFD_RELOC_386_TLS_LDM:
11773 case BFD_RELOC_386_TLS_IE_32:
11774 case BFD_RELOC_386_TLS_IE:
11775 case BFD_RELOC_386_TLS_GOTIE:
11776 case BFD_RELOC_386_TLS_GOTDESC:
11777 case BFD_RELOC_X86_64_TLSGD:
11778 case BFD_RELOC_X86_64_TLSLD:
11779 case BFD_RELOC_X86_64_GOTTPOFF:
11780 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11781 value = 0; /* Fully resolved at runtime. No addend. */
11782 /* Fallthrough */
11783 case BFD_RELOC_386_TLS_LE:
11784 case BFD_RELOC_386_TLS_LDO_32:
11785 case BFD_RELOC_386_TLS_LE_32:
11786 case BFD_RELOC_X86_64_DTPOFF32:
11787 case BFD_RELOC_X86_64_DTPOFF64:
11788 case BFD_RELOC_X86_64_TPOFF32:
11789 case BFD_RELOC_X86_64_TPOFF64:
11790 S_SET_THREAD_LOCAL (fixP->fx_addsy);
11791 break;
11792
11793 case BFD_RELOC_386_TLS_DESC_CALL:
11794 case BFD_RELOC_X86_64_TLSDESC_CALL:
11795 value = 0; /* Fully resolved at runtime. No addend. */
11796 S_SET_THREAD_LOCAL (fixP->fx_addsy);
11797 fixP->fx_done = 0;
11798 return;
11799
11800 case BFD_RELOC_VTABLE_INHERIT:
11801 case BFD_RELOC_VTABLE_ENTRY:
11802 fixP->fx_done = 0;
11803 return;
11804
11805 default:
11806 break;
11807 }
11808 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
11809 *valP = value;
11810 #endif /* !defined (TE_Mach) */
11811
11812 /* Are we finished with this relocation now? */
11813 if (fixP->fx_addsy == NULL)
11814 fixP->fx_done = 1;
11815 #if defined (OBJ_COFF) && defined (TE_PE)
11816 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
11817 {
11818 fixP->fx_done = 0;
11819 /* Remember value for tc_gen_reloc. */
11820 fixP->fx_addnumber = value;
11821 /* Clear out the frag for now. */
11822 value = 0;
11823 }
11824 #endif
11825 else if (use_rela_relocations)
11826 {
11827 fixP->fx_no_overflow = 1;
11828 /* Remember value for tc_gen_reloc. */
11829 fixP->fx_addnumber = value;
11830 value = 0;
11831 }
11832
11833 md_number_to_chars (p, value, fixP->fx_size);
11834 }
11835 \f
11836 const char *
11837 md_atof (int type, char *litP, int *sizeP)
11838 {
11839 /* This outputs the LITTLENUMs in REVERSE order;
11840 in accord with the bigendian 386. */
11841 return ieee_md_atof (type, litP, sizeP, FALSE);
11842 }
11843 \f
11844 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
11845
11846 static char *
11847 output_invalid (int c)
11848 {
11849 if (ISPRINT (c))
11850 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11851 "'%c'", c);
11852 else
11853 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11854 "(0x%x)", (unsigned char) c);
11855 return output_invalid_buf;
11856 }
11857
11858 /* REG_STRING starts *before* REGISTER_PREFIX. */
11859
11860 static const reg_entry *
11861 parse_real_register (char *reg_string, char **end_op)
11862 {
11863 char *s = reg_string;
11864 char *p;
11865 char reg_name_given[MAX_REG_NAME_SIZE + 1];
11866 const reg_entry *r;
11867
11868 /* Skip possible REGISTER_PREFIX and possible whitespace. */
11869 if (*s == REGISTER_PREFIX)
11870 ++s;
11871
11872 if (is_space_char (*s))
11873 ++s;
11874
11875 p = reg_name_given;
11876 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
11877 {
11878 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
11879 return (const reg_entry *) NULL;
11880 s++;
11881 }
11882
11883 /* For naked regs, make sure that we are not dealing with an identifier.
11884 This prevents confusing an identifier like `eax_var' with register
11885 `eax'. */
11886 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
11887 return (const reg_entry *) NULL;
11888
11889 *end_op = s;
11890
11891 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
11892
11893 /* Handle floating point regs, allowing spaces in the (i) part. */
11894 if (r == i386_regtab /* %st is first entry of table */)
11895 {
11896 if (!cpu_arch_flags.bitfield.cpu8087
11897 && !cpu_arch_flags.bitfield.cpu287
11898 && !cpu_arch_flags.bitfield.cpu387)
11899 return (const reg_entry *) NULL;
11900
11901 if (is_space_char (*s))
11902 ++s;
11903 if (*s == '(')
11904 {
11905 ++s;
11906 if (is_space_char (*s))
11907 ++s;
11908 if (*s >= '0' && *s <= '7')
11909 {
11910 int fpr = *s - '0';
11911 ++s;
11912 if (is_space_char (*s))
11913 ++s;
11914 if (*s == ')')
11915 {
11916 *end_op = s + 1;
11917 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
11918 know (r);
11919 return r + fpr;
11920 }
11921 }
11922 /* We have "%st(" then garbage. */
11923 return (const reg_entry *) NULL;
11924 }
11925 }
11926
11927 if (r == NULL || allow_pseudo_reg)
11928 return r;
11929
11930 if (operand_type_all_zero (&r->reg_type))
11931 return (const reg_entry *) NULL;
11932
11933 if ((r->reg_type.bitfield.dword
11934 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
11935 || r->reg_type.bitfield.class == RegCR
11936 || r->reg_type.bitfield.class == RegDR
11937 || r->reg_type.bitfield.class == RegTR)
11938 && !cpu_arch_flags.bitfield.cpui386)
11939 return (const reg_entry *) NULL;
11940
11941 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
11942 return (const reg_entry *) NULL;
11943
11944 if (!cpu_arch_flags.bitfield.cpuavx512f)
11945 {
11946 if (r->reg_type.bitfield.zmmword
11947 || r->reg_type.bitfield.class == RegMask)
11948 return (const reg_entry *) NULL;
11949
11950 if (!cpu_arch_flags.bitfield.cpuavx)
11951 {
11952 if (r->reg_type.bitfield.ymmword)
11953 return (const reg_entry *) NULL;
11954
11955 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
11956 return (const reg_entry *) NULL;
11957 }
11958 }
11959
11960 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
11961 return (const reg_entry *) NULL;
11962
11963 /* Don't allow fake index register unless allow_index_reg isn't 0. */
11964 if (!allow_index_reg && r->reg_num == RegIZ)
11965 return (const reg_entry *) NULL;
11966
11967 /* Upper 16 vector registers are only available with VREX in 64bit
11968 mode, and require EVEX encoding. */
11969 if (r->reg_flags & RegVRex)
11970 {
11971 if (!cpu_arch_flags.bitfield.cpuavx512f
11972 || flag_code != CODE_64BIT)
11973 return (const reg_entry *) NULL;
11974
11975 i.vec_encoding = vex_encoding_evex;
11976 }
11977
11978 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
11979 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
11980 && flag_code != CODE_64BIT)
11981 return (const reg_entry *) NULL;
11982
11983 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
11984 && !intel_syntax)
11985 return (const reg_entry *) NULL;
11986
11987 return r;
11988 }
11989
11990 /* REG_STRING starts *before* REGISTER_PREFIX. */
11991
11992 static const reg_entry *
11993 parse_register (char *reg_string, char **end_op)
11994 {
11995 const reg_entry *r;
11996
11997 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
11998 r = parse_real_register (reg_string, end_op);
11999 else
12000 r = NULL;
12001 if (!r)
12002 {
12003 char *save = input_line_pointer;
12004 char c;
12005 symbolS *symbolP;
12006
12007 input_line_pointer = reg_string;
12008 c = get_symbol_name (&reg_string);
12009 symbolP = symbol_find (reg_string);
12010 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12011 {
12012 const expressionS *e = symbol_get_value_expression (symbolP);
12013
12014 know (e->X_op == O_register);
12015 know (e->X_add_number >= 0
12016 && (valueT) e->X_add_number < i386_regtab_size);
12017 r = i386_regtab + e->X_add_number;
12018 if ((r->reg_flags & RegVRex))
12019 i.vec_encoding = vex_encoding_evex;
12020 *end_op = input_line_pointer;
12021 }
12022 *input_line_pointer = c;
12023 input_line_pointer = save;
12024 }
12025 return r;
12026 }
12027
12028 int
12029 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12030 {
12031 const reg_entry *r;
12032 char *end = input_line_pointer;
12033
12034 *end = *nextcharP;
12035 r = parse_register (name, &input_line_pointer);
12036 if (r && end <= input_line_pointer)
12037 {
12038 *nextcharP = *input_line_pointer;
12039 *input_line_pointer = 0;
12040 e->X_op = O_register;
12041 e->X_add_number = r - i386_regtab;
12042 return 1;
12043 }
12044 input_line_pointer = end;
12045 *end = 0;
12046 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12047 }
12048
12049 void
12050 md_operand (expressionS *e)
12051 {
12052 char *end;
12053 const reg_entry *r;
12054
12055 switch (*input_line_pointer)
12056 {
12057 case REGISTER_PREFIX:
12058 r = parse_real_register (input_line_pointer, &end);
12059 if (r)
12060 {
12061 e->X_op = O_register;
12062 e->X_add_number = r - i386_regtab;
12063 input_line_pointer = end;
12064 }
12065 break;
12066
12067 case '[':
12068 gas_assert (intel_syntax);
12069 end = input_line_pointer++;
12070 expression (e);
12071 if (*input_line_pointer == ']')
12072 {
12073 ++input_line_pointer;
12074 e->X_op_symbol = make_expr_symbol (e);
12075 e->X_add_symbol = NULL;
12076 e->X_add_number = 0;
12077 e->X_op = O_index;
12078 }
12079 else
12080 {
12081 e->X_op = O_absent;
12082 input_line_pointer = end;
12083 }
12084 break;
12085 }
12086 }
12087
12088 \f
12089 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12090 const char *md_shortopts = "kVQ:sqnO::";
12091 #else
12092 const char *md_shortopts = "qnO::";
12093 #endif
12094
12095 #define OPTION_32 (OPTION_MD_BASE + 0)
12096 #define OPTION_64 (OPTION_MD_BASE + 1)
12097 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12098 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12099 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12100 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12101 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12102 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12103 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12104 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12105 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12106 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12107 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12108 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12109 #define OPTION_X32 (OPTION_MD_BASE + 14)
12110 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12111 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12112 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12113 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12114 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12115 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12116 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12117 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12118 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12119 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12120 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12121 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12122 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12123 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12124 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12125 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12126
12127 struct option md_longopts[] =
12128 {
12129 {"32", no_argument, NULL, OPTION_32},
12130 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12131 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12132 {"64", no_argument, NULL, OPTION_64},
12133 #endif
12134 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12135 {"x32", no_argument, NULL, OPTION_X32},
12136 {"mshared", no_argument, NULL, OPTION_MSHARED},
12137 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12138 #endif
12139 {"divide", no_argument, NULL, OPTION_DIVIDE},
12140 {"march", required_argument, NULL, OPTION_MARCH},
12141 {"mtune", required_argument, NULL, OPTION_MTUNE},
12142 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12143 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12144 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12145 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12146 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12147 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12148 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12149 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12150 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12151 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12152 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12153 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12154 # if defined (TE_PE) || defined (TE_PEP)
12155 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12156 #endif
12157 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12158 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12159 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12160 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12161 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12162 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12163 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12164 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12165 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12166 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12167 {NULL, no_argument, NULL, 0}
12168 };
12169 size_t md_longopts_size = sizeof (md_longopts);
12170
12171 int
12172 md_parse_option (int c, const char *arg)
12173 {
12174 unsigned int j;
12175 char *arch, *next, *saved, *type;
12176
12177 switch (c)
12178 {
12179 case 'n':
12180 optimize_align_code = 0;
12181 break;
12182
12183 case 'q':
12184 quiet_warnings = 1;
12185 break;
12186
12187 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12188 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12189 should be emitted or not. FIXME: Not implemented. */
12190 case 'Q':
12191 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12192 return 0;
12193 break;
12194
12195 /* -V: SVR4 argument to print version ID. */
12196 case 'V':
12197 print_version_id ();
12198 break;
12199
12200 /* -k: Ignore for FreeBSD compatibility. */
12201 case 'k':
12202 break;
12203
12204 case 's':
12205 /* -s: On i386 Solaris, this tells the native assembler to use
12206 .stab instead of .stab.excl. We always use .stab anyhow. */
12207 break;
12208
12209 case OPTION_MSHARED:
12210 shared = 1;
12211 break;
12212
12213 case OPTION_X86_USED_NOTE:
12214 if (strcasecmp (arg, "yes") == 0)
12215 x86_used_note = 1;
12216 else if (strcasecmp (arg, "no") == 0)
12217 x86_used_note = 0;
12218 else
12219 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12220 break;
12221
12222
12223 #endif
12224 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12225 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12226 case OPTION_64:
12227 {
12228 const char **list, **l;
12229
12230 list = bfd_target_list ();
12231 for (l = list; *l != NULL; l++)
12232 if (CONST_STRNEQ (*l, "elf64-x86-64")
12233 || strcmp (*l, "coff-x86-64") == 0
12234 || strcmp (*l, "pe-x86-64") == 0
12235 || strcmp (*l, "pei-x86-64") == 0
12236 || strcmp (*l, "mach-o-x86-64") == 0)
12237 {
12238 default_arch = "x86_64";
12239 break;
12240 }
12241 if (*l == NULL)
12242 as_fatal (_("no compiled in support for x86_64"));
12243 free (list);
12244 }
12245 break;
12246 #endif
12247
12248 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12249 case OPTION_X32:
12250 if (IS_ELF)
12251 {
12252 const char **list, **l;
12253
12254 list = bfd_target_list ();
12255 for (l = list; *l != NULL; l++)
12256 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12257 {
12258 default_arch = "x86_64:32";
12259 break;
12260 }
12261 if (*l == NULL)
12262 as_fatal (_("no compiled in support for 32bit x86_64"));
12263 free (list);
12264 }
12265 else
12266 as_fatal (_("32bit x86_64 is only supported for ELF"));
12267 break;
12268 #endif
12269
12270 case OPTION_32:
12271 default_arch = "i386";
12272 break;
12273
12274 case OPTION_DIVIDE:
12275 #ifdef SVR4_COMMENT_CHARS
12276 {
12277 char *n, *t;
12278 const char *s;
12279
12280 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12281 t = n;
12282 for (s = i386_comment_chars; *s != '\0'; s++)
12283 if (*s != '/')
12284 *t++ = *s;
12285 *t = '\0';
12286 i386_comment_chars = n;
12287 }
12288 #endif
12289 break;
12290
12291 case OPTION_MARCH:
12292 saved = xstrdup (arg);
12293 arch = saved;
12294 /* Allow -march=+nosse. */
12295 if (*arch == '+')
12296 arch++;
12297 do
12298 {
12299 if (*arch == '.')
12300 as_fatal (_("invalid -march= option: `%s'"), arg);
12301 next = strchr (arch, '+');
12302 if (next)
12303 *next++ = '\0';
12304 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12305 {
12306 if (strcmp (arch, cpu_arch [j].name) == 0)
12307 {
12308 /* Processor. */
12309 if (! cpu_arch[j].flags.bitfield.cpui386)
12310 continue;
12311
12312 cpu_arch_name = cpu_arch[j].name;
12313 cpu_sub_arch_name = NULL;
12314 cpu_arch_flags = cpu_arch[j].flags;
12315 cpu_arch_isa = cpu_arch[j].type;
12316 cpu_arch_isa_flags = cpu_arch[j].flags;
12317 if (!cpu_arch_tune_set)
12318 {
12319 cpu_arch_tune = cpu_arch_isa;
12320 cpu_arch_tune_flags = cpu_arch_isa_flags;
12321 }
12322 break;
12323 }
12324 else if (*cpu_arch [j].name == '.'
12325 && strcmp (arch, cpu_arch [j].name + 1) == 0)
12326 {
12327 /* ISA extension. */
12328 i386_cpu_flags flags;
12329
12330 flags = cpu_flags_or (cpu_arch_flags,
12331 cpu_arch[j].flags);
12332
12333 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12334 {
12335 if (cpu_sub_arch_name)
12336 {
12337 char *name = cpu_sub_arch_name;
12338 cpu_sub_arch_name = concat (name,
12339 cpu_arch[j].name,
12340 (const char *) NULL);
12341 free (name);
12342 }
12343 else
12344 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12345 cpu_arch_flags = flags;
12346 cpu_arch_isa_flags = flags;
12347 }
12348 else
12349 cpu_arch_isa_flags
12350 = cpu_flags_or (cpu_arch_isa_flags,
12351 cpu_arch[j].flags);
12352 break;
12353 }
12354 }
12355
12356 if (j >= ARRAY_SIZE (cpu_arch))
12357 {
12358 /* Disable an ISA extension. */
12359 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12360 if (strcmp (arch, cpu_noarch [j].name) == 0)
12361 {
12362 i386_cpu_flags flags;
12363
12364 flags = cpu_flags_and_not (cpu_arch_flags,
12365 cpu_noarch[j].flags);
12366 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12367 {
12368 if (cpu_sub_arch_name)
12369 {
12370 char *name = cpu_sub_arch_name;
12371 cpu_sub_arch_name = concat (arch,
12372 (const char *) NULL);
12373 free (name);
12374 }
12375 else
12376 cpu_sub_arch_name = xstrdup (arch);
12377 cpu_arch_flags = flags;
12378 cpu_arch_isa_flags = flags;
12379 }
12380 break;
12381 }
12382
12383 if (j >= ARRAY_SIZE (cpu_noarch))
12384 j = ARRAY_SIZE (cpu_arch);
12385 }
12386
12387 if (j >= ARRAY_SIZE (cpu_arch))
12388 as_fatal (_("invalid -march= option: `%s'"), arg);
12389
12390 arch = next;
12391 }
12392 while (next != NULL);
12393 free (saved);
12394 break;
12395
12396 case OPTION_MTUNE:
12397 if (*arg == '.')
12398 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12399 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12400 {
12401 if (strcmp (arg, cpu_arch [j].name) == 0)
12402 {
12403 cpu_arch_tune_set = 1;
12404 cpu_arch_tune = cpu_arch [j].type;
12405 cpu_arch_tune_flags = cpu_arch[j].flags;
12406 break;
12407 }
12408 }
12409 if (j >= ARRAY_SIZE (cpu_arch))
12410 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12411 break;
12412
12413 case OPTION_MMNEMONIC:
12414 if (strcasecmp (arg, "att") == 0)
12415 intel_mnemonic = 0;
12416 else if (strcasecmp (arg, "intel") == 0)
12417 intel_mnemonic = 1;
12418 else
12419 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
12420 break;
12421
12422 case OPTION_MSYNTAX:
12423 if (strcasecmp (arg, "att") == 0)
12424 intel_syntax = 0;
12425 else if (strcasecmp (arg, "intel") == 0)
12426 intel_syntax = 1;
12427 else
12428 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
12429 break;
12430
12431 case OPTION_MINDEX_REG:
12432 allow_index_reg = 1;
12433 break;
12434
12435 case OPTION_MNAKED_REG:
12436 allow_naked_reg = 1;
12437 break;
12438
12439 case OPTION_MSSE2AVX:
12440 sse2avx = 1;
12441 break;
12442
12443 case OPTION_MSSE_CHECK:
12444 if (strcasecmp (arg, "error") == 0)
12445 sse_check = check_error;
12446 else if (strcasecmp (arg, "warning") == 0)
12447 sse_check = check_warning;
12448 else if (strcasecmp (arg, "none") == 0)
12449 sse_check = check_none;
12450 else
12451 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
12452 break;
12453
12454 case OPTION_MOPERAND_CHECK:
12455 if (strcasecmp (arg, "error") == 0)
12456 operand_check = check_error;
12457 else if (strcasecmp (arg, "warning") == 0)
12458 operand_check = check_warning;
12459 else if (strcasecmp (arg, "none") == 0)
12460 operand_check = check_none;
12461 else
12462 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
12463 break;
12464
12465 case OPTION_MAVXSCALAR:
12466 if (strcasecmp (arg, "128") == 0)
12467 avxscalar = vex128;
12468 else if (strcasecmp (arg, "256") == 0)
12469 avxscalar = vex256;
12470 else
12471 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
12472 break;
12473
12474 case OPTION_MVEXWIG:
12475 if (strcmp (arg, "0") == 0)
12476 vexwig = vexw0;
12477 else if (strcmp (arg, "1") == 0)
12478 vexwig = vexw1;
12479 else
12480 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
12481 break;
12482
12483 case OPTION_MADD_BND_PREFIX:
12484 add_bnd_prefix = 1;
12485 break;
12486
12487 case OPTION_MEVEXLIG:
12488 if (strcmp (arg, "128") == 0)
12489 evexlig = evexl128;
12490 else if (strcmp (arg, "256") == 0)
12491 evexlig = evexl256;
12492 else if (strcmp (arg, "512") == 0)
12493 evexlig = evexl512;
12494 else
12495 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
12496 break;
12497
12498 case OPTION_MEVEXRCIG:
12499 if (strcmp (arg, "rne") == 0)
12500 evexrcig = rne;
12501 else if (strcmp (arg, "rd") == 0)
12502 evexrcig = rd;
12503 else if (strcmp (arg, "ru") == 0)
12504 evexrcig = ru;
12505 else if (strcmp (arg, "rz") == 0)
12506 evexrcig = rz;
12507 else
12508 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
12509 break;
12510
12511 case OPTION_MEVEXWIG:
12512 if (strcmp (arg, "0") == 0)
12513 evexwig = evexw0;
12514 else if (strcmp (arg, "1") == 0)
12515 evexwig = evexw1;
12516 else
12517 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
12518 break;
12519
12520 # if defined (TE_PE) || defined (TE_PEP)
12521 case OPTION_MBIG_OBJ:
12522 use_big_obj = 1;
12523 break;
12524 #endif
12525
12526 case OPTION_MOMIT_LOCK_PREFIX:
12527 if (strcasecmp (arg, "yes") == 0)
12528 omit_lock_prefix = 1;
12529 else if (strcasecmp (arg, "no") == 0)
12530 omit_lock_prefix = 0;
12531 else
12532 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
12533 break;
12534
12535 case OPTION_MFENCE_AS_LOCK_ADD:
12536 if (strcasecmp (arg, "yes") == 0)
12537 avoid_fence = 1;
12538 else if (strcasecmp (arg, "no") == 0)
12539 avoid_fence = 0;
12540 else
12541 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
12542 break;
12543
12544 case OPTION_MRELAX_RELOCATIONS:
12545 if (strcasecmp (arg, "yes") == 0)
12546 generate_relax_relocations = 1;
12547 else if (strcasecmp (arg, "no") == 0)
12548 generate_relax_relocations = 0;
12549 else
12550 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
12551 break;
12552
12553 case OPTION_MALIGN_BRANCH_BOUNDARY:
12554 {
12555 char *end;
12556 long int align = strtoul (arg, &end, 0);
12557 if (*end == '\0')
12558 {
12559 if (align == 0)
12560 {
12561 align_branch_power = 0;
12562 break;
12563 }
12564 else if (align >= 16)
12565 {
12566 int align_power;
12567 for (align_power = 0;
12568 (align & 1) == 0;
12569 align >>= 1, align_power++)
12570 continue;
12571 /* Limit alignment power to 31. */
12572 if (align == 1 && align_power < 32)
12573 {
12574 align_branch_power = align_power;
12575 break;
12576 }
12577 }
12578 }
12579 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
12580 }
12581 break;
12582
12583 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
12584 {
12585 char *end;
12586 int align = strtoul (arg, &end, 0);
12587 /* Some processors only support 5 prefixes. */
12588 if (*end == '\0' && align >= 0 && align < 6)
12589 {
12590 align_branch_prefix_size = align;
12591 break;
12592 }
12593 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
12594 arg);
12595 }
12596 break;
12597
12598 case OPTION_MALIGN_BRANCH:
12599 align_branch = 0;
12600 saved = xstrdup (arg);
12601 type = saved;
12602 do
12603 {
12604 next = strchr (type, '+');
12605 if (next)
12606 *next++ = '\0';
12607 if (strcasecmp (type, "jcc") == 0)
12608 align_branch |= align_branch_jcc_bit;
12609 else if (strcasecmp (type, "fused") == 0)
12610 align_branch |= align_branch_fused_bit;
12611 else if (strcasecmp (type, "jmp") == 0)
12612 align_branch |= align_branch_jmp_bit;
12613 else if (strcasecmp (type, "call") == 0)
12614 align_branch |= align_branch_call_bit;
12615 else if (strcasecmp (type, "ret") == 0)
12616 align_branch |= align_branch_ret_bit;
12617 else if (strcasecmp (type, "indirect") == 0)
12618 align_branch |= align_branch_indirect_bit;
12619 else
12620 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
12621 type = next;
12622 }
12623 while (next != NULL);
12624 free (saved);
12625 break;
12626
12627 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
12628 align_branch_power = 5;
12629 align_branch_prefix_size = 5;
12630 align_branch = (align_branch_jcc_bit
12631 | align_branch_fused_bit
12632 | align_branch_jmp_bit);
12633 break;
12634
12635 case OPTION_MAMD64:
12636 isa64 = amd64;
12637 break;
12638
12639 case OPTION_MINTEL64:
12640 isa64 = intel64;
12641 break;
12642
12643 case 'O':
12644 if (arg == NULL)
12645 {
12646 optimize = 1;
12647 /* Turn off -Os. */
12648 optimize_for_space = 0;
12649 }
12650 else if (*arg == 's')
12651 {
12652 optimize_for_space = 1;
12653 /* Turn on all encoding optimizations. */
12654 optimize = INT_MAX;
12655 }
12656 else
12657 {
12658 optimize = atoi (arg);
12659 /* Turn off -Os. */
12660 optimize_for_space = 0;
12661 }
12662 break;
12663
12664 default:
12665 return 0;
12666 }
12667 return 1;
12668 }
12669
12670 #define MESSAGE_TEMPLATE \
12671 " "
12672
12673 static char *
12674 output_message (FILE *stream, char *p, char *message, char *start,
12675 int *left_p, const char *name, int len)
12676 {
12677 int size = sizeof (MESSAGE_TEMPLATE);
12678 int left = *left_p;
12679
12680 /* Reserve 2 spaces for ", " or ",\0" */
12681 left -= len + 2;
12682
12683 /* Check if there is any room. */
12684 if (left >= 0)
12685 {
12686 if (p != start)
12687 {
12688 *p++ = ',';
12689 *p++ = ' ';
12690 }
12691 p = mempcpy (p, name, len);
12692 }
12693 else
12694 {
12695 /* Output the current message now and start a new one. */
12696 *p++ = ',';
12697 *p = '\0';
12698 fprintf (stream, "%s\n", message);
12699 p = start;
12700 left = size - (start - message) - len - 2;
12701
12702 gas_assert (left >= 0);
12703
12704 p = mempcpy (p, name, len);
12705 }
12706
12707 *left_p = left;
12708 return p;
12709 }
12710
12711 static void
12712 show_arch (FILE *stream, int ext, int check)
12713 {
12714 static char message[] = MESSAGE_TEMPLATE;
12715 char *start = message + 27;
12716 char *p;
12717 int size = sizeof (MESSAGE_TEMPLATE);
12718 int left;
12719 const char *name;
12720 int len;
12721 unsigned int j;
12722
12723 p = start;
12724 left = size - (start - message);
12725 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12726 {
12727 /* Should it be skipped? */
12728 if (cpu_arch [j].skip)
12729 continue;
12730
12731 name = cpu_arch [j].name;
12732 len = cpu_arch [j].len;
12733 if (*name == '.')
12734 {
12735 /* It is an extension. Skip if we aren't asked to show it. */
12736 if (ext)
12737 {
12738 name++;
12739 len--;
12740 }
12741 else
12742 continue;
12743 }
12744 else if (ext)
12745 {
12746 /* It is an processor. Skip if we show only extension. */
12747 continue;
12748 }
12749 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
12750 {
12751 /* It is an impossible processor - skip. */
12752 continue;
12753 }
12754
12755 p = output_message (stream, p, message, start, &left, name, len);
12756 }
12757
12758 /* Display disabled extensions. */
12759 if (ext)
12760 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12761 {
12762 name = cpu_noarch [j].name;
12763 len = cpu_noarch [j].len;
12764 p = output_message (stream, p, message, start, &left, name,
12765 len);
12766 }
12767
12768 *p = '\0';
12769 fprintf (stream, "%s\n", message);
12770 }
12771
12772 void
12773 md_show_usage (FILE *stream)
12774 {
12775 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12776 fprintf (stream, _("\
12777 -Qy, -Qn ignored\n\
12778 -V print assembler version number\n\
12779 -k ignored\n"));
12780 #endif
12781 fprintf (stream, _("\
12782 -n Do not optimize code alignment\n\
12783 -q quieten some warnings\n"));
12784 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12785 fprintf (stream, _("\
12786 -s ignored\n"));
12787 #endif
12788 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12789 || defined (TE_PE) || defined (TE_PEP))
12790 fprintf (stream, _("\
12791 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
12792 #endif
12793 #ifdef SVR4_COMMENT_CHARS
12794 fprintf (stream, _("\
12795 --divide do not treat `/' as a comment character\n"));
12796 #else
12797 fprintf (stream, _("\
12798 --divide ignored\n"));
12799 #endif
12800 fprintf (stream, _("\
12801 -march=CPU[,+EXTENSION...]\n\
12802 generate code for CPU and EXTENSION, CPU is one of:\n"));
12803 show_arch (stream, 0, 1);
12804 fprintf (stream, _("\
12805 EXTENSION is combination of:\n"));
12806 show_arch (stream, 1, 0);
12807 fprintf (stream, _("\
12808 -mtune=CPU optimize for CPU, CPU is one of:\n"));
12809 show_arch (stream, 0, 0);
12810 fprintf (stream, _("\
12811 -msse2avx encode SSE instructions with VEX prefix\n"));
12812 fprintf (stream, _("\
12813 -msse-check=[none|error|warning] (default: warning)\n\
12814 check SSE instructions\n"));
12815 fprintf (stream, _("\
12816 -moperand-check=[none|error|warning] (default: warning)\n\
12817 check operand combinations for validity\n"));
12818 fprintf (stream, _("\
12819 -mavxscalar=[128|256] (default: 128)\n\
12820 encode scalar AVX instructions with specific vector\n\
12821 length\n"));
12822 fprintf (stream, _("\
12823 -mvexwig=[0|1] (default: 0)\n\
12824 encode VEX instructions with specific VEX.W value\n\
12825 for VEX.W bit ignored instructions\n"));
12826 fprintf (stream, _("\
12827 -mevexlig=[128|256|512] (default: 128)\n\
12828 encode scalar EVEX instructions with specific vector\n\
12829 length\n"));
12830 fprintf (stream, _("\
12831 -mevexwig=[0|1] (default: 0)\n\
12832 encode EVEX instructions with specific EVEX.W value\n\
12833 for EVEX.W bit ignored instructions\n"));
12834 fprintf (stream, _("\
12835 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
12836 encode EVEX instructions with specific EVEX.RC value\n\
12837 for SAE-only ignored instructions\n"));
12838 fprintf (stream, _("\
12839 -mmnemonic=[att|intel] "));
12840 if (SYSV386_COMPAT)
12841 fprintf (stream, _("(default: att)\n"));
12842 else
12843 fprintf (stream, _("(default: intel)\n"));
12844 fprintf (stream, _("\
12845 use AT&T/Intel mnemonic\n"));
12846 fprintf (stream, _("\
12847 -msyntax=[att|intel] (default: att)\n\
12848 use AT&T/Intel syntax\n"));
12849 fprintf (stream, _("\
12850 -mindex-reg support pseudo index registers\n"));
12851 fprintf (stream, _("\
12852 -mnaked-reg don't require `%%' prefix for registers\n"));
12853 fprintf (stream, _("\
12854 -madd-bnd-prefix add BND prefix for all valid branches\n"));
12855 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12856 fprintf (stream, _("\
12857 -mshared disable branch optimization for shared code\n"));
12858 fprintf (stream, _("\
12859 -mx86-used-note=[no|yes] "));
12860 if (DEFAULT_X86_USED_NOTE)
12861 fprintf (stream, _("(default: yes)\n"));
12862 else
12863 fprintf (stream, _("(default: no)\n"));
12864 fprintf (stream, _("\
12865 generate x86 used ISA and feature properties\n"));
12866 #endif
12867 #if defined (TE_PE) || defined (TE_PEP)
12868 fprintf (stream, _("\
12869 -mbig-obj generate big object files\n"));
12870 #endif
12871 fprintf (stream, _("\
12872 -momit-lock-prefix=[no|yes] (default: no)\n\
12873 strip all lock prefixes\n"));
12874 fprintf (stream, _("\
12875 -mfence-as-lock-add=[no|yes] (default: no)\n\
12876 encode lfence, mfence and sfence as\n\
12877 lock addl $0x0, (%%{re}sp)\n"));
12878 fprintf (stream, _("\
12879 -mrelax-relocations=[no|yes] "));
12880 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
12881 fprintf (stream, _("(default: yes)\n"));
12882 else
12883 fprintf (stream, _("(default: no)\n"));
12884 fprintf (stream, _("\
12885 generate relax relocations\n"));
12886 fprintf (stream, _("\
12887 -malign-branch-boundary=NUM (default: 0)\n\
12888 align branches within NUM byte boundary\n"));
12889 fprintf (stream, _("\
12890 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
12891 TYPE is combination of jcc, fused, jmp, call, ret,\n\
12892 indirect\n\
12893 specify types of branches to align\n"));
12894 fprintf (stream, _("\
12895 -malign-branch-prefix-size=NUM (default: 5)\n\
12896 align branches with NUM prefixes per instruction\n"));
12897 fprintf (stream, _("\
12898 -mbranches-within-32B-boundaries\n\
12899 align branches within 32 byte boundary\n"));
12900 fprintf (stream, _("\
12901 -mamd64 accept only AMD64 ISA [default]\n"));
12902 fprintf (stream, _("\
12903 -mintel64 accept only Intel64 ISA\n"));
12904 }
12905
12906 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
12907 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12908 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12909
12910 /* Pick the target format to use. */
12911
12912 const char *
12913 i386_target_format (void)
12914 {
12915 if (!strncmp (default_arch, "x86_64", 6))
12916 {
12917 update_code_flag (CODE_64BIT, 1);
12918 if (default_arch[6] == '\0')
12919 x86_elf_abi = X86_64_ABI;
12920 else
12921 x86_elf_abi = X86_64_X32_ABI;
12922 }
12923 else if (!strcmp (default_arch, "i386"))
12924 update_code_flag (CODE_32BIT, 1);
12925 else if (!strcmp (default_arch, "iamcu"))
12926 {
12927 update_code_flag (CODE_32BIT, 1);
12928 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
12929 {
12930 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
12931 cpu_arch_name = "iamcu";
12932 cpu_sub_arch_name = NULL;
12933 cpu_arch_flags = iamcu_flags;
12934 cpu_arch_isa = PROCESSOR_IAMCU;
12935 cpu_arch_isa_flags = iamcu_flags;
12936 if (!cpu_arch_tune_set)
12937 {
12938 cpu_arch_tune = cpu_arch_isa;
12939 cpu_arch_tune_flags = cpu_arch_isa_flags;
12940 }
12941 }
12942 else if (cpu_arch_isa != PROCESSOR_IAMCU)
12943 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
12944 cpu_arch_name);
12945 }
12946 else
12947 as_fatal (_("unknown architecture"));
12948
12949 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
12950 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12951 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
12952 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12953
12954 switch (OUTPUT_FLAVOR)
12955 {
12956 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
12957 case bfd_target_aout_flavour:
12958 return AOUT_TARGET_FORMAT;
12959 #endif
12960 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
12961 # if defined (TE_PE) || defined (TE_PEP)
12962 case bfd_target_coff_flavour:
12963 if (flag_code == CODE_64BIT)
12964 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
12965 else
12966 return "pe-i386";
12967 # elif defined (TE_GO32)
12968 case bfd_target_coff_flavour:
12969 return "coff-go32";
12970 # else
12971 case bfd_target_coff_flavour:
12972 return "coff-i386";
12973 # endif
12974 #endif
12975 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12976 case bfd_target_elf_flavour:
12977 {
12978 const char *format;
12979
12980 switch (x86_elf_abi)
12981 {
12982 default:
12983 format = ELF_TARGET_FORMAT;
12984 #ifndef TE_SOLARIS
12985 tls_get_addr = "___tls_get_addr";
12986 #endif
12987 break;
12988 case X86_64_ABI:
12989 use_rela_relocations = 1;
12990 object_64bit = 1;
12991 #ifndef TE_SOLARIS
12992 tls_get_addr = "__tls_get_addr";
12993 #endif
12994 format = ELF_TARGET_FORMAT64;
12995 break;
12996 case X86_64_X32_ABI:
12997 use_rela_relocations = 1;
12998 object_64bit = 1;
12999 #ifndef TE_SOLARIS
13000 tls_get_addr = "__tls_get_addr";
13001 #endif
13002 disallow_64bit_reloc = 1;
13003 format = ELF_TARGET_FORMAT32;
13004 break;
13005 }
13006 if (cpu_arch_isa == PROCESSOR_L1OM)
13007 {
13008 if (x86_elf_abi != X86_64_ABI)
13009 as_fatal (_("Intel L1OM is 64bit only"));
13010 return ELF_TARGET_L1OM_FORMAT;
13011 }
13012 else if (cpu_arch_isa == PROCESSOR_K1OM)
13013 {
13014 if (x86_elf_abi != X86_64_ABI)
13015 as_fatal (_("Intel K1OM is 64bit only"));
13016 return ELF_TARGET_K1OM_FORMAT;
13017 }
13018 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13019 {
13020 if (x86_elf_abi != I386_ABI)
13021 as_fatal (_("Intel MCU is 32bit only"));
13022 return ELF_TARGET_IAMCU_FORMAT;
13023 }
13024 else
13025 return format;
13026 }
13027 #endif
13028 #if defined (OBJ_MACH_O)
13029 case bfd_target_mach_o_flavour:
13030 if (flag_code == CODE_64BIT)
13031 {
13032 use_rela_relocations = 1;
13033 object_64bit = 1;
13034 return "mach-o-x86-64";
13035 }
13036 else
13037 return "mach-o-i386";
13038 #endif
13039 default:
13040 abort ();
13041 return NULL;
13042 }
13043 }
13044
13045 #endif /* OBJ_MAYBE_ more than one */
13046 \f
13047 symbolS *
13048 md_undefined_symbol (char *name)
13049 {
13050 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13051 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13052 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13053 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13054 {
13055 if (!GOT_symbol)
13056 {
13057 if (symbol_find (name))
13058 as_bad (_("GOT already in symbol table"));
13059 GOT_symbol = symbol_new (name, undefined_section,
13060 (valueT) 0, &zero_address_frag);
13061 };
13062 return GOT_symbol;
13063 }
13064 return 0;
13065 }
13066
13067 /* Round up a section size to the appropriate boundary. */
13068
13069 valueT
13070 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13071 {
13072 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13073 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13074 {
13075 /* For a.out, force the section size to be aligned. If we don't do
13076 this, BFD will align it for us, but it will not write out the
13077 final bytes of the section. This may be a bug in BFD, but it is
13078 easier to fix it here since that is how the other a.out targets
13079 work. */
13080 int align;
13081
13082 align = bfd_section_alignment (segment);
13083 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13084 }
13085 #endif
13086
13087 return size;
13088 }
13089
13090 /* On the i386, PC-relative offsets are relative to the start of the
13091 next instruction. That is, the address of the offset, plus its
13092 size, since the offset is always the last part of the insn. */
13093
13094 long
13095 md_pcrel_from (fixS *fixP)
13096 {
13097 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13098 }
13099
13100 #ifndef I386COFF
13101
13102 static void
13103 s_bss (int ignore ATTRIBUTE_UNUSED)
13104 {
13105 int temp;
13106
13107 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13108 if (IS_ELF)
13109 obj_elf_section_change_hook ();
13110 #endif
13111 temp = get_absolute_expression ();
13112 subseg_set (bss_section, (subsegT) temp);
13113 demand_empty_rest_of_line ();
13114 }
13115
13116 #endif
13117
13118 /* Remember constant directive. */
13119
13120 void
13121 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13122 {
13123 if (last_insn.kind != last_insn_directive
13124 && (bfd_section_flags (now_seg) & SEC_CODE))
13125 {
13126 last_insn.seg = now_seg;
13127 last_insn.kind = last_insn_directive;
13128 last_insn.name = "constant directive";
13129 last_insn.file = as_where (&last_insn.line);
13130 }
13131 }
13132
13133 void
13134 i386_validate_fix (fixS *fixp)
13135 {
13136 if (fixp->fx_subsy)
13137 {
13138 if (fixp->fx_subsy == GOT_symbol)
13139 {
13140 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13141 {
13142 if (!object_64bit)
13143 abort ();
13144 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13145 if (fixp->fx_tcbit2)
13146 fixp->fx_r_type = (fixp->fx_tcbit
13147 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13148 : BFD_RELOC_X86_64_GOTPCRELX);
13149 else
13150 #endif
13151 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13152 }
13153 else
13154 {
13155 if (!object_64bit)
13156 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13157 else
13158 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13159 }
13160 fixp->fx_subsy = 0;
13161 }
13162 }
13163 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13164 else if (!object_64bit)
13165 {
13166 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13167 && fixp->fx_tcbit2)
13168 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13169 }
13170 #endif
13171 }
13172
13173 arelent *
13174 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13175 {
13176 arelent *rel;
13177 bfd_reloc_code_real_type code;
13178
13179 switch (fixp->fx_r_type)
13180 {
13181 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13182 case BFD_RELOC_SIZE32:
13183 case BFD_RELOC_SIZE64:
13184 if (S_IS_DEFINED (fixp->fx_addsy)
13185 && !S_IS_EXTERNAL (fixp->fx_addsy))
13186 {
13187 /* Resolve size relocation against local symbol to size of
13188 the symbol plus addend. */
13189 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13190 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13191 && !fits_in_unsigned_long (value))
13192 as_bad_where (fixp->fx_file, fixp->fx_line,
13193 _("symbol size computation overflow"));
13194 fixp->fx_addsy = NULL;
13195 fixp->fx_subsy = NULL;
13196 md_apply_fix (fixp, (valueT *) &value, NULL);
13197 return NULL;
13198 }
13199 #endif
13200 /* Fall through. */
13201
13202 case BFD_RELOC_X86_64_PLT32:
13203 case BFD_RELOC_X86_64_GOT32:
13204 case BFD_RELOC_X86_64_GOTPCREL:
13205 case BFD_RELOC_X86_64_GOTPCRELX:
13206 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13207 case BFD_RELOC_386_PLT32:
13208 case BFD_RELOC_386_GOT32:
13209 case BFD_RELOC_386_GOT32X:
13210 case BFD_RELOC_386_GOTOFF:
13211 case BFD_RELOC_386_GOTPC:
13212 case BFD_RELOC_386_TLS_GD:
13213 case BFD_RELOC_386_TLS_LDM:
13214 case BFD_RELOC_386_TLS_LDO_32:
13215 case BFD_RELOC_386_TLS_IE_32:
13216 case BFD_RELOC_386_TLS_IE:
13217 case BFD_RELOC_386_TLS_GOTIE:
13218 case BFD_RELOC_386_TLS_LE_32:
13219 case BFD_RELOC_386_TLS_LE:
13220 case BFD_RELOC_386_TLS_GOTDESC:
13221 case BFD_RELOC_386_TLS_DESC_CALL:
13222 case BFD_RELOC_X86_64_TLSGD:
13223 case BFD_RELOC_X86_64_TLSLD:
13224 case BFD_RELOC_X86_64_DTPOFF32:
13225 case BFD_RELOC_X86_64_DTPOFF64:
13226 case BFD_RELOC_X86_64_GOTTPOFF:
13227 case BFD_RELOC_X86_64_TPOFF32:
13228 case BFD_RELOC_X86_64_TPOFF64:
13229 case BFD_RELOC_X86_64_GOTOFF64:
13230 case BFD_RELOC_X86_64_GOTPC32:
13231 case BFD_RELOC_X86_64_GOT64:
13232 case BFD_RELOC_X86_64_GOTPCREL64:
13233 case BFD_RELOC_X86_64_GOTPC64:
13234 case BFD_RELOC_X86_64_GOTPLT64:
13235 case BFD_RELOC_X86_64_PLTOFF64:
13236 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13237 case BFD_RELOC_X86_64_TLSDESC_CALL:
13238 case BFD_RELOC_RVA:
13239 case BFD_RELOC_VTABLE_ENTRY:
13240 case BFD_RELOC_VTABLE_INHERIT:
13241 #ifdef TE_PE
13242 case BFD_RELOC_32_SECREL:
13243 #endif
13244 code = fixp->fx_r_type;
13245 break;
13246 case BFD_RELOC_X86_64_32S:
13247 if (!fixp->fx_pcrel)
13248 {
13249 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13250 code = fixp->fx_r_type;
13251 break;
13252 }
13253 /* Fall through. */
13254 default:
13255 if (fixp->fx_pcrel)
13256 {
13257 switch (fixp->fx_size)
13258 {
13259 default:
13260 as_bad_where (fixp->fx_file, fixp->fx_line,
13261 _("can not do %d byte pc-relative relocation"),
13262 fixp->fx_size);
13263 code = BFD_RELOC_32_PCREL;
13264 break;
13265 case 1: code = BFD_RELOC_8_PCREL; break;
13266 case 2: code = BFD_RELOC_16_PCREL; break;
13267 case 4: code = BFD_RELOC_32_PCREL; break;
13268 #ifdef BFD64
13269 case 8: code = BFD_RELOC_64_PCREL; break;
13270 #endif
13271 }
13272 }
13273 else
13274 {
13275 switch (fixp->fx_size)
13276 {
13277 default:
13278 as_bad_where (fixp->fx_file, fixp->fx_line,
13279 _("can not do %d byte relocation"),
13280 fixp->fx_size);
13281 code = BFD_RELOC_32;
13282 break;
13283 case 1: code = BFD_RELOC_8; break;
13284 case 2: code = BFD_RELOC_16; break;
13285 case 4: code = BFD_RELOC_32; break;
13286 #ifdef BFD64
13287 case 8: code = BFD_RELOC_64; break;
13288 #endif
13289 }
13290 }
13291 break;
13292 }
13293
13294 if ((code == BFD_RELOC_32
13295 || code == BFD_RELOC_32_PCREL
13296 || code == BFD_RELOC_X86_64_32S)
13297 && GOT_symbol
13298 && fixp->fx_addsy == GOT_symbol)
13299 {
13300 if (!object_64bit)
13301 code = BFD_RELOC_386_GOTPC;
13302 else
13303 code = BFD_RELOC_X86_64_GOTPC32;
13304 }
13305 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13306 && GOT_symbol
13307 && fixp->fx_addsy == GOT_symbol)
13308 {
13309 code = BFD_RELOC_X86_64_GOTPC64;
13310 }
13311
13312 rel = XNEW (arelent);
13313 rel->sym_ptr_ptr = XNEW (asymbol *);
13314 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13315
13316 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13317
13318 if (!use_rela_relocations)
13319 {
13320 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13321 vtable entry to be used in the relocation's section offset. */
13322 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13323 rel->address = fixp->fx_offset;
13324 #if defined (OBJ_COFF) && defined (TE_PE)
13325 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13326 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13327 else
13328 #endif
13329 rel->addend = 0;
13330 }
13331 /* Use the rela in 64bit mode. */
13332 else
13333 {
13334 if (disallow_64bit_reloc)
13335 switch (code)
13336 {
13337 case BFD_RELOC_X86_64_DTPOFF64:
13338 case BFD_RELOC_X86_64_TPOFF64:
13339 case BFD_RELOC_64_PCREL:
13340 case BFD_RELOC_X86_64_GOTOFF64:
13341 case BFD_RELOC_X86_64_GOT64:
13342 case BFD_RELOC_X86_64_GOTPCREL64:
13343 case BFD_RELOC_X86_64_GOTPC64:
13344 case BFD_RELOC_X86_64_GOTPLT64:
13345 case BFD_RELOC_X86_64_PLTOFF64:
13346 as_bad_where (fixp->fx_file, fixp->fx_line,
13347 _("cannot represent relocation type %s in x32 mode"),
13348 bfd_get_reloc_code_name (code));
13349 break;
13350 default:
13351 break;
13352 }
13353
13354 if (!fixp->fx_pcrel)
13355 rel->addend = fixp->fx_offset;
13356 else
13357 switch (code)
13358 {
13359 case BFD_RELOC_X86_64_PLT32:
13360 case BFD_RELOC_X86_64_GOT32:
13361 case BFD_RELOC_X86_64_GOTPCREL:
13362 case BFD_RELOC_X86_64_GOTPCRELX:
13363 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13364 case BFD_RELOC_X86_64_TLSGD:
13365 case BFD_RELOC_X86_64_TLSLD:
13366 case BFD_RELOC_X86_64_GOTTPOFF:
13367 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13368 case BFD_RELOC_X86_64_TLSDESC_CALL:
13369 rel->addend = fixp->fx_offset - fixp->fx_size;
13370 break;
13371 default:
13372 rel->addend = (section->vma
13373 - fixp->fx_size
13374 + fixp->fx_addnumber
13375 + md_pcrel_from (fixp));
13376 break;
13377 }
13378 }
13379
13380 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
13381 if (rel->howto == NULL)
13382 {
13383 as_bad_where (fixp->fx_file, fixp->fx_line,
13384 _("cannot represent relocation type %s"),
13385 bfd_get_reloc_code_name (code));
13386 /* Set howto to a garbage value so that we can keep going. */
13387 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
13388 gas_assert (rel->howto != NULL);
13389 }
13390
13391 return rel;
13392 }
13393
13394 #include "tc-i386-intel.c"
13395
13396 void
13397 tc_x86_parse_to_dw2regnum (expressionS *exp)
13398 {
13399 int saved_naked_reg;
13400 char saved_register_dot;
13401
13402 saved_naked_reg = allow_naked_reg;
13403 allow_naked_reg = 1;
13404 saved_register_dot = register_chars['.'];
13405 register_chars['.'] = '.';
13406 allow_pseudo_reg = 1;
13407 expression_and_evaluate (exp);
13408 allow_pseudo_reg = 0;
13409 register_chars['.'] = saved_register_dot;
13410 allow_naked_reg = saved_naked_reg;
13411
13412 if (exp->X_op == O_register && exp->X_add_number >= 0)
13413 {
13414 if ((addressT) exp->X_add_number < i386_regtab_size)
13415 {
13416 exp->X_op = O_constant;
13417 exp->X_add_number = i386_regtab[exp->X_add_number]
13418 .dw2_regnum[flag_code >> 1];
13419 }
13420 else
13421 exp->X_op = O_illegal;
13422 }
13423 }
13424
13425 void
13426 tc_x86_frame_initial_instructions (void)
13427 {
13428 static unsigned int sp_regno[2];
13429
13430 if (!sp_regno[flag_code >> 1])
13431 {
13432 char *saved_input = input_line_pointer;
13433 char sp[][4] = {"esp", "rsp"};
13434 expressionS exp;
13435
13436 input_line_pointer = sp[flag_code >> 1];
13437 tc_x86_parse_to_dw2regnum (&exp);
13438 gas_assert (exp.X_op == O_constant);
13439 sp_regno[flag_code >> 1] = exp.X_add_number;
13440 input_line_pointer = saved_input;
13441 }
13442
13443 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
13444 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
13445 }
13446
13447 int
13448 x86_dwarf2_addr_size (void)
13449 {
13450 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13451 if (x86_elf_abi == X86_64_X32_ABI)
13452 return 4;
13453 #endif
13454 return bfd_arch_bits_per_address (stdoutput) / 8;
13455 }
13456
13457 int
13458 i386_elf_section_type (const char *str, size_t len)
13459 {
13460 if (flag_code == CODE_64BIT
13461 && len == sizeof ("unwind") - 1
13462 && strncmp (str, "unwind", 6) == 0)
13463 return SHT_X86_64_UNWIND;
13464
13465 return -1;
13466 }
13467
13468 #ifdef TE_SOLARIS
13469 void
13470 i386_solaris_fix_up_eh_frame (segT sec)
13471 {
13472 if (flag_code == CODE_64BIT)
13473 elf_section_type (sec) = SHT_X86_64_UNWIND;
13474 }
13475 #endif
13476
13477 #ifdef TE_PE
13478 void
13479 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
13480 {
13481 expressionS exp;
13482
13483 exp.X_op = O_secrel;
13484 exp.X_add_symbol = symbol;
13485 exp.X_add_number = 0;
13486 emit_expr (&exp, size);
13487 }
13488 #endif
13489
13490 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13491 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
13492
13493 bfd_vma
13494 x86_64_section_letter (int letter, const char **ptr_msg)
13495 {
13496 if (flag_code == CODE_64BIT)
13497 {
13498 if (letter == 'l')
13499 return SHF_X86_64_LARGE;
13500
13501 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
13502 }
13503 else
13504 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
13505 return -1;
13506 }
13507
13508 bfd_vma
13509 x86_64_section_word (char *str, size_t len)
13510 {
13511 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
13512 return SHF_X86_64_LARGE;
13513
13514 return -1;
13515 }
13516
13517 static void
13518 handle_large_common (int small ATTRIBUTE_UNUSED)
13519 {
13520 if (flag_code != CODE_64BIT)
13521 {
13522 s_comm_internal (0, elf_common_parse);
13523 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
13524 }
13525 else
13526 {
13527 static segT lbss_section;
13528 asection *saved_com_section_ptr = elf_com_section_ptr;
13529 asection *saved_bss_section = bss_section;
13530
13531 if (lbss_section == NULL)
13532 {
13533 flagword applicable;
13534 segT seg = now_seg;
13535 subsegT subseg = now_subseg;
13536
13537 /* The .lbss section is for local .largecomm symbols. */
13538 lbss_section = subseg_new (".lbss", 0);
13539 applicable = bfd_applicable_section_flags (stdoutput);
13540 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
13541 seg_info (lbss_section)->bss = 1;
13542
13543 subseg_set (seg, subseg);
13544 }
13545
13546 elf_com_section_ptr = &_bfd_elf_large_com_section;
13547 bss_section = lbss_section;
13548
13549 s_comm_internal (0, elf_common_parse);
13550
13551 elf_com_section_ptr = saved_com_section_ptr;
13552 bss_section = saved_bss_section;
13553 }
13554 }
13555 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 0.296701 seconds and 5 git commands to generate.