i386: Also check R12-R15 registers when optimizing testq to testb
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2019 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef REGISTER_WARNINGS
48 #define REGISTER_WARNINGS 1
49 #endif
50
51 #ifndef INFER_ADDR_PREFIX
52 #define INFER_ADDR_PREFIX 1
53 #endif
54
55 #ifndef DEFAULT_ARCH
56 #define DEFAULT_ARCH "i386"
57 #endif
58
59 #ifndef INLINE
60 #if __GNUC__ >= 2
61 #define INLINE __inline__
62 #else
63 #define INLINE
64 #endif
65 #endif
66
67 /* Prefixes will be emitted in the order defined below.
68 WAIT_PREFIX must be the first prefix since FWAIT is really is an
69 instruction, and so must come before any prefixes.
70 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
71 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
72 #define WAIT_PREFIX 0
73 #define SEG_PREFIX 1
74 #define ADDR_PREFIX 2
75 #define DATA_PREFIX 3
76 #define REP_PREFIX 4
77 #define HLE_PREFIX REP_PREFIX
78 #define BND_PREFIX REP_PREFIX
79 #define LOCK_PREFIX 5
80 #define REX_PREFIX 6 /* must come last. */
81 #define MAX_PREFIXES 7 /* max prefixes per opcode */
82
83 /* we define the syntax here (modulo base,index,scale syntax) */
84 #define REGISTER_PREFIX '%'
85 #define IMMEDIATE_PREFIX '$'
86 #define ABSOLUTE_PREFIX '*'
87
88 /* these are the instruction mnemonic suffixes in AT&T syntax or
89 memory operand size in Intel syntax. */
90 #define WORD_MNEM_SUFFIX 'w'
91 #define BYTE_MNEM_SUFFIX 'b'
92 #define SHORT_MNEM_SUFFIX 's'
93 #define LONG_MNEM_SUFFIX 'l'
94 #define QWORD_MNEM_SUFFIX 'q'
95 /* Intel Syntax. Use a non-ascii letter since since it never appears
96 in instructions. */
97 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
98
99 #define END_OF_INSN '\0'
100
101 /* This matches the C -> StaticRounding alias in the opcode table. */
102 #define commutative staticrounding
103
104 /*
105 'templates' is for grouping together 'template' structures for opcodes
106 of the same name. This is only used for storing the insns in the grand
107 ole hash table of insns.
108 The templates themselves start at START and range up to (but not including)
109 END.
110 */
111 typedef struct
112 {
113 const insn_template *start;
114 const insn_template *end;
115 }
116 templates;
117
118 /* 386 operand encoding bytes: see 386 book for details of this. */
119 typedef struct
120 {
121 unsigned int regmem; /* codes register or memory operand */
122 unsigned int reg; /* codes register operand (or extended opcode) */
123 unsigned int mode; /* how to interpret regmem & reg */
124 }
125 modrm_byte;
126
127 /* x86-64 extension prefix. */
128 typedef int rex_byte;
129
130 /* 386 opcode byte to code indirect addressing. */
131 typedef struct
132 {
133 unsigned base;
134 unsigned index;
135 unsigned scale;
136 }
137 sib_byte;
138
139 /* x86 arch names, types and features */
140 typedef struct
141 {
142 const char *name; /* arch name */
143 unsigned int len; /* arch string length */
144 enum processor_type type; /* arch type */
145 i386_cpu_flags flags; /* cpu feature flags */
146 unsigned int skip; /* show_arch should skip this. */
147 }
148 arch_entry;
149
150 /* Used to turn off indicated flags. */
151 typedef struct
152 {
153 const char *name; /* arch name */
154 unsigned int len; /* arch string length */
155 i386_cpu_flags flags; /* cpu feature flags */
156 }
157 noarch_entry;
158
159 static void update_code_flag (int, int);
160 static void set_code_flag (int);
161 static void set_16bit_gcc_code_flag (int);
162 static void set_intel_syntax (int);
163 static void set_intel_mnemonic (int);
164 static void set_allow_index_reg (int);
165 static void set_check (int);
166 static void set_cpu_arch (int);
167 #ifdef TE_PE
168 static void pe_directive_secrel (int);
169 #endif
170 static void signed_cons (int);
171 static char *output_invalid (int c);
172 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
173 const char *);
174 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
175 const char *);
176 static int i386_att_operand (char *);
177 static int i386_intel_operand (char *, int);
178 static int i386_intel_simplify (expressionS *);
179 static int i386_intel_parse_name (const char *, expressionS *);
180 static const reg_entry *parse_register (char *, char **);
181 static char *parse_insn (char *, char *);
182 static char *parse_operands (char *, const char *);
183 static void swap_operands (void);
184 static void swap_2_operands (int, int);
185 static void optimize_imm (void);
186 static void optimize_disp (void);
187 static const insn_template *match_template (char);
188 static int check_string (void);
189 static int process_suffix (void);
190 static int check_byte_reg (void);
191 static int check_long_reg (void);
192 static int check_qword_reg (void);
193 static int check_word_reg (void);
194 static int finalize_imm (void);
195 static int process_operands (void);
196 static const seg_entry *build_modrm_byte (void);
197 static void output_insn (void);
198 static void output_imm (fragS *, offsetT);
199 static void output_disp (fragS *, offsetT);
200 #ifndef I386COFF
201 static void s_bss (int);
202 #endif
203 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
204 static void handle_large_common (int small ATTRIBUTE_UNUSED);
205
206 /* GNU_PROPERTY_X86_ISA_1_USED. */
207 static unsigned int x86_isa_1_used;
208 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
209 static unsigned int x86_feature_2_used;
210 /* Generate x86 used ISA and feature properties. */
211 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
212 #endif
213
214 static const char *default_arch = DEFAULT_ARCH;
215
216 /* This struct describes rounding control and SAE in the instruction. */
217 struct RC_Operation
218 {
219 enum rc_type
220 {
221 rne = 0,
222 rd,
223 ru,
224 rz,
225 saeonly
226 } type;
227 int operand;
228 };
229
230 static struct RC_Operation rc_op;
231
232 /* The struct describes masking, applied to OPERAND in the instruction.
233 MASK is a pointer to the corresponding mask register. ZEROING tells
234 whether merging or zeroing mask is used. */
235 struct Mask_Operation
236 {
237 const reg_entry *mask;
238 unsigned int zeroing;
239 /* The operand where this operation is associated. */
240 int operand;
241 };
242
243 static struct Mask_Operation mask_op;
244
245 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
246 broadcast factor. */
247 struct Broadcast_Operation
248 {
249 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
250 int type;
251
252 /* Index of broadcasted operand. */
253 int operand;
254
255 /* Number of bytes to broadcast. */
256 int bytes;
257 };
258
259 static struct Broadcast_Operation broadcast_op;
260
261 /* VEX prefix. */
262 typedef struct
263 {
264 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
265 unsigned char bytes[4];
266 unsigned int length;
267 /* Destination or source register specifier. */
268 const reg_entry *register_specifier;
269 } vex_prefix;
270
271 /* 'md_assemble ()' gathers together information and puts it into a
272 i386_insn. */
273
274 union i386_op
275 {
276 expressionS *disps;
277 expressionS *imms;
278 const reg_entry *regs;
279 };
280
281 enum i386_error
282 {
283 operand_size_mismatch,
284 operand_type_mismatch,
285 register_type_mismatch,
286 number_of_operands_mismatch,
287 invalid_instruction_suffix,
288 bad_imm4,
289 unsupported_with_intel_mnemonic,
290 unsupported_syntax,
291 unsupported,
292 invalid_vsib_address,
293 invalid_vector_register_set,
294 unsupported_vector_index_register,
295 unsupported_broadcast,
296 broadcast_needed,
297 unsupported_masking,
298 mask_not_on_destination,
299 no_default_mask,
300 unsupported_rc_sae,
301 rc_sae_operand_not_last_imm,
302 invalid_register_operand,
303 };
304
305 struct _i386_insn
306 {
307 /* TM holds the template for the insn were currently assembling. */
308 insn_template tm;
309
310 /* SUFFIX holds the instruction size suffix for byte, word, dword
311 or qword, if given. */
312 char suffix;
313
314 /* OPERANDS gives the number of given operands. */
315 unsigned int operands;
316
317 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
318 of given register, displacement, memory operands and immediate
319 operands. */
320 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
321
322 /* TYPES [i] is the type (see above #defines) which tells us how to
323 use OP[i] for the corresponding operand. */
324 i386_operand_type types[MAX_OPERANDS];
325
326 /* Displacement expression, immediate expression, or register for each
327 operand. */
328 union i386_op op[MAX_OPERANDS];
329
330 /* Flags for operands. */
331 unsigned int flags[MAX_OPERANDS];
332 #define Operand_PCrel 1
333 #define Operand_Mem 2
334
335 /* Relocation type for operand */
336 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
337
338 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
339 the base index byte below. */
340 const reg_entry *base_reg;
341 const reg_entry *index_reg;
342 unsigned int log2_scale_factor;
343
344 /* SEG gives the seg_entries of this insn. They are zero unless
345 explicit segment overrides are given. */
346 const seg_entry *seg[2];
347
348 /* Copied first memory operand string, for re-checking. */
349 char *memop1_string;
350
351 /* PREFIX holds all the given prefix opcodes (usually null).
352 PREFIXES is the number of prefix opcodes. */
353 unsigned int prefixes;
354 unsigned char prefix[MAX_PREFIXES];
355
356 /* The operand to a branch insn indicates an absolute branch. */
357 bfd_boolean jumpabsolute;
358
359 /* Has MMX register operands. */
360 bfd_boolean has_regmmx;
361
362 /* Has XMM register operands. */
363 bfd_boolean has_regxmm;
364
365 /* Has YMM register operands. */
366 bfd_boolean has_regymm;
367
368 /* Has ZMM register operands. */
369 bfd_boolean has_regzmm;
370
371 /* Has GOTPC or TLS relocation. */
372 bfd_boolean has_gotpc_tls_reloc;
373
374 /* RM and SIB are the modrm byte and the sib byte where the
375 addressing modes of this insn are encoded. */
376 modrm_byte rm;
377 rex_byte rex;
378 rex_byte vrex;
379 sib_byte sib;
380 vex_prefix vex;
381
382 /* Masking attributes. */
383 struct Mask_Operation *mask;
384
385 /* Rounding control and SAE attributes. */
386 struct RC_Operation *rounding;
387
388 /* Broadcasting attributes. */
389 struct Broadcast_Operation *broadcast;
390
391 /* Compressed disp8*N attribute. */
392 unsigned int memshift;
393
394 /* Prefer load or store in encoding. */
395 enum
396 {
397 dir_encoding_default = 0,
398 dir_encoding_load,
399 dir_encoding_store,
400 dir_encoding_swap
401 } dir_encoding;
402
403 /* Prefer 8bit or 32bit displacement in encoding. */
404 enum
405 {
406 disp_encoding_default = 0,
407 disp_encoding_8bit,
408 disp_encoding_32bit
409 } disp_encoding;
410
411 /* Prefer the REX byte in encoding. */
412 bfd_boolean rex_encoding;
413
414 /* Disable instruction size optimization. */
415 bfd_boolean no_optimize;
416
417 /* How to encode vector instructions. */
418 enum
419 {
420 vex_encoding_default = 0,
421 vex_encoding_vex2,
422 vex_encoding_vex3,
423 vex_encoding_evex
424 } vec_encoding;
425
426 /* REP prefix. */
427 const char *rep_prefix;
428
429 /* HLE prefix. */
430 const char *hle_prefix;
431
432 /* Have BND prefix. */
433 const char *bnd_prefix;
434
435 /* Have NOTRACK prefix. */
436 const char *notrack_prefix;
437
438 /* Error message. */
439 enum i386_error error;
440 };
441
442 typedef struct _i386_insn i386_insn;
443
444 /* Link RC type with corresponding string, that'll be looked for in
445 asm. */
446 struct RC_name
447 {
448 enum rc_type type;
449 const char *name;
450 unsigned int len;
451 };
452
453 static const struct RC_name RC_NamesTable[] =
454 {
455 { rne, STRING_COMMA_LEN ("rn-sae") },
456 { rd, STRING_COMMA_LEN ("rd-sae") },
457 { ru, STRING_COMMA_LEN ("ru-sae") },
458 { rz, STRING_COMMA_LEN ("rz-sae") },
459 { saeonly, STRING_COMMA_LEN ("sae") },
460 };
461
462 /* List of chars besides those in app.c:symbol_chars that can start an
463 operand. Used to prevent the scrubber eating vital white-space. */
464 const char extra_symbol_chars[] = "*%-([{}"
465 #ifdef LEX_AT
466 "@"
467 #endif
468 #ifdef LEX_QM
469 "?"
470 #endif
471 ;
472
473 #if (defined (TE_I386AIX) \
474 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
475 && !defined (TE_GNU) \
476 && !defined (TE_LINUX) \
477 && !defined (TE_NACL) \
478 && !defined (TE_FreeBSD) \
479 && !defined (TE_DragonFly) \
480 && !defined (TE_NetBSD)))
481 /* This array holds the chars that always start a comment. If the
482 pre-processor is disabled, these aren't very useful. The option
483 --divide will remove '/' from this list. */
484 const char *i386_comment_chars = "#/";
485 #define SVR4_COMMENT_CHARS 1
486 #define PREFIX_SEPARATOR '\\'
487
488 #else
489 const char *i386_comment_chars = "#";
490 #define PREFIX_SEPARATOR '/'
491 #endif
492
493 /* This array holds the chars that only start a comment at the beginning of
494 a line. If the line seems to have the form '# 123 filename'
495 .line and .file directives will appear in the pre-processed output.
496 Note that input_file.c hand checks for '#' at the beginning of the
497 first line of the input file. This is because the compiler outputs
498 #NO_APP at the beginning of its output.
499 Also note that comments started like this one will always work if
500 '/' isn't otherwise defined. */
501 const char line_comment_chars[] = "#/";
502
503 const char line_separator_chars[] = ";";
504
505 /* Chars that can be used to separate mant from exp in floating point
506 nums. */
507 const char EXP_CHARS[] = "eE";
508
509 /* Chars that mean this number is a floating point constant
510 As in 0f12.456
511 or 0d1.2345e12. */
512 const char FLT_CHARS[] = "fFdDxX";
513
514 /* Tables for lexical analysis. */
515 static char mnemonic_chars[256];
516 static char register_chars[256];
517 static char operand_chars[256];
518 static char identifier_chars[256];
519 static char digit_chars[256];
520
521 /* Lexical macros. */
522 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
523 #define is_operand_char(x) (operand_chars[(unsigned char) x])
524 #define is_register_char(x) (register_chars[(unsigned char) x])
525 #define is_space_char(x) ((x) == ' ')
526 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
527 #define is_digit_char(x) (digit_chars[(unsigned char) x])
528
529 /* All non-digit non-letter characters that may occur in an operand. */
530 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
531
532 /* md_assemble() always leaves the strings it's passed unaltered. To
533 effect this we maintain a stack of saved characters that we've smashed
534 with '\0's (indicating end of strings for various sub-fields of the
535 assembler instruction). */
536 static char save_stack[32];
537 static char *save_stack_p;
538 #define END_STRING_AND_SAVE(s) \
539 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
540 #define RESTORE_END_STRING(s) \
541 do { *(s) = *--save_stack_p; } while (0)
542
543 /* The instruction we're assembling. */
544 static i386_insn i;
545
546 /* Possible templates for current insn. */
547 static const templates *current_templates;
548
549 /* Per instruction expressionS buffers: max displacements & immediates. */
550 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
551 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
552
553 /* Current operand we are working on. */
554 static int this_operand = -1;
555
556 /* We support four different modes. FLAG_CODE variable is used to distinguish
557 these. */
558
559 enum flag_code {
560 CODE_32BIT,
561 CODE_16BIT,
562 CODE_64BIT };
563
564 static enum flag_code flag_code;
565 static unsigned int object_64bit;
566 static unsigned int disallow_64bit_reloc;
567 static int use_rela_relocations = 0;
568 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
569 static const char *tls_get_addr;
570
571 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
572 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
573 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
574
575 /* The ELF ABI to use. */
576 enum x86_elf_abi
577 {
578 I386_ABI,
579 X86_64_ABI,
580 X86_64_X32_ABI
581 };
582
583 static enum x86_elf_abi x86_elf_abi = I386_ABI;
584 #endif
585
586 #if defined (TE_PE) || defined (TE_PEP)
587 /* Use big object file format. */
588 static int use_big_obj = 0;
589 #endif
590
591 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
592 /* 1 if generating code for a shared library. */
593 static int shared = 0;
594 #endif
595
596 /* 1 for intel syntax,
597 0 if att syntax. */
598 static int intel_syntax = 0;
599
600 /* 1 for Intel64 ISA,
601 0 if AMD64 ISA. */
602 static int intel64;
603
604 /* 1 for intel mnemonic,
605 0 if att mnemonic. */
606 static int intel_mnemonic = !SYSV386_COMPAT;
607
608 /* 1 if pseudo registers are permitted. */
609 static int allow_pseudo_reg = 0;
610
611 /* 1 if register prefix % not required. */
612 static int allow_naked_reg = 0;
613
614 /* 1 if the assembler should add BND prefix for all control-transferring
615 instructions supporting it, even if this prefix wasn't specified
616 explicitly. */
617 static int add_bnd_prefix = 0;
618
619 /* 1 if pseudo index register, eiz/riz, is allowed . */
620 static int allow_index_reg = 0;
621
622 /* 1 if the assembler should ignore LOCK prefix, even if it was
623 specified explicitly. */
624 static int omit_lock_prefix = 0;
625
626 /* 1 if the assembler should encode lfence, mfence, and sfence as
627 "lock addl $0, (%{re}sp)". */
628 static int avoid_fence = 0;
629
630 /* Type of the previous instruction. */
631 static struct
632 {
633 segT seg;
634 const char *file;
635 const char *name;
636 unsigned int line;
637 enum last_insn_kind
638 {
639 last_insn_other = 0,
640 last_insn_directive,
641 last_insn_prefix
642 } kind;
643 } last_insn;
644
645 /* 1 if the assembler should generate relax relocations. */
646
647 static int generate_relax_relocations
648 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
649
650 static enum check_kind
651 {
652 check_none = 0,
653 check_warning,
654 check_error
655 }
656 sse_check, operand_check = check_warning;
657
658 /* Non-zero if branches should be aligned within power of 2 boundary. */
659 static int align_branch_power = 0;
660
661 /* Types of branches to align. */
662 enum align_branch_kind
663 {
664 align_branch_none = 0,
665 align_branch_jcc = 1,
666 align_branch_fused = 2,
667 align_branch_jmp = 3,
668 align_branch_call = 4,
669 align_branch_indirect = 5,
670 align_branch_ret = 6
671 };
672
673 /* Type bits of branches to align. */
674 enum align_branch_bit
675 {
676 align_branch_jcc_bit = 1 << align_branch_jcc,
677 align_branch_fused_bit = 1 << align_branch_fused,
678 align_branch_jmp_bit = 1 << align_branch_jmp,
679 align_branch_call_bit = 1 << align_branch_call,
680 align_branch_indirect_bit = 1 << align_branch_indirect,
681 align_branch_ret_bit = 1 << align_branch_ret
682 };
683
684 static unsigned int align_branch = (align_branch_jcc_bit
685 | align_branch_fused_bit
686 | align_branch_jmp_bit);
687
688 /* The maximum padding size for fused jcc. CMP like instruction can
689 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
690 prefixes. */
691 #define MAX_FUSED_JCC_PADDING_SIZE 20
692
693 /* The maximum number of prefixes added for an instruction. */
694 static unsigned int align_branch_prefix_size = 5;
695
696 /* Optimization:
697 1. Clear the REX_W bit with register operand if possible.
698 2. Above plus use 128bit vector instruction to clear the full vector
699 register.
700 */
701 static int optimize = 0;
702
703 /* Optimization:
704 1. Clear the REX_W bit with register operand if possible.
705 2. Above plus use 128bit vector instruction to clear the full vector
706 register.
707 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
708 "testb $imm7,%r8".
709 */
710 static int optimize_for_space = 0;
711
712 /* Register prefix used for error message. */
713 static const char *register_prefix = "%";
714
715 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
716 leave, push, and pop instructions so that gcc has the same stack
717 frame as in 32 bit mode. */
718 static char stackop_size = '\0';
719
720 /* Non-zero to optimize code alignment. */
721 int optimize_align_code = 1;
722
723 /* Non-zero to quieten some warnings. */
724 static int quiet_warnings = 0;
725
726 /* CPU name. */
727 static const char *cpu_arch_name = NULL;
728 static char *cpu_sub_arch_name = NULL;
729
730 /* CPU feature flags. */
731 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
732
733 /* If we have selected a cpu we are generating instructions for. */
734 static int cpu_arch_tune_set = 0;
735
736 /* Cpu we are generating instructions for. */
737 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
738
739 /* CPU feature flags of cpu we are generating instructions for. */
740 static i386_cpu_flags cpu_arch_tune_flags;
741
742 /* CPU instruction set architecture used. */
743 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
744
745 /* CPU feature flags of instruction set architecture used. */
746 i386_cpu_flags cpu_arch_isa_flags;
747
748 /* If set, conditional jumps are not automatically promoted to handle
749 larger than a byte offset. */
750 static unsigned int no_cond_jump_promotion = 0;
751
752 /* Encode SSE instructions with VEX prefix. */
753 static unsigned int sse2avx;
754
755 /* Encode scalar AVX instructions with specific vector length. */
756 static enum
757 {
758 vex128 = 0,
759 vex256
760 } avxscalar;
761
762 /* Encode VEX WIG instructions with specific vex.w. */
763 static enum
764 {
765 vexw0 = 0,
766 vexw1
767 } vexwig;
768
769 /* Encode scalar EVEX LIG instructions with specific vector length. */
770 static enum
771 {
772 evexl128 = 0,
773 evexl256,
774 evexl512
775 } evexlig;
776
777 /* Encode EVEX WIG instructions with specific evex.w. */
778 static enum
779 {
780 evexw0 = 0,
781 evexw1
782 } evexwig;
783
784 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
785 static enum rc_type evexrcig = rne;
786
787 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
788 static symbolS *GOT_symbol;
789
790 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
791 unsigned int x86_dwarf2_return_column;
792
793 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
794 int x86_cie_data_alignment;
795
796 /* Interface to relax_segment.
797 There are 3 major relax states for 386 jump insns because the
798 different types of jumps add different sizes to frags when we're
799 figuring out what sort of jump to choose to reach a given label.
800
801 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
802 branches which are handled by md_estimate_size_before_relax() and
803 i386_generic_table_relax_frag(). */
804
805 /* Types. */
806 #define UNCOND_JUMP 0
807 #define COND_JUMP 1
808 #define COND_JUMP86 2
809 #define BRANCH_PADDING 3
810 #define BRANCH_PREFIX 4
811 #define FUSED_JCC_PADDING 5
812
813 /* Sizes. */
814 #define CODE16 1
815 #define SMALL 0
816 #define SMALL16 (SMALL | CODE16)
817 #define BIG 2
818 #define BIG16 (BIG | CODE16)
819
820 #ifndef INLINE
821 #ifdef __GNUC__
822 #define INLINE __inline__
823 #else
824 #define INLINE
825 #endif
826 #endif
827
828 #define ENCODE_RELAX_STATE(type, size) \
829 ((relax_substateT) (((type) << 2) | (size)))
830 #define TYPE_FROM_RELAX_STATE(s) \
831 ((s) >> 2)
832 #define DISP_SIZE_FROM_RELAX_STATE(s) \
833 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
834
835 /* This table is used by relax_frag to promote short jumps to long
836 ones where necessary. SMALL (short) jumps may be promoted to BIG
837 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
838 don't allow a short jump in a 32 bit code segment to be promoted to
839 a 16 bit offset jump because it's slower (requires data size
840 prefix), and doesn't work, unless the destination is in the bottom
841 64k of the code segment (The top 16 bits of eip are zeroed). */
842
843 const relax_typeS md_relax_table[] =
844 {
845 /* The fields are:
846 1) most positive reach of this state,
847 2) most negative reach of this state,
848 3) how many bytes this mode will have in the variable part of the frag
849 4) which index into the table to try if we can't fit into this one. */
850
851 /* UNCOND_JUMP states. */
852 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
853 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
854 /* dword jmp adds 4 bytes to frag:
855 0 extra opcode bytes, 4 displacement bytes. */
856 {0, 0, 4, 0},
857 /* word jmp adds 2 byte2 to frag:
858 0 extra opcode bytes, 2 displacement bytes. */
859 {0, 0, 2, 0},
860
861 /* COND_JUMP states. */
862 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
863 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
864 /* dword conditionals adds 5 bytes to frag:
865 1 extra opcode byte, 4 displacement bytes. */
866 {0, 0, 5, 0},
867 /* word conditionals add 3 bytes to frag:
868 1 extra opcode byte, 2 displacement bytes. */
869 {0, 0, 3, 0},
870
871 /* COND_JUMP86 states. */
872 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
873 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
874 /* dword conditionals adds 5 bytes to frag:
875 1 extra opcode byte, 4 displacement bytes. */
876 {0, 0, 5, 0},
877 /* word conditionals add 4 bytes to frag:
878 1 displacement byte and a 3 byte long branch insn. */
879 {0, 0, 4, 0}
880 };
881
882 static const arch_entry cpu_arch[] =
883 {
884 /* Do not replace the first two entries - i386_target_format()
885 relies on them being there in this order. */
886 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
887 CPU_GENERIC32_FLAGS, 0 },
888 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
889 CPU_GENERIC64_FLAGS, 0 },
890 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
891 CPU_NONE_FLAGS, 0 },
892 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
893 CPU_I186_FLAGS, 0 },
894 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
895 CPU_I286_FLAGS, 0 },
896 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
897 CPU_I386_FLAGS, 0 },
898 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
899 CPU_I486_FLAGS, 0 },
900 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
901 CPU_I586_FLAGS, 0 },
902 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
903 CPU_I686_FLAGS, 0 },
904 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
905 CPU_I586_FLAGS, 0 },
906 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
907 CPU_PENTIUMPRO_FLAGS, 0 },
908 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
909 CPU_P2_FLAGS, 0 },
910 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
911 CPU_P3_FLAGS, 0 },
912 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
913 CPU_P4_FLAGS, 0 },
914 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
915 CPU_CORE_FLAGS, 0 },
916 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
917 CPU_NOCONA_FLAGS, 0 },
918 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
919 CPU_CORE_FLAGS, 1 },
920 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
921 CPU_CORE_FLAGS, 0 },
922 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
923 CPU_CORE2_FLAGS, 1 },
924 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
925 CPU_CORE2_FLAGS, 0 },
926 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
927 CPU_COREI7_FLAGS, 0 },
928 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
929 CPU_L1OM_FLAGS, 0 },
930 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
931 CPU_K1OM_FLAGS, 0 },
932 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
933 CPU_IAMCU_FLAGS, 0 },
934 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
935 CPU_K6_FLAGS, 0 },
936 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
937 CPU_K6_2_FLAGS, 0 },
938 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
939 CPU_ATHLON_FLAGS, 0 },
940 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
941 CPU_K8_FLAGS, 1 },
942 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
943 CPU_K8_FLAGS, 0 },
944 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
945 CPU_K8_FLAGS, 0 },
946 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
947 CPU_AMDFAM10_FLAGS, 0 },
948 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
949 CPU_BDVER1_FLAGS, 0 },
950 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
951 CPU_BDVER2_FLAGS, 0 },
952 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
953 CPU_BDVER3_FLAGS, 0 },
954 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
955 CPU_BDVER4_FLAGS, 0 },
956 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
957 CPU_ZNVER1_FLAGS, 0 },
958 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
959 CPU_ZNVER2_FLAGS, 0 },
960 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
961 CPU_BTVER1_FLAGS, 0 },
962 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
963 CPU_BTVER2_FLAGS, 0 },
964 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
965 CPU_8087_FLAGS, 0 },
966 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
967 CPU_287_FLAGS, 0 },
968 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
969 CPU_387_FLAGS, 0 },
970 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
971 CPU_687_FLAGS, 0 },
972 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
973 CPU_CMOV_FLAGS, 0 },
974 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
975 CPU_FXSR_FLAGS, 0 },
976 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
977 CPU_MMX_FLAGS, 0 },
978 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
979 CPU_SSE_FLAGS, 0 },
980 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
981 CPU_SSE2_FLAGS, 0 },
982 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
983 CPU_SSE3_FLAGS, 0 },
984 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
985 CPU_SSSE3_FLAGS, 0 },
986 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
987 CPU_SSE4_1_FLAGS, 0 },
988 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
989 CPU_SSE4_2_FLAGS, 0 },
990 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
991 CPU_SSE4_2_FLAGS, 0 },
992 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
993 CPU_AVX_FLAGS, 0 },
994 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
995 CPU_AVX2_FLAGS, 0 },
996 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
997 CPU_AVX512F_FLAGS, 0 },
998 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
999 CPU_AVX512CD_FLAGS, 0 },
1000 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1001 CPU_AVX512ER_FLAGS, 0 },
1002 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1003 CPU_AVX512PF_FLAGS, 0 },
1004 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1005 CPU_AVX512DQ_FLAGS, 0 },
1006 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1007 CPU_AVX512BW_FLAGS, 0 },
1008 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1009 CPU_AVX512VL_FLAGS, 0 },
1010 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1011 CPU_VMX_FLAGS, 0 },
1012 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1013 CPU_VMFUNC_FLAGS, 0 },
1014 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1015 CPU_SMX_FLAGS, 0 },
1016 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1017 CPU_XSAVE_FLAGS, 0 },
1018 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1019 CPU_XSAVEOPT_FLAGS, 0 },
1020 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1021 CPU_XSAVEC_FLAGS, 0 },
1022 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1023 CPU_XSAVES_FLAGS, 0 },
1024 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1025 CPU_AES_FLAGS, 0 },
1026 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1027 CPU_PCLMUL_FLAGS, 0 },
1028 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1029 CPU_PCLMUL_FLAGS, 1 },
1030 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1031 CPU_FSGSBASE_FLAGS, 0 },
1032 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1033 CPU_RDRND_FLAGS, 0 },
1034 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1035 CPU_F16C_FLAGS, 0 },
1036 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1037 CPU_BMI2_FLAGS, 0 },
1038 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1039 CPU_FMA_FLAGS, 0 },
1040 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1041 CPU_FMA4_FLAGS, 0 },
1042 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1043 CPU_XOP_FLAGS, 0 },
1044 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1045 CPU_LWP_FLAGS, 0 },
1046 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1047 CPU_MOVBE_FLAGS, 0 },
1048 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1049 CPU_CX16_FLAGS, 0 },
1050 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1051 CPU_EPT_FLAGS, 0 },
1052 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1053 CPU_LZCNT_FLAGS, 0 },
1054 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1055 CPU_HLE_FLAGS, 0 },
1056 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1057 CPU_RTM_FLAGS, 0 },
1058 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1059 CPU_INVPCID_FLAGS, 0 },
1060 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1061 CPU_CLFLUSH_FLAGS, 0 },
1062 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1063 CPU_NOP_FLAGS, 0 },
1064 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1065 CPU_SYSCALL_FLAGS, 0 },
1066 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1067 CPU_RDTSCP_FLAGS, 0 },
1068 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1069 CPU_3DNOW_FLAGS, 0 },
1070 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1071 CPU_3DNOWA_FLAGS, 0 },
1072 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1073 CPU_PADLOCK_FLAGS, 0 },
1074 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1075 CPU_SVME_FLAGS, 1 },
1076 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1077 CPU_SVME_FLAGS, 0 },
1078 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1079 CPU_SSE4A_FLAGS, 0 },
1080 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1081 CPU_ABM_FLAGS, 0 },
1082 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1083 CPU_BMI_FLAGS, 0 },
1084 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1085 CPU_TBM_FLAGS, 0 },
1086 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1087 CPU_ADX_FLAGS, 0 },
1088 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1089 CPU_RDSEED_FLAGS, 0 },
1090 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1091 CPU_PRFCHW_FLAGS, 0 },
1092 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1093 CPU_SMAP_FLAGS, 0 },
1094 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1095 CPU_MPX_FLAGS, 0 },
1096 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1097 CPU_SHA_FLAGS, 0 },
1098 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1099 CPU_CLFLUSHOPT_FLAGS, 0 },
1100 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1101 CPU_PREFETCHWT1_FLAGS, 0 },
1102 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1103 CPU_SE1_FLAGS, 0 },
1104 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1105 CPU_CLWB_FLAGS, 0 },
1106 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1107 CPU_AVX512IFMA_FLAGS, 0 },
1108 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1109 CPU_AVX512VBMI_FLAGS, 0 },
1110 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1111 CPU_AVX512_4FMAPS_FLAGS, 0 },
1112 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1113 CPU_AVX512_4VNNIW_FLAGS, 0 },
1114 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1115 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1116 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1117 CPU_AVX512_VBMI2_FLAGS, 0 },
1118 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1119 CPU_AVX512_VNNI_FLAGS, 0 },
1120 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1121 CPU_AVX512_BITALG_FLAGS, 0 },
1122 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1123 CPU_CLZERO_FLAGS, 0 },
1124 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1125 CPU_MWAITX_FLAGS, 0 },
1126 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1127 CPU_OSPKE_FLAGS, 0 },
1128 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1129 CPU_RDPID_FLAGS, 0 },
1130 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1131 CPU_PTWRITE_FLAGS, 0 },
1132 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1133 CPU_IBT_FLAGS, 0 },
1134 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1135 CPU_SHSTK_FLAGS, 0 },
1136 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1137 CPU_GFNI_FLAGS, 0 },
1138 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1139 CPU_VAES_FLAGS, 0 },
1140 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1141 CPU_VPCLMULQDQ_FLAGS, 0 },
1142 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1143 CPU_WBNOINVD_FLAGS, 0 },
1144 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1145 CPU_PCONFIG_FLAGS, 0 },
1146 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1147 CPU_WAITPKG_FLAGS, 0 },
1148 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1149 CPU_CLDEMOTE_FLAGS, 0 },
1150 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1151 CPU_MOVDIRI_FLAGS, 0 },
1152 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1153 CPU_MOVDIR64B_FLAGS, 0 },
1154 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1155 CPU_AVX512_BF16_FLAGS, 0 },
1156 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1157 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1158 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1159 CPU_ENQCMD_FLAGS, 0 },
1160 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1161 CPU_RDPRU_FLAGS, 0 },
1162 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1163 CPU_MCOMMIT_FLAGS, 0 },
1164 };
1165
1166 static const noarch_entry cpu_noarch[] =
1167 {
1168 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1169 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1170 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1171 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1172 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1173 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1174 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1175 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1176 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1177 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1178 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1179 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1180 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1181 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1182 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1183 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1184 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1185 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1186 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1187 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1188 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1189 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1190 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1191 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1192 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1193 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1194 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1195 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1196 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1197 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1198 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1199 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1200 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1201 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1202 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1203 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1204 { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1205 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1206 };
1207
1208 #ifdef I386COFF
1209 /* Like s_lcomm_internal in gas/read.c but the alignment string
1210 is allowed to be optional. */
1211
1212 static symbolS *
1213 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1214 {
1215 addressT align = 0;
1216
1217 SKIP_WHITESPACE ();
1218
1219 if (needs_align
1220 && *input_line_pointer == ',')
1221 {
1222 align = parse_align (needs_align - 1);
1223
1224 if (align == (addressT) -1)
1225 return NULL;
1226 }
1227 else
1228 {
1229 if (size >= 8)
1230 align = 3;
1231 else if (size >= 4)
1232 align = 2;
1233 else if (size >= 2)
1234 align = 1;
1235 else
1236 align = 0;
1237 }
1238
1239 bss_alloc (symbolP, size, align);
1240 return symbolP;
1241 }
1242
1243 static void
1244 pe_lcomm (int needs_align)
1245 {
1246 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1247 }
1248 #endif
1249
1250 const pseudo_typeS md_pseudo_table[] =
1251 {
1252 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1253 {"align", s_align_bytes, 0},
1254 #else
1255 {"align", s_align_ptwo, 0},
1256 #endif
1257 {"arch", set_cpu_arch, 0},
1258 #ifndef I386COFF
1259 {"bss", s_bss, 0},
1260 #else
1261 {"lcomm", pe_lcomm, 1},
1262 #endif
1263 {"ffloat", float_cons, 'f'},
1264 {"dfloat", float_cons, 'd'},
1265 {"tfloat", float_cons, 'x'},
1266 {"value", cons, 2},
1267 {"slong", signed_cons, 4},
1268 {"noopt", s_ignore, 0},
1269 {"optim", s_ignore, 0},
1270 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1271 {"code16", set_code_flag, CODE_16BIT},
1272 {"code32", set_code_flag, CODE_32BIT},
1273 #ifdef BFD64
1274 {"code64", set_code_flag, CODE_64BIT},
1275 #endif
1276 {"intel_syntax", set_intel_syntax, 1},
1277 {"att_syntax", set_intel_syntax, 0},
1278 {"intel_mnemonic", set_intel_mnemonic, 1},
1279 {"att_mnemonic", set_intel_mnemonic, 0},
1280 {"allow_index_reg", set_allow_index_reg, 1},
1281 {"disallow_index_reg", set_allow_index_reg, 0},
1282 {"sse_check", set_check, 0},
1283 {"operand_check", set_check, 1},
1284 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1285 {"largecomm", handle_large_common, 0},
1286 #else
1287 {"file", dwarf2_directive_file, 0},
1288 {"loc", dwarf2_directive_loc, 0},
1289 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1290 #endif
1291 #ifdef TE_PE
1292 {"secrel32", pe_directive_secrel, 0},
1293 #endif
1294 {0, 0, 0}
1295 };
1296
1297 /* For interface with expression (). */
1298 extern char *input_line_pointer;
1299
1300 /* Hash table for instruction mnemonic lookup. */
1301 static struct hash_control *op_hash;
1302
1303 /* Hash table for register lookup. */
1304 static struct hash_control *reg_hash;
1305 \f
1306 /* Various efficient no-op patterns for aligning code labels.
1307 Note: Don't try to assemble the instructions in the comments.
1308 0L and 0w are not legal. */
1309 static const unsigned char f32_1[] =
1310 {0x90}; /* nop */
1311 static const unsigned char f32_2[] =
1312 {0x66,0x90}; /* xchg %ax,%ax */
1313 static const unsigned char f32_3[] =
1314 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1315 static const unsigned char f32_4[] =
1316 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1317 static const unsigned char f32_6[] =
1318 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1319 static const unsigned char f32_7[] =
1320 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1321 static const unsigned char f16_3[] =
1322 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1323 static const unsigned char f16_4[] =
1324 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1325 static const unsigned char jump_disp8[] =
1326 {0xeb}; /* jmp disp8 */
1327 static const unsigned char jump32_disp32[] =
1328 {0xe9}; /* jmp disp32 */
1329 static const unsigned char jump16_disp32[] =
1330 {0x66,0xe9}; /* jmp disp32 */
1331 /* 32-bit NOPs patterns. */
1332 static const unsigned char *const f32_patt[] = {
1333 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1334 };
1335 /* 16-bit NOPs patterns. */
1336 static const unsigned char *const f16_patt[] = {
1337 f32_1, f32_2, f16_3, f16_4
1338 };
1339 /* nopl (%[re]ax) */
1340 static const unsigned char alt_3[] =
1341 {0x0f,0x1f,0x00};
1342 /* nopl 0(%[re]ax) */
1343 static const unsigned char alt_4[] =
1344 {0x0f,0x1f,0x40,0x00};
1345 /* nopl 0(%[re]ax,%[re]ax,1) */
1346 static const unsigned char alt_5[] =
1347 {0x0f,0x1f,0x44,0x00,0x00};
1348 /* nopw 0(%[re]ax,%[re]ax,1) */
1349 static const unsigned char alt_6[] =
1350 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1351 /* nopl 0L(%[re]ax) */
1352 static const unsigned char alt_7[] =
1353 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1354 /* nopl 0L(%[re]ax,%[re]ax,1) */
1355 static const unsigned char alt_8[] =
1356 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1357 /* nopw 0L(%[re]ax,%[re]ax,1) */
1358 static const unsigned char alt_9[] =
1359 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1360 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1361 static const unsigned char alt_10[] =
1362 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1363 /* data16 nopw %cs:0L(%eax,%eax,1) */
1364 static const unsigned char alt_11[] =
1365 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1366 /* 32-bit and 64-bit NOPs patterns. */
1367 static const unsigned char *const alt_patt[] = {
1368 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1369 alt_9, alt_10, alt_11
1370 };
1371
1372 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1373 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1374
1375 static void
1376 i386_output_nops (char *where, const unsigned char *const *patt,
1377 int count, int max_single_nop_size)
1378
1379 {
1380 /* Place the longer NOP first. */
1381 int last;
1382 int offset;
1383 const unsigned char *nops;
1384
1385 if (max_single_nop_size < 1)
1386 {
1387 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1388 max_single_nop_size);
1389 return;
1390 }
1391
1392 nops = patt[max_single_nop_size - 1];
1393
1394 /* Use the smaller one if the requsted one isn't available. */
1395 if (nops == NULL)
1396 {
1397 max_single_nop_size--;
1398 nops = patt[max_single_nop_size - 1];
1399 }
1400
1401 last = count % max_single_nop_size;
1402
1403 count -= last;
1404 for (offset = 0; offset < count; offset += max_single_nop_size)
1405 memcpy (where + offset, nops, max_single_nop_size);
1406
1407 if (last)
1408 {
1409 nops = patt[last - 1];
1410 if (nops == NULL)
1411 {
1412 /* Use the smaller one plus one-byte NOP if the needed one
1413 isn't available. */
1414 last--;
1415 nops = patt[last - 1];
1416 memcpy (where + offset, nops, last);
1417 where[offset + last] = *patt[0];
1418 }
1419 else
1420 memcpy (where + offset, nops, last);
1421 }
1422 }
1423
1424 static INLINE int
1425 fits_in_imm7 (offsetT num)
1426 {
1427 return (num & 0x7f) == num;
1428 }
1429
1430 static INLINE int
1431 fits_in_imm31 (offsetT num)
1432 {
1433 return (num & 0x7fffffff) == num;
1434 }
1435
1436 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1437 single NOP instruction LIMIT. */
1438
1439 void
1440 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1441 {
1442 const unsigned char *const *patt = NULL;
1443 int max_single_nop_size;
1444 /* Maximum number of NOPs before switching to jump over NOPs. */
1445 int max_number_of_nops;
1446
1447 switch (fragP->fr_type)
1448 {
1449 case rs_fill_nop:
1450 case rs_align_code:
1451 break;
1452 case rs_machine_dependent:
1453 /* Allow NOP padding for jumps and calls. */
1454 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1455 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1456 break;
1457 /* Fall through. */
1458 default:
1459 return;
1460 }
1461
1462 /* We need to decide which NOP sequence to use for 32bit and
1463 64bit. When -mtune= is used:
1464
1465 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1466 PROCESSOR_GENERIC32, f32_patt will be used.
1467 2. For the rest, alt_patt will be used.
1468
1469 When -mtune= isn't used, alt_patt will be used if
1470 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1471 be used.
1472
1473 When -march= or .arch is used, we can't use anything beyond
1474 cpu_arch_isa_flags. */
1475
1476 if (flag_code == CODE_16BIT)
1477 {
1478 patt = f16_patt;
1479 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1480 /* Limit number of NOPs to 2 in 16-bit mode. */
1481 max_number_of_nops = 2;
1482 }
1483 else
1484 {
1485 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1486 {
1487 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1488 switch (cpu_arch_tune)
1489 {
1490 case PROCESSOR_UNKNOWN:
1491 /* We use cpu_arch_isa_flags to check if we SHOULD
1492 optimize with nops. */
1493 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1494 patt = alt_patt;
1495 else
1496 patt = f32_patt;
1497 break;
1498 case PROCESSOR_PENTIUM4:
1499 case PROCESSOR_NOCONA:
1500 case PROCESSOR_CORE:
1501 case PROCESSOR_CORE2:
1502 case PROCESSOR_COREI7:
1503 case PROCESSOR_L1OM:
1504 case PROCESSOR_K1OM:
1505 case PROCESSOR_GENERIC64:
1506 case PROCESSOR_K6:
1507 case PROCESSOR_ATHLON:
1508 case PROCESSOR_K8:
1509 case PROCESSOR_AMDFAM10:
1510 case PROCESSOR_BD:
1511 case PROCESSOR_ZNVER:
1512 case PROCESSOR_BT:
1513 patt = alt_patt;
1514 break;
1515 case PROCESSOR_I386:
1516 case PROCESSOR_I486:
1517 case PROCESSOR_PENTIUM:
1518 case PROCESSOR_PENTIUMPRO:
1519 case PROCESSOR_IAMCU:
1520 case PROCESSOR_GENERIC32:
1521 patt = f32_patt;
1522 break;
1523 }
1524 }
1525 else
1526 {
1527 switch (fragP->tc_frag_data.tune)
1528 {
1529 case PROCESSOR_UNKNOWN:
1530 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1531 PROCESSOR_UNKNOWN. */
1532 abort ();
1533 break;
1534
1535 case PROCESSOR_I386:
1536 case PROCESSOR_I486:
1537 case PROCESSOR_PENTIUM:
1538 case PROCESSOR_IAMCU:
1539 case PROCESSOR_K6:
1540 case PROCESSOR_ATHLON:
1541 case PROCESSOR_K8:
1542 case PROCESSOR_AMDFAM10:
1543 case PROCESSOR_BD:
1544 case PROCESSOR_ZNVER:
1545 case PROCESSOR_BT:
1546 case PROCESSOR_GENERIC32:
1547 /* We use cpu_arch_isa_flags to check if we CAN optimize
1548 with nops. */
1549 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1550 patt = alt_patt;
1551 else
1552 patt = f32_patt;
1553 break;
1554 case PROCESSOR_PENTIUMPRO:
1555 case PROCESSOR_PENTIUM4:
1556 case PROCESSOR_NOCONA:
1557 case PROCESSOR_CORE:
1558 case PROCESSOR_CORE2:
1559 case PROCESSOR_COREI7:
1560 case PROCESSOR_L1OM:
1561 case PROCESSOR_K1OM:
1562 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1563 patt = alt_patt;
1564 else
1565 patt = f32_patt;
1566 break;
1567 case PROCESSOR_GENERIC64:
1568 patt = alt_patt;
1569 break;
1570 }
1571 }
1572
1573 if (patt == f32_patt)
1574 {
1575 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1576 /* Limit number of NOPs to 2 for older processors. */
1577 max_number_of_nops = 2;
1578 }
1579 else
1580 {
1581 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1582 /* Limit number of NOPs to 7 for newer processors. */
1583 max_number_of_nops = 7;
1584 }
1585 }
1586
1587 if (limit == 0)
1588 limit = max_single_nop_size;
1589
1590 if (fragP->fr_type == rs_fill_nop)
1591 {
1592 /* Output NOPs for .nop directive. */
1593 if (limit > max_single_nop_size)
1594 {
1595 as_bad_where (fragP->fr_file, fragP->fr_line,
1596 _("invalid single nop size: %d "
1597 "(expect within [0, %d])"),
1598 limit, max_single_nop_size);
1599 return;
1600 }
1601 }
1602 else if (fragP->fr_type != rs_machine_dependent)
1603 fragP->fr_var = count;
1604
1605 if ((count / max_single_nop_size) > max_number_of_nops)
1606 {
1607 /* Generate jump over NOPs. */
1608 offsetT disp = count - 2;
1609 if (fits_in_imm7 (disp))
1610 {
1611 /* Use "jmp disp8" if possible. */
1612 count = disp;
1613 where[0] = jump_disp8[0];
1614 where[1] = count;
1615 where += 2;
1616 }
1617 else
1618 {
1619 unsigned int size_of_jump;
1620
1621 if (flag_code == CODE_16BIT)
1622 {
1623 where[0] = jump16_disp32[0];
1624 where[1] = jump16_disp32[1];
1625 size_of_jump = 2;
1626 }
1627 else
1628 {
1629 where[0] = jump32_disp32[0];
1630 size_of_jump = 1;
1631 }
1632
1633 count -= size_of_jump + 4;
1634 if (!fits_in_imm31 (count))
1635 {
1636 as_bad_where (fragP->fr_file, fragP->fr_line,
1637 _("jump over nop padding out of range"));
1638 return;
1639 }
1640
1641 md_number_to_chars (where + size_of_jump, count, 4);
1642 where += size_of_jump + 4;
1643 }
1644 }
1645
1646 /* Generate multiple NOPs. */
1647 i386_output_nops (where, patt, count, limit);
1648 }
1649
1650 static INLINE int
1651 operand_type_all_zero (const union i386_operand_type *x)
1652 {
1653 switch (ARRAY_SIZE(x->array))
1654 {
1655 case 3:
1656 if (x->array[2])
1657 return 0;
1658 /* Fall through. */
1659 case 2:
1660 if (x->array[1])
1661 return 0;
1662 /* Fall through. */
1663 case 1:
1664 return !x->array[0];
1665 default:
1666 abort ();
1667 }
1668 }
1669
1670 static INLINE void
1671 operand_type_set (union i386_operand_type *x, unsigned int v)
1672 {
1673 switch (ARRAY_SIZE(x->array))
1674 {
1675 case 3:
1676 x->array[2] = v;
1677 /* Fall through. */
1678 case 2:
1679 x->array[1] = v;
1680 /* Fall through. */
1681 case 1:
1682 x->array[0] = v;
1683 /* Fall through. */
1684 break;
1685 default:
1686 abort ();
1687 }
1688
1689 x->bitfield.class = ClassNone;
1690 x->bitfield.instance = InstanceNone;
1691 }
1692
1693 static INLINE int
1694 operand_type_equal (const union i386_operand_type *x,
1695 const union i386_operand_type *y)
1696 {
1697 switch (ARRAY_SIZE(x->array))
1698 {
1699 case 3:
1700 if (x->array[2] != y->array[2])
1701 return 0;
1702 /* Fall through. */
1703 case 2:
1704 if (x->array[1] != y->array[1])
1705 return 0;
1706 /* Fall through. */
1707 case 1:
1708 return x->array[0] == y->array[0];
1709 break;
1710 default:
1711 abort ();
1712 }
1713 }
1714
1715 static INLINE int
1716 cpu_flags_all_zero (const union i386_cpu_flags *x)
1717 {
1718 switch (ARRAY_SIZE(x->array))
1719 {
1720 case 4:
1721 if (x->array[3])
1722 return 0;
1723 /* Fall through. */
1724 case 3:
1725 if (x->array[2])
1726 return 0;
1727 /* Fall through. */
1728 case 2:
1729 if (x->array[1])
1730 return 0;
1731 /* Fall through. */
1732 case 1:
1733 return !x->array[0];
1734 default:
1735 abort ();
1736 }
1737 }
1738
1739 static INLINE int
1740 cpu_flags_equal (const union i386_cpu_flags *x,
1741 const union i386_cpu_flags *y)
1742 {
1743 switch (ARRAY_SIZE(x->array))
1744 {
1745 case 4:
1746 if (x->array[3] != y->array[3])
1747 return 0;
1748 /* Fall through. */
1749 case 3:
1750 if (x->array[2] != y->array[2])
1751 return 0;
1752 /* Fall through. */
1753 case 2:
1754 if (x->array[1] != y->array[1])
1755 return 0;
1756 /* Fall through. */
1757 case 1:
1758 return x->array[0] == y->array[0];
1759 break;
1760 default:
1761 abort ();
1762 }
1763 }
1764
1765 static INLINE int
1766 cpu_flags_check_cpu64 (i386_cpu_flags f)
1767 {
1768 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1769 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1770 }
1771
1772 static INLINE i386_cpu_flags
1773 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1774 {
1775 switch (ARRAY_SIZE (x.array))
1776 {
1777 case 4:
1778 x.array [3] &= y.array [3];
1779 /* Fall through. */
1780 case 3:
1781 x.array [2] &= y.array [2];
1782 /* Fall through. */
1783 case 2:
1784 x.array [1] &= y.array [1];
1785 /* Fall through. */
1786 case 1:
1787 x.array [0] &= y.array [0];
1788 break;
1789 default:
1790 abort ();
1791 }
1792 return x;
1793 }
1794
1795 static INLINE i386_cpu_flags
1796 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1797 {
1798 switch (ARRAY_SIZE (x.array))
1799 {
1800 case 4:
1801 x.array [3] |= y.array [3];
1802 /* Fall through. */
1803 case 3:
1804 x.array [2] |= y.array [2];
1805 /* Fall through. */
1806 case 2:
1807 x.array [1] |= y.array [1];
1808 /* Fall through. */
1809 case 1:
1810 x.array [0] |= y.array [0];
1811 break;
1812 default:
1813 abort ();
1814 }
1815 return x;
1816 }
1817
1818 static INLINE i386_cpu_flags
1819 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1820 {
1821 switch (ARRAY_SIZE (x.array))
1822 {
1823 case 4:
1824 x.array [3] &= ~y.array [3];
1825 /* Fall through. */
1826 case 3:
1827 x.array [2] &= ~y.array [2];
1828 /* Fall through. */
1829 case 2:
1830 x.array [1] &= ~y.array [1];
1831 /* Fall through. */
1832 case 1:
1833 x.array [0] &= ~y.array [0];
1834 break;
1835 default:
1836 abort ();
1837 }
1838 return x;
1839 }
1840
1841 #define CPU_FLAGS_ARCH_MATCH 0x1
1842 #define CPU_FLAGS_64BIT_MATCH 0x2
1843
1844 #define CPU_FLAGS_PERFECT_MATCH \
1845 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1846
1847 /* Return CPU flags match bits. */
1848
1849 static int
1850 cpu_flags_match (const insn_template *t)
1851 {
1852 i386_cpu_flags x = t->cpu_flags;
1853 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1854
1855 x.bitfield.cpu64 = 0;
1856 x.bitfield.cpuno64 = 0;
1857
1858 if (cpu_flags_all_zero (&x))
1859 {
1860 /* This instruction is available on all archs. */
1861 match |= CPU_FLAGS_ARCH_MATCH;
1862 }
1863 else
1864 {
1865 /* This instruction is available only on some archs. */
1866 i386_cpu_flags cpu = cpu_arch_flags;
1867
1868 /* AVX512VL is no standalone feature - match it and then strip it. */
1869 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1870 return match;
1871 x.bitfield.cpuavx512vl = 0;
1872
1873 cpu = cpu_flags_and (x, cpu);
1874 if (!cpu_flags_all_zero (&cpu))
1875 {
1876 if (x.bitfield.cpuavx)
1877 {
1878 /* We need to check a few extra flags with AVX. */
1879 if (cpu.bitfield.cpuavx
1880 && (!t->opcode_modifier.sse2avx || sse2avx)
1881 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1882 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1883 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1884 match |= CPU_FLAGS_ARCH_MATCH;
1885 }
1886 else if (x.bitfield.cpuavx512f)
1887 {
1888 /* We need to check a few extra flags with AVX512F. */
1889 if (cpu.bitfield.cpuavx512f
1890 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1891 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1892 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1893 match |= CPU_FLAGS_ARCH_MATCH;
1894 }
1895 else
1896 match |= CPU_FLAGS_ARCH_MATCH;
1897 }
1898 }
1899 return match;
1900 }
1901
1902 static INLINE i386_operand_type
1903 operand_type_and (i386_operand_type x, i386_operand_type y)
1904 {
1905 if (x.bitfield.class != y.bitfield.class)
1906 x.bitfield.class = ClassNone;
1907 if (x.bitfield.instance != y.bitfield.instance)
1908 x.bitfield.instance = InstanceNone;
1909
1910 switch (ARRAY_SIZE (x.array))
1911 {
1912 case 3:
1913 x.array [2] &= y.array [2];
1914 /* Fall through. */
1915 case 2:
1916 x.array [1] &= y.array [1];
1917 /* Fall through. */
1918 case 1:
1919 x.array [0] &= y.array [0];
1920 break;
1921 default:
1922 abort ();
1923 }
1924 return x;
1925 }
1926
1927 static INLINE i386_operand_type
1928 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1929 {
1930 gas_assert (y.bitfield.class == ClassNone);
1931 gas_assert (y.bitfield.instance == InstanceNone);
1932
1933 switch (ARRAY_SIZE (x.array))
1934 {
1935 case 3:
1936 x.array [2] &= ~y.array [2];
1937 /* Fall through. */
1938 case 2:
1939 x.array [1] &= ~y.array [1];
1940 /* Fall through. */
1941 case 1:
1942 x.array [0] &= ~y.array [0];
1943 break;
1944 default:
1945 abort ();
1946 }
1947 return x;
1948 }
1949
1950 static INLINE i386_operand_type
1951 operand_type_or (i386_operand_type x, i386_operand_type y)
1952 {
1953 gas_assert (x.bitfield.class == ClassNone ||
1954 y.bitfield.class == ClassNone ||
1955 x.bitfield.class == y.bitfield.class);
1956 gas_assert (x.bitfield.instance == InstanceNone ||
1957 y.bitfield.instance == InstanceNone ||
1958 x.bitfield.instance == y.bitfield.instance);
1959
1960 switch (ARRAY_SIZE (x.array))
1961 {
1962 case 3:
1963 x.array [2] |= y.array [2];
1964 /* Fall through. */
1965 case 2:
1966 x.array [1] |= y.array [1];
1967 /* Fall through. */
1968 case 1:
1969 x.array [0] |= y.array [0];
1970 break;
1971 default:
1972 abort ();
1973 }
1974 return x;
1975 }
1976
1977 static INLINE i386_operand_type
1978 operand_type_xor (i386_operand_type x, i386_operand_type y)
1979 {
1980 gas_assert (y.bitfield.class == ClassNone);
1981 gas_assert (y.bitfield.instance == InstanceNone);
1982
1983 switch (ARRAY_SIZE (x.array))
1984 {
1985 case 3:
1986 x.array [2] ^= y.array [2];
1987 /* Fall through. */
1988 case 2:
1989 x.array [1] ^= y.array [1];
1990 /* Fall through. */
1991 case 1:
1992 x.array [0] ^= y.array [0];
1993 break;
1994 default:
1995 abort ();
1996 }
1997 return x;
1998 }
1999
2000 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2001 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2002 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2003 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2004 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2005 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2006 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2007 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2008 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2009 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2010 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2011 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2012 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2013 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2014 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2015 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2016 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2017
2018 enum operand_type
2019 {
2020 reg,
2021 imm,
2022 disp,
2023 anymem
2024 };
2025
2026 static INLINE int
2027 operand_type_check (i386_operand_type t, enum operand_type c)
2028 {
2029 switch (c)
2030 {
2031 case reg:
2032 return t.bitfield.class == Reg;
2033
2034 case imm:
2035 return (t.bitfield.imm8
2036 || t.bitfield.imm8s
2037 || t.bitfield.imm16
2038 || t.bitfield.imm32
2039 || t.bitfield.imm32s
2040 || t.bitfield.imm64);
2041
2042 case disp:
2043 return (t.bitfield.disp8
2044 || t.bitfield.disp16
2045 || t.bitfield.disp32
2046 || t.bitfield.disp32s
2047 || t.bitfield.disp64);
2048
2049 case anymem:
2050 return (t.bitfield.disp8
2051 || t.bitfield.disp16
2052 || t.bitfield.disp32
2053 || t.bitfield.disp32s
2054 || t.bitfield.disp64
2055 || t.bitfield.baseindex);
2056
2057 default:
2058 abort ();
2059 }
2060
2061 return 0;
2062 }
2063
2064 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2065 between operand GIVEN and opeand WANTED for instruction template T. */
2066
2067 static INLINE int
2068 match_operand_size (const insn_template *t, unsigned int wanted,
2069 unsigned int given)
2070 {
2071 return !((i.types[given].bitfield.byte
2072 && !t->operand_types[wanted].bitfield.byte)
2073 || (i.types[given].bitfield.word
2074 && !t->operand_types[wanted].bitfield.word)
2075 || (i.types[given].bitfield.dword
2076 && !t->operand_types[wanted].bitfield.dword)
2077 || (i.types[given].bitfield.qword
2078 && !t->operand_types[wanted].bitfield.qword)
2079 || (i.types[given].bitfield.tbyte
2080 && !t->operand_types[wanted].bitfield.tbyte));
2081 }
2082
2083 /* Return 1 if there is no conflict in SIMD register between operand
2084 GIVEN and opeand WANTED for instruction template T. */
2085
2086 static INLINE int
2087 match_simd_size (const insn_template *t, unsigned int wanted,
2088 unsigned int given)
2089 {
2090 return !((i.types[given].bitfield.xmmword
2091 && !t->operand_types[wanted].bitfield.xmmword)
2092 || (i.types[given].bitfield.ymmword
2093 && !t->operand_types[wanted].bitfield.ymmword)
2094 || (i.types[given].bitfield.zmmword
2095 && !t->operand_types[wanted].bitfield.zmmword));
2096 }
2097
2098 /* Return 1 if there is no conflict in any size between operand GIVEN
2099 and opeand WANTED for instruction template T. */
2100
2101 static INLINE int
2102 match_mem_size (const insn_template *t, unsigned int wanted,
2103 unsigned int given)
2104 {
2105 return (match_operand_size (t, wanted, given)
2106 && !((i.types[given].bitfield.unspecified
2107 && !i.broadcast
2108 && !t->operand_types[wanted].bitfield.unspecified)
2109 || (i.types[given].bitfield.fword
2110 && !t->operand_types[wanted].bitfield.fword)
2111 /* For scalar opcode templates to allow register and memory
2112 operands at the same time, some special casing is needed
2113 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2114 down-conversion vpmov*. */
2115 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2116 && !t->opcode_modifier.broadcast
2117 && (t->operand_types[wanted].bitfield.byte
2118 || t->operand_types[wanted].bitfield.word
2119 || t->operand_types[wanted].bitfield.dword
2120 || t->operand_types[wanted].bitfield.qword))
2121 ? (i.types[given].bitfield.xmmword
2122 || i.types[given].bitfield.ymmword
2123 || i.types[given].bitfield.zmmword)
2124 : !match_simd_size(t, wanted, given))));
2125 }
2126
2127 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2128 operands for instruction template T, and it has MATCH_REVERSE set if there
2129 is no size conflict on any operands for the template with operands reversed
2130 (and the template allows for reversing in the first place). */
2131
2132 #define MATCH_STRAIGHT 1
2133 #define MATCH_REVERSE 2
2134
2135 static INLINE unsigned int
2136 operand_size_match (const insn_template *t)
2137 {
2138 unsigned int j, match = MATCH_STRAIGHT;
2139
2140 /* Don't check non-absolute jump instructions. */
2141 if (t->opcode_modifier.jump
2142 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2143 return match;
2144
2145 /* Check memory and accumulator operand size. */
2146 for (j = 0; j < i.operands; j++)
2147 {
2148 if (i.types[j].bitfield.class != Reg
2149 && i.types[j].bitfield.class != RegSIMD
2150 && t->opcode_modifier.anysize)
2151 continue;
2152
2153 if (t->operand_types[j].bitfield.class == Reg
2154 && !match_operand_size (t, j, j))
2155 {
2156 match = 0;
2157 break;
2158 }
2159
2160 if (t->operand_types[j].bitfield.class == RegSIMD
2161 && !match_simd_size (t, j, j))
2162 {
2163 match = 0;
2164 break;
2165 }
2166
2167 if (t->operand_types[j].bitfield.instance == Accum
2168 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2169 {
2170 match = 0;
2171 break;
2172 }
2173
2174 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2175 {
2176 match = 0;
2177 break;
2178 }
2179 }
2180
2181 if (!t->opcode_modifier.d)
2182 {
2183 mismatch:
2184 if (!match)
2185 i.error = operand_size_mismatch;
2186 return match;
2187 }
2188
2189 /* Check reverse. */
2190 gas_assert (i.operands >= 2 && i.operands <= 3);
2191
2192 for (j = 0; j < i.operands; j++)
2193 {
2194 unsigned int given = i.operands - j - 1;
2195
2196 if (t->operand_types[j].bitfield.class == Reg
2197 && !match_operand_size (t, j, given))
2198 goto mismatch;
2199
2200 if (t->operand_types[j].bitfield.class == RegSIMD
2201 && !match_simd_size (t, j, given))
2202 goto mismatch;
2203
2204 if (t->operand_types[j].bitfield.instance == Accum
2205 && (!match_operand_size (t, j, given)
2206 || !match_simd_size (t, j, given)))
2207 goto mismatch;
2208
2209 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2210 goto mismatch;
2211 }
2212
2213 return match | MATCH_REVERSE;
2214 }
2215
2216 static INLINE int
2217 operand_type_match (i386_operand_type overlap,
2218 i386_operand_type given)
2219 {
2220 i386_operand_type temp = overlap;
2221
2222 temp.bitfield.unspecified = 0;
2223 temp.bitfield.byte = 0;
2224 temp.bitfield.word = 0;
2225 temp.bitfield.dword = 0;
2226 temp.bitfield.fword = 0;
2227 temp.bitfield.qword = 0;
2228 temp.bitfield.tbyte = 0;
2229 temp.bitfield.xmmword = 0;
2230 temp.bitfield.ymmword = 0;
2231 temp.bitfield.zmmword = 0;
2232 if (operand_type_all_zero (&temp))
2233 goto mismatch;
2234
2235 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2236 return 1;
2237
2238 mismatch:
2239 i.error = operand_type_mismatch;
2240 return 0;
2241 }
2242
2243 /* If given types g0 and g1 are registers they must be of the same type
2244 unless the expected operand type register overlap is null.
2245 Memory operand size of certain SIMD instructions is also being checked
2246 here. */
2247
2248 static INLINE int
2249 operand_type_register_match (i386_operand_type g0,
2250 i386_operand_type t0,
2251 i386_operand_type g1,
2252 i386_operand_type t1)
2253 {
2254 if (g0.bitfield.class != Reg
2255 && g0.bitfield.class != RegSIMD
2256 && (!operand_type_check (g0, anymem)
2257 || g0.bitfield.unspecified
2258 || t0.bitfield.class != RegSIMD))
2259 return 1;
2260
2261 if (g1.bitfield.class != Reg
2262 && g1.bitfield.class != RegSIMD
2263 && (!operand_type_check (g1, anymem)
2264 || g1.bitfield.unspecified
2265 || t1.bitfield.class != RegSIMD))
2266 return 1;
2267
2268 if (g0.bitfield.byte == g1.bitfield.byte
2269 && g0.bitfield.word == g1.bitfield.word
2270 && g0.bitfield.dword == g1.bitfield.dword
2271 && g0.bitfield.qword == g1.bitfield.qword
2272 && g0.bitfield.xmmword == g1.bitfield.xmmword
2273 && g0.bitfield.ymmword == g1.bitfield.ymmword
2274 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2275 return 1;
2276
2277 if (!(t0.bitfield.byte & t1.bitfield.byte)
2278 && !(t0.bitfield.word & t1.bitfield.word)
2279 && !(t0.bitfield.dword & t1.bitfield.dword)
2280 && !(t0.bitfield.qword & t1.bitfield.qword)
2281 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2282 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2283 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2284 return 1;
2285
2286 i.error = register_type_mismatch;
2287
2288 return 0;
2289 }
2290
2291 static INLINE unsigned int
2292 register_number (const reg_entry *r)
2293 {
2294 unsigned int nr = r->reg_num;
2295
2296 if (r->reg_flags & RegRex)
2297 nr += 8;
2298
2299 if (r->reg_flags & RegVRex)
2300 nr += 16;
2301
2302 return nr;
2303 }
2304
2305 static INLINE unsigned int
2306 mode_from_disp_size (i386_operand_type t)
2307 {
2308 if (t.bitfield.disp8)
2309 return 1;
2310 else if (t.bitfield.disp16
2311 || t.bitfield.disp32
2312 || t.bitfield.disp32s)
2313 return 2;
2314 else
2315 return 0;
2316 }
2317
2318 static INLINE int
2319 fits_in_signed_byte (addressT num)
2320 {
2321 return num + 0x80 <= 0xff;
2322 }
2323
2324 static INLINE int
2325 fits_in_unsigned_byte (addressT num)
2326 {
2327 return num <= 0xff;
2328 }
2329
2330 static INLINE int
2331 fits_in_unsigned_word (addressT num)
2332 {
2333 return num <= 0xffff;
2334 }
2335
2336 static INLINE int
2337 fits_in_signed_word (addressT num)
2338 {
2339 return num + 0x8000 <= 0xffff;
2340 }
2341
2342 static INLINE int
2343 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2344 {
2345 #ifndef BFD64
2346 return 1;
2347 #else
2348 return num + 0x80000000 <= 0xffffffff;
2349 #endif
2350 } /* fits_in_signed_long() */
2351
2352 static INLINE int
2353 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2354 {
2355 #ifndef BFD64
2356 return 1;
2357 #else
2358 return num <= 0xffffffff;
2359 #endif
2360 } /* fits_in_unsigned_long() */
2361
2362 static INLINE int
2363 fits_in_disp8 (offsetT num)
2364 {
2365 int shift = i.memshift;
2366 unsigned int mask;
2367
2368 if (shift == -1)
2369 abort ();
2370
2371 mask = (1 << shift) - 1;
2372
2373 /* Return 0 if NUM isn't properly aligned. */
2374 if ((num & mask))
2375 return 0;
2376
2377 /* Check if NUM will fit in 8bit after shift. */
2378 return fits_in_signed_byte (num >> shift);
2379 }
2380
2381 static INLINE int
2382 fits_in_imm4 (offsetT num)
2383 {
2384 return (num & 0xf) == num;
2385 }
2386
2387 static i386_operand_type
2388 smallest_imm_type (offsetT num)
2389 {
2390 i386_operand_type t;
2391
2392 operand_type_set (&t, 0);
2393 t.bitfield.imm64 = 1;
2394
2395 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2396 {
2397 /* This code is disabled on the 486 because all the Imm1 forms
2398 in the opcode table are slower on the i486. They're the
2399 versions with the implicitly specified single-position
2400 displacement, which has another syntax if you really want to
2401 use that form. */
2402 t.bitfield.imm1 = 1;
2403 t.bitfield.imm8 = 1;
2404 t.bitfield.imm8s = 1;
2405 t.bitfield.imm16 = 1;
2406 t.bitfield.imm32 = 1;
2407 t.bitfield.imm32s = 1;
2408 }
2409 else if (fits_in_signed_byte (num))
2410 {
2411 t.bitfield.imm8 = 1;
2412 t.bitfield.imm8s = 1;
2413 t.bitfield.imm16 = 1;
2414 t.bitfield.imm32 = 1;
2415 t.bitfield.imm32s = 1;
2416 }
2417 else if (fits_in_unsigned_byte (num))
2418 {
2419 t.bitfield.imm8 = 1;
2420 t.bitfield.imm16 = 1;
2421 t.bitfield.imm32 = 1;
2422 t.bitfield.imm32s = 1;
2423 }
2424 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2425 {
2426 t.bitfield.imm16 = 1;
2427 t.bitfield.imm32 = 1;
2428 t.bitfield.imm32s = 1;
2429 }
2430 else if (fits_in_signed_long (num))
2431 {
2432 t.bitfield.imm32 = 1;
2433 t.bitfield.imm32s = 1;
2434 }
2435 else if (fits_in_unsigned_long (num))
2436 t.bitfield.imm32 = 1;
2437
2438 return t;
2439 }
2440
2441 static offsetT
2442 offset_in_range (offsetT val, int size)
2443 {
2444 addressT mask;
2445
2446 switch (size)
2447 {
2448 case 1: mask = ((addressT) 1 << 8) - 1; break;
2449 case 2: mask = ((addressT) 1 << 16) - 1; break;
2450 case 4: mask = ((addressT) 2 << 31) - 1; break;
2451 #ifdef BFD64
2452 case 8: mask = ((addressT) 2 << 63) - 1; break;
2453 #endif
2454 default: abort ();
2455 }
2456
2457 #ifdef BFD64
2458 /* If BFD64, sign extend val for 32bit address mode. */
2459 if (flag_code != CODE_64BIT
2460 || i.prefix[ADDR_PREFIX])
2461 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2462 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2463 #endif
2464
2465 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2466 {
2467 char buf1[40], buf2[40];
2468
2469 sprint_value (buf1, val);
2470 sprint_value (buf2, val & mask);
2471 as_warn (_("%s shortened to %s"), buf1, buf2);
2472 }
2473 return val & mask;
2474 }
2475
2476 enum PREFIX_GROUP
2477 {
2478 PREFIX_EXIST = 0,
2479 PREFIX_LOCK,
2480 PREFIX_REP,
2481 PREFIX_DS,
2482 PREFIX_OTHER
2483 };
2484
2485 /* Returns
2486 a. PREFIX_EXIST if attempting to add a prefix where one from the
2487 same class already exists.
2488 b. PREFIX_LOCK if lock prefix is added.
2489 c. PREFIX_REP if rep/repne prefix is added.
2490 d. PREFIX_DS if ds prefix is added.
2491 e. PREFIX_OTHER if other prefix is added.
2492 */
2493
2494 static enum PREFIX_GROUP
2495 add_prefix (unsigned int prefix)
2496 {
2497 enum PREFIX_GROUP ret = PREFIX_OTHER;
2498 unsigned int q;
2499
2500 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2501 && flag_code == CODE_64BIT)
2502 {
2503 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2504 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2505 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2506 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2507 ret = PREFIX_EXIST;
2508 q = REX_PREFIX;
2509 }
2510 else
2511 {
2512 switch (prefix)
2513 {
2514 default:
2515 abort ();
2516
2517 case DS_PREFIX_OPCODE:
2518 ret = PREFIX_DS;
2519 /* Fall through. */
2520 case CS_PREFIX_OPCODE:
2521 case ES_PREFIX_OPCODE:
2522 case FS_PREFIX_OPCODE:
2523 case GS_PREFIX_OPCODE:
2524 case SS_PREFIX_OPCODE:
2525 q = SEG_PREFIX;
2526 break;
2527
2528 case REPNE_PREFIX_OPCODE:
2529 case REPE_PREFIX_OPCODE:
2530 q = REP_PREFIX;
2531 ret = PREFIX_REP;
2532 break;
2533
2534 case LOCK_PREFIX_OPCODE:
2535 q = LOCK_PREFIX;
2536 ret = PREFIX_LOCK;
2537 break;
2538
2539 case FWAIT_OPCODE:
2540 q = WAIT_PREFIX;
2541 break;
2542
2543 case ADDR_PREFIX_OPCODE:
2544 q = ADDR_PREFIX;
2545 break;
2546
2547 case DATA_PREFIX_OPCODE:
2548 q = DATA_PREFIX;
2549 break;
2550 }
2551 if (i.prefix[q] != 0)
2552 ret = PREFIX_EXIST;
2553 }
2554
2555 if (ret)
2556 {
2557 if (!i.prefix[q])
2558 ++i.prefixes;
2559 i.prefix[q] |= prefix;
2560 }
2561 else
2562 as_bad (_("same type of prefix used twice"));
2563
2564 return ret;
2565 }
2566
2567 static void
2568 update_code_flag (int value, int check)
2569 {
2570 PRINTF_LIKE ((*as_error));
2571
2572 flag_code = (enum flag_code) value;
2573 if (flag_code == CODE_64BIT)
2574 {
2575 cpu_arch_flags.bitfield.cpu64 = 1;
2576 cpu_arch_flags.bitfield.cpuno64 = 0;
2577 }
2578 else
2579 {
2580 cpu_arch_flags.bitfield.cpu64 = 0;
2581 cpu_arch_flags.bitfield.cpuno64 = 1;
2582 }
2583 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2584 {
2585 if (check)
2586 as_error = as_fatal;
2587 else
2588 as_error = as_bad;
2589 (*as_error) (_("64bit mode not supported on `%s'."),
2590 cpu_arch_name ? cpu_arch_name : default_arch);
2591 }
2592 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2593 {
2594 if (check)
2595 as_error = as_fatal;
2596 else
2597 as_error = as_bad;
2598 (*as_error) (_("32bit mode not supported on `%s'."),
2599 cpu_arch_name ? cpu_arch_name : default_arch);
2600 }
2601 stackop_size = '\0';
2602 }
2603
2604 static void
2605 set_code_flag (int value)
2606 {
2607 update_code_flag (value, 0);
2608 }
2609
2610 static void
2611 set_16bit_gcc_code_flag (int new_code_flag)
2612 {
2613 flag_code = (enum flag_code) new_code_flag;
2614 if (flag_code != CODE_16BIT)
2615 abort ();
2616 cpu_arch_flags.bitfield.cpu64 = 0;
2617 cpu_arch_flags.bitfield.cpuno64 = 1;
2618 stackop_size = LONG_MNEM_SUFFIX;
2619 }
2620
2621 static void
2622 set_intel_syntax (int syntax_flag)
2623 {
2624 /* Find out if register prefixing is specified. */
2625 int ask_naked_reg = 0;
2626
2627 SKIP_WHITESPACE ();
2628 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2629 {
2630 char *string;
2631 int e = get_symbol_name (&string);
2632
2633 if (strcmp (string, "prefix") == 0)
2634 ask_naked_reg = 1;
2635 else if (strcmp (string, "noprefix") == 0)
2636 ask_naked_reg = -1;
2637 else
2638 as_bad (_("bad argument to syntax directive."));
2639 (void) restore_line_pointer (e);
2640 }
2641 demand_empty_rest_of_line ();
2642
2643 intel_syntax = syntax_flag;
2644
2645 if (ask_naked_reg == 0)
2646 allow_naked_reg = (intel_syntax
2647 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2648 else
2649 allow_naked_reg = (ask_naked_reg < 0);
2650
2651 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2652
2653 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2654 identifier_chars['$'] = intel_syntax ? '$' : 0;
2655 register_prefix = allow_naked_reg ? "" : "%";
2656 }
2657
2658 static void
2659 set_intel_mnemonic (int mnemonic_flag)
2660 {
2661 intel_mnemonic = mnemonic_flag;
2662 }
2663
2664 static void
2665 set_allow_index_reg (int flag)
2666 {
2667 allow_index_reg = flag;
2668 }
2669
2670 static void
2671 set_check (int what)
2672 {
2673 enum check_kind *kind;
2674 const char *str;
2675
2676 if (what)
2677 {
2678 kind = &operand_check;
2679 str = "operand";
2680 }
2681 else
2682 {
2683 kind = &sse_check;
2684 str = "sse";
2685 }
2686
2687 SKIP_WHITESPACE ();
2688
2689 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2690 {
2691 char *string;
2692 int e = get_symbol_name (&string);
2693
2694 if (strcmp (string, "none") == 0)
2695 *kind = check_none;
2696 else if (strcmp (string, "warning") == 0)
2697 *kind = check_warning;
2698 else if (strcmp (string, "error") == 0)
2699 *kind = check_error;
2700 else
2701 as_bad (_("bad argument to %s_check directive."), str);
2702 (void) restore_line_pointer (e);
2703 }
2704 else
2705 as_bad (_("missing argument for %s_check directive"), str);
2706
2707 demand_empty_rest_of_line ();
2708 }
2709
2710 static void
2711 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2712 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2713 {
2714 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2715 static const char *arch;
2716
2717 /* Intel LIOM is only supported on ELF. */
2718 if (!IS_ELF)
2719 return;
2720
2721 if (!arch)
2722 {
2723 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2724 use default_arch. */
2725 arch = cpu_arch_name;
2726 if (!arch)
2727 arch = default_arch;
2728 }
2729
2730 /* If we are targeting Intel MCU, we must enable it. */
2731 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2732 || new_flag.bitfield.cpuiamcu)
2733 return;
2734
2735 /* If we are targeting Intel L1OM, we must enable it. */
2736 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2737 || new_flag.bitfield.cpul1om)
2738 return;
2739
2740 /* If we are targeting Intel K1OM, we must enable it. */
2741 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2742 || new_flag.bitfield.cpuk1om)
2743 return;
2744
2745 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2746 #endif
2747 }
2748
2749 static void
2750 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2751 {
2752 SKIP_WHITESPACE ();
2753
2754 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2755 {
2756 char *string;
2757 int e = get_symbol_name (&string);
2758 unsigned int j;
2759 i386_cpu_flags flags;
2760
2761 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2762 {
2763 if (strcmp (string, cpu_arch[j].name) == 0)
2764 {
2765 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2766
2767 if (*string != '.')
2768 {
2769 cpu_arch_name = cpu_arch[j].name;
2770 cpu_sub_arch_name = NULL;
2771 cpu_arch_flags = cpu_arch[j].flags;
2772 if (flag_code == CODE_64BIT)
2773 {
2774 cpu_arch_flags.bitfield.cpu64 = 1;
2775 cpu_arch_flags.bitfield.cpuno64 = 0;
2776 }
2777 else
2778 {
2779 cpu_arch_flags.bitfield.cpu64 = 0;
2780 cpu_arch_flags.bitfield.cpuno64 = 1;
2781 }
2782 cpu_arch_isa = cpu_arch[j].type;
2783 cpu_arch_isa_flags = cpu_arch[j].flags;
2784 if (!cpu_arch_tune_set)
2785 {
2786 cpu_arch_tune = cpu_arch_isa;
2787 cpu_arch_tune_flags = cpu_arch_isa_flags;
2788 }
2789 break;
2790 }
2791
2792 flags = cpu_flags_or (cpu_arch_flags,
2793 cpu_arch[j].flags);
2794
2795 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2796 {
2797 if (cpu_sub_arch_name)
2798 {
2799 char *name = cpu_sub_arch_name;
2800 cpu_sub_arch_name = concat (name,
2801 cpu_arch[j].name,
2802 (const char *) NULL);
2803 free (name);
2804 }
2805 else
2806 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2807 cpu_arch_flags = flags;
2808 cpu_arch_isa_flags = flags;
2809 }
2810 else
2811 cpu_arch_isa_flags
2812 = cpu_flags_or (cpu_arch_isa_flags,
2813 cpu_arch[j].flags);
2814 (void) restore_line_pointer (e);
2815 demand_empty_rest_of_line ();
2816 return;
2817 }
2818 }
2819
2820 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2821 {
2822 /* Disable an ISA extension. */
2823 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2824 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2825 {
2826 flags = cpu_flags_and_not (cpu_arch_flags,
2827 cpu_noarch[j].flags);
2828 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2829 {
2830 if (cpu_sub_arch_name)
2831 {
2832 char *name = cpu_sub_arch_name;
2833 cpu_sub_arch_name = concat (name, string,
2834 (const char *) NULL);
2835 free (name);
2836 }
2837 else
2838 cpu_sub_arch_name = xstrdup (string);
2839 cpu_arch_flags = flags;
2840 cpu_arch_isa_flags = flags;
2841 }
2842 (void) restore_line_pointer (e);
2843 demand_empty_rest_of_line ();
2844 return;
2845 }
2846
2847 j = ARRAY_SIZE (cpu_arch);
2848 }
2849
2850 if (j >= ARRAY_SIZE (cpu_arch))
2851 as_bad (_("no such architecture: `%s'"), string);
2852
2853 *input_line_pointer = e;
2854 }
2855 else
2856 as_bad (_("missing cpu architecture"));
2857
2858 no_cond_jump_promotion = 0;
2859 if (*input_line_pointer == ','
2860 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2861 {
2862 char *string;
2863 char e;
2864
2865 ++input_line_pointer;
2866 e = get_symbol_name (&string);
2867
2868 if (strcmp (string, "nojumps") == 0)
2869 no_cond_jump_promotion = 1;
2870 else if (strcmp (string, "jumps") == 0)
2871 ;
2872 else
2873 as_bad (_("no such architecture modifier: `%s'"), string);
2874
2875 (void) restore_line_pointer (e);
2876 }
2877
2878 demand_empty_rest_of_line ();
2879 }
2880
2881 enum bfd_architecture
2882 i386_arch (void)
2883 {
2884 if (cpu_arch_isa == PROCESSOR_L1OM)
2885 {
2886 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2887 || flag_code != CODE_64BIT)
2888 as_fatal (_("Intel L1OM is 64bit ELF only"));
2889 return bfd_arch_l1om;
2890 }
2891 else if (cpu_arch_isa == PROCESSOR_K1OM)
2892 {
2893 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2894 || flag_code != CODE_64BIT)
2895 as_fatal (_("Intel K1OM is 64bit ELF only"));
2896 return bfd_arch_k1om;
2897 }
2898 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2899 {
2900 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2901 || flag_code == CODE_64BIT)
2902 as_fatal (_("Intel MCU is 32bit ELF only"));
2903 return bfd_arch_iamcu;
2904 }
2905 else
2906 return bfd_arch_i386;
2907 }
2908
2909 unsigned long
2910 i386_mach (void)
2911 {
2912 if (!strncmp (default_arch, "x86_64", 6))
2913 {
2914 if (cpu_arch_isa == PROCESSOR_L1OM)
2915 {
2916 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2917 || default_arch[6] != '\0')
2918 as_fatal (_("Intel L1OM is 64bit ELF only"));
2919 return bfd_mach_l1om;
2920 }
2921 else if (cpu_arch_isa == PROCESSOR_K1OM)
2922 {
2923 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2924 || default_arch[6] != '\0')
2925 as_fatal (_("Intel K1OM is 64bit ELF only"));
2926 return bfd_mach_k1om;
2927 }
2928 else if (default_arch[6] == '\0')
2929 return bfd_mach_x86_64;
2930 else
2931 return bfd_mach_x64_32;
2932 }
2933 else if (!strcmp (default_arch, "i386")
2934 || !strcmp (default_arch, "iamcu"))
2935 {
2936 if (cpu_arch_isa == PROCESSOR_IAMCU)
2937 {
2938 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2939 as_fatal (_("Intel MCU is 32bit ELF only"));
2940 return bfd_mach_i386_iamcu;
2941 }
2942 else
2943 return bfd_mach_i386_i386;
2944 }
2945 else
2946 as_fatal (_("unknown architecture"));
2947 }
2948 \f
2949 void
2950 md_begin (void)
2951 {
2952 const char *hash_err;
2953
2954 /* Support pseudo prefixes like {disp32}. */
2955 lex_type ['{'] = LEX_BEGIN_NAME;
2956
2957 /* Initialize op_hash hash table. */
2958 op_hash = hash_new ();
2959
2960 {
2961 const insn_template *optab;
2962 templates *core_optab;
2963
2964 /* Setup for loop. */
2965 optab = i386_optab;
2966 core_optab = XNEW (templates);
2967 core_optab->start = optab;
2968
2969 while (1)
2970 {
2971 ++optab;
2972 if (optab->name == NULL
2973 || strcmp (optab->name, (optab - 1)->name) != 0)
2974 {
2975 /* different name --> ship out current template list;
2976 add to hash table; & begin anew. */
2977 core_optab->end = optab;
2978 hash_err = hash_insert (op_hash,
2979 (optab - 1)->name,
2980 (void *) core_optab);
2981 if (hash_err)
2982 {
2983 as_fatal (_("can't hash %s: %s"),
2984 (optab - 1)->name,
2985 hash_err);
2986 }
2987 if (optab->name == NULL)
2988 break;
2989 core_optab = XNEW (templates);
2990 core_optab->start = optab;
2991 }
2992 }
2993 }
2994
2995 /* Initialize reg_hash hash table. */
2996 reg_hash = hash_new ();
2997 {
2998 const reg_entry *regtab;
2999 unsigned int regtab_size = i386_regtab_size;
3000
3001 for (regtab = i386_regtab; regtab_size--; regtab++)
3002 {
3003 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3004 if (hash_err)
3005 as_fatal (_("can't hash %s: %s"),
3006 regtab->reg_name,
3007 hash_err);
3008 }
3009 }
3010
3011 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3012 {
3013 int c;
3014 char *p;
3015
3016 for (c = 0; c < 256; c++)
3017 {
3018 if (ISDIGIT (c))
3019 {
3020 digit_chars[c] = c;
3021 mnemonic_chars[c] = c;
3022 register_chars[c] = c;
3023 operand_chars[c] = c;
3024 }
3025 else if (ISLOWER (c))
3026 {
3027 mnemonic_chars[c] = c;
3028 register_chars[c] = c;
3029 operand_chars[c] = c;
3030 }
3031 else if (ISUPPER (c))
3032 {
3033 mnemonic_chars[c] = TOLOWER (c);
3034 register_chars[c] = mnemonic_chars[c];
3035 operand_chars[c] = c;
3036 }
3037 else if (c == '{' || c == '}')
3038 {
3039 mnemonic_chars[c] = c;
3040 operand_chars[c] = c;
3041 }
3042
3043 if (ISALPHA (c) || ISDIGIT (c))
3044 identifier_chars[c] = c;
3045 else if (c >= 128)
3046 {
3047 identifier_chars[c] = c;
3048 operand_chars[c] = c;
3049 }
3050 }
3051
3052 #ifdef LEX_AT
3053 identifier_chars['@'] = '@';
3054 #endif
3055 #ifdef LEX_QM
3056 identifier_chars['?'] = '?';
3057 operand_chars['?'] = '?';
3058 #endif
3059 digit_chars['-'] = '-';
3060 mnemonic_chars['_'] = '_';
3061 mnemonic_chars['-'] = '-';
3062 mnemonic_chars['.'] = '.';
3063 identifier_chars['_'] = '_';
3064 identifier_chars['.'] = '.';
3065
3066 for (p = operand_special_chars; *p != '\0'; p++)
3067 operand_chars[(unsigned char) *p] = *p;
3068 }
3069
3070 if (flag_code == CODE_64BIT)
3071 {
3072 #if defined (OBJ_COFF) && defined (TE_PE)
3073 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3074 ? 32 : 16);
3075 #else
3076 x86_dwarf2_return_column = 16;
3077 #endif
3078 x86_cie_data_alignment = -8;
3079 }
3080 else
3081 {
3082 x86_dwarf2_return_column = 8;
3083 x86_cie_data_alignment = -4;
3084 }
3085
3086 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3087 can be turned into BRANCH_PREFIX frag. */
3088 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3089 abort ();
3090 }
3091
3092 void
3093 i386_print_statistics (FILE *file)
3094 {
3095 hash_print_statistics (file, "i386 opcode", op_hash);
3096 hash_print_statistics (file, "i386 register", reg_hash);
3097 }
3098 \f
3099 #ifdef DEBUG386
3100
3101 /* Debugging routines for md_assemble. */
3102 static void pte (insn_template *);
3103 static void pt (i386_operand_type);
3104 static void pe (expressionS *);
3105 static void ps (symbolS *);
3106
3107 static void
3108 pi (const char *line, i386_insn *x)
3109 {
3110 unsigned int j;
3111
3112 fprintf (stdout, "%s: template ", line);
3113 pte (&x->tm);
3114 fprintf (stdout, " address: base %s index %s scale %x\n",
3115 x->base_reg ? x->base_reg->reg_name : "none",
3116 x->index_reg ? x->index_reg->reg_name : "none",
3117 x->log2_scale_factor);
3118 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3119 x->rm.mode, x->rm.reg, x->rm.regmem);
3120 fprintf (stdout, " sib: base %x index %x scale %x\n",
3121 x->sib.base, x->sib.index, x->sib.scale);
3122 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3123 (x->rex & REX_W) != 0,
3124 (x->rex & REX_R) != 0,
3125 (x->rex & REX_X) != 0,
3126 (x->rex & REX_B) != 0);
3127 for (j = 0; j < x->operands; j++)
3128 {
3129 fprintf (stdout, " #%d: ", j + 1);
3130 pt (x->types[j]);
3131 fprintf (stdout, "\n");
3132 if (x->types[j].bitfield.class == Reg
3133 || x->types[j].bitfield.class == RegMMX
3134 || x->types[j].bitfield.class == RegSIMD
3135 || x->types[j].bitfield.class == SReg
3136 || x->types[j].bitfield.class == RegCR
3137 || x->types[j].bitfield.class == RegDR
3138 || x->types[j].bitfield.class == RegTR)
3139 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3140 if (operand_type_check (x->types[j], imm))
3141 pe (x->op[j].imms);
3142 if (operand_type_check (x->types[j], disp))
3143 pe (x->op[j].disps);
3144 }
3145 }
3146
3147 static void
3148 pte (insn_template *t)
3149 {
3150 unsigned int j;
3151 fprintf (stdout, " %d operands ", t->operands);
3152 fprintf (stdout, "opcode %x ", t->base_opcode);
3153 if (t->extension_opcode != None)
3154 fprintf (stdout, "ext %x ", t->extension_opcode);
3155 if (t->opcode_modifier.d)
3156 fprintf (stdout, "D");
3157 if (t->opcode_modifier.w)
3158 fprintf (stdout, "W");
3159 fprintf (stdout, "\n");
3160 for (j = 0; j < t->operands; j++)
3161 {
3162 fprintf (stdout, " #%d type ", j + 1);
3163 pt (t->operand_types[j]);
3164 fprintf (stdout, "\n");
3165 }
3166 }
3167
3168 static void
3169 pe (expressionS *e)
3170 {
3171 fprintf (stdout, " operation %d\n", e->X_op);
3172 fprintf (stdout, " add_number %ld (%lx)\n",
3173 (long) e->X_add_number, (long) e->X_add_number);
3174 if (e->X_add_symbol)
3175 {
3176 fprintf (stdout, " add_symbol ");
3177 ps (e->X_add_symbol);
3178 fprintf (stdout, "\n");
3179 }
3180 if (e->X_op_symbol)
3181 {
3182 fprintf (stdout, " op_symbol ");
3183 ps (e->X_op_symbol);
3184 fprintf (stdout, "\n");
3185 }
3186 }
3187
3188 static void
3189 ps (symbolS *s)
3190 {
3191 fprintf (stdout, "%s type %s%s",
3192 S_GET_NAME (s),
3193 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3194 segment_name (S_GET_SEGMENT (s)));
3195 }
3196
3197 static struct type_name
3198 {
3199 i386_operand_type mask;
3200 const char *name;
3201 }
3202 const type_names[] =
3203 {
3204 { OPERAND_TYPE_REG8, "r8" },
3205 { OPERAND_TYPE_REG16, "r16" },
3206 { OPERAND_TYPE_REG32, "r32" },
3207 { OPERAND_TYPE_REG64, "r64" },
3208 { OPERAND_TYPE_ACC8, "acc8" },
3209 { OPERAND_TYPE_ACC16, "acc16" },
3210 { OPERAND_TYPE_ACC32, "acc32" },
3211 { OPERAND_TYPE_ACC64, "acc64" },
3212 { OPERAND_TYPE_IMM8, "i8" },
3213 { OPERAND_TYPE_IMM8, "i8s" },
3214 { OPERAND_TYPE_IMM16, "i16" },
3215 { OPERAND_TYPE_IMM32, "i32" },
3216 { OPERAND_TYPE_IMM32S, "i32s" },
3217 { OPERAND_TYPE_IMM64, "i64" },
3218 { OPERAND_TYPE_IMM1, "i1" },
3219 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3220 { OPERAND_TYPE_DISP8, "d8" },
3221 { OPERAND_TYPE_DISP16, "d16" },
3222 { OPERAND_TYPE_DISP32, "d32" },
3223 { OPERAND_TYPE_DISP32S, "d32s" },
3224 { OPERAND_TYPE_DISP64, "d64" },
3225 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3226 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3227 { OPERAND_TYPE_CONTROL, "control reg" },
3228 { OPERAND_TYPE_TEST, "test reg" },
3229 { OPERAND_TYPE_DEBUG, "debug reg" },
3230 { OPERAND_TYPE_FLOATREG, "FReg" },
3231 { OPERAND_TYPE_FLOATACC, "FAcc" },
3232 { OPERAND_TYPE_SREG, "SReg" },
3233 { OPERAND_TYPE_REGMMX, "rMMX" },
3234 { OPERAND_TYPE_REGXMM, "rXMM" },
3235 { OPERAND_TYPE_REGYMM, "rYMM" },
3236 { OPERAND_TYPE_REGZMM, "rZMM" },
3237 { OPERAND_TYPE_REGMASK, "Mask reg" },
3238 };
3239
3240 static void
3241 pt (i386_operand_type t)
3242 {
3243 unsigned int j;
3244 i386_operand_type a;
3245
3246 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3247 {
3248 a = operand_type_and (t, type_names[j].mask);
3249 if (operand_type_equal (&a, &type_names[j].mask))
3250 fprintf (stdout, "%s, ", type_names[j].name);
3251 }
3252 fflush (stdout);
3253 }
3254
3255 #endif /* DEBUG386 */
3256 \f
3257 static bfd_reloc_code_real_type
3258 reloc (unsigned int size,
3259 int pcrel,
3260 int sign,
3261 bfd_reloc_code_real_type other)
3262 {
3263 if (other != NO_RELOC)
3264 {
3265 reloc_howto_type *rel;
3266
3267 if (size == 8)
3268 switch (other)
3269 {
3270 case BFD_RELOC_X86_64_GOT32:
3271 return BFD_RELOC_X86_64_GOT64;
3272 break;
3273 case BFD_RELOC_X86_64_GOTPLT64:
3274 return BFD_RELOC_X86_64_GOTPLT64;
3275 break;
3276 case BFD_RELOC_X86_64_PLTOFF64:
3277 return BFD_RELOC_X86_64_PLTOFF64;
3278 break;
3279 case BFD_RELOC_X86_64_GOTPC32:
3280 other = BFD_RELOC_X86_64_GOTPC64;
3281 break;
3282 case BFD_RELOC_X86_64_GOTPCREL:
3283 other = BFD_RELOC_X86_64_GOTPCREL64;
3284 break;
3285 case BFD_RELOC_X86_64_TPOFF32:
3286 other = BFD_RELOC_X86_64_TPOFF64;
3287 break;
3288 case BFD_RELOC_X86_64_DTPOFF32:
3289 other = BFD_RELOC_X86_64_DTPOFF64;
3290 break;
3291 default:
3292 break;
3293 }
3294
3295 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3296 if (other == BFD_RELOC_SIZE32)
3297 {
3298 if (size == 8)
3299 other = BFD_RELOC_SIZE64;
3300 if (pcrel)
3301 {
3302 as_bad (_("there are no pc-relative size relocations"));
3303 return NO_RELOC;
3304 }
3305 }
3306 #endif
3307
3308 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3309 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3310 sign = -1;
3311
3312 rel = bfd_reloc_type_lookup (stdoutput, other);
3313 if (!rel)
3314 as_bad (_("unknown relocation (%u)"), other);
3315 else if (size != bfd_get_reloc_size (rel))
3316 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3317 bfd_get_reloc_size (rel),
3318 size);
3319 else if (pcrel && !rel->pc_relative)
3320 as_bad (_("non-pc-relative relocation for pc-relative field"));
3321 else if ((rel->complain_on_overflow == complain_overflow_signed
3322 && !sign)
3323 || (rel->complain_on_overflow == complain_overflow_unsigned
3324 && sign > 0))
3325 as_bad (_("relocated field and relocation type differ in signedness"));
3326 else
3327 return other;
3328 return NO_RELOC;
3329 }
3330
3331 if (pcrel)
3332 {
3333 if (!sign)
3334 as_bad (_("there are no unsigned pc-relative relocations"));
3335 switch (size)
3336 {
3337 case 1: return BFD_RELOC_8_PCREL;
3338 case 2: return BFD_RELOC_16_PCREL;
3339 case 4: return BFD_RELOC_32_PCREL;
3340 case 8: return BFD_RELOC_64_PCREL;
3341 }
3342 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3343 }
3344 else
3345 {
3346 if (sign > 0)
3347 switch (size)
3348 {
3349 case 4: return BFD_RELOC_X86_64_32S;
3350 }
3351 else
3352 switch (size)
3353 {
3354 case 1: return BFD_RELOC_8;
3355 case 2: return BFD_RELOC_16;
3356 case 4: return BFD_RELOC_32;
3357 case 8: return BFD_RELOC_64;
3358 }
3359 as_bad (_("cannot do %s %u byte relocation"),
3360 sign > 0 ? "signed" : "unsigned", size);
3361 }
3362
3363 return NO_RELOC;
3364 }
3365
3366 /* Here we decide which fixups can be adjusted to make them relative to
3367 the beginning of the section instead of the symbol. Basically we need
3368 to make sure that the dynamic relocations are done correctly, so in
3369 some cases we force the original symbol to be used. */
3370
3371 int
3372 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3373 {
3374 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3375 if (!IS_ELF)
3376 return 1;
3377
3378 /* Don't adjust pc-relative references to merge sections in 64-bit
3379 mode. */
3380 if (use_rela_relocations
3381 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3382 && fixP->fx_pcrel)
3383 return 0;
3384
3385 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3386 and changed later by validate_fix. */
3387 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3388 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3389 return 0;
3390
3391 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3392 for size relocations. */
3393 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3394 || fixP->fx_r_type == BFD_RELOC_SIZE64
3395 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3396 || fixP->fx_r_type == BFD_RELOC_386_PLT32
3397 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3398 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3399 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3400 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3401 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3402 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3403 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3404 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3405 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3406 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3407 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3408 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3409 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
3410 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3411 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3412 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3413 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3414 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3415 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3416 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3417 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3418 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3419 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3420 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3421 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3422 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3423 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3424 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3425 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3426 return 0;
3427 #endif
3428 return 1;
3429 }
3430
3431 static int
3432 intel_float_operand (const char *mnemonic)
3433 {
3434 /* Note that the value returned is meaningful only for opcodes with (memory)
3435 operands, hence the code here is free to improperly handle opcodes that
3436 have no operands (for better performance and smaller code). */
3437
3438 if (mnemonic[0] != 'f')
3439 return 0; /* non-math */
3440
3441 switch (mnemonic[1])
3442 {
3443 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3444 the fs segment override prefix not currently handled because no
3445 call path can make opcodes without operands get here */
3446 case 'i':
3447 return 2 /* integer op */;
3448 case 'l':
3449 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3450 return 3; /* fldcw/fldenv */
3451 break;
3452 case 'n':
3453 if (mnemonic[2] != 'o' /* fnop */)
3454 return 3; /* non-waiting control op */
3455 break;
3456 case 'r':
3457 if (mnemonic[2] == 's')
3458 return 3; /* frstor/frstpm */
3459 break;
3460 case 's':
3461 if (mnemonic[2] == 'a')
3462 return 3; /* fsave */
3463 if (mnemonic[2] == 't')
3464 {
3465 switch (mnemonic[3])
3466 {
3467 case 'c': /* fstcw */
3468 case 'd': /* fstdw */
3469 case 'e': /* fstenv */
3470 case 's': /* fsts[gw] */
3471 return 3;
3472 }
3473 }
3474 break;
3475 case 'x':
3476 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3477 return 0; /* fxsave/fxrstor are not really math ops */
3478 break;
3479 }
3480
3481 return 1;
3482 }
3483
3484 /* Build the VEX prefix. */
3485
3486 static void
3487 build_vex_prefix (const insn_template *t)
3488 {
3489 unsigned int register_specifier;
3490 unsigned int implied_prefix;
3491 unsigned int vector_length;
3492 unsigned int w;
3493
3494 /* Check register specifier. */
3495 if (i.vex.register_specifier)
3496 {
3497 register_specifier =
3498 ~register_number (i.vex.register_specifier) & 0xf;
3499 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3500 }
3501 else
3502 register_specifier = 0xf;
3503
3504 /* Use 2-byte VEX prefix by swapping destination and source operand
3505 if there are more than 1 register operand. */
3506 if (i.reg_operands > 1
3507 && i.vec_encoding != vex_encoding_vex3
3508 && i.dir_encoding == dir_encoding_default
3509 && i.operands == i.reg_operands
3510 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3511 && i.tm.opcode_modifier.vexopcode == VEX0F
3512 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3513 && i.rex == REX_B)
3514 {
3515 unsigned int xchg = i.operands - 1;
3516 union i386_op temp_op;
3517 i386_operand_type temp_type;
3518
3519 temp_type = i.types[xchg];
3520 i.types[xchg] = i.types[0];
3521 i.types[0] = temp_type;
3522 temp_op = i.op[xchg];
3523 i.op[xchg] = i.op[0];
3524 i.op[0] = temp_op;
3525
3526 gas_assert (i.rm.mode == 3);
3527
3528 i.rex = REX_R;
3529 xchg = i.rm.regmem;
3530 i.rm.regmem = i.rm.reg;
3531 i.rm.reg = xchg;
3532
3533 if (i.tm.opcode_modifier.d)
3534 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3535 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3536 else /* Use the next insn. */
3537 i.tm = t[1];
3538 }
3539
3540 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3541 are no memory operands and at least 3 register ones. */
3542 if (i.reg_operands >= 3
3543 && i.vec_encoding != vex_encoding_vex3
3544 && i.reg_operands == i.operands - i.imm_operands
3545 && i.tm.opcode_modifier.vex
3546 && i.tm.opcode_modifier.commutative
3547 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3548 && i.rex == REX_B
3549 && i.vex.register_specifier
3550 && !(i.vex.register_specifier->reg_flags & RegRex))
3551 {
3552 unsigned int xchg = i.operands - i.reg_operands;
3553 union i386_op temp_op;
3554 i386_operand_type temp_type;
3555
3556 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3557 gas_assert (!i.tm.opcode_modifier.sae);
3558 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3559 &i.types[i.operands - 3]));
3560 gas_assert (i.rm.mode == 3);
3561
3562 temp_type = i.types[xchg];
3563 i.types[xchg] = i.types[xchg + 1];
3564 i.types[xchg + 1] = temp_type;
3565 temp_op = i.op[xchg];
3566 i.op[xchg] = i.op[xchg + 1];
3567 i.op[xchg + 1] = temp_op;
3568
3569 i.rex = 0;
3570 xchg = i.rm.regmem | 8;
3571 i.rm.regmem = ~register_specifier & 0xf;
3572 gas_assert (!(i.rm.regmem & 8));
3573 i.vex.register_specifier += xchg - i.rm.regmem;
3574 register_specifier = ~xchg & 0xf;
3575 }
3576
3577 if (i.tm.opcode_modifier.vex == VEXScalar)
3578 vector_length = avxscalar;
3579 else if (i.tm.opcode_modifier.vex == VEX256)
3580 vector_length = 1;
3581 else
3582 {
3583 unsigned int op;
3584
3585 /* Determine vector length from the last multi-length vector
3586 operand. */
3587 vector_length = 0;
3588 for (op = t->operands; op--;)
3589 if (t->operand_types[op].bitfield.xmmword
3590 && t->operand_types[op].bitfield.ymmword
3591 && i.types[op].bitfield.ymmword)
3592 {
3593 vector_length = 1;
3594 break;
3595 }
3596 }
3597
3598 switch ((i.tm.base_opcode >> 8) & 0xff)
3599 {
3600 case 0:
3601 implied_prefix = 0;
3602 break;
3603 case DATA_PREFIX_OPCODE:
3604 implied_prefix = 1;
3605 break;
3606 case REPE_PREFIX_OPCODE:
3607 implied_prefix = 2;
3608 break;
3609 case REPNE_PREFIX_OPCODE:
3610 implied_prefix = 3;
3611 break;
3612 default:
3613 abort ();
3614 }
3615
3616 /* Check the REX.W bit and VEXW. */
3617 if (i.tm.opcode_modifier.vexw == VEXWIG)
3618 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3619 else if (i.tm.opcode_modifier.vexw)
3620 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3621 else
3622 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3623
3624 /* Use 2-byte VEX prefix if possible. */
3625 if (w == 0
3626 && i.vec_encoding != vex_encoding_vex3
3627 && i.tm.opcode_modifier.vexopcode == VEX0F
3628 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3629 {
3630 /* 2-byte VEX prefix. */
3631 unsigned int r;
3632
3633 i.vex.length = 2;
3634 i.vex.bytes[0] = 0xc5;
3635
3636 /* Check the REX.R bit. */
3637 r = (i.rex & REX_R) ? 0 : 1;
3638 i.vex.bytes[1] = (r << 7
3639 | register_specifier << 3
3640 | vector_length << 2
3641 | implied_prefix);
3642 }
3643 else
3644 {
3645 /* 3-byte VEX prefix. */
3646 unsigned int m;
3647
3648 i.vex.length = 3;
3649
3650 switch (i.tm.opcode_modifier.vexopcode)
3651 {
3652 case VEX0F:
3653 m = 0x1;
3654 i.vex.bytes[0] = 0xc4;
3655 break;
3656 case VEX0F38:
3657 m = 0x2;
3658 i.vex.bytes[0] = 0xc4;
3659 break;
3660 case VEX0F3A:
3661 m = 0x3;
3662 i.vex.bytes[0] = 0xc4;
3663 break;
3664 case XOP08:
3665 m = 0x8;
3666 i.vex.bytes[0] = 0x8f;
3667 break;
3668 case XOP09:
3669 m = 0x9;
3670 i.vex.bytes[0] = 0x8f;
3671 break;
3672 case XOP0A:
3673 m = 0xa;
3674 i.vex.bytes[0] = 0x8f;
3675 break;
3676 default:
3677 abort ();
3678 }
3679
3680 /* The high 3 bits of the second VEX byte are 1's compliment
3681 of RXB bits from REX. */
3682 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3683
3684 i.vex.bytes[2] = (w << 7
3685 | register_specifier << 3
3686 | vector_length << 2
3687 | implied_prefix);
3688 }
3689 }
3690
3691 static INLINE bfd_boolean
3692 is_evex_encoding (const insn_template *t)
3693 {
3694 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3695 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3696 || t->opcode_modifier.sae;
3697 }
3698
3699 static INLINE bfd_boolean
3700 is_any_vex_encoding (const insn_template *t)
3701 {
3702 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3703 || is_evex_encoding (t);
3704 }
3705
3706 /* Build the EVEX prefix. */
3707
3708 static void
3709 build_evex_prefix (void)
3710 {
3711 unsigned int register_specifier;
3712 unsigned int implied_prefix;
3713 unsigned int m, w;
3714 rex_byte vrex_used = 0;
3715
3716 /* Check register specifier. */
3717 if (i.vex.register_specifier)
3718 {
3719 gas_assert ((i.vrex & REX_X) == 0);
3720
3721 register_specifier = i.vex.register_specifier->reg_num;
3722 if ((i.vex.register_specifier->reg_flags & RegRex))
3723 register_specifier += 8;
3724 /* The upper 16 registers are encoded in the fourth byte of the
3725 EVEX prefix. */
3726 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3727 i.vex.bytes[3] = 0x8;
3728 register_specifier = ~register_specifier & 0xf;
3729 }
3730 else
3731 {
3732 register_specifier = 0xf;
3733
3734 /* Encode upper 16 vector index register in the fourth byte of
3735 the EVEX prefix. */
3736 if (!(i.vrex & REX_X))
3737 i.vex.bytes[3] = 0x8;
3738 else
3739 vrex_used |= REX_X;
3740 }
3741
3742 switch ((i.tm.base_opcode >> 8) & 0xff)
3743 {
3744 case 0:
3745 implied_prefix = 0;
3746 break;
3747 case DATA_PREFIX_OPCODE:
3748 implied_prefix = 1;
3749 break;
3750 case REPE_PREFIX_OPCODE:
3751 implied_prefix = 2;
3752 break;
3753 case REPNE_PREFIX_OPCODE:
3754 implied_prefix = 3;
3755 break;
3756 default:
3757 abort ();
3758 }
3759
3760 /* 4 byte EVEX prefix. */
3761 i.vex.length = 4;
3762 i.vex.bytes[0] = 0x62;
3763
3764 /* mmmm bits. */
3765 switch (i.tm.opcode_modifier.vexopcode)
3766 {
3767 case VEX0F:
3768 m = 1;
3769 break;
3770 case VEX0F38:
3771 m = 2;
3772 break;
3773 case VEX0F3A:
3774 m = 3;
3775 break;
3776 default:
3777 abort ();
3778 break;
3779 }
3780
3781 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3782 bits from REX. */
3783 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3784
3785 /* The fifth bit of the second EVEX byte is 1's compliment of the
3786 REX_R bit in VREX. */
3787 if (!(i.vrex & REX_R))
3788 i.vex.bytes[1] |= 0x10;
3789 else
3790 vrex_used |= REX_R;
3791
3792 if ((i.reg_operands + i.imm_operands) == i.operands)
3793 {
3794 /* When all operands are registers, the REX_X bit in REX is not
3795 used. We reuse it to encode the upper 16 registers, which is
3796 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3797 as 1's compliment. */
3798 if ((i.vrex & REX_B))
3799 {
3800 vrex_used |= REX_B;
3801 i.vex.bytes[1] &= ~0x40;
3802 }
3803 }
3804
3805 /* EVEX instructions shouldn't need the REX prefix. */
3806 i.vrex &= ~vrex_used;
3807 gas_assert (i.vrex == 0);
3808
3809 /* Check the REX.W bit and VEXW. */
3810 if (i.tm.opcode_modifier.vexw == VEXWIG)
3811 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3812 else if (i.tm.opcode_modifier.vexw)
3813 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3814 else
3815 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3816
3817 /* Encode the U bit. */
3818 implied_prefix |= 0x4;
3819
3820 /* The third byte of the EVEX prefix. */
3821 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3822
3823 /* The fourth byte of the EVEX prefix. */
3824 /* The zeroing-masking bit. */
3825 if (i.mask && i.mask->zeroing)
3826 i.vex.bytes[3] |= 0x80;
3827
3828 /* Don't always set the broadcast bit if there is no RC. */
3829 if (!i.rounding)
3830 {
3831 /* Encode the vector length. */
3832 unsigned int vec_length;
3833
3834 if (!i.tm.opcode_modifier.evex
3835 || i.tm.opcode_modifier.evex == EVEXDYN)
3836 {
3837 unsigned int op;
3838
3839 /* Determine vector length from the last multi-length vector
3840 operand. */
3841 vec_length = 0;
3842 for (op = i.operands; op--;)
3843 if (i.tm.operand_types[op].bitfield.xmmword
3844 + i.tm.operand_types[op].bitfield.ymmword
3845 + i.tm.operand_types[op].bitfield.zmmword > 1)
3846 {
3847 if (i.types[op].bitfield.zmmword)
3848 {
3849 i.tm.opcode_modifier.evex = EVEX512;
3850 break;
3851 }
3852 else if (i.types[op].bitfield.ymmword)
3853 {
3854 i.tm.opcode_modifier.evex = EVEX256;
3855 break;
3856 }
3857 else if (i.types[op].bitfield.xmmword)
3858 {
3859 i.tm.opcode_modifier.evex = EVEX128;
3860 break;
3861 }
3862 else if (i.broadcast && (int) op == i.broadcast->operand)
3863 {
3864 switch (i.broadcast->bytes)
3865 {
3866 case 64:
3867 i.tm.opcode_modifier.evex = EVEX512;
3868 break;
3869 case 32:
3870 i.tm.opcode_modifier.evex = EVEX256;
3871 break;
3872 case 16:
3873 i.tm.opcode_modifier.evex = EVEX128;
3874 break;
3875 default:
3876 abort ();
3877 }
3878 break;
3879 }
3880 }
3881
3882 if (op >= MAX_OPERANDS)
3883 abort ();
3884 }
3885
3886 switch (i.tm.opcode_modifier.evex)
3887 {
3888 case EVEXLIG: /* LL' is ignored */
3889 vec_length = evexlig << 5;
3890 break;
3891 case EVEX128:
3892 vec_length = 0 << 5;
3893 break;
3894 case EVEX256:
3895 vec_length = 1 << 5;
3896 break;
3897 case EVEX512:
3898 vec_length = 2 << 5;
3899 break;
3900 default:
3901 abort ();
3902 break;
3903 }
3904 i.vex.bytes[3] |= vec_length;
3905 /* Encode the broadcast bit. */
3906 if (i.broadcast)
3907 i.vex.bytes[3] |= 0x10;
3908 }
3909 else
3910 {
3911 if (i.rounding->type != saeonly)
3912 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3913 else
3914 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3915 }
3916
3917 if (i.mask && i.mask->mask)
3918 i.vex.bytes[3] |= i.mask->mask->reg_num;
3919 }
3920
3921 static void
3922 process_immext (void)
3923 {
3924 expressionS *exp;
3925
3926 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3927 which is coded in the same place as an 8-bit immediate field
3928 would be. Here we fake an 8-bit immediate operand from the
3929 opcode suffix stored in tm.extension_opcode.
3930
3931 AVX instructions also use this encoding, for some of
3932 3 argument instructions. */
3933
3934 gas_assert (i.imm_operands <= 1
3935 && (i.operands <= 2
3936 || (is_any_vex_encoding (&i.tm)
3937 && i.operands <= 4)));
3938
3939 exp = &im_expressions[i.imm_operands++];
3940 i.op[i.operands].imms = exp;
3941 i.types[i.operands] = imm8;
3942 i.operands++;
3943 exp->X_op = O_constant;
3944 exp->X_add_number = i.tm.extension_opcode;
3945 i.tm.extension_opcode = None;
3946 }
3947
3948
3949 static int
3950 check_hle (void)
3951 {
3952 switch (i.tm.opcode_modifier.hleprefixok)
3953 {
3954 default:
3955 abort ();
3956 case HLEPrefixNone:
3957 as_bad (_("invalid instruction `%s' after `%s'"),
3958 i.tm.name, i.hle_prefix);
3959 return 0;
3960 case HLEPrefixLock:
3961 if (i.prefix[LOCK_PREFIX])
3962 return 1;
3963 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3964 return 0;
3965 case HLEPrefixAny:
3966 return 1;
3967 case HLEPrefixRelease:
3968 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3969 {
3970 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3971 i.tm.name);
3972 return 0;
3973 }
3974 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
3975 {
3976 as_bad (_("memory destination needed for instruction `%s'"
3977 " after `xrelease'"), i.tm.name);
3978 return 0;
3979 }
3980 return 1;
3981 }
3982 }
3983
3984 /* Try the shortest encoding by shortening operand size. */
3985
3986 static void
3987 optimize_encoding (void)
3988 {
3989 unsigned int j;
3990
3991 if (optimize_for_space
3992 && i.reg_operands == 1
3993 && i.imm_operands == 1
3994 && !i.types[1].bitfield.byte
3995 && i.op[0].imms->X_op == O_constant
3996 && fits_in_imm7 (i.op[0].imms->X_add_number)
3997 && ((i.tm.base_opcode == 0xa8
3998 && i.tm.extension_opcode == None)
3999 || (i.tm.base_opcode == 0xf6
4000 && i.tm.extension_opcode == 0x0)))
4001 {
4002 /* Optimize: -Os:
4003 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4004 */
4005 unsigned int base_regnum = i.op[1].regs->reg_num;
4006 if (flag_code == CODE_64BIT || base_regnum < 4)
4007 {
4008 i.types[1].bitfield.byte = 1;
4009 /* Ignore the suffix. */
4010 i.suffix = 0;
4011 if (base_regnum >= 4)
4012 {
4013 /* Handle SP, BP, SI, DI and R12-R15 registers. */
4014 if (i.types[1].bitfield.word)
4015 j = 16;
4016 else if (i.types[1].bitfield.dword)
4017 j = 32;
4018 else
4019 j = 48;
4020 i.op[1].regs -= j;
4021 }
4022 }
4023 }
4024 else if (flag_code == CODE_64BIT
4025 && ((i.types[1].bitfield.qword
4026 && i.reg_operands == 1
4027 && i.imm_operands == 1
4028 && i.op[0].imms->X_op == O_constant
4029 && ((i.tm.base_opcode == 0xb8
4030 && i.tm.extension_opcode == None
4031 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4032 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4033 && (((i.tm.base_opcode == 0x24
4034 || i.tm.base_opcode == 0xa8)
4035 && i.tm.extension_opcode == None)
4036 || (i.tm.base_opcode == 0x80
4037 && i.tm.extension_opcode == 0x4)
4038 || ((i.tm.base_opcode == 0xf6
4039 || (i.tm.base_opcode | 1) == 0xc7)
4040 && i.tm.extension_opcode == 0x0)))
4041 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4042 && i.tm.base_opcode == 0x83
4043 && i.tm.extension_opcode == 0x4)))
4044 || (i.types[0].bitfield.qword
4045 && ((i.reg_operands == 2
4046 && i.op[0].regs == i.op[1].regs
4047 && ((i.tm.base_opcode == 0x30
4048 || i.tm.base_opcode == 0x28)
4049 && i.tm.extension_opcode == None))
4050 || (i.reg_operands == 1
4051 && i.operands == 1
4052 && i.tm.base_opcode == 0x30
4053 && i.tm.extension_opcode == None)))))
4054 {
4055 /* Optimize: -O:
4056 andq $imm31, %r64 -> andl $imm31, %r32
4057 andq $imm7, %r64 -> andl $imm7, %r32
4058 testq $imm31, %r64 -> testl $imm31, %r32
4059 xorq %r64, %r64 -> xorl %r32, %r32
4060 subq %r64, %r64 -> subl %r32, %r32
4061 movq $imm31, %r64 -> movl $imm31, %r32
4062 movq $imm32, %r64 -> movl $imm32, %r32
4063 */
4064 i.tm.opcode_modifier.norex64 = 1;
4065 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4066 {
4067 /* Handle
4068 movq $imm31, %r64 -> movl $imm31, %r32
4069 movq $imm32, %r64 -> movl $imm32, %r32
4070 */
4071 i.tm.operand_types[0].bitfield.imm32 = 1;
4072 i.tm.operand_types[0].bitfield.imm32s = 0;
4073 i.tm.operand_types[0].bitfield.imm64 = 0;
4074 i.types[0].bitfield.imm32 = 1;
4075 i.types[0].bitfield.imm32s = 0;
4076 i.types[0].bitfield.imm64 = 0;
4077 i.types[1].bitfield.dword = 1;
4078 i.types[1].bitfield.qword = 0;
4079 if ((i.tm.base_opcode | 1) == 0xc7)
4080 {
4081 /* Handle
4082 movq $imm31, %r64 -> movl $imm31, %r32
4083 */
4084 i.tm.base_opcode = 0xb8;
4085 i.tm.extension_opcode = None;
4086 i.tm.opcode_modifier.w = 0;
4087 i.tm.opcode_modifier.shortform = 1;
4088 i.tm.opcode_modifier.modrm = 0;
4089 }
4090 }
4091 }
4092 else if (optimize > 1
4093 && !optimize_for_space
4094 && i.reg_operands == 2
4095 && i.op[0].regs == i.op[1].regs
4096 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4097 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4098 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4099 {
4100 /* Optimize: -O2:
4101 andb %rN, %rN -> testb %rN, %rN
4102 andw %rN, %rN -> testw %rN, %rN
4103 andq %rN, %rN -> testq %rN, %rN
4104 orb %rN, %rN -> testb %rN, %rN
4105 orw %rN, %rN -> testw %rN, %rN
4106 orq %rN, %rN -> testq %rN, %rN
4107
4108 and outside of 64-bit mode
4109
4110 andl %rN, %rN -> testl %rN, %rN
4111 orl %rN, %rN -> testl %rN, %rN
4112 */
4113 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4114 }
4115 else if (i.reg_operands == 3
4116 && i.op[0].regs == i.op[1].regs
4117 && !i.types[2].bitfield.xmmword
4118 && (i.tm.opcode_modifier.vex
4119 || ((!i.mask || i.mask->zeroing)
4120 && !i.rounding
4121 && is_evex_encoding (&i.tm)
4122 && (i.vec_encoding != vex_encoding_evex
4123 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4124 || i.tm.cpu_flags.bitfield.cpuavx512vl
4125 || (i.tm.operand_types[2].bitfield.zmmword
4126 && i.types[2].bitfield.ymmword))))
4127 && ((i.tm.base_opcode == 0x55
4128 || i.tm.base_opcode == 0x6655
4129 || i.tm.base_opcode == 0x66df
4130 || i.tm.base_opcode == 0x57
4131 || i.tm.base_opcode == 0x6657
4132 || i.tm.base_opcode == 0x66ef
4133 || i.tm.base_opcode == 0x66f8
4134 || i.tm.base_opcode == 0x66f9
4135 || i.tm.base_opcode == 0x66fa
4136 || i.tm.base_opcode == 0x66fb
4137 || i.tm.base_opcode == 0x42
4138 || i.tm.base_opcode == 0x6642
4139 || i.tm.base_opcode == 0x47
4140 || i.tm.base_opcode == 0x6647)
4141 && i.tm.extension_opcode == None))
4142 {
4143 /* Optimize: -O1:
4144 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4145 vpsubq and vpsubw:
4146 EVEX VOP %zmmM, %zmmM, %zmmN
4147 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4148 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4149 EVEX VOP %ymmM, %ymmM, %ymmN
4150 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4151 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4152 VEX VOP %ymmM, %ymmM, %ymmN
4153 -> VEX VOP %xmmM, %xmmM, %xmmN
4154 VOP, one of vpandn and vpxor:
4155 VEX VOP %ymmM, %ymmM, %ymmN
4156 -> VEX VOP %xmmM, %xmmM, %xmmN
4157 VOP, one of vpandnd and vpandnq:
4158 EVEX VOP %zmmM, %zmmM, %zmmN
4159 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4160 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4161 EVEX VOP %ymmM, %ymmM, %ymmN
4162 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4163 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4164 VOP, one of vpxord and vpxorq:
4165 EVEX VOP %zmmM, %zmmM, %zmmN
4166 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4167 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4168 EVEX VOP %ymmM, %ymmM, %ymmN
4169 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4170 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4171 VOP, one of kxord and kxorq:
4172 VEX VOP %kM, %kM, %kN
4173 -> VEX kxorw %kM, %kM, %kN
4174 VOP, one of kandnd and kandnq:
4175 VEX VOP %kM, %kM, %kN
4176 -> VEX kandnw %kM, %kM, %kN
4177 */
4178 if (is_evex_encoding (&i.tm))
4179 {
4180 if (i.vec_encoding != vex_encoding_evex)
4181 {
4182 i.tm.opcode_modifier.vex = VEX128;
4183 i.tm.opcode_modifier.vexw = VEXW0;
4184 i.tm.opcode_modifier.evex = 0;
4185 }
4186 else if (optimize > 1)
4187 i.tm.opcode_modifier.evex = EVEX128;
4188 else
4189 return;
4190 }
4191 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4192 {
4193 i.tm.base_opcode &= 0xff;
4194 i.tm.opcode_modifier.vexw = VEXW0;
4195 }
4196 else
4197 i.tm.opcode_modifier.vex = VEX128;
4198
4199 if (i.tm.opcode_modifier.vex)
4200 for (j = 0; j < 3; j++)
4201 {
4202 i.types[j].bitfield.xmmword = 1;
4203 i.types[j].bitfield.ymmword = 0;
4204 }
4205 }
4206 else if (i.vec_encoding != vex_encoding_evex
4207 && !i.types[0].bitfield.zmmword
4208 && !i.types[1].bitfield.zmmword
4209 && !i.mask
4210 && !i.broadcast
4211 && is_evex_encoding (&i.tm)
4212 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4213 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4214 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4215 || (i.tm.base_opcode & ~4) == 0x66db
4216 || (i.tm.base_opcode & ~4) == 0x66eb)
4217 && i.tm.extension_opcode == None)
4218 {
4219 /* Optimize: -O1:
4220 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4221 vmovdqu32 and vmovdqu64:
4222 EVEX VOP %xmmM, %xmmN
4223 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4224 EVEX VOP %ymmM, %ymmN
4225 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4226 EVEX VOP %xmmM, mem
4227 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4228 EVEX VOP %ymmM, mem
4229 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4230 EVEX VOP mem, %xmmN
4231 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4232 EVEX VOP mem, %ymmN
4233 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4234 VOP, one of vpand, vpandn, vpor, vpxor:
4235 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4236 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4237 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4238 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4239 EVEX VOP{d,q} mem, %xmmM, %xmmN
4240 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4241 EVEX VOP{d,q} mem, %ymmM, %ymmN
4242 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4243 */
4244 for (j = 0; j < i.operands; j++)
4245 if (operand_type_check (i.types[j], disp)
4246 && i.op[j].disps->X_op == O_constant)
4247 {
4248 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4249 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4250 bytes, we choose EVEX Disp8 over VEX Disp32. */
4251 int evex_disp8, vex_disp8;
4252 unsigned int memshift = i.memshift;
4253 offsetT n = i.op[j].disps->X_add_number;
4254
4255 evex_disp8 = fits_in_disp8 (n);
4256 i.memshift = 0;
4257 vex_disp8 = fits_in_disp8 (n);
4258 if (evex_disp8 != vex_disp8)
4259 {
4260 i.memshift = memshift;
4261 return;
4262 }
4263
4264 i.types[j].bitfield.disp8 = vex_disp8;
4265 break;
4266 }
4267 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4268 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4269 i.tm.opcode_modifier.vex
4270 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4271 i.tm.opcode_modifier.vexw = VEXW0;
4272 /* VPAND, VPOR, and VPXOR are commutative. */
4273 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4274 i.tm.opcode_modifier.commutative = 1;
4275 i.tm.opcode_modifier.evex = 0;
4276 i.tm.opcode_modifier.masking = 0;
4277 i.tm.opcode_modifier.broadcast = 0;
4278 i.tm.opcode_modifier.disp8memshift = 0;
4279 i.memshift = 0;
4280 if (j < i.operands)
4281 i.types[j].bitfield.disp8
4282 = fits_in_disp8 (i.op[j].disps->X_add_number);
4283 }
4284 }
4285
4286 /* This is the guts of the machine-dependent assembler. LINE points to a
4287 machine dependent instruction. This function is supposed to emit
4288 the frags/bytes it assembles to. */
4289
4290 void
4291 md_assemble (char *line)
4292 {
4293 unsigned int j;
4294 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4295 const insn_template *t;
4296
4297 /* Initialize globals. */
4298 memset (&i, '\0', sizeof (i));
4299 for (j = 0; j < MAX_OPERANDS; j++)
4300 i.reloc[j] = NO_RELOC;
4301 memset (disp_expressions, '\0', sizeof (disp_expressions));
4302 memset (im_expressions, '\0', sizeof (im_expressions));
4303 save_stack_p = save_stack;
4304
4305 /* First parse an instruction mnemonic & call i386_operand for the operands.
4306 We assume that the scrubber has arranged it so that line[0] is the valid
4307 start of a (possibly prefixed) mnemonic. */
4308
4309 line = parse_insn (line, mnemonic);
4310 if (line == NULL)
4311 return;
4312 mnem_suffix = i.suffix;
4313
4314 line = parse_operands (line, mnemonic);
4315 this_operand = -1;
4316 xfree (i.memop1_string);
4317 i.memop1_string = NULL;
4318 if (line == NULL)
4319 return;
4320
4321 /* Now we've parsed the mnemonic into a set of templates, and have the
4322 operands at hand. */
4323
4324 /* All intel opcodes have reversed operands except for "bound" and
4325 "enter". We also don't reverse intersegment "jmp" and "call"
4326 instructions with 2 immediate operands so that the immediate segment
4327 precedes the offset, as it does when in AT&T mode. */
4328 if (intel_syntax
4329 && i.operands > 1
4330 && (strcmp (mnemonic, "bound") != 0)
4331 && (strcmp (mnemonic, "invlpga") != 0)
4332 && !(operand_type_check (i.types[0], imm)
4333 && operand_type_check (i.types[1], imm)))
4334 swap_operands ();
4335
4336 /* The order of the immediates should be reversed
4337 for 2 immediates extrq and insertq instructions */
4338 if (i.imm_operands == 2
4339 && (strcmp (mnemonic, "extrq") == 0
4340 || strcmp (mnemonic, "insertq") == 0))
4341 swap_2_operands (0, 1);
4342
4343 if (i.imm_operands)
4344 optimize_imm ();
4345
4346 /* Don't optimize displacement for movabs since it only takes 64bit
4347 displacement. */
4348 if (i.disp_operands
4349 && i.disp_encoding != disp_encoding_32bit
4350 && (flag_code != CODE_64BIT
4351 || strcmp (mnemonic, "movabs") != 0))
4352 optimize_disp ();
4353
4354 /* Next, we find a template that matches the given insn,
4355 making sure the overlap of the given operands types is consistent
4356 with the template operand types. */
4357
4358 if (!(t = match_template (mnem_suffix)))
4359 return;
4360
4361 if (sse_check != check_none
4362 && !i.tm.opcode_modifier.noavx
4363 && !i.tm.cpu_flags.bitfield.cpuavx
4364 && !i.tm.cpu_flags.bitfield.cpuavx512f
4365 && (i.tm.cpu_flags.bitfield.cpusse
4366 || i.tm.cpu_flags.bitfield.cpusse2
4367 || i.tm.cpu_flags.bitfield.cpusse3
4368 || i.tm.cpu_flags.bitfield.cpussse3
4369 || i.tm.cpu_flags.bitfield.cpusse4_1
4370 || i.tm.cpu_flags.bitfield.cpusse4_2
4371 || i.tm.cpu_flags.bitfield.cpusse4a
4372 || i.tm.cpu_flags.bitfield.cpupclmul
4373 || i.tm.cpu_flags.bitfield.cpuaes
4374 || i.tm.cpu_flags.bitfield.cpusha
4375 || i.tm.cpu_flags.bitfield.cpugfni))
4376 {
4377 (sse_check == check_warning
4378 ? as_warn
4379 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4380 }
4381
4382 /* Zap movzx and movsx suffix. The suffix has been set from
4383 "word ptr" or "byte ptr" on the source operand in Intel syntax
4384 or extracted from mnemonic in AT&T syntax. But we'll use
4385 the destination register to choose the suffix for encoding. */
4386 if ((i.tm.base_opcode & ~9) == 0x0fb6)
4387 {
4388 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
4389 there is no suffix, the default will be byte extension. */
4390 if (i.reg_operands != 2
4391 && !i.suffix
4392 && intel_syntax)
4393 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4394
4395 i.suffix = 0;
4396 }
4397
4398 if (i.tm.opcode_modifier.fwait)
4399 if (!add_prefix (FWAIT_OPCODE))
4400 return;
4401
4402 /* Check if REP prefix is OK. */
4403 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4404 {
4405 as_bad (_("invalid instruction `%s' after `%s'"),
4406 i.tm.name, i.rep_prefix);
4407 return;
4408 }
4409
4410 /* Check for lock without a lockable instruction. Destination operand
4411 must be memory unless it is xchg (0x86). */
4412 if (i.prefix[LOCK_PREFIX]
4413 && (!i.tm.opcode_modifier.islockable
4414 || i.mem_operands == 0
4415 || (i.tm.base_opcode != 0x86
4416 && !(i.flags[i.operands - 1] & Operand_Mem))))
4417 {
4418 as_bad (_("expecting lockable instruction after `lock'"));
4419 return;
4420 }
4421
4422 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4423 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4424 {
4425 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4426 return;
4427 }
4428
4429 /* Check if HLE prefix is OK. */
4430 if (i.hle_prefix && !check_hle ())
4431 return;
4432
4433 /* Check BND prefix. */
4434 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4435 as_bad (_("expecting valid branch instruction after `bnd'"));
4436
4437 /* Check NOTRACK prefix. */
4438 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4439 as_bad (_("expecting indirect branch instruction after `notrack'"));
4440
4441 if (i.tm.cpu_flags.bitfield.cpumpx)
4442 {
4443 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4444 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4445 else if (flag_code != CODE_16BIT
4446 ? i.prefix[ADDR_PREFIX]
4447 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4448 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4449 }
4450
4451 /* Insert BND prefix. */
4452 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4453 {
4454 if (!i.prefix[BND_PREFIX])
4455 add_prefix (BND_PREFIX_OPCODE);
4456 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4457 {
4458 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4459 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4460 }
4461 }
4462
4463 /* Check string instruction segment overrides. */
4464 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4465 {
4466 gas_assert (i.mem_operands);
4467 if (!check_string ())
4468 return;
4469 i.disp_operands = 0;
4470 }
4471
4472 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4473 optimize_encoding ();
4474
4475 if (!process_suffix ())
4476 return;
4477
4478 /* Update operand types. */
4479 for (j = 0; j < i.operands; j++)
4480 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4481
4482 /* Make still unresolved immediate matches conform to size of immediate
4483 given in i.suffix. */
4484 if (!finalize_imm ())
4485 return;
4486
4487 if (i.types[0].bitfield.imm1)
4488 i.imm_operands = 0; /* kludge for shift insns. */
4489
4490 /* We only need to check those implicit registers for instructions
4491 with 3 operands or less. */
4492 if (i.operands <= 3)
4493 for (j = 0; j < i.operands; j++)
4494 if (i.types[j].bitfield.instance != InstanceNone
4495 && !i.types[j].bitfield.xmmword)
4496 i.reg_operands--;
4497
4498 /* ImmExt should be processed after SSE2AVX. */
4499 if (!i.tm.opcode_modifier.sse2avx
4500 && i.tm.opcode_modifier.immext)
4501 process_immext ();
4502
4503 /* For insns with operands there are more diddles to do to the opcode. */
4504 if (i.operands)
4505 {
4506 if (!process_operands ())
4507 return;
4508 }
4509 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4510 {
4511 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4512 as_warn (_("translating to `%sp'"), i.tm.name);
4513 }
4514
4515 if (is_any_vex_encoding (&i.tm))
4516 {
4517 if (!cpu_arch_flags.bitfield.cpui286)
4518 {
4519 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4520 i.tm.name);
4521 return;
4522 }
4523
4524 if (i.tm.opcode_modifier.vex)
4525 build_vex_prefix (t);
4526 else
4527 build_evex_prefix ();
4528 }
4529
4530 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4531 instructions may define INT_OPCODE as well, so avoid this corner
4532 case for those instructions that use MODRM. */
4533 if (i.tm.base_opcode == INT_OPCODE
4534 && !i.tm.opcode_modifier.modrm
4535 && i.op[0].imms->X_add_number == 3)
4536 {
4537 i.tm.base_opcode = INT3_OPCODE;
4538 i.imm_operands = 0;
4539 }
4540
4541 if ((i.tm.opcode_modifier.jump == JUMP
4542 || i.tm.opcode_modifier.jump == JUMP_BYTE
4543 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4544 && i.op[0].disps->X_op == O_constant)
4545 {
4546 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4547 the absolute address given by the constant. Since ix86 jumps and
4548 calls are pc relative, we need to generate a reloc. */
4549 i.op[0].disps->X_add_symbol = &abs_symbol;
4550 i.op[0].disps->X_op = O_symbol;
4551 }
4552
4553 if (i.tm.opcode_modifier.rex64)
4554 i.rex |= REX_W;
4555
4556 /* For 8 bit registers we need an empty rex prefix. Also if the
4557 instruction already has a prefix, we need to convert old
4558 registers to new ones. */
4559
4560 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4561 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4562 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4563 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4564 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4565 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4566 && i.rex != 0))
4567 {
4568 int x;
4569
4570 i.rex |= REX_OPCODE;
4571 for (x = 0; x < 2; x++)
4572 {
4573 /* Look for 8 bit operand that uses old registers. */
4574 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4575 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4576 {
4577 /* In case it is "hi" register, give up. */
4578 if (i.op[x].regs->reg_num > 3)
4579 as_bad (_("can't encode register '%s%s' in an "
4580 "instruction requiring REX prefix."),
4581 register_prefix, i.op[x].regs->reg_name);
4582
4583 /* Otherwise it is equivalent to the extended register.
4584 Since the encoding doesn't change this is merely
4585 cosmetic cleanup for debug output. */
4586
4587 i.op[x].regs = i.op[x].regs + 8;
4588 }
4589 }
4590 }
4591
4592 if (i.rex == 0 && i.rex_encoding)
4593 {
4594 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4595 that uses legacy register. If it is "hi" register, don't add
4596 the REX_OPCODE byte. */
4597 int x;
4598 for (x = 0; x < 2; x++)
4599 if (i.types[x].bitfield.class == Reg
4600 && i.types[x].bitfield.byte
4601 && (i.op[x].regs->reg_flags & RegRex64) == 0
4602 && i.op[x].regs->reg_num > 3)
4603 {
4604 i.rex_encoding = FALSE;
4605 break;
4606 }
4607
4608 if (i.rex_encoding)
4609 i.rex = REX_OPCODE;
4610 }
4611
4612 if (i.rex != 0)
4613 add_prefix (REX_OPCODE | i.rex);
4614
4615 /* We are ready to output the insn. */
4616 output_insn ();
4617
4618 last_insn.seg = now_seg;
4619
4620 if (i.tm.opcode_modifier.isprefix)
4621 {
4622 last_insn.kind = last_insn_prefix;
4623 last_insn.name = i.tm.name;
4624 last_insn.file = as_where (&last_insn.line);
4625 }
4626 else
4627 last_insn.kind = last_insn_other;
4628 }
4629
4630 static char *
4631 parse_insn (char *line, char *mnemonic)
4632 {
4633 char *l = line;
4634 char *token_start = l;
4635 char *mnem_p;
4636 int supported;
4637 const insn_template *t;
4638 char *dot_p = NULL;
4639
4640 while (1)
4641 {
4642 mnem_p = mnemonic;
4643 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4644 {
4645 if (*mnem_p == '.')
4646 dot_p = mnem_p;
4647 mnem_p++;
4648 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4649 {
4650 as_bad (_("no such instruction: `%s'"), token_start);
4651 return NULL;
4652 }
4653 l++;
4654 }
4655 if (!is_space_char (*l)
4656 && *l != END_OF_INSN
4657 && (intel_syntax
4658 || (*l != PREFIX_SEPARATOR
4659 && *l != ',')))
4660 {
4661 as_bad (_("invalid character %s in mnemonic"),
4662 output_invalid (*l));
4663 return NULL;
4664 }
4665 if (token_start == l)
4666 {
4667 if (!intel_syntax && *l == PREFIX_SEPARATOR)
4668 as_bad (_("expecting prefix; got nothing"));
4669 else
4670 as_bad (_("expecting mnemonic; got nothing"));
4671 return NULL;
4672 }
4673
4674 /* Look up instruction (or prefix) via hash table. */
4675 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4676
4677 if (*l != END_OF_INSN
4678 && (!is_space_char (*l) || l[1] != END_OF_INSN)
4679 && current_templates
4680 && current_templates->start->opcode_modifier.isprefix)
4681 {
4682 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4683 {
4684 as_bad ((flag_code != CODE_64BIT
4685 ? _("`%s' is only supported in 64-bit mode")
4686 : _("`%s' is not supported in 64-bit mode")),
4687 current_templates->start->name);
4688 return NULL;
4689 }
4690 /* If we are in 16-bit mode, do not allow addr16 or data16.
4691 Similarly, in 32-bit mode, do not allow addr32 or data32. */
4692 if ((current_templates->start->opcode_modifier.size == SIZE16
4693 || current_templates->start->opcode_modifier.size == SIZE32)
4694 && flag_code != CODE_64BIT
4695 && ((current_templates->start->opcode_modifier.size == SIZE32)
4696 ^ (flag_code == CODE_16BIT)))
4697 {
4698 as_bad (_("redundant %s prefix"),
4699 current_templates->start->name);
4700 return NULL;
4701 }
4702 if (current_templates->start->opcode_length == 0)
4703 {
4704 /* Handle pseudo prefixes. */
4705 switch (current_templates->start->base_opcode)
4706 {
4707 case 0x0:
4708 /* {disp8} */
4709 i.disp_encoding = disp_encoding_8bit;
4710 break;
4711 case 0x1:
4712 /* {disp32} */
4713 i.disp_encoding = disp_encoding_32bit;
4714 break;
4715 case 0x2:
4716 /* {load} */
4717 i.dir_encoding = dir_encoding_load;
4718 break;
4719 case 0x3:
4720 /* {store} */
4721 i.dir_encoding = dir_encoding_store;
4722 break;
4723 case 0x4:
4724 /* {vex2} */
4725 i.vec_encoding = vex_encoding_vex2;
4726 break;
4727 case 0x5:
4728 /* {vex3} */
4729 i.vec_encoding = vex_encoding_vex3;
4730 break;
4731 case 0x6:
4732 /* {evex} */
4733 i.vec_encoding = vex_encoding_evex;
4734 break;
4735 case 0x7:
4736 /* {rex} */
4737 i.rex_encoding = TRUE;
4738 break;
4739 case 0x8:
4740 /* {nooptimize} */
4741 i.no_optimize = TRUE;
4742 break;
4743 default:
4744 abort ();
4745 }
4746 }
4747 else
4748 {
4749 /* Add prefix, checking for repeated prefixes. */
4750 switch (add_prefix (current_templates->start->base_opcode))
4751 {
4752 case PREFIX_EXIST:
4753 return NULL;
4754 case PREFIX_DS:
4755 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4756 i.notrack_prefix = current_templates->start->name;
4757 break;
4758 case PREFIX_REP:
4759 if (current_templates->start->cpu_flags.bitfield.cpuhle)
4760 i.hle_prefix = current_templates->start->name;
4761 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4762 i.bnd_prefix = current_templates->start->name;
4763 else
4764 i.rep_prefix = current_templates->start->name;
4765 break;
4766 default:
4767 break;
4768 }
4769 }
4770 /* Skip past PREFIX_SEPARATOR and reset token_start. */
4771 token_start = ++l;
4772 }
4773 else
4774 break;
4775 }
4776
4777 if (!current_templates)
4778 {
4779 /* Deprecated functionality (new code should use pseudo-prefixes instead):
4780 Check if we should swap operand or force 32bit displacement in
4781 encoding. */
4782 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4783 i.dir_encoding = dir_encoding_swap;
4784 else if (mnem_p - 3 == dot_p
4785 && dot_p[1] == 'd'
4786 && dot_p[2] == '8')
4787 i.disp_encoding = disp_encoding_8bit;
4788 else if (mnem_p - 4 == dot_p
4789 && dot_p[1] == 'd'
4790 && dot_p[2] == '3'
4791 && dot_p[3] == '2')
4792 i.disp_encoding = disp_encoding_32bit;
4793 else
4794 goto check_suffix;
4795 mnem_p = dot_p;
4796 *dot_p = '\0';
4797 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4798 }
4799
4800 if (!current_templates)
4801 {
4802 check_suffix:
4803 if (mnem_p > mnemonic)
4804 {
4805 /* See if we can get a match by trimming off a suffix. */
4806 switch (mnem_p[-1])
4807 {
4808 case WORD_MNEM_SUFFIX:
4809 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4810 i.suffix = SHORT_MNEM_SUFFIX;
4811 else
4812 /* Fall through. */
4813 case BYTE_MNEM_SUFFIX:
4814 case QWORD_MNEM_SUFFIX:
4815 i.suffix = mnem_p[-1];
4816 mnem_p[-1] = '\0';
4817 current_templates = (const templates *) hash_find (op_hash,
4818 mnemonic);
4819 break;
4820 case SHORT_MNEM_SUFFIX:
4821 case LONG_MNEM_SUFFIX:
4822 if (!intel_syntax)
4823 {
4824 i.suffix = mnem_p[-1];
4825 mnem_p[-1] = '\0';
4826 current_templates = (const templates *) hash_find (op_hash,
4827 mnemonic);
4828 }
4829 break;
4830
4831 /* Intel Syntax. */
4832 case 'd':
4833 if (intel_syntax)
4834 {
4835 if (intel_float_operand (mnemonic) == 1)
4836 i.suffix = SHORT_MNEM_SUFFIX;
4837 else
4838 i.suffix = LONG_MNEM_SUFFIX;
4839 mnem_p[-1] = '\0';
4840 current_templates = (const templates *) hash_find (op_hash,
4841 mnemonic);
4842 }
4843 break;
4844 }
4845 }
4846
4847 if (!current_templates)
4848 {
4849 as_bad (_("no such instruction: `%s'"), token_start);
4850 return NULL;
4851 }
4852 }
4853
4854 if (current_templates->start->opcode_modifier.jump == JUMP
4855 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
4856 {
4857 /* Check for a branch hint. We allow ",pt" and ",pn" for
4858 predict taken and predict not taken respectively.
4859 I'm not sure that branch hints actually do anything on loop
4860 and jcxz insns (JumpByte) for current Pentium4 chips. They
4861 may work in the future and it doesn't hurt to accept them
4862 now. */
4863 if (l[0] == ',' && l[1] == 'p')
4864 {
4865 if (l[2] == 't')
4866 {
4867 if (!add_prefix (DS_PREFIX_OPCODE))
4868 return NULL;
4869 l += 3;
4870 }
4871 else if (l[2] == 'n')
4872 {
4873 if (!add_prefix (CS_PREFIX_OPCODE))
4874 return NULL;
4875 l += 3;
4876 }
4877 }
4878 }
4879 /* Any other comma loses. */
4880 if (*l == ',')
4881 {
4882 as_bad (_("invalid character %s in mnemonic"),
4883 output_invalid (*l));
4884 return NULL;
4885 }
4886
4887 /* Check if instruction is supported on specified architecture. */
4888 supported = 0;
4889 for (t = current_templates->start; t < current_templates->end; ++t)
4890 {
4891 supported |= cpu_flags_match (t);
4892 if (supported == CPU_FLAGS_PERFECT_MATCH)
4893 {
4894 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4895 as_warn (_("use .code16 to ensure correct addressing mode"));
4896
4897 return l;
4898 }
4899 }
4900
4901 if (!(supported & CPU_FLAGS_64BIT_MATCH))
4902 as_bad (flag_code == CODE_64BIT
4903 ? _("`%s' is not supported in 64-bit mode")
4904 : _("`%s' is only supported in 64-bit mode"),
4905 current_templates->start->name);
4906 else
4907 as_bad (_("`%s' is not supported on `%s%s'"),
4908 current_templates->start->name,
4909 cpu_arch_name ? cpu_arch_name : default_arch,
4910 cpu_sub_arch_name ? cpu_sub_arch_name : "");
4911
4912 return NULL;
4913 }
4914
4915 static char *
4916 parse_operands (char *l, const char *mnemonic)
4917 {
4918 char *token_start;
4919
4920 /* 1 if operand is pending after ','. */
4921 unsigned int expecting_operand = 0;
4922
4923 /* Non-zero if operand parens not balanced. */
4924 unsigned int paren_not_balanced;
4925
4926 while (*l != END_OF_INSN)
4927 {
4928 /* Skip optional white space before operand. */
4929 if (is_space_char (*l))
4930 ++l;
4931 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4932 {
4933 as_bad (_("invalid character %s before operand %d"),
4934 output_invalid (*l),
4935 i.operands + 1);
4936 return NULL;
4937 }
4938 token_start = l; /* After white space. */
4939 paren_not_balanced = 0;
4940 while (paren_not_balanced || *l != ',')
4941 {
4942 if (*l == END_OF_INSN)
4943 {
4944 if (paren_not_balanced)
4945 {
4946 if (!intel_syntax)
4947 as_bad (_("unbalanced parenthesis in operand %d."),
4948 i.operands + 1);
4949 else
4950 as_bad (_("unbalanced brackets in operand %d."),
4951 i.operands + 1);
4952 return NULL;
4953 }
4954 else
4955 break; /* we are done */
4956 }
4957 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4958 {
4959 as_bad (_("invalid character %s in operand %d"),
4960 output_invalid (*l),
4961 i.operands + 1);
4962 return NULL;
4963 }
4964 if (!intel_syntax)
4965 {
4966 if (*l == '(')
4967 ++paren_not_balanced;
4968 if (*l == ')')
4969 --paren_not_balanced;
4970 }
4971 else
4972 {
4973 if (*l == '[')
4974 ++paren_not_balanced;
4975 if (*l == ']')
4976 --paren_not_balanced;
4977 }
4978 l++;
4979 }
4980 if (l != token_start)
4981 { /* Yes, we've read in another operand. */
4982 unsigned int operand_ok;
4983 this_operand = i.operands++;
4984 if (i.operands > MAX_OPERANDS)
4985 {
4986 as_bad (_("spurious operands; (%d operands/instruction max)"),
4987 MAX_OPERANDS);
4988 return NULL;
4989 }
4990 i.types[this_operand].bitfield.unspecified = 1;
4991 /* Now parse operand adding info to 'i' as we go along. */
4992 END_STRING_AND_SAVE (l);
4993
4994 if (i.mem_operands > 1)
4995 {
4996 as_bad (_("too many memory references for `%s'"),
4997 mnemonic);
4998 return 0;
4999 }
5000
5001 if (intel_syntax)
5002 operand_ok =
5003 i386_intel_operand (token_start,
5004 intel_float_operand (mnemonic));
5005 else
5006 operand_ok = i386_att_operand (token_start);
5007
5008 RESTORE_END_STRING (l);
5009 if (!operand_ok)
5010 return NULL;
5011 }
5012 else
5013 {
5014 if (expecting_operand)
5015 {
5016 expecting_operand_after_comma:
5017 as_bad (_("expecting operand after ','; got nothing"));
5018 return NULL;
5019 }
5020 if (*l == ',')
5021 {
5022 as_bad (_("expecting operand before ','; got nothing"));
5023 return NULL;
5024 }
5025 }
5026
5027 /* Now *l must be either ',' or END_OF_INSN. */
5028 if (*l == ',')
5029 {
5030 if (*++l == END_OF_INSN)
5031 {
5032 /* Just skip it, if it's \n complain. */
5033 goto expecting_operand_after_comma;
5034 }
5035 expecting_operand = 1;
5036 }
5037 }
5038 return l;
5039 }
5040
5041 static void
5042 swap_2_operands (int xchg1, int xchg2)
5043 {
5044 union i386_op temp_op;
5045 i386_operand_type temp_type;
5046 unsigned int temp_flags;
5047 enum bfd_reloc_code_real temp_reloc;
5048
5049 temp_type = i.types[xchg2];
5050 i.types[xchg2] = i.types[xchg1];
5051 i.types[xchg1] = temp_type;
5052
5053 temp_flags = i.flags[xchg2];
5054 i.flags[xchg2] = i.flags[xchg1];
5055 i.flags[xchg1] = temp_flags;
5056
5057 temp_op = i.op[xchg2];
5058 i.op[xchg2] = i.op[xchg1];
5059 i.op[xchg1] = temp_op;
5060
5061 temp_reloc = i.reloc[xchg2];
5062 i.reloc[xchg2] = i.reloc[xchg1];
5063 i.reloc[xchg1] = temp_reloc;
5064
5065 if (i.mask)
5066 {
5067 if (i.mask->operand == xchg1)
5068 i.mask->operand = xchg2;
5069 else if (i.mask->operand == xchg2)
5070 i.mask->operand = xchg1;
5071 }
5072 if (i.broadcast)
5073 {
5074 if (i.broadcast->operand == xchg1)
5075 i.broadcast->operand = xchg2;
5076 else if (i.broadcast->operand == xchg2)
5077 i.broadcast->operand = xchg1;
5078 }
5079 if (i.rounding)
5080 {
5081 if (i.rounding->operand == xchg1)
5082 i.rounding->operand = xchg2;
5083 else if (i.rounding->operand == xchg2)
5084 i.rounding->operand = xchg1;
5085 }
5086 }
5087
5088 static void
5089 swap_operands (void)
5090 {
5091 switch (i.operands)
5092 {
5093 case 5:
5094 case 4:
5095 swap_2_operands (1, i.operands - 2);
5096 /* Fall through. */
5097 case 3:
5098 case 2:
5099 swap_2_operands (0, i.operands - 1);
5100 break;
5101 default:
5102 abort ();
5103 }
5104
5105 if (i.mem_operands == 2)
5106 {
5107 const seg_entry *temp_seg;
5108 temp_seg = i.seg[0];
5109 i.seg[0] = i.seg[1];
5110 i.seg[1] = temp_seg;
5111 }
5112 }
5113
5114 /* Try to ensure constant immediates are represented in the smallest
5115 opcode possible. */
5116 static void
5117 optimize_imm (void)
5118 {
5119 char guess_suffix = 0;
5120 int op;
5121
5122 if (i.suffix)
5123 guess_suffix = i.suffix;
5124 else if (i.reg_operands)
5125 {
5126 /* Figure out a suffix from the last register operand specified.
5127 We can't do this properly yet, i.e. excluding special register
5128 instances, but the following works for instructions with
5129 immediates. In any case, we can't set i.suffix yet. */
5130 for (op = i.operands; --op >= 0;)
5131 if (i.types[op].bitfield.class != Reg)
5132 continue;
5133 else if (i.types[op].bitfield.byte)
5134 {
5135 guess_suffix = BYTE_MNEM_SUFFIX;
5136 break;
5137 }
5138 else if (i.types[op].bitfield.word)
5139 {
5140 guess_suffix = WORD_MNEM_SUFFIX;
5141 break;
5142 }
5143 else if (i.types[op].bitfield.dword)
5144 {
5145 guess_suffix = LONG_MNEM_SUFFIX;
5146 break;
5147 }
5148 else if (i.types[op].bitfield.qword)
5149 {
5150 guess_suffix = QWORD_MNEM_SUFFIX;
5151 break;
5152 }
5153 }
5154 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5155 guess_suffix = WORD_MNEM_SUFFIX;
5156
5157 for (op = i.operands; --op >= 0;)
5158 if (operand_type_check (i.types[op], imm))
5159 {
5160 switch (i.op[op].imms->X_op)
5161 {
5162 case O_constant:
5163 /* If a suffix is given, this operand may be shortened. */
5164 switch (guess_suffix)
5165 {
5166 case LONG_MNEM_SUFFIX:
5167 i.types[op].bitfield.imm32 = 1;
5168 i.types[op].bitfield.imm64 = 1;
5169 break;
5170 case WORD_MNEM_SUFFIX:
5171 i.types[op].bitfield.imm16 = 1;
5172 i.types[op].bitfield.imm32 = 1;
5173 i.types[op].bitfield.imm32s = 1;
5174 i.types[op].bitfield.imm64 = 1;
5175 break;
5176 case BYTE_MNEM_SUFFIX:
5177 i.types[op].bitfield.imm8 = 1;
5178 i.types[op].bitfield.imm8s = 1;
5179 i.types[op].bitfield.imm16 = 1;
5180 i.types[op].bitfield.imm32 = 1;
5181 i.types[op].bitfield.imm32s = 1;
5182 i.types[op].bitfield.imm64 = 1;
5183 break;
5184 }
5185
5186 /* If this operand is at most 16 bits, convert it
5187 to a signed 16 bit number before trying to see
5188 whether it will fit in an even smaller size.
5189 This allows a 16-bit operand such as $0xffe0 to
5190 be recognised as within Imm8S range. */
5191 if ((i.types[op].bitfield.imm16)
5192 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5193 {
5194 i.op[op].imms->X_add_number =
5195 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5196 }
5197 #ifdef BFD64
5198 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5199 if ((i.types[op].bitfield.imm32)
5200 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5201 == 0))
5202 {
5203 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5204 ^ ((offsetT) 1 << 31))
5205 - ((offsetT) 1 << 31));
5206 }
5207 #endif
5208 i.types[op]
5209 = operand_type_or (i.types[op],
5210 smallest_imm_type (i.op[op].imms->X_add_number));
5211
5212 /* We must avoid matching of Imm32 templates when 64bit
5213 only immediate is available. */
5214 if (guess_suffix == QWORD_MNEM_SUFFIX)
5215 i.types[op].bitfield.imm32 = 0;
5216 break;
5217
5218 case O_absent:
5219 case O_register:
5220 abort ();
5221
5222 /* Symbols and expressions. */
5223 default:
5224 /* Convert symbolic operand to proper sizes for matching, but don't
5225 prevent matching a set of insns that only supports sizes other
5226 than those matching the insn suffix. */
5227 {
5228 i386_operand_type mask, allowed;
5229 const insn_template *t;
5230
5231 operand_type_set (&mask, 0);
5232 operand_type_set (&allowed, 0);
5233
5234 for (t = current_templates->start;
5235 t < current_templates->end;
5236 ++t)
5237 {
5238 allowed = operand_type_or (allowed, t->operand_types[op]);
5239 allowed = operand_type_and (allowed, anyimm);
5240 }
5241 switch (guess_suffix)
5242 {
5243 case QWORD_MNEM_SUFFIX:
5244 mask.bitfield.imm64 = 1;
5245 mask.bitfield.imm32s = 1;
5246 break;
5247 case LONG_MNEM_SUFFIX:
5248 mask.bitfield.imm32 = 1;
5249 break;
5250 case WORD_MNEM_SUFFIX:
5251 mask.bitfield.imm16 = 1;
5252 break;
5253 case BYTE_MNEM_SUFFIX:
5254 mask.bitfield.imm8 = 1;
5255 break;
5256 default:
5257 break;
5258 }
5259 allowed = operand_type_and (mask, allowed);
5260 if (!operand_type_all_zero (&allowed))
5261 i.types[op] = operand_type_and (i.types[op], mask);
5262 }
5263 break;
5264 }
5265 }
5266 }
5267
5268 /* Try to use the smallest displacement type too. */
5269 static void
5270 optimize_disp (void)
5271 {
5272 int op;
5273
5274 for (op = i.operands; --op >= 0;)
5275 if (operand_type_check (i.types[op], disp))
5276 {
5277 if (i.op[op].disps->X_op == O_constant)
5278 {
5279 offsetT op_disp = i.op[op].disps->X_add_number;
5280
5281 if (i.types[op].bitfield.disp16
5282 && (op_disp & ~(offsetT) 0xffff) == 0)
5283 {
5284 /* If this operand is at most 16 bits, convert
5285 to a signed 16 bit number and don't use 64bit
5286 displacement. */
5287 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5288 i.types[op].bitfield.disp64 = 0;
5289 }
5290 #ifdef BFD64
5291 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5292 if (i.types[op].bitfield.disp32
5293 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5294 {
5295 /* If this operand is at most 32 bits, convert
5296 to a signed 32 bit number and don't use 64bit
5297 displacement. */
5298 op_disp &= (((offsetT) 2 << 31) - 1);
5299 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5300 i.types[op].bitfield.disp64 = 0;
5301 }
5302 #endif
5303 if (!op_disp && i.types[op].bitfield.baseindex)
5304 {
5305 i.types[op].bitfield.disp8 = 0;
5306 i.types[op].bitfield.disp16 = 0;
5307 i.types[op].bitfield.disp32 = 0;
5308 i.types[op].bitfield.disp32s = 0;
5309 i.types[op].bitfield.disp64 = 0;
5310 i.op[op].disps = 0;
5311 i.disp_operands--;
5312 }
5313 else if (flag_code == CODE_64BIT)
5314 {
5315 if (fits_in_signed_long (op_disp))
5316 {
5317 i.types[op].bitfield.disp64 = 0;
5318 i.types[op].bitfield.disp32s = 1;
5319 }
5320 if (i.prefix[ADDR_PREFIX]
5321 && fits_in_unsigned_long (op_disp))
5322 i.types[op].bitfield.disp32 = 1;
5323 }
5324 if ((i.types[op].bitfield.disp32
5325 || i.types[op].bitfield.disp32s
5326 || i.types[op].bitfield.disp16)
5327 && fits_in_disp8 (op_disp))
5328 i.types[op].bitfield.disp8 = 1;
5329 }
5330 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5331 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5332 {
5333 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5334 i.op[op].disps, 0, i.reloc[op]);
5335 i.types[op].bitfield.disp8 = 0;
5336 i.types[op].bitfield.disp16 = 0;
5337 i.types[op].bitfield.disp32 = 0;
5338 i.types[op].bitfield.disp32s = 0;
5339 i.types[op].bitfield.disp64 = 0;
5340 }
5341 else
5342 /* We only support 64bit displacement on constants. */
5343 i.types[op].bitfield.disp64 = 0;
5344 }
5345 }
5346
5347 /* Return 1 if there is a match in broadcast bytes between operand
5348 GIVEN and instruction template T. */
5349
5350 static INLINE int
5351 match_broadcast_size (const insn_template *t, unsigned int given)
5352 {
5353 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5354 && i.types[given].bitfield.byte)
5355 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5356 && i.types[given].bitfield.word)
5357 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5358 && i.types[given].bitfield.dword)
5359 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5360 && i.types[given].bitfield.qword));
5361 }
5362
5363 /* Check if operands are valid for the instruction. */
5364
5365 static int
5366 check_VecOperands (const insn_template *t)
5367 {
5368 unsigned int op;
5369 i386_cpu_flags cpu;
5370 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
5371
5372 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5373 any one operand are implicity requiring AVX512VL support if the actual
5374 operand size is YMMword or XMMword. Since this function runs after
5375 template matching, there's no need to check for YMMword/XMMword in
5376 the template. */
5377 cpu = cpu_flags_and (t->cpu_flags, avx512);
5378 if (!cpu_flags_all_zero (&cpu)
5379 && !t->cpu_flags.bitfield.cpuavx512vl
5380 && !cpu_arch_flags.bitfield.cpuavx512vl)
5381 {
5382 for (op = 0; op < t->operands; ++op)
5383 {
5384 if (t->operand_types[op].bitfield.zmmword
5385 && (i.types[op].bitfield.ymmword
5386 || i.types[op].bitfield.xmmword))
5387 {
5388 i.error = unsupported;
5389 return 1;
5390 }
5391 }
5392 }
5393
5394 /* Without VSIB byte, we can't have a vector register for index. */
5395 if (!t->opcode_modifier.vecsib
5396 && i.index_reg
5397 && (i.index_reg->reg_type.bitfield.xmmword
5398 || i.index_reg->reg_type.bitfield.ymmword
5399 || i.index_reg->reg_type.bitfield.zmmword))
5400 {
5401 i.error = unsupported_vector_index_register;
5402 return 1;
5403 }
5404
5405 /* Check if default mask is allowed. */
5406 if (t->opcode_modifier.nodefmask
5407 && (!i.mask || i.mask->mask->reg_num == 0))
5408 {
5409 i.error = no_default_mask;
5410 return 1;
5411 }
5412
5413 /* For VSIB byte, we need a vector register for index, and all vector
5414 registers must be distinct. */
5415 if (t->opcode_modifier.vecsib)
5416 {
5417 if (!i.index_reg
5418 || !((t->opcode_modifier.vecsib == VecSIB128
5419 && i.index_reg->reg_type.bitfield.xmmword)
5420 || (t->opcode_modifier.vecsib == VecSIB256
5421 && i.index_reg->reg_type.bitfield.ymmword)
5422 || (t->opcode_modifier.vecsib == VecSIB512
5423 && i.index_reg->reg_type.bitfield.zmmword)))
5424 {
5425 i.error = invalid_vsib_address;
5426 return 1;
5427 }
5428
5429 gas_assert (i.reg_operands == 2 || i.mask);
5430 if (i.reg_operands == 2 && !i.mask)
5431 {
5432 gas_assert (i.types[0].bitfield.class == RegSIMD);
5433 gas_assert (i.types[0].bitfield.xmmword
5434 || i.types[0].bitfield.ymmword);
5435 gas_assert (i.types[2].bitfield.class == RegSIMD);
5436 gas_assert (i.types[2].bitfield.xmmword
5437 || i.types[2].bitfield.ymmword);
5438 if (operand_check == check_none)
5439 return 0;
5440 if (register_number (i.op[0].regs)
5441 != register_number (i.index_reg)
5442 && register_number (i.op[2].regs)
5443 != register_number (i.index_reg)
5444 && register_number (i.op[0].regs)
5445 != register_number (i.op[2].regs))
5446 return 0;
5447 if (operand_check == check_error)
5448 {
5449 i.error = invalid_vector_register_set;
5450 return 1;
5451 }
5452 as_warn (_("mask, index, and destination registers should be distinct"));
5453 }
5454 else if (i.reg_operands == 1 && i.mask)
5455 {
5456 if (i.types[1].bitfield.class == RegSIMD
5457 && (i.types[1].bitfield.xmmword
5458 || i.types[1].bitfield.ymmword
5459 || i.types[1].bitfield.zmmword)
5460 && (register_number (i.op[1].regs)
5461 == register_number (i.index_reg)))
5462 {
5463 if (operand_check == check_error)
5464 {
5465 i.error = invalid_vector_register_set;
5466 return 1;
5467 }
5468 if (operand_check != check_none)
5469 as_warn (_("index and destination registers should be distinct"));
5470 }
5471 }
5472 }
5473
5474 /* Check if broadcast is supported by the instruction and is applied
5475 to the memory operand. */
5476 if (i.broadcast)
5477 {
5478 i386_operand_type type, overlap;
5479
5480 /* Check if specified broadcast is supported in this instruction,
5481 and its broadcast bytes match the memory operand. */
5482 op = i.broadcast->operand;
5483 if (!t->opcode_modifier.broadcast
5484 || !(i.flags[op] & Operand_Mem)
5485 || (!i.types[op].bitfield.unspecified
5486 && !match_broadcast_size (t, op)))
5487 {
5488 bad_broadcast:
5489 i.error = unsupported_broadcast;
5490 return 1;
5491 }
5492
5493 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5494 * i.broadcast->type);
5495 operand_type_set (&type, 0);
5496 switch (i.broadcast->bytes)
5497 {
5498 case 2:
5499 type.bitfield.word = 1;
5500 break;
5501 case 4:
5502 type.bitfield.dword = 1;
5503 break;
5504 case 8:
5505 type.bitfield.qword = 1;
5506 break;
5507 case 16:
5508 type.bitfield.xmmword = 1;
5509 break;
5510 case 32:
5511 type.bitfield.ymmword = 1;
5512 break;
5513 case 64:
5514 type.bitfield.zmmword = 1;
5515 break;
5516 default:
5517 goto bad_broadcast;
5518 }
5519
5520 overlap = operand_type_and (type, t->operand_types[op]);
5521 if (operand_type_all_zero (&overlap))
5522 goto bad_broadcast;
5523
5524 if (t->opcode_modifier.checkregsize)
5525 {
5526 unsigned int j;
5527
5528 type.bitfield.baseindex = 1;
5529 for (j = 0; j < i.operands; ++j)
5530 {
5531 if (j != op
5532 && !operand_type_register_match(i.types[j],
5533 t->operand_types[j],
5534 type,
5535 t->operand_types[op]))
5536 goto bad_broadcast;
5537 }
5538 }
5539 }
5540 /* If broadcast is supported in this instruction, we need to check if
5541 operand of one-element size isn't specified without broadcast. */
5542 else if (t->opcode_modifier.broadcast && i.mem_operands)
5543 {
5544 /* Find memory operand. */
5545 for (op = 0; op < i.operands; op++)
5546 if (i.flags[op] & Operand_Mem)
5547 break;
5548 gas_assert (op < i.operands);
5549 /* Check size of the memory operand. */
5550 if (match_broadcast_size (t, op))
5551 {
5552 i.error = broadcast_needed;
5553 return 1;
5554 }
5555 }
5556 else
5557 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5558
5559 /* Check if requested masking is supported. */
5560 if (i.mask)
5561 {
5562 switch (t->opcode_modifier.masking)
5563 {
5564 case BOTH_MASKING:
5565 break;
5566 case MERGING_MASKING:
5567 if (i.mask->zeroing)
5568 {
5569 case 0:
5570 i.error = unsupported_masking;
5571 return 1;
5572 }
5573 break;
5574 case DYNAMIC_MASKING:
5575 /* Memory destinations allow only merging masking. */
5576 if (i.mask->zeroing && i.mem_operands)
5577 {
5578 /* Find memory operand. */
5579 for (op = 0; op < i.operands; op++)
5580 if (i.flags[op] & Operand_Mem)
5581 break;
5582 gas_assert (op < i.operands);
5583 if (op == i.operands - 1)
5584 {
5585 i.error = unsupported_masking;
5586 return 1;
5587 }
5588 }
5589 break;
5590 default:
5591 abort ();
5592 }
5593 }
5594
5595 /* Check if masking is applied to dest operand. */
5596 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5597 {
5598 i.error = mask_not_on_destination;
5599 return 1;
5600 }
5601
5602 /* Check RC/SAE. */
5603 if (i.rounding)
5604 {
5605 if (!t->opcode_modifier.sae
5606 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5607 {
5608 i.error = unsupported_rc_sae;
5609 return 1;
5610 }
5611 /* If the instruction has several immediate operands and one of
5612 them is rounding, the rounding operand should be the last
5613 immediate operand. */
5614 if (i.imm_operands > 1
5615 && i.rounding->operand != (int) (i.imm_operands - 1))
5616 {
5617 i.error = rc_sae_operand_not_last_imm;
5618 return 1;
5619 }
5620 }
5621
5622 /* Check vector Disp8 operand. */
5623 if (t->opcode_modifier.disp8memshift
5624 && i.disp_encoding != disp_encoding_32bit)
5625 {
5626 if (i.broadcast)
5627 i.memshift = t->opcode_modifier.broadcast - 1;
5628 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5629 i.memshift = t->opcode_modifier.disp8memshift;
5630 else
5631 {
5632 const i386_operand_type *type = NULL;
5633
5634 i.memshift = 0;
5635 for (op = 0; op < i.operands; op++)
5636 if (i.flags[op] & Operand_Mem)
5637 {
5638 if (t->opcode_modifier.evex == EVEXLIG)
5639 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5640 else if (t->operand_types[op].bitfield.xmmword
5641 + t->operand_types[op].bitfield.ymmword
5642 + t->operand_types[op].bitfield.zmmword <= 1)
5643 type = &t->operand_types[op];
5644 else if (!i.types[op].bitfield.unspecified)
5645 type = &i.types[op];
5646 }
5647 else if (i.types[op].bitfield.class == RegSIMD
5648 && t->opcode_modifier.evex != EVEXLIG)
5649 {
5650 if (i.types[op].bitfield.zmmword)
5651 i.memshift = 6;
5652 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5653 i.memshift = 5;
5654 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5655 i.memshift = 4;
5656 }
5657
5658 if (type)
5659 {
5660 if (type->bitfield.zmmword)
5661 i.memshift = 6;
5662 else if (type->bitfield.ymmword)
5663 i.memshift = 5;
5664 else if (type->bitfield.xmmword)
5665 i.memshift = 4;
5666 }
5667
5668 /* For the check in fits_in_disp8(). */
5669 if (i.memshift == 0)
5670 i.memshift = -1;
5671 }
5672
5673 for (op = 0; op < i.operands; op++)
5674 if (operand_type_check (i.types[op], disp)
5675 && i.op[op].disps->X_op == O_constant)
5676 {
5677 if (fits_in_disp8 (i.op[op].disps->X_add_number))
5678 {
5679 i.types[op].bitfield.disp8 = 1;
5680 return 0;
5681 }
5682 i.types[op].bitfield.disp8 = 0;
5683 }
5684 }
5685
5686 i.memshift = 0;
5687
5688 return 0;
5689 }
5690
5691 /* Check if operands are valid for the instruction. Update VEX
5692 operand types. */
5693
5694 static int
5695 VEX_check_operands (const insn_template *t)
5696 {
5697 if (i.vec_encoding == vex_encoding_evex)
5698 {
5699 /* This instruction must be encoded with EVEX prefix. */
5700 if (!is_evex_encoding (t))
5701 {
5702 i.error = unsupported;
5703 return 1;
5704 }
5705 return 0;
5706 }
5707
5708 if (!t->opcode_modifier.vex)
5709 {
5710 /* This instruction template doesn't have VEX prefix. */
5711 if (i.vec_encoding != vex_encoding_default)
5712 {
5713 i.error = unsupported;
5714 return 1;
5715 }
5716 return 0;
5717 }
5718
5719 /* Check the special Imm4 cases; must be the first operand. */
5720 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
5721 {
5722 if (i.op[0].imms->X_op != O_constant
5723 || !fits_in_imm4 (i.op[0].imms->X_add_number))
5724 {
5725 i.error = bad_imm4;
5726 return 1;
5727 }
5728
5729 /* Turn off Imm<N> so that update_imm won't complain. */
5730 operand_type_set (&i.types[0], 0);
5731 }
5732
5733 return 0;
5734 }
5735
5736 static const insn_template *
5737 match_template (char mnem_suffix)
5738 {
5739 /* Points to template once we've found it. */
5740 const insn_template *t;
5741 i386_operand_type overlap0, overlap1, overlap2, overlap3;
5742 i386_operand_type overlap4;
5743 unsigned int found_reverse_match;
5744 i386_opcode_modifier suffix_check;
5745 i386_operand_type operand_types [MAX_OPERANDS];
5746 int addr_prefix_disp;
5747 unsigned int j;
5748 unsigned int found_cpu_match, size_match;
5749 unsigned int check_register;
5750 enum i386_error specific_error = 0;
5751
5752 #if MAX_OPERANDS != 5
5753 # error "MAX_OPERANDS must be 5."
5754 #endif
5755
5756 found_reverse_match = 0;
5757 addr_prefix_disp = -1;
5758
5759 /* Prepare for mnemonic suffix check. */
5760 memset (&suffix_check, 0, sizeof (suffix_check));
5761 switch (mnem_suffix)
5762 {
5763 case BYTE_MNEM_SUFFIX:
5764 suffix_check.no_bsuf = 1;
5765 break;
5766 case WORD_MNEM_SUFFIX:
5767 suffix_check.no_wsuf = 1;
5768 break;
5769 case SHORT_MNEM_SUFFIX:
5770 suffix_check.no_ssuf = 1;
5771 break;
5772 case LONG_MNEM_SUFFIX:
5773 suffix_check.no_lsuf = 1;
5774 break;
5775 case QWORD_MNEM_SUFFIX:
5776 suffix_check.no_qsuf = 1;
5777 break;
5778 default:
5779 /* NB: In Intel syntax, normally we can check for memory operand
5780 size when there is no mnemonic suffix. But jmp and call have
5781 2 different encodings with Dword memory operand size, one with
5782 No_ldSuf and the other without. i.suffix is set to
5783 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
5784 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5785 suffix_check.no_ldsuf = 1;
5786 }
5787
5788 /* Must have right number of operands. */
5789 i.error = number_of_operands_mismatch;
5790
5791 for (t = current_templates->start; t < current_templates->end; t++)
5792 {
5793 addr_prefix_disp = -1;
5794 found_reverse_match = 0;
5795
5796 if (i.operands != t->operands)
5797 continue;
5798
5799 /* Check processor support. */
5800 i.error = unsupported;
5801 found_cpu_match = (cpu_flags_match (t)
5802 == CPU_FLAGS_PERFECT_MATCH);
5803 if (!found_cpu_match)
5804 continue;
5805
5806 /* Check AT&T mnemonic. */
5807 i.error = unsupported_with_intel_mnemonic;
5808 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5809 continue;
5810
5811 /* Check AT&T/Intel syntax and Intel64/AMD64 ISA. */
5812 i.error = unsupported_syntax;
5813 if ((intel_syntax && t->opcode_modifier.attsyntax)
5814 || (!intel_syntax && t->opcode_modifier.intelsyntax)
5815 || (intel64 && t->opcode_modifier.amd64)
5816 || (!intel64 && t->opcode_modifier.intel64))
5817 continue;
5818
5819 /* Check the suffix. */
5820 i.error = invalid_instruction_suffix;
5821 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5822 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5823 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5824 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5825 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5826 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
5827 continue;
5828
5829 size_match = operand_size_match (t);
5830 if (!size_match)
5831 continue;
5832
5833 /* This is intentionally not
5834
5835 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
5836
5837 as the case of a missing * on the operand is accepted (perhaps with
5838 a warning, issued further down). */
5839 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5840 {
5841 i.error = operand_type_mismatch;
5842 continue;
5843 }
5844
5845 for (j = 0; j < MAX_OPERANDS; j++)
5846 operand_types[j] = t->operand_types[j];
5847
5848 /* In general, don't allow 64-bit operands in 32-bit mode. */
5849 if (i.suffix == QWORD_MNEM_SUFFIX
5850 && flag_code != CODE_64BIT
5851 && (intel_syntax
5852 ? (!t->opcode_modifier.ignoresize
5853 && !t->opcode_modifier.broadcast
5854 && !intel_float_operand (t->name))
5855 : intel_float_operand (t->name) != 2)
5856 && ((operand_types[0].bitfield.class != RegMMX
5857 && operand_types[0].bitfield.class != RegSIMD)
5858 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5859 && operand_types[t->operands > 1].bitfield.class != RegSIMD))
5860 && (t->base_opcode != 0x0fc7
5861 || t->extension_opcode != 1 /* cmpxchg8b */))
5862 continue;
5863
5864 /* In general, don't allow 32-bit operands on pre-386. */
5865 else if (i.suffix == LONG_MNEM_SUFFIX
5866 && !cpu_arch_flags.bitfield.cpui386
5867 && (intel_syntax
5868 ? (!t->opcode_modifier.ignoresize
5869 && !intel_float_operand (t->name))
5870 : intel_float_operand (t->name) != 2)
5871 && ((operand_types[0].bitfield.class != RegMMX
5872 && operand_types[0].bitfield.class != RegSIMD)
5873 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5874 && operand_types[t->operands > 1].bitfield.class
5875 != RegSIMD)))
5876 continue;
5877
5878 /* Do not verify operands when there are none. */
5879 else
5880 {
5881 if (!t->operands)
5882 /* We've found a match; break out of loop. */
5883 break;
5884 }
5885
5886 /* Address size prefix will turn Disp64/Disp32/Disp16 operand
5887 into Disp32/Disp16/Disp32 operand. */
5888 if (i.prefix[ADDR_PREFIX] != 0)
5889 {
5890 /* There should be only one Disp operand. */
5891 switch (flag_code)
5892 {
5893 case CODE_16BIT:
5894 for (j = 0; j < MAX_OPERANDS; j++)
5895 {
5896 if (operand_types[j].bitfield.disp16)
5897 {
5898 addr_prefix_disp = j;
5899 operand_types[j].bitfield.disp32 = 1;
5900 operand_types[j].bitfield.disp16 = 0;
5901 break;
5902 }
5903 }
5904 break;
5905 case CODE_32BIT:
5906 for (j = 0; j < MAX_OPERANDS; j++)
5907 {
5908 if (operand_types[j].bitfield.disp32)
5909 {
5910 addr_prefix_disp = j;
5911 operand_types[j].bitfield.disp32 = 0;
5912 operand_types[j].bitfield.disp16 = 1;
5913 break;
5914 }
5915 }
5916 break;
5917 case CODE_64BIT:
5918 for (j = 0; j < MAX_OPERANDS; j++)
5919 {
5920 if (operand_types[j].bitfield.disp64)
5921 {
5922 addr_prefix_disp = j;
5923 operand_types[j].bitfield.disp64 = 0;
5924 operand_types[j].bitfield.disp32 = 1;
5925 break;
5926 }
5927 }
5928 break;
5929 }
5930 }
5931
5932 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
5933 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5934 continue;
5935
5936 /* We check register size if needed. */
5937 if (t->opcode_modifier.checkregsize)
5938 {
5939 check_register = (1 << t->operands) - 1;
5940 if (i.broadcast)
5941 check_register &= ~(1 << i.broadcast->operand);
5942 }
5943 else
5944 check_register = 0;
5945
5946 overlap0 = operand_type_and (i.types[0], operand_types[0]);
5947 switch (t->operands)
5948 {
5949 case 1:
5950 if (!operand_type_match (overlap0, i.types[0]))
5951 continue;
5952 break;
5953 case 2:
5954 /* xchg %eax, %eax is a special case. It is an alias for nop
5955 only in 32bit mode and we can use opcode 0x90. In 64bit
5956 mode, we can't use 0x90 for xchg %eax, %eax since it should
5957 zero-extend %eax to %rax. */
5958 if (flag_code == CODE_64BIT
5959 && t->base_opcode == 0x90
5960 && i.types[0].bitfield.instance == Accum
5961 && i.types[0].bitfield.dword
5962 && i.types[1].bitfield.instance == Accum
5963 && i.types[1].bitfield.dword)
5964 continue;
5965 /* xrelease mov %eax, <disp> is another special case. It must not
5966 match the accumulator-only encoding of mov. */
5967 if (flag_code != CODE_64BIT
5968 && i.hle_prefix
5969 && t->base_opcode == 0xa0
5970 && i.types[0].bitfield.instance == Accum
5971 && (i.flags[1] & Operand_Mem))
5972 continue;
5973 /* Fall through. */
5974
5975 case 3:
5976 if (!(size_match & MATCH_STRAIGHT))
5977 goto check_reverse;
5978 /* Reverse direction of operands if swapping is possible in the first
5979 place (operands need to be symmetric) and
5980 - the load form is requested, and the template is a store form,
5981 - the store form is requested, and the template is a load form,
5982 - the non-default (swapped) form is requested. */
5983 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5984 if (t->opcode_modifier.d && i.reg_operands == i.operands
5985 && !operand_type_all_zero (&overlap1))
5986 switch (i.dir_encoding)
5987 {
5988 case dir_encoding_load:
5989 if (operand_type_check (operand_types[i.operands - 1], anymem)
5990 || t->opcode_modifier.regmem)
5991 goto check_reverse;
5992 break;
5993
5994 case dir_encoding_store:
5995 if (!operand_type_check (operand_types[i.operands - 1], anymem)
5996 && !t->opcode_modifier.regmem)
5997 goto check_reverse;
5998 break;
5999
6000 case dir_encoding_swap:
6001 goto check_reverse;
6002
6003 case dir_encoding_default:
6004 break;
6005 }
6006 /* If we want store form, we skip the current load. */
6007 if ((i.dir_encoding == dir_encoding_store
6008 || i.dir_encoding == dir_encoding_swap)
6009 && i.mem_operands == 0
6010 && t->opcode_modifier.load)
6011 continue;
6012 /* Fall through. */
6013 case 4:
6014 case 5:
6015 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6016 if (!operand_type_match (overlap0, i.types[0])
6017 || !operand_type_match (overlap1, i.types[1])
6018 || ((check_register & 3) == 3
6019 && !operand_type_register_match (i.types[0],
6020 operand_types[0],
6021 i.types[1],
6022 operand_types[1])))
6023 {
6024 /* Check if other direction is valid ... */
6025 if (!t->opcode_modifier.d)
6026 continue;
6027
6028 check_reverse:
6029 if (!(size_match & MATCH_REVERSE))
6030 continue;
6031 /* Try reversing direction of operands. */
6032 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6033 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6034 if (!operand_type_match (overlap0, i.types[0])
6035 || !operand_type_match (overlap1, i.types[i.operands - 1])
6036 || (check_register
6037 && !operand_type_register_match (i.types[0],
6038 operand_types[i.operands - 1],
6039 i.types[i.operands - 1],
6040 operand_types[0])))
6041 {
6042 /* Does not match either direction. */
6043 continue;
6044 }
6045 /* found_reverse_match holds which of D or FloatR
6046 we've found. */
6047 if (!t->opcode_modifier.d)
6048 found_reverse_match = 0;
6049 else if (operand_types[0].bitfield.tbyte)
6050 found_reverse_match = Opcode_FloatD;
6051 else if (operand_types[0].bitfield.xmmword
6052 || operand_types[i.operands - 1].bitfield.xmmword
6053 || operand_types[0].bitfield.class == RegMMX
6054 || operand_types[i.operands - 1].bitfield.class == RegMMX
6055 || is_any_vex_encoding(t))
6056 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6057 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6058 else
6059 found_reverse_match = Opcode_D;
6060 if (t->opcode_modifier.floatr)
6061 found_reverse_match |= Opcode_FloatR;
6062 }
6063 else
6064 {
6065 /* Found a forward 2 operand match here. */
6066 switch (t->operands)
6067 {
6068 case 5:
6069 overlap4 = operand_type_and (i.types[4],
6070 operand_types[4]);
6071 /* Fall through. */
6072 case 4:
6073 overlap3 = operand_type_and (i.types[3],
6074 operand_types[3]);
6075 /* Fall through. */
6076 case 3:
6077 overlap2 = operand_type_and (i.types[2],
6078 operand_types[2]);
6079 break;
6080 }
6081
6082 switch (t->operands)
6083 {
6084 case 5:
6085 if (!operand_type_match (overlap4, i.types[4])
6086 || !operand_type_register_match (i.types[3],
6087 operand_types[3],
6088 i.types[4],
6089 operand_types[4]))
6090 continue;
6091 /* Fall through. */
6092 case 4:
6093 if (!operand_type_match (overlap3, i.types[3])
6094 || ((check_register & 0xa) == 0xa
6095 && !operand_type_register_match (i.types[1],
6096 operand_types[1],
6097 i.types[3],
6098 operand_types[3]))
6099 || ((check_register & 0xc) == 0xc
6100 && !operand_type_register_match (i.types[2],
6101 operand_types[2],
6102 i.types[3],
6103 operand_types[3])))
6104 continue;
6105 /* Fall through. */
6106 case 3:
6107 /* Here we make use of the fact that there are no
6108 reverse match 3 operand instructions. */
6109 if (!operand_type_match (overlap2, i.types[2])
6110 || ((check_register & 5) == 5
6111 && !operand_type_register_match (i.types[0],
6112 operand_types[0],
6113 i.types[2],
6114 operand_types[2]))
6115 || ((check_register & 6) == 6
6116 && !operand_type_register_match (i.types[1],
6117 operand_types[1],
6118 i.types[2],
6119 operand_types[2])))
6120 continue;
6121 break;
6122 }
6123 }
6124 /* Found either forward/reverse 2, 3 or 4 operand match here:
6125 slip through to break. */
6126 }
6127 if (!found_cpu_match)
6128 continue;
6129
6130 /* Check if vector and VEX operands are valid. */
6131 if (check_VecOperands (t) || VEX_check_operands (t))
6132 {
6133 specific_error = i.error;
6134 continue;
6135 }
6136
6137 /* We've found a match; break out of loop. */
6138 break;
6139 }
6140
6141 if (t == current_templates->end)
6142 {
6143 /* We found no match. */
6144 const char *err_msg;
6145 switch (specific_error ? specific_error : i.error)
6146 {
6147 default:
6148 abort ();
6149 case operand_size_mismatch:
6150 err_msg = _("operand size mismatch");
6151 break;
6152 case operand_type_mismatch:
6153 err_msg = _("operand type mismatch");
6154 break;
6155 case register_type_mismatch:
6156 err_msg = _("register type mismatch");
6157 break;
6158 case number_of_operands_mismatch:
6159 err_msg = _("number of operands mismatch");
6160 break;
6161 case invalid_instruction_suffix:
6162 err_msg = _("invalid instruction suffix");
6163 break;
6164 case bad_imm4:
6165 err_msg = _("constant doesn't fit in 4 bits");
6166 break;
6167 case unsupported_with_intel_mnemonic:
6168 err_msg = _("unsupported with Intel mnemonic");
6169 break;
6170 case unsupported_syntax:
6171 err_msg = _("unsupported syntax");
6172 break;
6173 case unsupported:
6174 as_bad (_("unsupported instruction `%s'"),
6175 current_templates->start->name);
6176 return NULL;
6177 case invalid_vsib_address:
6178 err_msg = _("invalid VSIB address");
6179 break;
6180 case invalid_vector_register_set:
6181 err_msg = _("mask, index, and destination registers must be distinct");
6182 break;
6183 case unsupported_vector_index_register:
6184 err_msg = _("unsupported vector index register");
6185 break;
6186 case unsupported_broadcast:
6187 err_msg = _("unsupported broadcast");
6188 break;
6189 case broadcast_needed:
6190 err_msg = _("broadcast is needed for operand of such type");
6191 break;
6192 case unsupported_masking:
6193 err_msg = _("unsupported masking");
6194 break;
6195 case mask_not_on_destination:
6196 err_msg = _("mask not on destination operand");
6197 break;
6198 case no_default_mask:
6199 err_msg = _("default mask isn't allowed");
6200 break;
6201 case unsupported_rc_sae:
6202 err_msg = _("unsupported static rounding/sae");
6203 break;
6204 case rc_sae_operand_not_last_imm:
6205 if (intel_syntax)
6206 err_msg = _("RC/SAE operand must precede immediate operands");
6207 else
6208 err_msg = _("RC/SAE operand must follow immediate operands");
6209 break;
6210 case invalid_register_operand:
6211 err_msg = _("invalid register operand");
6212 break;
6213 }
6214 as_bad (_("%s for `%s'"), err_msg,
6215 current_templates->start->name);
6216 return NULL;
6217 }
6218
6219 if (!quiet_warnings)
6220 {
6221 if (!intel_syntax
6222 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6223 as_warn (_("indirect %s without `*'"), t->name);
6224
6225 if (t->opcode_modifier.isprefix
6226 && t->opcode_modifier.ignoresize)
6227 {
6228 /* Warn them that a data or address size prefix doesn't
6229 affect assembly of the next line of code. */
6230 as_warn (_("stand-alone `%s' prefix"), t->name);
6231 }
6232 }
6233
6234 /* Copy the template we found. */
6235 i.tm = *t;
6236
6237 if (addr_prefix_disp != -1)
6238 i.tm.operand_types[addr_prefix_disp]
6239 = operand_types[addr_prefix_disp];
6240
6241 if (found_reverse_match)
6242 {
6243 /* If we found a reverse match we must alter the opcode direction
6244 bit and clear/flip the regmem modifier one. found_reverse_match
6245 holds bits to change (different for int & float insns). */
6246
6247 i.tm.base_opcode ^= found_reverse_match;
6248
6249 i.tm.operand_types[0] = operand_types[i.operands - 1];
6250 i.tm.operand_types[i.operands - 1] = operand_types[0];
6251
6252 /* Certain SIMD insns have their load forms specified in the opcode
6253 table, and hence we need to _set_ RegMem instead of clearing it.
6254 We need to avoid setting the bit though on insns like KMOVW. */
6255 i.tm.opcode_modifier.regmem
6256 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6257 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6258 && !i.tm.opcode_modifier.regmem;
6259 }
6260
6261 return t;
6262 }
6263
6264 static int
6265 check_string (void)
6266 {
6267 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6268 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6269
6270 if (i.seg[op] != NULL && i.seg[op] != &es)
6271 {
6272 as_bad (_("`%s' operand %u must use `%ses' segment"),
6273 i.tm.name,
6274 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6275 register_prefix);
6276 return 0;
6277 }
6278
6279 /* There's only ever one segment override allowed per instruction.
6280 This instruction possibly has a legal segment override on the
6281 second operand, so copy the segment to where non-string
6282 instructions store it, allowing common code. */
6283 i.seg[op] = i.seg[1];
6284
6285 return 1;
6286 }
6287
6288 static int
6289 process_suffix (void)
6290 {
6291 /* If matched instruction specifies an explicit instruction mnemonic
6292 suffix, use it. */
6293 if (i.tm.opcode_modifier.size == SIZE16)
6294 i.suffix = WORD_MNEM_SUFFIX;
6295 else if (i.tm.opcode_modifier.size == SIZE32)
6296 i.suffix = LONG_MNEM_SUFFIX;
6297 else if (i.tm.opcode_modifier.size == SIZE64)
6298 i.suffix = QWORD_MNEM_SUFFIX;
6299 else if (i.reg_operands
6300 && (i.operands > 1 || i.types[0].bitfield.class == Reg))
6301 {
6302 /* If there's no instruction mnemonic suffix we try to invent one
6303 based on GPR operands. */
6304 if (!i.suffix)
6305 {
6306 /* We take i.suffix from the last register operand specified,
6307 Destination register type is more significant than source
6308 register type. crc32 in SSE4.2 prefers source register
6309 type. */
6310 if (i.tm.base_opcode == 0xf20f38f0
6311 && i.types[0].bitfield.class == Reg)
6312 {
6313 if (i.types[0].bitfield.byte)
6314 i.suffix = BYTE_MNEM_SUFFIX;
6315 else if (i.types[0].bitfield.word)
6316 i.suffix = WORD_MNEM_SUFFIX;
6317 else if (i.types[0].bitfield.dword)
6318 i.suffix = LONG_MNEM_SUFFIX;
6319 else if (i.types[0].bitfield.qword)
6320 i.suffix = QWORD_MNEM_SUFFIX;
6321 }
6322
6323 if (!i.suffix)
6324 {
6325 int op;
6326
6327 if (i.tm.base_opcode == 0xf20f38f0)
6328 {
6329 /* We have to know the operand size for crc32. */
6330 as_bad (_("ambiguous memory operand size for `%s`"),
6331 i.tm.name);
6332 return 0;
6333 }
6334
6335 for (op = i.operands; --op >= 0;)
6336 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6337 || i.tm.operand_types[op].bitfield.instance == Accum)
6338 {
6339 if (i.types[op].bitfield.class != Reg)
6340 continue;
6341 if (i.types[op].bitfield.byte)
6342 i.suffix = BYTE_MNEM_SUFFIX;
6343 else if (i.types[op].bitfield.word)
6344 i.suffix = WORD_MNEM_SUFFIX;
6345 else if (i.types[op].bitfield.dword)
6346 i.suffix = LONG_MNEM_SUFFIX;
6347 else if (i.types[op].bitfield.qword)
6348 i.suffix = QWORD_MNEM_SUFFIX;
6349 else
6350 continue;
6351 break;
6352 }
6353 }
6354 }
6355 else if (i.suffix == BYTE_MNEM_SUFFIX)
6356 {
6357 if (intel_syntax
6358 && i.tm.opcode_modifier.ignoresize
6359 && i.tm.opcode_modifier.no_bsuf)
6360 i.suffix = 0;
6361 else if (!check_byte_reg ())
6362 return 0;
6363 }
6364 else if (i.suffix == LONG_MNEM_SUFFIX)
6365 {
6366 if (intel_syntax
6367 && i.tm.opcode_modifier.ignoresize
6368 && i.tm.opcode_modifier.no_lsuf
6369 && !i.tm.opcode_modifier.todword
6370 && !i.tm.opcode_modifier.toqword)
6371 i.suffix = 0;
6372 else if (!check_long_reg ())
6373 return 0;
6374 }
6375 else if (i.suffix == QWORD_MNEM_SUFFIX)
6376 {
6377 if (intel_syntax
6378 && i.tm.opcode_modifier.ignoresize
6379 && i.tm.opcode_modifier.no_qsuf
6380 && !i.tm.opcode_modifier.todword
6381 && !i.tm.opcode_modifier.toqword)
6382 i.suffix = 0;
6383 else if (!check_qword_reg ())
6384 return 0;
6385 }
6386 else if (i.suffix == WORD_MNEM_SUFFIX)
6387 {
6388 if (intel_syntax
6389 && i.tm.opcode_modifier.ignoresize
6390 && i.tm.opcode_modifier.no_wsuf)
6391 i.suffix = 0;
6392 else if (!check_word_reg ())
6393 return 0;
6394 }
6395 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6396 /* Do nothing if the instruction is going to ignore the prefix. */
6397 ;
6398 else
6399 abort ();
6400 }
6401 else if (i.tm.opcode_modifier.defaultsize
6402 && !i.suffix
6403 /* exclude fldenv/frstor/fsave/fstenv */
6404 && i.tm.opcode_modifier.no_ssuf
6405 /* exclude sysret */
6406 && i.tm.base_opcode != 0x0f07)
6407 {
6408 i.suffix = stackop_size;
6409 if (stackop_size == LONG_MNEM_SUFFIX)
6410 {
6411 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6412 .code16gcc directive to support 16-bit mode with
6413 32-bit address. For IRET without a suffix, generate
6414 16-bit IRET (opcode 0xcf) to return from an interrupt
6415 handler. */
6416 if (i.tm.base_opcode == 0xcf)
6417 {
6418 i.suffix = WORD_MNEM_SUFFIX;
6419 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6420 }
6421 /* Warn about changed behavior for segment register push/pop. */
6422 else if ((i.tm.base_opcode | 1) == 0x07)
6423 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6424 i.tm.name);
6425 }
6426 }
6427 else if (intel_syntax
6428 && !i.suffix
6429 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6430 || i.tm.opcode_modifier.jump == JUMP_BYTE
6431 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6432 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6433 && i.tm.extension_opcode <= 3)))
6434 {
6435 switch (flag_code)
6436 {
6437 case CODE_64BIT:
6438 if (!i.tm.opcode_modifier.no_qsuf)
6439 {
6440 i.suffix = QWORD_MNEM_SUFFIX;
6441 break;
6442 }
6443 /* Fall through. */
6444 case CODE_32BIT:
6445 if (!i.tm.opcode_modifier.no_lsuf)
6446 i.suffix = LONG_MNEM_SUFFIX;
6447 break;
6448 case CODE_16BIT:
6449 if (!i.tm.opcode_modifier.no_wsuf)
6450 i.suffix = WORD_MNEM_SUFFIX;
6451 break;
6452 }
6453 }
6454
6455 if (!i.suffix)
6456 {
6457 if (!intel_syntax)
6458 {
6459 if (i.tm.opcode_modifier.w)
6460 {
6461 as_bad (_("no instruction mnemonic suffix given and "
6462 "no register operands; can't size instruction"));
6463 return 0;
6464 }
6465 }
6466 else
6467 {
6468 unsigned int suffixes;
6469
6470 suffixes = !i.tm.opcode_modifier.no_bsuf;
6471 if (!i.tm.opcode_modifier.no_wsuf)
6472 suffixes |= 1 << 1;
6473 if (!i.tm.opcode_modifier.no_lsuf)
6474 suffixes |= 1 << 2;
6475 if (!i.tm.opcode_modifier.no_ldsuf)
6476 suffixes |= 1 << 3;
6477 if (!i.tm.opcode_modifier.no_ssuf)
6478 suffixes |= 1 << 4;
6479 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6480 suffixes |= 1 << 5;
6481
6482 /* There are more than suffix matches. */
6483 if (i.tm.opcode_modifier.w
6484 || ((suffixes & (suffixes - 1))
6485 && !i.tm.opcode_modifier.defaultsize
6486 && !i.tm.opcode_modifier.ignoresize))
6487 {
6488 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6489 return 0;
6490 }
6491 }
6492 }
6493
6494 /* Change the opcode based on the operand size given by i.suffix. */
6495 switch (i.suffix)
6496 {
6497 /* Size floating point instruction. */
6498 case LONG_MNEM_SUFFIX:
6499 if (i.tm.opcode_modifier.floatmf)
6500 {
6501 i.tm.base_opcode ^= 4;
6502 break;
6503 }
6504 /* fall through */
6505 case WORD_MNEM_SUFFIX:
6506 case QWORD_MNEM_SUFFIX:
6507 /* It's not a byte, select word/dword operation. */
6508 if (i.tm.opcode_modifier.w)
6509 {
6510 if (i.tm.opcode_modifier.shortform)
6511 i.tm.base_opcode |= 8;
6512 else
6513 i.tm.base_opcode |= 1;
6514 }
6515 /* fall through */
6516 case SHORT_MNEM_SUFFIX:
6517 /* Now select between word & dword operations via the operand
6518 size prefix, except for instructions that will ignore this
6519 prefix anyway. */
6520 if (i.reg_operands > 0
6521 && i.types[0].bitfield.class == Reg
6522 && i.tm.opcode_modifier.addrprefixopreg
6523 && (i.tm.operand_types[0].bitfield.instance == Accum
6524 || i.operands == 1))
6525 {
6526 /* The address size override prefix changes the size of the
6527 first operand. */
6528 if ((flag_code == CODE_32BIT
6529 && i.op[0].regs->reg_type.bitfield.word)
6530 || (flag_code != CODE_32BIT
6531 && i.op[0].regs->reg_type.bitfield.dword))
6532 if (!add_prefix (ADDR_PREFIX_OPCODE))
6533 return 0;
6534 }
6535 else if (i.suffix != QWORD_MNEM_SUFFIX
6536 && !i.tm.opcode_modifier.ignoresize
6537 && !i.tm.opcode_modifier.floatmf
6538 && !is_any_vex_encoding (&i.tm)
6539 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6540 || (flag_code == CODE_64BIT
6541 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
6542 {
6543 unsigned int prefix = DATA_PREFIX_OPCODE;
6544
6545 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
6546 prefix = ADDR_PREFIX_OPCODE;
6547
6548 if (!add_prefix (prefix))
6549 return 0;
6550 }
6551
6552 /* Set mode64 for an operand. */
6553 if (i.suffix == QWORD_MNEM_SUFFIX
6554 && flag_code == CODE_64BIT
6555 && !i.tm.opcode_modifier.norex64
6556 /* Special case for xchg %rax,%rax. It is NOP and doesn't
6557 need rex64. */
6558 && ! (i.operands == 2
6559 && i.tm.base_opcode == 0x90
6560 && i.tm.extension_opcode == None
6561 && i.types[0].bitfield.instance == Accum
6562 && i.types[0].bitfield.qword
6563 && i.types[1].bitfield.instance == Accum
6564 && i.types[1].bitfield.qword))
6565 i.rex |= REX_W;
6566
6567 break;
6568 }
6569
6570 if (i.reg_operands != 0
6571 && i.operands > 1
6572 && i.tm.opcode_modifier.addrprefixopreg
6573 && i.tm.operand_types[0].bitfield.instance != Accum)
6574 {
6575 /* Check invalid register operand when the address size override
6576 prefix changes the size of register operands. */
6577 unsigned int op;
6578 enum { need_word, need_dword, need_qword } need;
6579
6580 if (flag_code == CODE_32BIT)
6581 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6582 else
6583 {
6584 if (i.prefix[ADDR_PREFIX])
6585 need = need_dword;
6586 else
6587 need = flag_code == CODE_64BIT ? need_qword : need_word;
6588 }
6589
6590 for (op = 0; op < i.operands; op++)
6591 if (i.types[op].bitfield.class == Reg
6592 && ((need == need_word
6593 && !i.op[op].regs->reg_type.bitfield.word)
6594 || (need == need_dword
6595 && !i.op[op].regs->reg_type.bitfield.dword)
6596 || (need == need_qword
6597 && !i.op[op].regs->reg_type.bitfield.qword)))
6598 {
6599 as_bad (_("invalid register operand size for `%s'"),
6600 i.tm.name);
6601 return 0;
6602 }
6603 }
6604
6605 return 1;
6606 }
6607
6608 static int
6609 check_byte_reg (void)
6610 {
6611 int op;
6612
6613 for (op = i.operands; --op >= 0;)
6614 {
6615 /* Skip non-register operands. */
6616 if (i.types[op].bitfield.class != Reg)
6617 continue;
6618
6619 /* If this is an eight bit register, it's OK. If it's the 16 or
6620 32 bit version of an eight bit register, we will just use the
6621 low portion, and that's OK too. */
6622 if (i.types[op].bitfield.byte)
6623 continue;
6624
6625 /* I/O port address operands are OK too. */
6626 if (i.tm.operand_types[op].bitfield.instance == RegD
6627 && i.tm.operand_types[op].bitfield.word)
6628 continue;
6629
6630 /* crc32 doesn't generate this warning. */
6631 if (i.tm.base_opcode == 0xf20f38f0)
6632 continue;
6633
6634 if ((i.types[op].bitfield.word
6635 || i.types[op].bitfield.dword
6636 || i.types[op].bitfield.qword)
6637 && i.op[op].regs->reg_num < 4
6638 /* Prohibit these changes in 64bit mode, since the lowering
6639 would be more complicated. */
6640 && flag_code != CODE_64BIT)
6641 {
6642 #if REGISTER_WARNINGS
6643 if (!quiet_warnings)
6644 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6645 register_prefix,
6646 (i.op[op].regs + (i.types[op].bitfield.word
6647 ? REGNAM_AL - REGNAM_AX
6648 : REGNAM_AL - REGNAM_EAX))->reg_name,
6649 register_prefix,
6650 i.op[op].regs->reg_name,
6651 i.suffix);
6652 #endif
6653 continue;
6654 }
6655 /* Any other register is bad. */
6656 if (i.types[op].bitfield.class == Reg
6657 || i.types[op].bitfield.class == RegMMX
6658 || i.types[op].bitfield.class == RegSIMD
6659 || i.types[op].bitfield.class == SReg
6660 || i.types[op].bitfield.class == RegCR
6661 || i.types[op].bitfield.class == RegDR
6662 || i.types[op].bitfield.class == RegTR)
6663 {
6664 as_bad (_("`%s%s' not allowed with `%s%c'"),
6665 register_prefix,
6666 i.op[op].regs->reg_name,
6667 i.tm.name,
6668 i.suffix);
6669 return 0;
6670 }
6671 }
6672 return 1;
6673 }
6674
6675 static int
6676 check_long_reg (void)
6677 {
6678 int op;
6679
6680 for (op = i.operands; --op >= 0;)
6681 /* Skip non-register operands. */
6682 if (i.types[op].bitfield.class != Reg)
6683 continue;
6684 /* Reject eight bit registers, except where the template requires
6685 them. (eg. movzb) */
6686 else if (i.types[op].bitfield.byte
6687 && (i.tm.operand_types[op].bitfield.class == Reg
6688 || i.tm.operand_types[op].bitfield.instance == Accum)
6689 && (i.tm.operand_types[op].bitfield.word
6690 || i.tm.operand_types[op].bitfield.dword))
6691 {
6692 as_bad (_("`%s%s' not allowed with `%s%c'"),
6693 register_prefix,
6694 i.op[op].regs->reg_name,
6695 i.tm.name,
6696 i.suffix);
6697 return 0;
6698 }
6699 /* Warn if the e prefix on a general reg is missing. */
6700 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6701 && i.types[op].bitfield.word
6702 && (i.tm.operand_types[op].bitfield.class == Reg
6703 || i.tm.operand_types[op].bitfield.instance == Accum)
6704 && i.tm.operand_types[op].bitfield.dword)
6705 {
6706 /* Prohibit these changes in the 64bit mode, since the
6707 lowering is more complicated. */
6708 if (flag_code == CODE_64BIT)
6709 {
6710 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6711 register_prefix, i.op[op].regs->reg_name,
6712 i.suffix);
6713 return 0;
6714 }
6715 #if REGISTER_WARNINGS
6716 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6717 register_prefix,
6718 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
6719 register_prefix, i.op[op].regs->reg_name, i.suffix);
6720 #endif
6721 }
6722 /* Warn if the r prefix on a general reg is present. */
6723 else if (i.types[op].bitfield.qword
6724 && (i.tm.operand_types[op].bitfield.class == Reg
6725 || i.tm.operand_types[op].bitfield.instance == Accum)
6726 && i.tm.operand_types[op].bitfield.dword)
6727 {
6728 if (intel_syntax
6729 && i.tm.opcode_modifier.toqword
6730 && i.types[0].bitfield.class != RegSIMD)
6731 {
6732 /* Convert to QWORD. We want REX byte. */
6733 i.suffix = QWORD_MNEM_SUFFIX;
6734 }
6735 else
6736 {
6737 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6738 register_prefix, i.op[op].regs->reg_name,
6739 i.suffix);
6740 return 0;
6741 }
6742 }
6743 return 1;
6744 }
6745
6746 static int
6747 check_qword_reg (void)
6748 {
6749 int op;
6750
6751 for (op = i.operands; --op >= 0; )
6752 /* Skip non-register operands. */
6753 if (i.types[op].bitfield.class != Reg)
6754 continue;
6755 /* Reject eight bit registers, except where the template requires
6756 them. (eg. movzb) */
6757 else if (i.types[op].bitfield.byte
6758 && (i.tm.operand_types[op].bitfield.class == Reg
6759 || i.tm.operand_types[op].bitfield.instance == Accum)
6760 && (i.tm.operand_types[op].bitfield.word
6761 || i.tm.operand_types[op].bitfield.dword))
6762 {
6763 as_bad (_("`%s%s' not allowed with `%s%c'"),
6764 register_prefix,
6765 i.op[op].regs->reg_name,
6766 i.tm.name,
6767 i.suffix);
6768 return 0;
6769 }
6770 /* Warn if the r prefix on a general reg is missing. */
6771 else if ((i.types[op].bitfield.word
6772 || i.types[op].bitfield.dword)
6773 && (i.tm.operand_types[op].bitfield.class == Reg
6774 || i.tm.operand_types[op].bitfield.instance == Accum)
6775 && i.tm.operand_types[op].bitfield.qword)
6776 {
6777 /* Prohibit these changes in the 64bit mode, since the
6778 lowering is more complicated. */
6779 if (intel_syntax
6780 && i.tm.opcode_modifier.todword
6781 && i.types[0].bitfield.class != RegSIMD)
6782 {
6783 /* Convert to DWORD. We don't want REX byte. */
6784 i.suffix = LONG_MNEM_SUFFIX;
6785 }
6786 else
6787 {
6788 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6789 register_prefix, i.op[op].regs->reg_name,
6790 i.suffix);
6791 return 0;
6792 }
6793 }
6794 return 1;
6795 }
6796
6797 static int
6798 check_word_reg (void)
6799 {
6800 int op;
6801 for (op = i.operands; --op >= 0;)
6802 /* Skip non-register operands. */
6803 if (i.types[op].bitfield.class != Reg)
6804 continue;
6805 /* Reject eight bit registers, except where the template requires
6806 them. (eg. movzb) */
6807 else if (i.types[op].bitfield.byte
6808 && (i.tm.operand_types[op].bitfield.class == Reg
6809 || i.tm.operand_types[op].bitfield.instance == Accum)
6810 && (i.tm.operand_types[op].bitfield.word
6811 || i.tm.operand_types[op].bitfield.dword))
6812 {
6813 as_bad (_("`%s%s' not allowed with `%s%c'"),
6814 register_prefix,
6815 i.op[op].regs->reg_name,
6816 i.tm.name,
6817 i.suffix);
6818 return 0;
6819 }
6820 /* Warn if the e or r prefix on a general reg is present. */
6821 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6822 && (i.types[op].bitfield.dword
6823 || i.types[op].bitfield.qword)
6824 && (i.tm.operand_types[op].bitfield.class == Reg
6825 || i.tm.operand_types[op].bitfield.instance == Accum)
6826 && i.tm.operand_types[op].bitfield.word)
6827 {
6828 /* Prohibit these changes in the 64bit mode, since the
6829 lowering is more complicated. */
6830 if (flag_code == CODE_64BIT)
6831 {
6832 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6833 register_prefix, i.op[op].regs->reg_name,
6834 i.suffix);
6835 return 0;
6836 }
6837 #if REGISTER_WARNINGS
6838 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6839 register_prefix,
6840 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
6841 register_prefix, i.op[op].regs->reg_name, i.suffix);
6842 #endif
6843 }
6844 return 1;
6845 }
6846
6847 static int
6848 update_imm (unsigned int j)
6849 {
6850 i386_operand_type overlap = i.types[j];
6851 if ((overlap.bitfield.imm8
6852 || overlap.bitfield.imm8s
6853 || overlap.bitfield.imm16
6854 || overlap.bitfield.imm32
6855 || overlap.bitfield.imm32s
6856 || overlap.bitfield.imm64)
6857 && !operand_type_equal (&overlap, &imm8)
6858 && !operand_type_equal (&overlap, &imm8s)
6859 && !operand_type_equal (&overlap, &imm16)
6860 && !operand_type_equal (&overlap, &imm32)
6861 && !operand_type_equal (&overlap, &imm32s)
6862 && !operand_type_equal (&overlap, &imm64))
6863 {
6864 if (i.suffix)
6865 {
6866 i386_operand_type temp;
6867
6868 operand_type_set (&temp, 0);
6869 if (i.suffix == BYTE_MNEM_SUFFIX)
6870 {
6871 temp.bitfield.imm8 = overlap.bitfield.imm8;
6872 temp.bitfield.imm8s = overlap.bitfield.imm8s;
6873 }
6874 else if (i.suffix == WORD_MNEM_SUFFIX)
6875 temp.bitfield.imm16 = overlap.bitfield.imm16;
6876 else if (i.suffix == QWORD_MNEM_SUFFIX)
6877 {
6878 temp.bitfield.imm64 = overlap.bitfield.imm64;
6879 temp.bitfield.imm32s = overlap.bitfield.imm32s;
6880 }
6881 else
6882 temp.bitfield.imm32 = overlap.bitfield.imm32;
6883 overlap = temp;
6884 }
6885 else if (operand_type_equal (&overlap, &imm16_32_32s)
6886 || operand_type_equal (&overlap, &imm16_32)
6887 || operand_type_equal (&overlap, &imm16_32s))
6888 {
6889 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6890 overlap = imm16;
6891 else
6892 overlap = imm32s;
6893 }
6894 if (!operand_type_equal (&overlap, &imm8)
6895 && !operand_type_equal (&overlap, &imm8s)
6896 && !operand_type_equal (&overlap, &imm16)
6897 && !operand_type_equal (&overlap, &imm32)
6898 && !operand_type_equal (&overlap, &imm32s)
6899 && !operand_type_equal (&overlap, &imm64))
6900 {
6901 as_bad (_("no instruction mnemonic suffix given; "
6902 "can't determine immediate size"));
6903 return 0;
6904 }
6905 }
6906 i.types[j] = overlap;
6907
6908 return 1;
6909 }
6910
6911 static int
6912 finalize_imm (void)
6913 {
6914 unsigned int j, n;
6915
6916 /* Update the first 2 immediate operands. */
6917 n = i.operands > 2 ? 2 : i.operands;
6918 if (n)
6919 {
6920 for (j = 0; j < n; j++)
6921 if (update_imm (j) == 0)
6922 return 0;
6923
6924 /* The 3rd operand can't be immediate operand. */
6925 gas_assert (operand_type_check (i.types[2], imm) == 0);
6926 }
6927
6928 return 1;
6929 }
6930
6931 static int
6932 process_operands (void)
6933 {
6934 /* Default segment register this instruction will use for memory
6935 accesses. 0 means unknown. This is only for optimizing out
6936 unnecessary segment overrides. */
6937 const seg_entry *default_seg = 0;
6938
6939 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6940 {
6941 unsigned int dupl = i.operands;
6942 unsigned int dest = dupl - 1;
6943 unsigned int j;
6944
6945 /* The destination must be an xmm register. */
6946 gas_assert (i.reg_operands
6947 && MAX_OPERANDS > dupl
6948 && operand_type_equal (&i.types[dest], &regxmm));
6949
6950 if (i.tm.operand_types[0].bitfield.instance == Accum
6951 && i.tm.operand_types[0].bitfield.xmmword)
6952 {
6953 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6954 {
6955 /* Keep xmm0 for instructions with VEX prefix and 3
6956 sources. */
6957 i.tm.operand_types[0].bitfield.instance = InstanceNone;
6958 i.tm.operand_types[0].bitfield.class = RegSIMD;
6959 goto duplicate;
6960 }
6961 else
6962 {
6963 /* We remove the first xmm0 and keep the number of
6964 operands unchanged, which in fact duplicates the
6965 destination. */
6966 for (j = 1; j < i.operands; j++)
6967 {
6968 i.op[j - 1] = i.op[j];
6969 i.types[j - 1] = i.types[j];
6970 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6971 i.flags[j - 1] = i.flags[j];
6972 }
6973 }
6974 }
6975 else if (i.tm.opcode_modifier.implicit1stxmm0)
6976 {
6977 gas_assert ((MAX_OPERANDS - 1) > dupl
6978 && (i.tm.opcode_modifier.vexsources
6979 == VEX3SOURCES));
6980
6981 /* Add the implicit xmm0 for instructions with VEX prefix
6982 and 3 sources. */
6983 for (j = i.operands; j > 0; j--)
6984 {
6985 i.op[j] = i.op[j - 1];
6986 i.types[j] = i.types[j - 1];
6987 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
6988 i.flags[j] = i.flags[j - 1];
6989 }
6990 i.op[0].regs
6991 = (const reg_entry *) hash_find (reg_hash, "xmm0");
6992 i.types[0] = regxmm;
6993 i.tm.operand_types[0] = regxmm;
6994
6995 i.operands += 2;
6996 i.reg_operands += 2;
6997 i.tm.operands += 2;
6998
6999 dupl++;
7000 dest++;
7001 i.op[dupl] = i.op[dest];
7002 i.types[dupl] = i.types[dest];
7003 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7004 i.flags[dupl] = i.flags[dest];
7005 }
7006 else
7007 {
7008 duplicate:
7009 i.operands++;
7010 i.reg_operands++;
7011 i.tm.operands++;
7012
7013 i.op[dupl] = i.op[dest];
7014 i.types[dupl] = i.types[dest];
7015 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7016 i.flags[dupl] = i.flags[dest];
7017 }
7018
7019 if (i.tm.opcode_modifier.immext)
7020 process_immext ();
7021 }
7022 else if (i.tm.operand_types[0].bitfield.instance == Accum
7023 && i.tm.operand_types[0].bitfield.xmmword)
7024 {
7025 unsigned int j;
7026
7027 for (j = 1; j < i.operands; j++)
7028 {
7029 i.op[j - 1] = i.op[j];
7030 i.types[j - 1] = i.types[j];
7031
7032 /* We need to adjust fields in i.tm since they are used by
7033 build_modrm_byte. */
7034 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7035
7036 i.flags[j - 1] = i.flags[j];
7037 }
7038
7039 i.operands--;
7040 i.reg_operands--;
7041 i.tm.operands--;
7042 }
7043 else if (i.tm.opcode_modifier.implicitquadgroup)
7044 {
7045 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7046
7047 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7048 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7049 regnum = register_number (i.op[1].regs);
7050 first_reg_in_group = regnum & ~3;
7051 last_reg_in_group = first_reg_in_group + 3;
7052 if (regnum != first_reg_in_group)
7053 as_warn (_("source register `%s%s' implicitly denotes"
7054 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7055 register_prefix, i.op[1].regs->reg_name,
7056 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7057 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7058 i.tm.name);
7059 }
7060 else if (i.tm.opcode_modifier.regkludge)
7061 {
7062 /* The imul $imm, %reg instruction is converted into
7063 imul $imm, %reg, %reg, and the clr %reg instruction
7064 is converted into xor %reg, %reg. */
7065
7066 unsigned int first_reg_op;
7067
7068 if (operand_type_check (i.types[0], reg))
7069 first_reg_op = 0;
7070 else
7071 first_reg_op = 1;
7072 /* Pretend we saw the extra register operand. */
7073 gas_assert (i.reg_operands == 1
7074 && i.op[first_reg_op + 1].regs == 0);
7075 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7076 i.types[first_reg_op + 1] = i.types[first_reg_op];
7077 i.operands++;
7078 i.reg_operands++;
7079 }
7080
7081 if (i.tm.opcode_modifier.modrm)
7082 {
7083 /* The opcode is completed (modulo i.tm.extension_opcode which
7084 must be put into the modrm byte). Now, we make the modrm and
7085 index base bytes based on all the info we've collected. */
7086
7087 default_seg = build_modrm_byte ();
7088 }
7089 else if (i.types[0].bitfield.class == SReg)
7090 {
7091 if (flag_code != CODE_64BIT
7092 ? i.tm.base_opcode == POP_SEG_SHORT
7093 && i.op[0].regs->reg_num == 1
7094 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7095 && i.op[0].regs->reg_num < 4)
7096 {
7097 as_bad (_("you can't `%s %s%s'"),
7098 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7099 return 0;
7100 }
7101 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7102 {
7103 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7104 i.tm.opcode_length = 2;
7105 }
7106 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7107 }
7108 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7109 {
7110 default_seg = &ds;
7111 }
7112 else if (i.tm.opcode_modifier.isstring)
7113 {
7114 /* For the string instructions that allow a segment override
7115 on one of their operands, the default segment is ds. */
7116 default_seg = &ds;
7117 }
7118 else if (i.tm.opcode_modifier.shortform)
7119 {
7120 /* The register or float register operand is in operand
7121 0 or 1. */
7122 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7123
7124 /* Register goes in low 3 bits of opcode. */
7125 i.tm.base_opcode |= i.op[op].regs->reg_num;
7126 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7127 i.rex |= REX_B;
7128 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7129 {
7130 /* Warn about some common errors, but press on regardless.
7131 The first case can be generated by gcc (<= 2.8.1). */
7132 if (i.operands == 2)
7133 {
7134 /* Reversed arguments on faddp, fsubp, etc. */
7135 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7136 register_prefix, i.op[!intel_syntax].regs->reg_name,
7137 register_prefix, i.op[intel_syntax].regs->reg_name);
7138 }
7139 else
7140 {
7141 /* Extraneous `l' suffix on fp insn. */
7142 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7143 register_prefix, i.op[0].regs->reg_name);
7144 }
7145 }
7146 }
7147
7148 if (i.tm.base_opcode == 0x8d /* lea */
7149 && i.seg[0]
7150 && !quiet_warnings)
7151 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7152
7153 /* If a segment was explicitly specified, and the specified segment
7154 is not the default, use an opcode prefix to select it. If we
7155 never figured out what the default segment is, then default_seg
7156 will be zero at this point, and the specified segment prefix will
7157 always be used. */
7158 if ((i.seg[0]) && (i.seg[0] != default_seg))
7159 {
7160 if (!add_prefix (i.seg[0]->seg_prefix))
7161 return 0;
7162 }
7163 return 1;
7164 }
7165
7166 static const seg_entry *
7167 build_modrm_byte (void)
7168 {
7169 const seg_entry *default_seg = 0;
7170 unsigned int source, dest;
7171 int vex_3_sources;
7172
7173 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7174 if (vex_3_sources)
7175 {
7176 unsigned int nds, reg_slot;
7177 expressionS *exp;
7178
7179 dest = i.operands - 1;
7180 nds = dest - 1;
7181
7182 /* There are 2 kinds of instructions:
7183 1. 5 operands: 4 register operands or 3 register operands
7184 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7185 VexW0 or VexW1. The destination must be either XMM, YMM or
7186 ZMM register.
7187 2. 4 operands: 4 register operands or 3 register operands
7188 plus 1 memory operand, with VexXDS. */
7189 gas_assert ((i.reg_operands == 4
7190 || (i.reg_operands == 3 && i.mem_operands == 1))
7191 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7192 && i.tm.opcode_modifier.vexw
7193 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7194
7195 /* If VexW1 is set, the first non-immediate operand is the source and
7196 the second non-immediate one is encoded in the immediate operand. */
7197 if (i.tm.opcode_modifier.vexw == VEXW1)
7198 {
7199 source = i.imm_operands;
7200 reg_slot = i.imm_operands + 1;
7201 }
7202 else
7203 {
7204 source = i.imm_operands + 1;
7205 reg_slot = i.imm_operands;
7206 }
7207
7208 if (i.imm_operands == 0)
7209 {
7210 /* When there is no immediate operand, generate an 8bit
7211 immediate operand to encode the first operand. */
7212 exp = &im_expressions[i.imm_operands++];
7213 i.op[i.operands].imms = exp;
7214 i.types[i.operands] = imm8;
7215 i.operands++;
7216
7217 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7218 exp->X_op = O_constant;
7219 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7220 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7221 }
7222 else
7223 {
7224 gas_assert (i.imm_operands == 1);
7225 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7226 gas_assert (!i.tm.opcode_modifier.immext);
7227
7228 /* Turn on Imm8 again so that output_imm will generate it. */
7229 i.types[0].bitfield.imm8 = 1;
7230
7231 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7232 i.op[0].imms->X_add_number
7233 |= register_number (i.op[reg_slot].regs) << 4;
7234 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7235 }
7236
7237 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7238 i.vex.register_specifier = i.op[nds].regs;
7239 }
7240 else
7241 source = dest = 0;
7242
7243 /* i.reg_operands MUST be the number of real register operands;
7244 implicit registers do not count. If there are 3 register
7245 operands, it must be a instruction with VexNDS. For a
7246 instruction with VexNDD, the destination register is encoded
7247 in VEX prefix. If there are 4 register operands, it must be
7248 a instruction with VEX prefix and 3 sources. */
7249 if (i.mem_operands == 0
7250 && ((i.reg_operands == 2
7251 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7252 || (i.reg_operands == 3
7253 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7254 || (i.reg_operands == 4 && vex_3_sources)))
7255 {
7256 switch (i.operands)
7257 {
7258 case 2:
7259 source = 0;
7260 break;
7261 case 3:
7262 /* When there are 3 operands, one of them may be immediate,
7263 which may be the first or the last operand. Otherwise,
7264 the first operand must be shift count register (cl) or it
7265 is an instruction with VexNDS. */
7266 gas_assert (i.imm_operands == 1
7267 || (i.imm_operands == 0
7268 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7269 || (i.types[0].bitfield.instance == RegC
7270 && i.types[0].bitfield.byte))));
7271 if (operand_type_check (i.types[0], imm)
7272 || (i.types[0].bitfield.instance == RegC
7273 && i.types[0].bitfield.byte))
7274 source = 1;
7275 else
7276 source = 0;
7277 break;
7278 case 4:
7279 /* When there are 4 operands, the first two must be 8bit
7280 immediate operands. The source operand will be the 3rd
7281 one.
7282
7283 For instructions with VexNDS, if the first operand
7284 an imm8, the source operand is the 2nd one. If the last
7285 operand is imm8, the source operand is the first one. */
7286 gas_assert ((i.imm_operands == 2
7287 && i.types[0].bitfield.imm8
7288 && i.types[1].bitfield.imm8)
7289 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7290 && i.imm_operands == 1
7291 && (i.types[0].bitfield.imm8
7292 || i.types[i.operands - 1].bitfield.imm8
7293 || i.rounding)));
7294 if (i.imm_operands == 2)
7295 source = 2;
7296 else
7297 {
7298 if (i.types[0].bitfield.imm8)
7299 source = 1;
7300 else
7301 source = 0;
7302 }
7303 break;
7304 case 5:
7305 if (is_evex_encoding (&i.tm))
7306 {
7307 /* For EVEX instructions, when there are 5 operands, the
7308 first one must be immediate operand. If the second one
7309 is immediate operand, the source operand is the 3th
7310 one. If the last one is immediate operand, the source
7311 operand is the 2nd one. */
7312 gas_assert (i.imm_operands == 2
7313 && i.tm.opcode_modifier.sae
7314 && operand_type_check (i.types[0], imm));
7315 if (operand_type_check (i.types[1], imm))
7316 source = 2;
7317 else if (operand_type_check (i.types[4], imm))
7318 source = 1;
7319 else
7320 abort ();
7321 }
7322 break;
7323 default:
7324 abort ();
7325 }
7326
7327 if (!vex_3_sources)
7328 {
7329 dest = source + 1;
7330
7331 /* RC/SAE operand could be between DEST and SRC. That happens
7332 when one operand is GPR and the other one is XMM/YMM/ZMM
7333 register. */
7334 if (i.rounding && i.rounding->operand == (int) dest)
7335 dest++;
7336
7337 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7338 {
7339 /* For instructions with VexNDS, the register-only source
7340 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7341 register. It is encoded in VEX prefix. */
7342
7343 i386_operand_type op;
7344 unsigned int vvvv;
7345
7346 /* Check register-only source operand when two source
7347 operands are swapped. */
7348 if (!i.tm.operand_types[source].bitfield.baseindex
7349 && i.tm.operand_types[dest].bitfield.baseindex)
7350 {
7351 vvvv = source;
7352 source = dest;
7353 }
7354 else
7355 vvvv = dest;
7356
7357 op = i.tm.operand_types[vvvv];
7358 if ((dest + 1) >= i.operands
7359 || ((op.bitfield.class != Reg
7360 || (!op.bitfield.dword && !op.bitfield.qword))
7361 && op.bitfield.class != RegSIMD
7362 && !operand_type_equal (&op, &regmask)))
7363 abort ();
7364 i.vex.register_specifier = i.op[vvvv].regs;
7365 dest++;
7366 }
7367 }
7368
7369 i.rm.mode = 3;
7370 /* One of the register operands will be encoded in the i.rm.reg
7371 field, the other in the combined i.rm.mode and i.rm.regmem
7372 fields. If no form of this instruction supports a memory
7373 destination operand, then we assume the source operand may
7374 sometimes be a memory operand and so we need to store the
7375 destination in the i.rm.reg field. */
7376 if (!i.tm.opcode_modifier.regmem
7377 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7378 {
7379 i.rm.reg = i.op[dest].regs->reg_num;
7380 i.rm.regmem = i.op[source].regs->reg_num;
7381 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7382 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7383 i.has_regmmx = TRUE;
7384 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7385 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7386 {
7387 if (i.types[dest].bitfield.zmmword
7388 || i.types[source].bitfield.zmmword)
7389 i.has_regzmm = TRUE;
7390 else if (i.types[dest].bitfield.ymmword
7391 || i.types[source].bitfield.ymmword)
7392 i.has_regymm = TRUE;
7393 else
7394 i.has_regxmm = TRUE;
7395 }
7396 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7397 i.rex |= REX_R;
7398 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7399 i.vrex |= REX_R;
7400 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7401 i.rex |= REX_B;
7402 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7403 i.vrex |= REX_B;
7404 }
7405 else
7406 {
7407 i.rm.reg = i.op[source].regs->reg_num;
7408 i.rm.regmem = i.op[dest].regs->reg_num;
7409 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7410 i.rex |= REX_B;
7411 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7412 i.vrex |= REX_B;
7413 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7414 i.rex |= REX_R;
7415 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7416 i.vrex |= REX_R;
7417 }
7418 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7419 {
7420 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7421 abort ();
7422 i.rex &= ~REX_R;
7423 add_prefix (LOCK_PREFIX_OPCODE);
7424 }
7425 }
7426 else
7427 { /* If it's not 2 reg operands... */
7428 unsigned int mem;
7429
7430 if (i.mem_operands)
7431 {
7432 unsigned int fake_zero_displacement = 0;
7433 unsigned int op;
7434
7435 for (op = 0; op < i.operands; op++)
7436 if (i.flags[op] & Operand_Mem)
7437 break;
7438 gas_assert (op < i.operands);
7439
7440 if (i.tm.opcode_modifier.vecsib)
7441 {
7442 if (i.index_reg->reg_num == RegIZ)
7443 abort ();
7444
7445 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7446 if (!i.base_reg)
7447 {
7448 i.sib.base = NO_BASE_REGISTER;
7449 i.sib.scale = i.log2_scale_factor;
7450 i.types[op].bitfield.disp8 = 0;
7451 i.types[op].bitfield.disp16 = 0;
7452 i.types[op].bitfield.disp64 = 0;
7453 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7454 {
7455 /* Must be 32 bit */
7456 i.types[op].bitfield.disp32 = 1;
7457 i.types[op].bitfield.disp32s = 0;
7458 }
7459 else
7460 {
7461 i.types[op].bitfield.disp32 = 0;
7462 i.types[op].bitfield.disp32s = 1;
7463 }
7464 }
7465 i.sib.index = i.index_reg->reg_num;
7466 if ((i.index_reg->reg_flags & RegRex) != 0)
7467 i.rex |= REX_X;
7468 if ((i.index_reg->reg_flags & RegVRex) != 0)
7469 i.vrex |= REX_X;
7470 }
7471
7472 default_seg = &ds;
7473
7474 if (i.base_reg == 0)
7475 {
7476 i.rm.mode = 0;
7477 if (!i.disp_operands)
7478 fake_zero_displacement = 1;
7479 if (i.index_reg == 0)
7480 {
7481 i386_operand_type newdisp;
7482
7483 gas_assert (!i.tm.opcode_modifier.vecsib);
7484 /* Operand is just <disp> */
7485 if (flag_code == CODE_64BIT)
7486 {
7487 /* 64bit mode overwrites the 32bit absolute
7488 addressing by RIP relative addressing and
7489 absolute addressing is encoded by one of the
7490 redundant SIB forms. */
7491 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7492 i.sib.base = NO_BASE_REGISTER;
7493 i.sib.index = NO_INDEX_REGISTER;
7494 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7495 }
7496 else if ((flag_code == CODE_16BIT)
7497 ^ (i.prefix[ADDR_PREFIX] != 0))
7498 {
7499 i.rm.regmem = NO_BASE_REGISTER_16;
7500 newdisp = disp16;
7501 }
7502 else
7503 {
7504 i.rm.regmem = NO_BASE_REGISTER;
7505 newdisp = disp32;
7506 }
7507 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7508 i.types[op] = operand_type_or (i.types[op], newdisp);
7509 }
7510 else if (!i.tm.opcode_modifier.vecsib)
7511 {
7512 /* !i.base_reg && i.index_reg */
7513 if (i.index_reg->reg_num == RegIZ)
7514 i.sib.index = NO_INDEX_REGISTER;
7515 else
7516 i.sib.index = i.index_reg->reg_num;
7517 i.sib.base = NO_BASE_REGISTER;
7518 i.sib.scale = i.log2_scale_factor;
7519 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7520 i.types[op].bitfield.disp8 = 0;
7521 i.types[op].bitfield.disp16 = 0;
7522 i.types[op].bitfield.disp64 = 0;
7523 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7524 {
7525 /* Must be 32 bit */
7526 i.types[op].bitfield.disp32 = 1;
7527 i.types[op].bitfield.disp32s = 0;
7528 }
7529 else
7530 {
7531 i.types[op].bitfield.disp32 = 0;
7532 i.types[op].bitfield.disp32s = 1;
7533 }
7534 if ((i.index_reg->reg_flags & RegRex) != 0)
7535 i.rex |= REX_X;
7536 }
7537 }
7538 /* RIP addressing for 64bit mode. */
7539 else if (i.base_reg->reg_num == RegIP)
7540 {
7541 gas_assert (!i.tm.opcode_modifier.vecsib);
7542 i.rm.regmem = NO_BASE_REGISTER;
7543 i.types[op].bitfield.disp8 = 0;
7544 i.types[op].bitfield.disp16 = 0;
7545 i.types[op].bitfield.disp32 = 0;
7546 i.types[op].bitfield.disp32s = 1;
7547 i.types[op].bitfield.disp64 = 0;
7548 i.flags[op] |= Operand_PCrel;
7549 if (! i.disp_operands)
7550 fake_zero_displacement = 1;
7551 }
7552 else if (i.base_reg->reg_type.bitfield.word)
7553 {
7554 gas_assert (!i.tm.opcode_modifier.vecsib);
7555 switch (i.base_reg->reg_num)
7556 {
7557 case 3: /* (%bx) */
7558 if (i.index_reg == 0)
7559 i.rm.regmem = 7;
7560 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
7561 i.rm.regmem = i.index_reg->reg_num - 6;
7562 break;
7563 case 5: /* (%bp) */
7564 default_seg = &ss;
7565 if (i.index_reg == 0)
7566 {
7567 i.rm.regmem = 6;
7568 if (operand_type_check (i.types[op], disp) == 0)
7569 {
7570 /* fake (%bp) into 0(%bp) */
7571 i.types[op].bitfield.disp8 = 1;
7572 fake_zero_displacement = 1;
7573 }
7574 }
7575 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
7576 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7577 break;
7578 default: /* (%si) -> 4 or (%di) -> 5 */
7579 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7580 }
7581 i.rm.mode = mode_from_disp_size (i.types[op]);
7582 }
7583 else /* i.base_reg and 32/64 bit mode */
7584 {
7585 if (flag_code == CODE_64BIT
7586 && operand_type_check (i.types[op], disp))
7587 {
7588 i.types[op].bitfield.disp16 = 0;
7589 i.types[op].bitfield.disp64 = 0;
7590 if (i.prefix[ADDR_PREFIX] == 0)
7591 {
7592 i.types[op].bitfield.disp32 = 0;
7593 i.types[op].bitfield.disp32s = 1;
7594 }
7595 else
7596 {
7597 i.types[op].bitfield.disp32 = 1;
7598 i.types[op].bitfield.disp32s = 0;
7599 }
7600 }
7601
7602 if (!i.tm.opcode_modifier.vecsib)
7603 i.rm.regmem = i.base_reg->reg_num;
7604 if ((i.base_reg->reg_flags & RegRex) != 0)
7605 i.rex |= REX_B;
7606 i.sib.base = i.base_reg->reg_num;
7607 /* x86-64 ignores REX prefix bit here to avoid decoder
7608 complications. */
7609 if (!(i.base_reg->reg_flags & RegRex)
7610 && (i.base_reg->reg_num == EBP_REG_NUM
7611 || i.base_reg->reg_num == ESP_REG_NUM))
7612 default_seg = &ss;
7613 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7614 {
7615 fake_zero_displacement = 1;
7616 i.types[op].bitfield.disp8 = 1;
7617 }
7618 i.sib.scale = i.log2_scale_factor;
7619 if (i.index_reg == 0)
7620 {
7621 gas_assert (!i.tm.opcode_modifier.vecsib);
7622 /* <disp>(%esp) becomes two byte modrm with no index
7623 register. We've already stored the code for esp
7624 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7625 Any base register besides %esp will not use the
7626 extra modrm byte. */
7627 i.sib.index = NO_INDEX_REGISTER;
7628 }
7629 else if (!i.tm.opcode_modifier.vecsib)
7630 {
7631 if (i.index_reg->reg_num == RegIZ)
7632 i.sib.index = NO_INDEX_REGISTER;
7633 else
7634 i.sib.index = i.index_reg->reg_num;
7635 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7636 if ((i.index_reg->reg_flags & RegRex) != 0)
7637 i.rex |= REX_X;
7638 }
7639
7640 if (i.disp_operands
7641 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7642 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7643 i.rm.mode = 0;
7644 else
7645 {
7646 if (!fake_zero_displacement
7647 && !i.disp_operands
7648 && i.disp_encoding)
7649 {
7650 fake_zero_displacement = 1;
7651 if (i.disp_encoding == disp_encoding_8bit)
7652 i.types[op].bitfield.disp8 = 1;
7653 else
7654 i.types[op].bitfield.disp32 = 1;
7655 }
7656 i.rm.mode = mode_from_disp_size (i.types[op]);
7657 }
7658 }
7659
7660 if (fake_zero_displacement)
7661 {
7662 /* Fakes a zero displacement assuming that i.types[op]
7663 holds the correct displacement size. */
7664 expressionS *exp;
7665
7666 gas_assert (i.op[op].disps == 0);
7667 exp = &disp_expressions[i.disp_operands++];
7668 i.op[op].disps = exp;
7669 exp->X_op = O_constant;
7670 exp->X_add_number = 0;
7671 exp->X_add_symbol = (symbolS *) 0;
7672 exp->X_op_symbol = (symbolS *) 0;
7673 }
7674
7675 mem = op;
7676 }
7677 else
7678 mem = ~0;
7679
7680 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7681 {
7682 if (operand_type_check (i.types[0], imm))
7683 i.vex.register_specifier = NULL;
7684 else
7685 {
7686 /* VEX.vvvv encodes one of the sources when the first
7687 operand is not an immediate. */
7688 if (i.tm.opcode_modifier.vexw == VEXW0)
7689 i.vex.register_specifier = i.op[0].regs;
7690 else
7691 i.vex.register_specifier = i.op[1].regs;
7692 }
7693
7694 /* Destination is a XMM register encoded in the ModRM.reg
7695 and VEX.R bit. */
7696 i.rm.reg = i.op[2].regs->reg_num;
7697 if ((i.op[2].regs->reg_flags & RegRex) != 0)
7698 i.rex |= REX_R;
7699
7700 /* ModRM.rm and VEX.B encodes the other source. */
7701 if (!i.mem_operands)
7702 {
7703 i.rm.mode = 3;
7704
7705 if (i.tm.opcode_modifier.vexw == VEXW0)
7706 i.rm.regmem = i.op[1].regs->reg_num;
7707 else
7708 i.rm.regmem = i.op[0].regs->reg_num;
7709
7710 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7711 i.rex |= REX_B;
7712 }
7713 }
7714 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7715 {
7716 i.vex.register_specifier = i.op[2].regs;
7717 if (!i.mem_operands)
7718 {
7719 i.rm.mode = 3;
7720 i.rm.regmem = i.op[1].regs->reg_num;
7721 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7722 i.rex |= REX_B;
7723 }
7724 }
7725 /* Fill in i.rm.reg or i.rm.regmem field with register operand
7726 (if any) based on i.tm.extension_opcode. Again, we must be
7727 careful to make sure that segment/control/debug/test/MMX
7728 registers are coded into the i.rm.reg field. */
7729 else if (i.reg_operands)
7730 {
7731 unsigned int op;
7732 unsigned int vex_reg = ~0;
7733
7734 for (op = 0; op < i.operands; op++)
7735 {
7736 if (i.types[op].bitfield.class == Reg
7737 || i.types[op].bitfield.class == RegBND
7738 || i.types[op].bitfield.class == RegMask
7739 || i.types[op].bitfield.class == SReg
7740 || i.types[op].bitfield.class == RegCR
7741 || i.types[op].bitfield.class == RegDR
7742 || i.types[op].bitfield.class == RegTR)
7743 break;
7744 if (i.types[op].bitfield.class == RegSIMD)
7745 {
7746 if (i.types[op].bitfield.zmmword)
7747 i.has_regzmm = TRUE;
7748 else if (i.types[op].bitfield.ymmword)
7749 i.has_regymm = TRUE;
7750 else
7751 i.has_regxmm = TRUE;
7752 break;
7753 }
7754 if (i.types[op].bitfield.class == RegMMX)
7755 {
7756 i.has_regmmx = TRUE;
7757 break;
7758 }
7759 }
7760
7761 if (vex_3_sources)
7762 op = dest;
7763 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7764 {
7765 /* For instructions with VexNDS, the register-only
7766 source operand is encoded in VEX prefix. */
7767 gas_assert (mem != (unsigned int) ~0);
7768
7769 if (op > mem)
7770 {
7771 vex_reg = op++;
7772 gas_assert (op < i.operands);
7773 }
7774 else
7775 {
7776 /* Check register-only source operand when two source
7777 operands are swapped. */
7778 if (!i.tm.operand_types[op].bitfield.baseindex
7779 && i.tm.operand_types[op + 1].bitfield.baseindex)
7780 {
7781 vex_reg = op;
7782 op += 2;
7783 gas_assert (mem == (vex_reg + 1)
7784 && op < i.operands);
7785 }
7786 else
7787 {
7788 vex_reg = op + 1;
7789 gas_assert (vex_reg < i.operands);
7790 }
7791 }
7792 }
7793 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7794 {
7795 /* For instructions with VexNDD, the register destination
7796 is encoded in VEX prefix. */
7797 if (i.mem_operands == 0)
7798 {
7799 /* There is no memory operand. */
7800 gas_assert ((op + 2) == i.operands);
7801 vex_reg = op + 1;
7802 }
7803 else
7804 {
7805 /* There are only 2 non-immediate operands. */
7806 gas_assert (op < i.imm_operands + 2
7807 && i.operands == i.imm_operands + 2);
7808 vex_reg = i.imm_operands + 1;
7809 }
7810 }
7811 else
7812 gas_assert (op < i.operands);
7813
7814 if (vex_reg != (unsigned int) ~0)
7815 {
7816 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7817
7818 if ((type->bitfield.class != Reg
7819 || (!type->bitfield.dword && !type->bitfield.qword))
7820 && type->bitfield.class != RegSIMD
7821 && !operand_type_equal (type, &regmask))
7822 abort ();
7823
7824 i.vex.register_specifier = i.op[vex_reg].regs;
7825 }
7826
7827 /* Don't set OP operand twice. */
7828 if (vex_reg != op)
7829 {
7830 /* If there is an extension opcode to put here, the
7831 register number must be put into the regmem field. */
7832 if (i.tm.extension_opcode != None)
7833 {
7834 i.rm.regmem = i.op[op].regs->reg_num;
7835 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7836 i.rex |= REX_B;
7837 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7838 i.vrex |= REX_B;
7839 }
7840 else
7841 {
7842 i.rm.reg = i.op[op].regs->reg_num;
7843 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7844 i.rex |= REX_R;
7845 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7846 i.vrex |= REX_R;
7847 }
7848 }
7849
7850 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7851 must set it to 3 to indicate this is a register operand
7852 in the regmem field. */
7853 if (!i.mem_operands)
7854 i.rm.mode = 3;
7855 }
7856
7857 /* Fill in i.rm.reg field with extension opcode (if any). */
7858 if (i.tm.extension_opcode != None)
7859 i.rm.reg = i.tm.extension_opcode;
7860 }
7861 return default_seg;
7862 }
7863
7864 static void
7865 output_branch (void)
7866 {
7867 char *p;
7868 int size;
7869 int code16;
7870 int prefix;
7871 relax_substateT subtype;
7872 symbolS *sym;
7873 offsetT off;
7874
7875 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7876 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7877
7878 prefix = 0;
7879 if (i.prefix[DATA_PREFIX] != 0)
7880 {
7881 prefix = 1;
7882 i.prefixes -= 1;
7883 code16 ^= CODE16;
7884 }
7885 /* Pentium4 branch hints. */
7886 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7887 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7888 {
7889 prefix++;
7890 i.prefixes--;
7891 }
7892 if (i.prefix[REX_PREFIX] != 0)
7893 {
7894 prefix++;
7895 i.prefixes--;
7896 }
7897
7898 /* BND prefixed jump. */
7899 if (i.prefix[BND_PREFIX] != 0)
7900 {
7901 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7902 i.prefixes -= 1;
7903 }
7904
7905 if (i.prefixes != 0 && !intel_syntax)
7906 as_warn (_("skipping prefixes on this instruction"));
7907
7908 /* It's always a symbol; End frag & setup for relax.
7909 Make sure there is enough room in this frag for the largest
7910 instruction we may generate in md_convert_frag. This is 2
7911 bytes for the opcode and room for the prefix and largest
7912 displacement. */
7913 frag_grow (prefix + 2 + 4);
7914 /* Prefix and 1 opcode byte go in fr_fix. */
7915 p = frag_more (prefix + 1);
7916 if (i.prefix[DATA_PREFIX] != 0)
7917 *p++ = DATA_PREFIX_OPCODE;
7918 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7919 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7920 *p++ = i.prefix[SEG_PREFIX];
7921 if (i.prefix[REX_PREFIX] != 0)
7922 *p++ = i.prefix[REX_PREFIX];
7923 *p = i.tm.base_opcode;
7924
7925 if ((unsigned char) *p == JUMP_PC_RELATIVE)
7926 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7927 else if (cpu_arch_flags.bitfield.cpui386)
7928 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7929 else
7930 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7931 subtype |= code16;
7932
7933 sym = i.op[0].disps->X_add_symbol;
7934 off = i.op[0].disps->X_add_number;
7935
7936 if (i.op[0].disps->X_op != O_constant
7937 && i.op[0].disps->X_op != O_symbol)
7938 {
7939 /* Handle complex expressions. */
7940 sym = make_expr_symbol (i.op[0].disps);
7941 off = 0;
7942 }
7943
7944 /* 1 possible extra opcode + 4 byte displacement go in var part.
7945 Pass reloc in fr_var. */
7946 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7947 }
7948
7949 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7950 /* Return TRUE iff PLT32 relocation should be used for branching to
7951 symbol S. */
7952
7953 static bfd_boolean
7954 need_plt32_p (symbolS *s)
7955 {
7956 /* PLT32 relocation is ELF only. */
7957 if (!IS_ELF)
7958 return FALSE;
7959
7960 #ifdef TE_SOLARIS
7961 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
7962 krtld support it. */
7963 return FALSE;
7964 #endif
7965
7966 /* Since there is no need to prepare for PLT branch on x86-64, we
7967 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
7968 be used as a marker for 32-bit PC-relative branches. */
7969 if (!object_64bit)
7970 return FALSE;
7971
7972 /* Weak or undefined symbol need PLT32 relocation. */
7973 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
7974 return TRUE;
7975
7976 /* Non-global symbol doesn't need PLT32 relocation. */
7977 if (! S_IS_EXTERNAL (s))
7978 return FALSE;
7979
7980 /* Other global symbols need PLT32 relocation. NB: Symbol with
7981 non-default visibilities are treated as normal global symbol
7982 so that PLT32 relocation can be used as a marker for 32-bit
7983 PC-relative branches. It is useful for linker relaxation. */
7984 return TRUE;
7985 }
7986 #endif
7987
7988 static void
7989 output_jump (void)
7990 {
7991 char *p;
7992 int size;
7993 fixS *fixP;
7994 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
7995
7996 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
7997 {
7998 /* This is a loop or jecxz type instruction. */
7999 size = 1;
8000 if (i.prefix[ADDR_PREFIX] != 0)
8001 {
8002 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8003 i.prefixes -= 1;
8004 }
8005 /* Pentium4 branch hints. */
8006 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8007 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8008 {
8009 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8010 i.prefixes--;
8011 }
8012 }
8013 else
8014 {
8015 int code16;
8016
8017 code16 = 0;
8018 if (flag_code == CODE_16BIT)
8019 code16 = CODE16;
8020
8021 if (i.prefix[DATA_PREFIX] != 0)
8022 {
8023 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8024 i.prefixes -= 1;
8025 code16 ^= CODE16;
8026 }
8027
8028 size = 4;
8029 if (code16)
8030 size = 2;
8031 }
8032
8033 if (i.prefix[REX_PREFIX] != 0)
8034 {
8035 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8036 i.prefixes -= 1;
8037 }
8038
8039 /* BND prefixed jump. */
8040 if (i.prefix[BND_PREFIX] != 0)
8041 {
8042 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8043 i.prefixes -= 1;
8044 }
8045
8046 if (i.prefixes != 0 && !intel_syntax)
8047 as_warn (_("skipping prefixes on this instruction"));
8048
8049 p = frag_more (i.tm.opcode_length + size);
8050 switch (i.tm.opcode_length)
8051 {
8052 case 2:
8053 *p++ = i.tm.base_opcode >> 8;
8054 /* Fall through. */
8055 case 1:
8056 *p++ = i.tm.base_opcode;
8057 break;
8058 default:
8059 abort ();
8060 }
8061
8062 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8063 if (size == 4
8064 && jump_reloc == NO_RELOC
8065 && need_plt32_p (i.op[0].disps->X_add_symbol))
8066 jump_reloc = BFD_RELOC_X86_64_PLT32;
8067 #endif
8068
8069 jump_reloc = reloc (size, 1, 1, jump_reloc);
8070
8071 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8072 i.op[0].disps, 1, jump_reloc);
8073
8074 /* All jumps handled here are signed, but don't use a signed limit
8075 check for 32 and 16 bit jumps as we want to allow wrap around at
8076 4G and 64k respectively. */
8077 if (size == 1)
8078 fixP->fx_signed = 1;
8079 }
8080
8081 static void
8082 output_interseg_jump (void)
8083 {
8084 char *p;
8085 int size;
8086 int prefix;
8087 int code16;
8088
8089 code16 = 0;
8090 if (flag_code == CODE_16BIT)
8091 code16 = CODE16;
8092
8093 prefix = 0;
8094 if (i.prefix[DATA_PREFIX] != 0)
8095 {
8096 prefix = 1;
8097 i.prefixes -= 1;
8098 code16 ^= CODE16;
8099 }
8100 if (i.prefix[REX_PREFIX] != 0)
8101 {
8102 prefix++;
8103 i.prefixes -= 1;
8104 }
8105
8106 size = 4;
8107 if (code16)
8108 size = 2;
8109
8110 if (i.prefixes != 0 && !intel_syntax)
8111 as_warn (_("skipping prefixes on this instruction"));
8112
8113 /* 1 opcode; 2 segment; offset */
8114 p = frag_more (prefix + 1 + 2 + size);
8115
8116 if (i.prefix[DATA_PREFIX] != 0)
8117 *p++ = DATA_PREFIX_OPCODE;
8118
8119 if (i.prefix[REX_PREFIX] != 0)
8120 *p++ = i.prefix[REX_PREFIX];
8121
8122 *p++ = i.tm.base_opcode;
8123 if (i.op[1].imms->X_op == O_constant)
8124 {
8125 offsetT n = i.op[1].imms->X_add_number;
8126
8127 if (size == 2
8128 && !fits_in_unsigned_word (n)
8129 && !fits_in_signed_word (n))
8130 {
8131 as_bad (_("16-bit jump out of range"));
8132 return;
8133 }
8134 md_number_to_chars (p, n, size);
8135 }
8136 else
8137 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8138 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8139 if (i.op[0].imms->X_op != O_constant)
8140 as_bad (_("can't handle non absolute segment in `%s'"),
8141 i.tm.name);
8142 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8143 }
8144
8145 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8146 void
8147 x86_cleanup (void)
8148 {
8149 char *p;
8150 asection *seg = now_seg;
8151 subsegT subseg = now_subseg;
8152 asection *sec;
8153 unsigned int alignment, align_size_1;
8154 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8155 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8156 unsigned int padding;
8157
8158 if (!IS_ELF || !x86_used_note)
8159 return;
8160
8161 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8162
8163 /* The .note.gnu.property section layout:
8164
8165 Field Length Contents
8166 ---- ---- ----
8167 n_namsz 4 4
8168 n_descsz 4 The note descriptor size
8169 n_type 4 NT_GNU_PROPERTY_TYPE_0
8170 n_name 4 "GNU"
8171 n_desc n_descsz The program property array
8172 .... .... ....
8173 */
8174
8175 /* Create the .note.gnu.property section. */
8176 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8177 bfd_set_section_flags (sec,
8178 (SEC_ALLOC
8179 | SEC_LOAD
8180 | SEC_DATA
8181 | SEC_HAS_CONTENTS
8182 | SEC_READONLY));
8183
8184 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8185 {
8186 align_size_1 = 7;
8187 alignment = 3;
8188 }
8189 else
8190 {
8191 align_size_1 = 3;
8192 alignment = 2;
8193 }
8194
8195 bfd_set_section_alignment (sec, alignment);
8196 elf_section_type (sec) = SHT_NOTE;
8197
8198 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8199 + 4-byte data */
8200 isa_1_descsz_raw = 4 + 4 + 4;
8201 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8202 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8203
8204 feature_2_descsz_raw = isa_1_descsz;
8205 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8206 + 4-byte data */
8207 feature_2_descsz_raw += 4 + 4 + 4;
8208 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8209 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8210 & ~align_size_1);
8211
8212 descsz = feature_2_descsz;
8213 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8214 p = frag_more (4 + 4 + 4 + 4 + descsz);
8215
8216 /* Write n_namsz. */
8217 md_number_to_chars (p, (valueT) 4, 4);
8218
8219 /* Write n_descsz. */
8220 md_number_to_chars (p + 4, (valueT) descsz, 4);
8221
8222 /* Write n_type. */
8223 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8224
8225 /* Write n_name. */
8226 memcpy (p + 4 * 3, "GNU", 4);
8227
8228 /* Write 4-byte type. */
8229 md_number_to_chars (p + 4 * 4,
8230 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8231
8232 /* Write 4-byte data size. */
8233 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8234
8235 /* Write 4-byte data. */
8236 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8237
8238 /* Zero out paddings. */
8239 padding = isa_1_descsz - isa_1_descsz_raw;
8240 if (padding)
8241 memset (p + 4 * 7, 0, padding);
8242
8243 /* Write 4-byte type. */
8244 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8245 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8246
8247 /* Write 4-byte data size. */
8248 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8249
8250 /* Write 4-byte data. */
8251 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8252 (valueT) x86_feature_2_used, 4);
8253
8254 /* Zero out paddings. */
8255 padding = feature_2_descsz - feature_2_descsz_raw;
8256 if (padding)
8257 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8258
8259 /* We probably can't restore the current segment, for there likely
8260 isn't one yet... */
8261 if (seg && subseg)
8262 subseg_set (seg, subseg);
8263 }
8264 #endif
8265
8266 static unsigned int
8267 encoding_length (const fragS *start_frag, offsetT start_off,
8268 const char *frag_now_ptr)
8269 {
8270 unsigned int len = 0;
8271
8272 if (start_frag != frag_now)
8273 {
8274 const fragS *fr = start_frag;
8275
8276 do {
8277 len += fr->fr_fix;
8278 fr = fr->fr_next;
8279 } while (fr && fr != frag_now);
8280 }
8281
8282 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8283 }
8284
8285 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8286 be macro-fused with conditional jumps. */
8287
8288 static int
8289 maybe_fused_with_jcc_p (void)
8290 {
8291 /* No RIP address. */
8292 if (i.base_reg && i.base_reg->reg_num == RegIP)
8293 return 0;
8294
8295 /* No VEX/EVEX encoding. */
8296 if (is_any_vex_encoding (&i.tm))
8297 return 0;
8298
8299 /* and, add, sub with destination register. */
8300 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8301 || i.tm.base_opcode <= 5
8302 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8303 || ((i.tm.base_opcode | 3) == 0x83
8304 && ((i.tm.extension_opcode | 1) == 0x5
8305 || i.tm.extension_opcode == 0x0)))
8306 return (i.types[1].bitfield.class == Reg
8307 || i.types[1].bitfield.instance == Accum);
8308
8309 /* test, cmp with any register. */
8310 if ((i.tm.base_opcode | 1) == 0x85
8311 || (i.tm.base_opcode | 1) == 0xa9
8312 || ((i.tm.base_opcode | 1) == 0xf7
8313 && i.tm.extension_opcode == 0)
8314 || (i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8315 || ((i.tm.base_opcode | 3) == 0x83
8316 && (i.tm.extension_opcode == 0x7)))
8317 return (i.types[0].bitfield.class == Reg
8318 || i.types[0].bitfield.instance == Accum
8319 || i.types[1].bitfield.class == Reg
8320 || i.types[1].bitfield.instance == Accum);
8321
8322 /* inc, dec with any register. */
8323 if ((i.tm.cpu_flags.bitfield.cpuno64
8324 && (i.tm.base_opcode | 0xf) == 0x4f)
8325 || ((i.tm.base_opcode | 1) == 0xff
8326 && i.tm.extension_opcode <= 0x1))
8327 return (i.types[0].bitfield.class == Reg
8328 || i.types[0].bitfield.instance == Accum);
8329
8330 return 0;
8331 }
8332
8333 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8334
8335 static int
8336 add_fused_jcc_padding_frag_p (void)
8337 {
8338 /* NB: Don't work with COND_JUMP86 without i386. */
8339 if (!align_branch_power
8340 || now_seg == absolute_section
8341 || !cpu_arch_flags.bitfield.cpui386
8342 || !(align_branch & align_branch_fused_bit))
8343 return 0;
8344
8345 if (maybe_fused_with_jcc_p ())
8346 {
8347 if (last_insn.kind == last_insn_other
8348 || last_insn.seg != now_seg)
8349 return 1;
8350 if (flag_debug)
8351 as_warn_where (last_insn.file, last_insn.line,
8352 _("`%s` skips -malign-branch-boundary on `%s`"),
8353 last_insn.name, i.tm.name);
8354 }
8355
8356 return 0;
8357 }
8358
8359 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
8360
8361 static int
8362 add_branch_prefix_frag_p (void)
8363 {
8364 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8365 to PadLock instructions since they include prefixes in opcode. */
8366 if (!align_branch_power
8367 || !align_branch_prefix_size
8368 || now_seg == absolute_section
8369 || i.tm.cpu_flags.bitfield.cpupadlock
8370 || !cpu_arch_flags.bitfield.cpui386)
8371 return 0;
8372
8373 /* Don't add prefix if it is a prefix or there is no operand in case
8374 that segment prefix is special. */
8375 if (!i.operands || i.tm.opcode_modifier.isprefix)
8376 return 0;
8377
8378 if (last_insn.kind == last_insn_other
8379 || last_insn.seg != now_seg)
8380 return 1;
8381
8382 if (flag_debug)
8383 as_warn_where (last_insn.file, last_insn.line,
8384 _("`%s` skips -malign-branch-boundary on `%s`"),
8385 last_insn.name, i.tm.name);
8386
8387 return 0;
8388 }
8389
8390 /* Return 1 if a BRANCH_PADDING frag should be generated. */
8391
8392 static int
8393 add_branch_padding_frag_p (enum align_branch_kind *branch_p)
8394 {
8395 int add_padding;
8396
8397 /* NB: Don't work with COND_JUMP86 without i386. */
8398 if (!align_branch_power
8399 || now_seg == absolute_section
8400 || !cpu_arch_flags.bitfield.cpui386)
8401 return 0;
8402
8403 add_padding = 0;
8404
8405 /* Check for jcc and direct jmp. */
8406 if (i.tm.opcode_modifier.jump == JUMP)
8407 {
8408 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8409 {
8410 *branch_p = align_branch_jmp;
8411 add_padding = align_branch & align_branch_jmp_bit;
8412 }
8413 else
8414 {
8415 *branch_p = align_branch_jcc;
8416 if ((align_branch & align_branch_jcc_bit))
8417 add_padding = 1;
8418 }
8419 }
8420 else if (is_any_vex_encoding (&i.tm))
8421 return 0;
8422 else if ((i.tm.base_opcode | 1) == 0xc3)
8423 {
8424 /* Near ret. */
8425 *branch_p = align_branch_ret;
8426 if ((align_branch & align_branch_ret_bit))
8427 add_padding = 1;
8428 }
8429 else
8430 {
8431 /* Check for indirect jmp, direct and indirect calls. */
8432 if (i.tm.base_opcode == 0xe8)
8433 {
8434 /* Direct call. */
8435 *branch_p = align_branch_call;
8436 if ((align_branch & align_branch_call_bit))
8437 add_padding = 1;
8438 }
8439 else if (i.tm.base_opcode == 0xff
8440 && (i.tm.extension_opcode == 2
8441 || i.tm.extension_opcode == 4))
8442 {
8443 /* Indirect call and jmp. */
8444 *branch_p = align_branch_indirect;
8445 if ((align_branch & align_branch_indirect_bit))
8446 add_padding = 1;
8447 }
8448
8449 if (add_padding
8450 && i.disp_operands
8451 && tls_get_addr
8452 && (i.op[0].disps->X_op == O_symbol
8453 || (i.op[0].disps->X_op == O_subtract
8454 && i.op[0].disps->X_op_symbol == GOT_symbol)))
8455 {
8456 symbolS *s = i.op[0].disps->X_add_symbol;
8457 /* No padding to call to global or undefined tls_get_addr. */
8458 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
8459 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
8460 return 0;
8461 }
8462 }
8463
8464 if (add_padding
8465 && last_insn.kind != last_insn_other
8466 && last_insn.seg == now_seg)
8467 {
8468 if (flag_debug)
8469 as_warn_where (last_insn.file, last_insn.line,
8470 _("`%s` skips -malign-branch-boundary on `%s`"),
8471 last_insn.name, i.tm.name);
8472 return 0;
8473 }
8474
8475 return add_padding;
8476 }
8477
8478 static void
8479 output_insn (void)
8480 {
8481 fragS *insn_start_frag;
8482 offsetT insn_start_off;
8483 fragS *fragP = NULL;
8484 enum align_branch_kind branch = align_branch_none;
8485
8486 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8487 if (IS_ELF && x86_used_note)
8488 {
8489 if (i.tm.cpu_flags.bitfield.cpucmov)
8490 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8491 if (i.tm.cpu_flags.bitfield.cpusse)
8492 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8493 if (i.tm.cpu_flags.bitfield.cpusse2)
8494 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8495 if (i.tm.cpu_flags.bitfield.cpusse3)
8496 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8497 if (i.tm.cpu_flags.bitfield.cpussse3)
8498 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8499 if (i.tm.cpu_flags.bitfield.cpusse4_1)
8500 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8501 if (i.tm.cpu_flags.bitfield.cpusse4_2)
8502 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8503 if (i.tm.cpu_flags.bitfield.cpuavx)
8504 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8505 if (i.tm.cpu_flags.bitfield.cpuavx2)
8506 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8507 if (i.tm.cpu_flags.bitfield.cpufma)
8508 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8509 if (i.tm.cpu_flags.bitfield.cpuavx512f)
8510 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8511 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8512 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8513 if (i.tm.cpu_flags.bitfield.cpuavx512er)
8514 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8515 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8516 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8517 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8518 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8519 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8520 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8521 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8522 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8523 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8524 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8525 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8526 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8527 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8528 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8529 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8530 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8531 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8532 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8533 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8534 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8535 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8536 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8537 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8538 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8539
8540 if (i.tm.cpu_flags.bitfield.cpu8087
8541 || i.tm.cpu_flags.bitfield.cpu287
8542 || i.tm.cpu_flags.bitfield.cpu387
8543 || i.tm.cpu_flags.bitfield.cpu687
8544 || i.tm.cpu_flags.bitfield.cpufisttp)
8545 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8546 if (i.has_regmmx
8547 || i.tm.base_opcode == 0xf77 /* emms */
8548 || i.tm.base_opcode == 0xf0e /* femms */)
8549 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8550 if (i.has_regxmm)
8551 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8552 if (i.has_regymm)
8553 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8554 if (i.has_regzmm)
8555 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8556 if (i.tm.cpu_flags.bitfield.cpufxsr)
8557 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8558 if (i.tm.cpu_flags.bitfield.cpuxsave)
8559 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8560 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8561 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8562 if (i.tm.cpu_flags.bitfield.cpuxsavec)
8563 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8564 }
8565 #endif
8566
8567 /* Tie dwarf2 debug info to the address at the start of the insn.
8568 We can't do this after the insn has been output as the current
8569 frag may have been closed off. eg. by frag_var. */
8570 dwarf2_emit_insn (0);
8571
8572 insn_start_frag = frag_now;
8573 insn_start_off = frag_now_fix ();
8574
8575 if (add_branch_padding_frag_p (&branch))
8576 {
8577 char *p;
8578 /* Branch can be 8 bytes. Leave some room for prefixes. */
8579 unsigned int max_branch_padding_size = 14;
8580
8581 /* Align section to boundary. */
8582 record_alignment (now_seg, align_branch_power);
8583
8584 /* Make room for padding. */
8585 frag_grow (max_branch_padding_size);
8586
8587 /* Start of the padding. */
8588 p = frag_more (0);
8589
8590 fragP = frag_now;
8591
8592 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
8593 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
8594 NULL, 0, p);
8595
8596 fragP->tc_frag_data.branch_type = branch;
8597 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
8598 }
8599
8600 /* Output jumps. */
8601 if (i.tm.opcode_modifier.jump == JUMP)
8602 output_branch ();
8603 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
8604 || i.tm.opcode_modifier.jump == JUMP_DWORD)
8605 output_jump ();
8606 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
8607 output_interseg_jump ();
8608 else
8609 {
8610 /* Output normal instructions here. */
8611 char *p;
8612 unsigned char *q;
8613 unsigned int j;
8614 unsigned int prefix;
8615
8616 if (avoid_fence
8617 && (i.tm.base_opcode == 0xfaee8
8618 || i.tm.base_opcode == 0xfaef0
8619 || i.tm.base_opcode == 0xfaef8))
8620 {
8621 /* Encode lfence, mfence, and sfence as
8622 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
8623 offsetT val = 0x240483f0ULL;
8624 p = frag_more (5);
8625 md_number_to_chars (p, val, 5);
8626 return;
8627 }
8628
8629 /* Some processors fail on LOCK prefix. This options makes
8630 assembler ignore LOCK prefix and serves as a workaround. */
8631 if (omit_lock_prefix)
8632 {
8633 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8634 return;
8635 i.prefix[LOCK_PREFIX] = 0;
8636 }
8637
8638 if (branch)
8639 /* Skip if this is a branch. */
8640 ;
8641 else if (add_fused_jcc_padding_frag_p ())
8642 {
8643 /* Make room for padding. */
8644 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
8645 p = frag_more (0);
8646
8647 fragP = frag_now;
8648
8649 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
8650 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
8651 NULL, 0, p);
8652
8653 fragP->tc_frag_data.branch_type = align_branch_fused;
8654 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
8655 }
8656 else if (add_branch_prefix_frag_p ())
8657 {
8658 unsigned int max_prefix_size = align_branch_prefix_size;
8659
8660 /* Make room for padding. */
8661 frag_grow (max_prefix_size);
8662 p = frag_more (0);
8663
8664 fragP = frag_now;
8665
8666 frag_var (rs_machine_dependent, max_prefix_size, 0,
8667 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
8668 NULL, 0, p);
8669
8670 fragP->tc_frag_data.max_bytes = max_prefix_size;
8671 }
8672
8673 /* Since the VEX/EVEX prefix contains the implicit prefix, we
8674 don't need the explicit prefix. */
8675 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8676 {
8677 switch (i.tm.opcode_length)
8678 {
8679 case 3:
8680 if (i.tm.base_opcode & 0xff000000)
8681 {
8682 prefix = (i.tm.base_opcode >> 24) & 0xff;
8683 if (!i.tm.cpu_flags.bitfield.cpupadlock
8684 || prefix != REPE_PREFIX_OPCODE
8685 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8686 add_prefix (prefix);
8687 }
8688 break;
8689 case 2:
8690 if ((i.tm.base_opcode & 0xff0000) != 0)
8691 {
8692 prefix = (i.tm.base_opcode >> 16) & 0xff;
8693 add_prefix (prefix);
8694 }
8695 break;
8696 case 1:
8697 break;
8698 case 0:
8699 /* Check for pseudo prefixes. */
8700 as_bad_where (insn_start_frag->fr_file,
8701 insn_start_frag->fr_line,
8702 _("pseudo prefix without instruction"));
8703 return;
8704 default:
8705 abort ();
8706 }
8707
8708 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8709 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8710 R_X86_64_GOTTPOFF relocation so that linker can safely
8711 perform IE->LE optimization. */
8712 if (x86_elf_abi == X86_64_X32_ABI
8713 && i.operands == 2
8714 && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8715 && i.prefix[REX_PREFIX] == 0)
8716 add_prefix (REX_OPCODE);
8717 #endif
8718
8719 /* The prefix bytes. */
8720 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8721 if (*q)
8722 FRAG_APPEND_1_CHAR (*q);
8723 }
8724 else
8725 {
8726 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8727 if (*q)
8728 switch (j)
8729 {
8730 case REX_PREFIX:
8731 /* REX byte is encoded in VEX prefix. */
8732 break;
8733 case SEG_PREFIX:
8734 case ADDR_PREFIX:
8735 FRAG_APPEND_1_CHAR (*q);
8736 break;
8737 default:
8738 /* There should be no other prefixes for instructions
8739 with VEX prefix. */
8740 abort ();
8741 }
8742
8743 /* For EVEX instructions i.vrex should become 0 after
8744 build_evex_prefix. For VEX instructions upper 16 registers
8745 aren't available, so VREX should be 0. */
8746 if (i.vrex)
8747 abort ();
8748 /* Now the VEX prefix. */
8749 p = frag_more (i.vex.length);
8750 for (j = 0; j < i.vex.length; j++)
8751 p[j] = i.vex.bytes[j];
8752 }
8753
8754 /* Now the opcode; be careful about word order here! */
8755 if (i.tm.opcode_length == 1)
8756 {
8757 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8758 }
8759 else
8760 {
8761 switch (i.tm.opcode_length)
8762 {
8763 case 4:
8764 p = frag_more (4);
8765 *p++ = (i.tm.base_opcode >> 24) & 0xff;
8766 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8767 break;
8768 case 3:
8769 p = frag_more (3);
8770 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8771 break;
8772 case 2:
8773 p = frag_more (2);
8774 break;
8775 default:
8776 abort ();
8777 break;
8778 }
8779
8780 /* Put out high byte first: can't use md_number_to_chars! */
8781 *p++ = (i.tm.base_opcode >> 8) & 0xff;
8782 *p = i.tm.base_opcode & 0xff;
8783 }
8784
8785 /* Now the modrm byte and sib byte (if present). */
8786 if (i.tm.opcode_modifier.modrm)
8787 {
8788 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8789 | i.rm.reg << 3
8790 | i.rm.mode << 6));
8791 /* If i.rm.regmem == ESP (4)
8792 && i.rm.mode != (Register mode)
8793 && not 16 bit
8794 ==> need second modrm byte. */
8795 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8796 && i.rm.mode != 3
8797 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8798 FRAG_APPEND_1_CHAR ((i.sib.base << 0
8799 | i.sib.index << 3
8800 | i.sib.scale << 6));
8801 }
8802
8803 if (i.disp_operands)
8804 output_disp (insn_start_frag, insn_start_off);
8805
8806 if (i.imm_operands)
8807 output_imm (insn_start_frag, insn_start_off);
8808
8809 /*
8810 * frag_now_fix () returning plain abs_section_offset when we're in the
8811 * absolute section, and abs_section_offset not getting updated as data
8812 * gets added to the frag breaks the logic below.
8813 */
8814 if (now_seg != absolute_section)
8815 {
8816 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8817 if (j > 15)
8818 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8819 j);
8820 else if (fragP)
8821 {
8822 /* NB: Don't add prefix with GOTPC relocation since
8823 output_disp() above depends on the fixed encoding
8824 length. Can't add prefix with TLS relocation since
8825 it breaks TLS linker optimization. */
8826 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
8827 /* Prefix count on the current instruction. */
8828 unsigned int count = i.vex.length;
8829 unsigned int k;
8830 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
8831 /* REX byte is encoded in VEX/EVEX prefix. */
8832 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
8833 count++;
8834
8835 /* Count prefixes for extended opcode maps. */
8836 if (!i.vex.length)
8837 switch (i.tm.opcode_length)
8838 {
8839 case 3:
8840 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
8841 {
8842 count++;
8843 switch ((i.tm.base_opcode >> 8) & 0xff)
8844 {
8845 case 0x38:
8846 case 0x3a:
8847 count++;
8848 break;
8849 default:
8850 break;
8851 }
8852 }
8853 break;
8854 case 2:
8855 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
8856 count++;
8857 break;
8858 case 1:
8859 break;
8860 default:
8861 abort ();
8862 }
8863
8864 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
8865 == BRANCH_PREFIX)
8866 {
8867 /* Set the maximum prefix size in BRANCH_PREFIX
8868 frag. */
8869 if (fragP->tc_frag_data.max_bytes > max)
8870 fragP->tc_frag_data.max_bytes = max;
8871 if (fragP->tc_frag_data.max_bytes > count)
8872 fragP->tc_frag_data.max_bytes -= count;
8873 else
8874 fragP->tc_frag_data.max_bytes = 0;
8875 }
8876 else
8877 {
8878 /* Remember the maximum prefix size in FUSED_JCC_PADDING
8879 frag. */
8880 unsigned int max_prefix_size;
8881 if (align_branch_prefix_size > max)
8882 max_prefix_size = max;
8883 else
8884 max_prefix_size = align_branch_prefix_size;
8885 if (max_prefix_size > count)
8886 fragP->tc_frag_data.max_prefix_length
8887 = max_prefix_size - count;
8888 }
8889
8890 /* Use existing segment prefix if possible. Use CS
8891 segment prefix in 64-bit mode. In 32-bit mode, use SS
8892 segment prefix with ESP/EBP base register and use DS
8893 segment prefix without ESP/EBP base register. */
8894 if (i.prefix[SEG_PREFIX])
8895 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
8896 else if (flag_code == CODE_64BIT)
8897 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
8898 else if (i.base_reg
8899 && (i.base_reg->reg_num == 4
8900 || i.base_reg->reg_num == 5))
8901 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
8902 else
8903 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
8904 }
8905 }
8906 }
8907
8908 /* NB: Don't work with COND_JUMP86 without i386. */
8909 if (align_branch_power
8910 && now_seg != absolute_section
8911 && cpu_arch_flags.bitfield.cpui386)
8912 {
8913 /* Terminate each frag so that we can add prefix and check for
8914 fused jcc. */
8915 frag_wane (frag_now);
8916 frag_new (0);
8917 }
8918
8919 #ifdef DEBUG386
8920 if (flag_debug)
8921 {
8922 pi ("" /*line*/, &i);
8923 }
8924 #endif /* DEBUG386 */
8925 }
8926
8927 /* Return the size of the displacement operand N. */
8928
8929 static int
8930 disp_size (unsigned int n)
8931 {
8932 int size = 4;
8933
8934 if (i.types[n].bitfield.disp64)
8935 size = 8;
8936 else if (i.types[n].bitfield.disp8)
8937 size = 1;
8938 else if (i.types[n].bitfield.disp16)
8939 size = 2;
8940 return size;
8941 }
8942
8943 /* Return the size of the immediate operand N. */
8944
8945 static int
8946 imm_size (unsigned int n)
8947 {
8948 int size = 4;
8949 if (i.types[n].bitfield.imm64)
8950 size = 8;
8951 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8952 size = 1;
8953 else if (i.types[n].bitfield.imm16)
8954 size = 2;
8955 return size;
8956 }
8957
8958 static void
8959 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
8960 {
8961 char *p;
8962 unsigned int n;
8963
8964 for (n = 0; n < i.operands; n++)
8965 {
8966 if (operand_type_check (i.types[n], disp))
8967 {
8968 if (i.op[n].disps->X_op == O_constant)
8969 {
8970 int size = disp_size (n);
8971 offsetT val = i.op[n].disps->X_add_number;
8972
8973 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
8974 size);
8975 p = frag_more (size);
8976 md_number_to_chars (p, val, size);
8977 }
8978 else
8979 {
8980 enum bfd_reloc_code_real reloc_type;
8981 int size = disp_size (n);
8982 int sign = i.types[n].bitfield.disp32s;
8983 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
8984 fixS *fixP;
8985
8986 /* We can't have 8 bit displacement here. */
8987 gas_assert (!i.types[n].bitfield.disp8);
8988
8989 /* The PC relative address is computed relative
8990 to the instruction boundary, so in case immediate
8991 fields follows, we need to adjust the value. */
8992 if (pcrel && i.imm_operands)
8993 {
8994 unsigned int n1;
8995 int sz = 0;
8996
8997 for (n1 = 0; n1 < i.operands; n1++)
8998 if (operand_type_check (i.types[n1], imm))
8999 {
9000 /* Only one immediate is allowed for PC
9001 relative address. */
9002 gas_assert (sz == 0);
9003 sz = imm_size (n1);
9004 i.op[n].disps->X_add_number -= sz;
9005 }
9006 /* We should find the immediate. */
9007 gas_assert (sz != 0);
9008 }
9009
9010 p = frag_more (size);
9011 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9012 if (GOT_symbol
9013 && GOT_symbol == i.op[n].disps->X_add_symbol
9014 && (((reloc_type == BFD_RELOC_32
9015 || reloc_type == BFD_RELOC_X86_64_32S
9016 || (reloc_type == BFD_RELOC_64
9017 && object_64bit))
9018 && (i.op[n].disps->X_op == O_symbol
9019 || (i.op[n].disps->X_op == O_add
9020 && ((symbol_get_value_expression
9021 (i.op[n].disps->X_op_symbol)->X_op)
9022 == O_subtract))))
9023 || reloc_type == BFD_RELOC_32_PCREL))
9024 {
9025 if (!object_64bit)
9026 {
9027 reloc_type = BFD_RELOC_386_GOTPC;
9028 i.has_gotpc_tls_reloc = TRUE;
9029 i.op[n].imms->X_add_number +=
9030 encoding_length (insn_start_frag, insn_start_off, p);
9031 }
9032 else if (reloc_type == BFD_RELOC_64)
9033 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9034 else
9035 /* Don't do the adjustment for x86-64, as there
9036 the pcrel addressing is relative to the _next_
9037 insn, and that is taken care of in other code. */
9038 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9039 }
9040 else if (align_branch_power)
9041 {
9042 switch (reloc_type)
9043 {
9044 case BFD_RELOC_386_TLS_GD:
9045 case BFD_RELOC_386_TLS_LDM:
9046 case BFD_RELOC_386_TLS_IE:
9047 case BFD_RELOC_386_TLS_IE_32:
9048 case BFD_RELOC_386_TLS_GOTIE:
9049 case BFD_RELOC_386_TLS_GOTDESC:
9050 case BFD_RELOC_386_TLS_DESC_CALL:
9051 case BFD_RELOC_X86_64_TLSGD:
9052 case BFD_RELOC_X86_64_TLSLD:
9053 case BFD_RELOC_X86_64_GOTTPOFF:
9054 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9055 case BFD_RELOC_X86_64_TLSDESC_CALL:
9056 i.has_gotpc_tls_reloc = TRUE;
9057 default:
9058 break;
9059 }
9060 }
9061 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9062 size, i.op[n].disps, pcrel,
9063 reloc_type);
9064 /* Check for "call/jmp *mem", "mov mem, %reg",
9065 "test %reg, mem" and "binop mem, %reg" where binop
9066 is one of adc, add, and, cmp, or, sbb, sub, xor
9067 instructions without data prefix. Always generate
9068 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9069 if (i.prefix[DATA_PREFIX] == 0
9070 && (generate_relax_relocations
9071 || (!object_64bit
9072 && i.rm.mode == 0
9073 && i.rm.regmem == 5))
9074 && (i.rm.mode == 2
9075 || (i.rm.mode == 0 && i.rm.regmem == 5))
9076 && ((i.operands == 1
9077 && i.tm.base_opcode == 0xff
9078 && (i.rm.reg == 2 || i.rm.reg == 4))
9079 || (i.operands == 2
9080 && (i.tm.base_opcode == 0x8b
9081 || i.tm.base_opcode == 0x85
9082 || (i.tm.base_opcode & 0xc7) == 0x03))))
9083 {
9084 if (object_64bit)
9085 {
9086 fixP->fx_tcbit = i.rex != 0;
9087 if (i.base_reg
9088 && (i.base_reg->reg_num == RegIP))
9089 fixP->fx_tcbit2 = 1;
9090 }
9091 else
9092 fixP->fx_tcbit2 = 1;
9093 }
9094 }
9095 }
9096 }
9097 }
9098
9099 static void
9100 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9101 {
9102 char *p;
9103 unsigned int n;
9104
9105 for (n = 0; n < i.operands; n++)
9106 {
9107 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9108 if (i.rounding && (int) n == i.rounding->operand)
9109 continue;
9110
9111 if (operand_type_check (i.types[n], imm))
9112 {
9113 if (i.op[n].imms->X_op == O_constant)
9114 {
9115 int size = imm_size (n);
9116 offsetT val;
9117
9118 val = offset_in_range (i.op[n].imms->X_add_number,
9119 size);
9120 p = frag_more (size);
9121 md_number_to_chars (p, val, size);
9122 }
9123 else
9124 {
9125 /* Not absolute_section.
9126 Need a 32-bit fixup (don't support 8bit
9127 non-absolute imms). Try to support other
9128 sizes ... */
9129 enum bfd_reloc_code_real reloc_type;
9130 int size = imm_size (n);
9131 int sign;
9132
9133 if (i.types[n].bitfield.imm32s
9134 && (i.suffix == QWORD_MNEM_SUFFIX
9135 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9136 sign = 1;
9137 else
9138 sign = 0;
9139
9140 p = frag_more (size);
9141 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9142
9143 /* This is tough to explain. We end up with this one if we
9144 * have operands that look like
9145 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9146 * obtain the absolute address of the GOT, and it is strongly
9147 * preferable from a performance point of view to avoid using
9148 * a runtime relocation for this. The actual sequence of
9149 * instructions often look something like:
9150 *
9151 * call .L66
9152 * .L66:
9153 * popl %ebx
9154 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9155 *
9156 * The call and pop essentially return the absolute address
9157 * of the label .L66 and store it in %ebx. The linker itself
9158 * will ultimately change the first operand of the addl so
9159 * that %ebx points to the GOT, but to keep things simple, the
9160 * .o file must have this operand set so that it generates not
9161 * the absolute address of .L66, but the absolute address of
9162 * itself. This allows the linker itself simply treat a GOTPC
9163 * relocation as asking for a pcrel offset to the GOT to be
9164 * added in, and the addend of the relocation is stored in the
9165 * operand field for the instruction itself.
9166 *
9167 * Our job here is to fix the operand so that it would add
9168 * the correct offset so that %ebx would point to itself. The
9169 * thing that is tricky is that .-.L66 will point to the
9170 * beginning of the instruction, so we need to further modify
9171 * the operand so that it will point to itself. There are
9172 * other cases where you have something like:
9173 *
9174 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9175 *
9176 * and here no correction would be required. Internally in
9177 * the assembler we treat operands of this form as not being
9178 * pcrel since the '.' is explicitly mentioned, and I wonder
9179 * whether it would simplify matters to do it this way. Who
9180 * knows. In earlier versions of the PIC patches, the
9181 * pcrel_adjust field was used to store the correction, but
9182 * since the expression is not pcrel, I felt it would be
9183 * confusing to do it this way. */
9184
9185 if ((reloc_type == BFD_RELOC_32
9186 || reloc_type == BFD_RELOC_X86_64_32S
9187 || reloc_type == BFD_RELOC_64)
9188 && GOT_symbol
9189 && GOT_symbol == i.op[n].imms->X_add_symbol
9190 && (i.op[n].imms->X_op == O_symbol
9191 || (i.op[n].imms->X_op == O_add
9192 && ((symbol_get_value_expression
9193 (i.op[n].imms->X_op_symbol)->X_op)
9194 == O_subtract))))
9195 {
9196 if (!object_64bit)
9197 reloc_type = BFD_RELOC_386_GOTPC;
9198 else if (size == 4)
9199 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9200 else if (size == 8)
9201 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9202 i.has_gotpc_tls_reloc = TRUE;
9203 i.op[n].imms->X_add_number +=
9204 encoding_length (insn_start_frag, insn_start_off, p);
9205 }
9206 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9207 i.op[n].imms, 0, reloc_type);
9208 }
9209 }
9210 }
9211 }
9212 \f
9213 /* x86_cons_fix_new is called via the expression parsing code when a
9214 reloc is needed. We use this hook to get the correct .got reloc. */
9215 static int cons_sign = -1;
9216
9217 void
9218 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9219 expressionS *exp, bfd_reloc_code_real_type r)
9220 {
9221 r = reloc (len, 0, cons_sign, r);
9222
9223 #ifdef TE_PE
9224 if (exp->X_op == O_secrel)
9225 {
9226 exp->X_op = O_symbol;
9227 r = BFD_RELOC_32_SECREL;
9228 }
9229 #endif
9230
9231 fix_new_exp (frag, off, len, exp, 0, r);
9232 }
9233
9234 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9235 purpose of the `.dc.a' internal pseudo-op. */
9236
9237 int
9238 x86_address_bytes (void)
9239 {
9240 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9241 return 4;
9242 return stdoutput->arch_info->bits_per_address / 8;
9243 }
9244
9245 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9246 || defined (LEX_AT)
9247 # define lex_got(reloc, adjust, types) NULL
9248 #else
9249 /* Parse operands of the form
9250 <symbol>@GOTOFF+<nnn>
9251 and similar .plt or .got references.
9252
9253 If we find one, set up the correct relocation in RELOC and copy the
9254 input string, minus the `@GOTOFF' into a malloc'd buffer for
9255 parsing by the calling routine. Return this buffer, and if ADJUST
9256 is non-null set it to the length of the string we removed from the
9257 input line. Otherwise return NULL. */
9258 static char *
9259 lex_got (enum bfd_reloc_code_real *rel,
9260 int *adjust,
9261 i386_operand_type *types)
9262 {
9263 /* Some of the relocations depend on the size of what field is to
9264 be relocated. But in our callers i386_immediate and i386_displacement
9265 we don't yet know the operand size (this will be set by insn
9266 matching). Hence we record the word32 relocation here,
9267 and adjust the reloc according to the real size in reloc(). */
9268 static const struct {
9269 const char *str;
9270 int len;
9271 const enum bfd_reloc_code_real rel[2];
9272 const i386_operand_type types64;
9273 } gotrel[] = {
9274 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9275 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9276 BFD_RELOC_SIZE32 },
9277 OPERAND_TYPE_IMM32_64 },
9278 #endif
9279 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9280 BFD_RELOC_X86_64_PLTOFF64 },
9281 OPERAND_TYPE_IMM64 },
9282 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9283 BFD_RELOC_X86_64_PLT32 },
9284 OPERAND_TYPE_IMM32_32S_DISP32 },
9285 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9286 BFD_RELOC_X86_64_GOTPLT64 },
9287 OPERAND_TYPE_IMM64_DISP64 },
9288 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9289 BFD_RELOC_X86_64_GOTOFF64 },
9290 OPERAND_TYPE_IMM64_DISP64 },
9291 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9292 BFD_RELOC_X86_64_GOTPCREL },
9293 OPERAND_TYPE_IMM32_32S_DISP32 },
9294 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9295 BFD_RELOC_X86_64_TLSGD },
9296 OPERAND_TYPE_IMM32_32S_DISP32 },
9297 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9298 _dummy_first_bfd_reloc_code_real },
9299 OPERAND_TYPE_NONE },
9300 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9301 BFD_RELOC_X86_64_TLSLD },
9302 OPERAND_TYPE_IMM32_32S_DISP32 },
9303 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9304 BFD_RELOC_X86_64_GOTTPOFF },
9305 OPERAND_TYPE_IMM32_32S_DISP32 },
9306 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9307 BFD_RELOC_X86_64_TPOFF32 },
9308 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9309 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9310 _dummy_first_bfd_reloc_code_real },
9311 OPERAND_TYPE_NONE },
9312 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9313 BFD_RELOC_X86_64_DTPOFF32 },
9314 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9315 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9316 _dummy_first_bfd_reloc_code_real },
9317 OPERAND_TYPE_NONE },
9318 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9319 _dummy_first_bfd_reloc_code_real },
9320 OPERAND_TYPE_NONE },
9321 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9322 BFD_RELOC_X86_64_GOT32 },
9323 OPERAND_TYPE_IMM32_32S_64_DISP32 },
9324 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9325 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9326 OPERAND_TYPE_IMM32_32S_DISP32 },
9327 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9328 BFD_RELOC_X86_64_TLSDESC_CALL },
9329 OPERAND_TYPE_IMM32_32S_DISP32 },
9330 };
9331 char *cp;
9332 unsigned int j;
9333
9334 #if defined (OBJ_MAYBE_ELF)
9335 if (!IS_ELF)
9336 return NULL;
9337 #endif
9338
9339 for (cp = input_line_pointer; *cp != '@'; cp++)
9340 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9341 return NULL;
9342
9343 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9344 {
9345 int len = gotrel[j].len;
9346 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9347 {
9348 if (gotrel[j].rel[object_64bit] != 0)
9349 {
9350 int first, second;
9351 char *tmpbuf, *past_reloc;
9352
9353 *rel = gotrel[j].rel[object_64bit];
9354
9355 if (types)
9356 {
9357 if (flag_code != CODE_64BIT)
9358 {
9359 types->bitfield.imm32 = 1;
9360 types->bitfield.disp32 = 1;
9361 }
9362 else
9363 *types = gotrel[j].types64;
9364 }
9365
9366 if (j != 0 && GOT_symbol == NULL)
9367 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9368
9369 /* The length of the first part of our input line. */
9370 first = cp - input_line_pointer;
9371
9372 /* The second part goes from after the reloc token until
9373 (and including) an end_of_line char or comma. */
9374 past_reloc = cp + 1 + len;
9375 cp = past_reloc;
9376 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9377 ++cp;
9378 second = cp + 1 - past_reloc;
9379
9380 /* Allocate and copy string. The trailing NUL shouldn't
9381 be necessary, but be safe. */
9382 tmpbuf = XNEWVEC (char, first + second + 2);
9383 memcpy (tmpbuf, input_line_pointer, first);
9384 if (second != 0 && *past_reloc != ' ')
9385 /* Replace the relocation token with ' ', so that
9386 errors like foo@GOTOFF1 will be detected. */
9387 tmpbuf[first++] = ' ';
9388 else
9389 /* Increment length by 1 if the relocation token is
9390 removed. */
9391 len++;
9392 if (adjust)
9393 *adjust = len;
9394 memcpy (tmpbuf + first, past_reloc, second);
9395 tmpbuf[first + second] = '\0';
9396 return tmpbuf;
9397 }
9398
9399 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9400 gotrel[j].str, 1 << (5 + object_64bit));
9401 return NULL;
9402 }
9403 }
9404
9405 /* Might be a symbol version string. Don't as_bad here. */
9406 return NULL;
9407 }
9408 #endif
9409
9410 #ifdef TE_PE
9411 #ifdef lex_got
9412 #undef lex_got
9413 #endif
9414 /* Parse operands of the form
9415 <symbol>@SECREL32+<nnn>
9416
9417 If we find one, set up the correct relocation in RELOC and copy the
9418 input string, minus the `@SECREL32' into a malloc'd buffer for
9419 parsing by the calling routine. Return this buffer, and if ADJUST
9420 is non-null set it to the length of the string we removed from the
9421 input line. Otherwise return NULL.
9422
9423 This function is copied from the ELF version above adjusted for PE targets. */
9424
9425 static char *
9426 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
9427 int *adjust ATTRIBUTE_UNUSED,
9428 i386_operand_type *types)
9429 {
9430 static const struct
9431 {
9432 const char *str;
9433 int len;
9434 const enum bfd_reloc_code_real rel[2];
9435 const i386_operand_type types64;
9436 }
9437 gotrel[] =
9438 {
9439 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
9440 BFD_RELOC_32_SECREL },
9441 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9442 };
9443
9444 char *cp;
9445 unsigned j;
9446
9447 for (cp = input_line_pointer; *cp != '@'; cp++)
9448 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9449 return NULL;
9450
9451 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9452 {
9453 int len = gotrel[j].len;
9454
9455 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9456 {
9457 if (gotrel[j].rel[object_64bit] != 0)
9458 {
9459 int first, second;
9460 char *tmpbuf, *past_reloc;
9461
9462 *rel = gotrel[j].rel[object_64bit];
9463 if (adjust)
9464 *adjust = len;
9465
9466 if (types)
9467 {
9468 if (flag_code != CODE_64BIT)
9469 {
9470 types->bitfield.imm32 = 1;
9471 types->bitfield.disp32 = 1;
9472 }
9473 else
9474 *types = gotrel[j].types64;
9475 }
9476
9477 /* The length of the first part of our input line. */
9478 first = cp - input_line_pointer;
9479
9480 /* The second part goes from after the reloc token until
9481 (and including) an end_of_line char or comma. */
9482 past_reloc = cp + 1 + len;
9483 cp = past_reloc;
9484 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9485 ++cp;
9486 second = cp + 1 - past_reloc;
9487
9488 /* Allocate and copy string. The trailing NUL shouldn't
9489 be necessary, but be safe. */
9490 tmpbuf = XNEWVEC (char, first + second + 2);
9491 memcpy (tmpbuf, input_line_pointer, first);
9492 if (second != 0 && *past_reloc != ' ')
9493 /* Replace the relocation token with ' ', so that
9494 errors like foo@SECLREL321 will be detected. */
9495 tmpbuf[first++] = ' ';
9496 memcpy (tmpbuf + first, past_reloc, second);
9497 tmpbuf[first + second] = '\0';
9498 return tmpbuf;
9499 }
9500
9501 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9502 gotrel[j].str, 1 << (5 + object_64bit));
9503 return NULL;
9504 }
9505 }
9506
9507 /* Might be a symbol version string. Don't as_bad here. */
9508 return NULL;
9509 }
9510
9511 #endif /* TE_PE */
9512
9513 bfd_reloc_code_real_type
9514 x86_cons (expressionS *exp, int size)
9515 {
9516 bfd_reloc_code_real_type got_reloc = NO_RELOC;
9517
9518 intel_syntax = -intel_syntax;
9519
9520 exp->X_md = 0;
9521 if (size == 4 || (object_64bit && size == 8))
9522 {
9523 /* Handle @GOTOFF and the like in an expression. */
9524 char *save;
9525 char *gotfree_input_line;
9526 int adjust = 0;
9527
9528 save = input_line_pointer;
9529 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9530 if (gotfree_input_line)
9531 input_line_pointer = gotfree_input_line;
9532
9533 expression (exp);
9534
9535 if (gotfree_input_line)
9536 {
9537 /* expression () has merrily parsed up to the end of line,
9538 or a comma - in the wrong buffer. Transfer how far
9539 input_line_pointer has moved to the right buffer. */
9540 input_line_pointer = (save
9541 + (input_line_pointer - gotfree_input_line)
9542 + adjust);
9543 free (gotfree_input_line);
9544 if (exp->X_op == O_constant
9545 || exp->X_op == O_absent
9546 || exp->X_op == O_illegal
9547 || exp->X_op == O_register
9548 || exp->X_op == O_big)
9549 {
9550 char c = *input_line_pointer;
9551 *input_line_pointer = 0;
9552 as_bad (_("missing or invalid expression `%s'"), save);
9553 *input_line_pointer = c;
9554 }
9555 else if ((got_reloc == BFD_RELOC_386_PLT32
9556 || got_reloc == BFD_RELOC_X86_64_PLT32)
9557 && exp->X_op != O_symbol)
9558 {
9559 char c = *input_line_pointer;
9560 *input_line_pointer = 0;
9561 as_bad (_("invalid PLT expression `%s'"), save);
9562 *input_line_pointer = c;
9563 }
9564 }
9565 }
9566 else
9567 expression (exp);
9568
9569 intel_syntax = -intel_syntax;
9570
9571 if (intel_syntax)
9572 i386_intel_simplify (exp);
9573
9574 return got_reloc;
9575 }
9576
9577 static void
9578 signed_cons (int size)
9579 {
9580 if (flag_code == CODE_64BIT)
9581 cons_sign = 1;
9582 cons (size);
9583 cons_sign = -1;
9584 }
9585
9586 #ifdef TE_PE
9587 static void
9588 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9589 {
9590 expressionS exp;
9591
9592 do
9593 {
9594 expression (&exp);
9595 if (exp.X_op == O_symbol)
9596 exp.X_op = O_secrel;
9597
9598 emit_expr (&exp, 4);
9599 }
9600 while (*input_line_pointer++ == ',');
9601
9602 input_line_pointer--;
9603 demand_empty_rest_of_line ();
9604 }
9605 #endif
9606
9607 /* Handle Vector operations. */
9608
9609 static char *
9610 check_VecOperations (char *op_string, char *op_end)
9611 {
9612 const reg_entry *mask;
9613 const char *saved;
9614 char *end_op;
9615
9616 while (*op_string
9617 && (op_end == NULL || op_string < op_end))
9618 {
9619 saved = op_string;
9620 if (*op_string == '{')
9621 {
9622 op_string++;
9623
9624 /* Check broadcasts. */
9625 if (strncmp (op_string, "1to", 3) == 0)
9626 {
9627 int bcst_type;
9628
9629 if (i.broadcast)
9630 goto duplicated_vec_op;
9631
9632 op_string += 3;
9633 if (*op_string == '8')
9634 bcst_type = 8;
9635 else if (*op_string == '4')
9636 bcst_type = 4;
9637 else if (*op_string == '2')
9638 bcst_type = 2;
9639 else if (*op_string == '1'
9640 && *(op_string+1) == '6')
9641 {
9642 bcst_type = 16;
9643 op_string++;
9644 }
9645 else
9646 {
9647 as_bad (_("Unsupported broadcast: `%s'"), saved);
9648 return NULL;
9649 }
9650 op_string++;
9651
9652 broadcast_op.type = bcst_type;
9653 broadcast_op.operand = this_operand;
9654 broadcast_op.bytes = 0;
9655 i.broadcast = &broadcast_op;
9656 }
9657 /* Check masking operation. */
9658 else if ((mask = parse_register (op_string, &end_op)) != NULL)
9659 {
9660 /* k0 can't be used for write mask. */
9661 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
9662 {
9663 as_bad (_("`%s%s' can't be used for write mask"),
9664 register_prefix, mask->reg_name);
9665 return NULL;
9666 }
9667
9668 if (!i.mask)
9669 {
9670 mask_op.mask = mask;
9671 mask_op.zeroing = 0;
9672 mask_op.operand = this_operand;
9673 i.mask = &mask_op;
9674 }
9675 else
9676 {
9677 if (i.mask->mask)
9678 goto duplicated_vec_op;
9679
9680 i.mask->mask = mask;
9681
9682 /* Only "{z}" is allowed here. No need to check
9683 zeroing mask explicitly. */
9684 if (i.mask->operand != this_operand)
9685 {
9686 as_bad (_("invalid write mask `%s'"), saved);
9687 return NULL;
9688 }
9689 }
9690
9691 op_string = end_op;
9692 }
9693 /* Check zeroing-flag for masking operation. */
9694 else if (*op_string == 'z')
9695 {
9696 if (!i.mask)
9697 {
9698 mask_op.mask = NULL;
9699 mask_op.zeroing = 1;
9700 mask_op.operand = this_operand;
9701 i.mask = &mask_op;
9702 }
9703 else
9704 {
9705 if (i.mask->zeroing)
9706 {
9707 duplicated_vec_op:
9708 as_bad (_("duplicated `%s'"), saved);
9709 return NULL;
9710 }
9711
9712 i.mask->zeroing = 1;
9713
9714 /* Only "{%k}" is allowed here. No need to check mask
9715 register explicitly. */
9716 if (i.mask->operand != this_operand)
9717 {
9718 as_bad (_("invalid zeroing-masking `%s'"),
9719 saved);
9720 return NULL;
9721 }
9722 }
9723
9724 op_string++;
9725 }
9726 else
9727 goto unknown_vec_op;
9728
9729 if (*op_string != '}')
9730 {
9731 as_bad (_("missing `}' in `%s'"), saved);
9732 return NULL;
9733 }
9734 op_string++;
9735
9736 /* Strip whitespace since the addition of pseudo prefixes
9737 changed how the scrubber treats '{'. */
9738 if (is_space_char (*op_string))
9739 ++op_string;
9740
9741 continue;
9742 }
9743 unknown_vec_op:
9744 /* We don't know this one. */
9745 as_bad (_("unknown vector operation: `%s'"), saved);
9746 return NULL;
9747 }
9748
9749 if (i.mask && i.mask->zeroing && !i.mask->mask)
9750 {
9751 as_bad (_("zeroing-masking only allowed with write mask"));
9752 return NULL;
9753 }
9754
9755 return op_string;
9756 }
9757
9758 static int
9759 i386_immediate (char *imm_start)
9760 {
9761 char *save_input_line_pointer;
9762 char *gotfree_input_line;
9763 segT exp_seg = 0;
9764 expressionS *exp;
9765 i386_operand_type types;
9766
9767 operand_type_set (&types, ~0);
9768
9769 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9770 {
9771 as_bad (_("at most %d immediate operands are allowed"),
9772 MAX_IMMEDIATE_OPERANDS);
9773 return 0;
9774 }
9775
9776 exp = &im_expressions[i.imm_operands++];
9777 i.op[this_operand].imms = exp;
9778
9779 if (is_space_char (*imm_start))
9780 ++imm_start;
9781
9782 save_input_line_pointer = input_line_pointer;
9783 input_line_pointer = imm_start;
9784
9785 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9786 if (gotfree_input_line)
9787 input_line_pointer = gotfree_input_line;
9788
9789 exp_seg = expression (exp);
9790
9791 SKIP_WHITESPACE ();
9792
9793 /* Handle vector operations. */
9794 if (*input_line_pointer == '{')
9795 {
9796 input_line_pointer = check_VecOperations (input_line_pointer,
9797 NULL);
9798 if (input_line_pointer == NULL)
9799 return 0;
9800 }
9801
9802 if (*input_line_pointer)
9803 as_bad (_("junk `%s' after expression"), input_line_pointer);
9804
9805 input_line_pointer = save_input_line_pointer;
9806 if (gotfree_input_line)
9807 {
9808 free (gotfree_input_line);
9809
9810 if (exp->X_op == O_constant || exp->X_op == O_register)
9811 exp->X_op = O_illegal;
9812 }
9813
9814 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9815 }
9816
9817 static int
9818 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9819 i386_operand_type types, const char *imm_start)
9820 {
9821 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9822 {
9823 if (imm_start)
9824 as_bad (_("missing or invalid immediate expression `%s'"),
9825 imm_start);
9826 return 0;
9827 }
9828 else if (exp->X_op == O_constant)
9829 {
9830 /* Size it properly later. */
9831 i.types[this_operand].bitfield.imm64 = 1;
9832 /* If not 64bit, sign extend val. */
9833 if (flag_code != CODE_64BIT
9834 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9835 exp->X_add_number
9836 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9837 }
9838 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9839 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9840 && exp_seg != absolute_section
9841 && exp_seg != text_section
9842 && exp_seg != data_section
9843 && exp_seg != bss_section
9844 && exp_seg != undefined_section
9845 && !bfd_is_com_section (exp_seg))
9846 {
9847 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9848 return 0;
9849 }
9850 #endif
9851 else if (!intel_syntax && exp_seg == reg_section)
9852 {
9853 if (imm_start)
9854 as_bad (_("illegal immediate register operand %s"), imm_start);
9855 return 0;
9856 }
9857 else
9858 {
9859 /* This is an address. The size of the address will be
9860 determined later, depending on destination register,
9861 suffix, or the default for the section. */
9862 i.types[this_operand].bitfield.imm8 = 1;
9863 i.types[this_operand].bitfield.imm16 = 1;
9864 i.types[this_operand].bitfield.imm32 = 1;
9865 i.types[this_operand].bitfield.imm32s = 1;
9866 i.types[this_operand].bitfield.imm64 = 1;
9867 i.types[this_operand] = operand_type_and (i.types[this_operand],
9868 types);
9869 }
9870
9871 return 1;
9872 }
9873
9874 static char *
9875 i386_scale (char *scale)
9876 {
9877 offsetT val;
9878 char *save = input_line_pointer;
9879
9880 input_line_pointer = scale;
9881 val = get_absolute_expression ();
9882
9883 switch (val)
9884 {
9885 case 1:
9886 i.log2_scale_factor = 0;
9887 break;
9888 case 2:
9889 i.log2_scale_factor = 1;
9890 break;
9891 case 4:
9892 i.log2_scale_factor = 2;
9893 break;
9894 case 8:
9895 i.log2_scale_factor = 3;
9896 break;
9897 default:
9898 {
9899 char sep = *input_line_pointer;
9900
9901 *input_line_pointer = '\0';
9902 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9903 scale);
9904 *input_line_pointer = sep;
9905 input_line_pointer = save;
9906 return NULL;
9907 }
9908 }
9909 if (i.log2_scale_factor != 0 && i.index_reg == 0)
9910 {
9911 as_warn (_("scale factor of %d without an index register"),
9912 1 << i.log2_scale_factor);
9913 i.log2_scale_factor = 0;
9914 }
9915 scale = input_line_pointer;
9916 input_line_pointer = save;
9917 return scale;
9918 }
9919
9920 static int
9921 i386_displacement (char *disp_start, char *disp_end)
9922 {
9923 expressionS *exp;
9924 segT exp_seg = 0;
9925 char *save_input_line_pointer;
9926 char *gotfree_input_line;
9927 int override;
9928 i386_operand_type bigdisp, types = anydisp;
9929 int ret;
9930
9931 if (i.disp_operands == MAX_MEMORY_OPERANDS)
9932 {
9933 as_bad (_("at most %d displacement operands are allowed"),
9934 MAX_MEMORY_OPERANDS);
9935 return 0;
9936 }
9937
9938 operand_type_set (&bigdisp, 0);
9939 if (i.jumpabsolute
9940 || (current_templates->start->opcode_modifier.jump != JUMP
9941 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
9942 {
9943 bigdisp.bitfield.disp32 = 1;
9944 override = (i.prefix[ADDR_PREFIX] != 0);
9945 if (flag_code == CODE_64BIT)
9946 {
9947 if (!override)
9948 {
9949 bigdisp.bitfield.disp32s = 1;
9950 bigdisp.bitfield.disp64 = 1;
9951 }
9952 }
9953 else if ((flag_code == CODE_16BIT) ^ override)
9954 {
9955 bigdisp.bitfield.disp32 = 0;
9956 bigdisp.bitfield.disp16 = 1;
9957 }
9958 }
9959 else
9960 {
9961 /* For PC-relative branches, the width of the displacement
9962 is dependent upon data size, not address size. */
9963 override = (i.prefix[DATA_PREFIX] != 0);
9964 if (flag_code == CODE_64BIT)
9965 {
9966 if (override || i.suffix == WORD_MNEM_SUFFIX)
9967 bigdisp.bitfield.disp16 = 1;
9968 else
9969 {
9970 bigdisp.bitfield.disp32 = 1;
9971 bigdisp.bitfield.disp32s = 1;
9972 }
9973 }
9974 else
9975 {
9976 if (!override)
9977 override = (i.suffix == (flag_code != CODE_16BIT
9978 ? WORD_MNEM_SUFFIX
9979 : LONG_MNEM_SUFFIX));
9980 bigdisp.bitfield.disp32 = 1;
9981 if ((flag_code == CODE_16BIT) ^ override)
9982 {
9983 bigdisp.bitfield.disp32 = 0;
9984 bigdisp.bitfield.disp16 = 1;
9985 }
9986 }
9987 }
9988 i.types[this_operand] = operand_type_or (i.types[this_operand],
9989 bigdisp);
9990
9991 exp = &disp_expressions[i.disp_operands];
9992 i.op[this_operand].disps = exp;
9993 i.disp_operands++;
9994 save_input_line_pointer = input_line_pointer;
9995 input_line_pointer = disp_start;
9996 END_STRING_AND_SAVE (disp_end);
9997
9998 #ifndef GCC_ASM_O_HACK
9999 #define GCC_ASM_O_HACK 0
10000 #endif
10001 #if GCC_ASM_O_HACK
10002 END_STRING_AND_SAVE (disp_end + 1);
10003 if (i.types[this_operand].bitfield.baseIndex
10004 && displacement_string_end[-1] == '+')
10005 {
10006 /* This hack is to avoid a warning when using the "o"
10007 constraint within gcc asm statements.
10008 For instance:
10009
10010 #define _set_tssldt_desc(n,addr,limit,type) \
10011 __asm__ __volatile__ ( \
10012 "movw %w2,%0\n\t" \
10013 "movw %w1,2+%0\n\t" \
10014 "rorl $16,%1\n\t" \
10015 "movb %b1,4+%0\n\t" \
10016 "movb %4,5+%0\n\t" \
10017 "movb $0,6+%0\n\t" \
10018 "movb %h1,7+%0\n\t" \
10019 "rorl $16,%1" \
10020 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10021
10022 This works great except that the output assembler ends
10023 up looking a bit weird if it turns out that there is
10024 no offset. You end up producing code that looks like:
10025
10026 #APP
10027 movw $235,(%eax)
10028 movw %dx,2+(%eax)
10029 rorl $16,%edx
10030 movb %dl,4+(%eax)
10031 movb $137,5+(%eax)
10032 movb $0,6+(%eax)
10033 movb %dh,7+(%eax)
10034 rorl $16,%edx
10035 #NO_APP
10036
10037 So here we provide the missing zero. */
10038
10039 *displacement_string_end = '0';
10040 }
10041 #endif
10042 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10043 if (gotfree_input_line)
10044 input_line_pointer = gotfree_input_line;
10045
10046 exp_seg = expression (exp);
10047
10048 SKIP_WHITESPACE ();
10049 if (*input_line_pointer)
10050 as_bad (_("junk `%s' after expression"), input_line_pointer);
10051 #if GCC_ASM_O_HACK
10052 RESTORE_END_STRING (disp_end + 1);
10053 #endif
10054 input_line_pointer = save_input_line_pointer;
10055 if (gotfree_input_line)
10056 {
10057 free (gotfree_input_line);
10058
10059 if (exp->X_op == O_constant || exp->X_op == O_register)
10060 exp->X_op = O_illegal;
10061 }
10062
10063 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10064
10065 RESTORE_END_STRING (disp_end);
10066
10067 return ret;
10068 }
10069
10070 static int
10071 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10072 i386_operand_type types, const char *disp_start)
10073 {
10074 i386_operand_type bigdisp;
10075 int ret = 1;
10076
10077 /* We do this to make sure that the section symbol is in
10078 the symbol table. We will ultimately change the relocation
10079 to be relative to the beginning of the section. */
10080 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10081 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10082 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10083 {
10084 if (exp->X_op != O_symbol)
10085 goto inv_disp;
10086
10087 if (S_IS_LOCAL (exp->X_add_symbol)
10088 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10089 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10090 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10091 exp->X_op = O_subtract;
10092 exp->X_op_symbol = GOT_symbol;
10093 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10094 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10095 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10096 i.reloc[this_operand] = BFD_RELOC_64;
10097 else
10098 i.reloc[this_operand] = BFD_RELOC_32;
10099 }
10100
10101 else if (exp->X_op == O_absent
10102 || exp->X_op == O_illegal
10103 || exp->X_op == O_big)
10104 {
10105 inv_disp:
10106 as_bad (_("missing or invalid displacement expression `%s'"),
10107 disp_start);
10108 ret = 0;
10109 }
10110
10111 else if (flag_code == CODE_64BIT
10112 && !i.prefix[ADDR_PREFIX]
10113 && exp->X_op == O_constant)
10114 {
10115 /* Since displacement is signed extended to 64bit, don't allow
10116 disp32 and turn off disp32s if they are out of range. */
10117 i.types[this_operand].bitfield.disp32 = 0;
10118 if (!fits_in_signed_long (exp->X_add_number))
10119 {
10120 i.types[this_operand].bitfield.disp32s = 0;
10121 if (i.types[this_operand].bitfield.baseindex)
10122 {
10123 as_bad (_("0x%lx out range of signed 32bit displacement"),
10124 (long) exp->X_add_number);
10125 ret = 0;
10126 }
10127 }
10128 }
10129
10130 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10131 else if (exp->X_op != O_constant
10132 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10133 && exp_seg != absolute_section
10134 && exp_seg != text_section
10135 && exp_seg != data_section
10136 && exp_seg != bss_section
10137 && exp_seg != undefined_section
10138 && !bfd_is_com_section (exp_seg))
10139 {
10140 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10141 ret = 0;
10142 }
10143 #endif
10144
10145 /* Check if this is a displacement only operand. */
10146 bigdisp = i.types[this_operand];
10147 bigdisp.bitfield.disp8 = 0;
10148 bigdisp.bitfield.disp16 = 0;
10149 bigdisp.bitfield.disp32 = 0;
10150 bigdisp.bitfield.disp32s = 0;
10151 bigdisp.bitfield.disp64 = 0;
10152 if (operand_type_all_zero (&bigdisp))
10153 i.types[this_operand] = operand_type_and (i.types[this_operand],
10154 types);
10155
10156 return ret;
10157 }
10158
10159 /* Return the active addressing mode, taking address override and
10160 registers forming the address into consideration. Update the
10161 address override prefix if necessary. */
10162
10163 static enum flag_code
10164 i386_addressing_mode (void)
10165 {
10166 enum flag_code addr_mode;
10167
10168 if (i.prefix[ADDR_PREFIX])
10169 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10170 else
10171 {
10172 addr_mode = flag_code;
10173
10174 #if INFER_ADDR_PREFIX
10175 if (i.mem_operands == 0)
10176 {
10177 /* Infer address prefix from the first memory operand. */
10178 const reg_entry *addr_reg = i.base_reg;
10179
10180 if (addr_reg == NULL)
10181 addr_reg = i.index_reg;
10182
10183 if (addr_reg)
10184 {
10185 if (addr_reg->reg_type.bitfield.dword)
10186 addr_mode = CODE_32BIT;
10187 else if (flag_code != CODE_64BIT
10188 && addr_reg->reg_type.bitfield.word)
10189 addr_mode = CODE_16BIT;
10190
10191 if (addr_mode != flag_code)
10192 {
10193 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10194 i.prefixes += 1;
10195 /* Change the size of any displacement too. At most one
10196 of Disp16 or Disp32 is set.
10197 FIXME. There doesn't seem to be any real need for
10198 separate Disp16 and Disp32 flags. The same goes for
10199 Imm16 and Imm32. Removing them would probably clean
10200 up the code quite a lot. */
10201 if (flag_code != CODE_64BIT
10202 && (i.types[this_operand].bitfield.disp16
10203 || i.types[this_operand].bitfield.disp32))
10204 i.types[this_operand]
10205 = operand_type_xor (i.types[this_operand], disp16_32);
10206 }
10207 }
10208 }
10209 #endif
10210 }
10211
10212 return addr_mode;
10213 }
10214
10215 /* Make sure the memory operand we've been dealt is valid.
10216 Return 1 on success, 0 on a failure. */
10217
10218 static int
10219 i386_index_check (const char *operand_string)
10220 {
10221 const char *kind = "base/index";
10222 enum flag_code addr_mode = i386_addressing_mode ();
10223
10224 if (current_templates->start->opcode_modifier.isstring
10225 && !current_templates->start->cpu_flags.bitfield.cpupadlock
10226 && (current_templates->end[-1].opcode_modifier.isstring
10227 || i.mem_operands))
10228 {
10229 /* Memory operands of string insns are special in that they only allow
10230 a single register (rDI, rSI, or rBX) as their memory address. */
10231 const reg_entry *expected_reg;
10232 static const char *di_si[][2] =
10233 {
10234 { "esi", "edi" },
10235 { "si", "di" },
10236 { "rsi", "rdi" }
10237 };
10238 static const char *bx[] = { "ebx", "bx", "rbx" };
10239
10240 kind = "string address";
10241
10242 if (current_templates->start->opcode_modifier.repprefixok)
10243 {
10244 int es_op = current_templates->end[-1].opcode_modifier.isstring
10245 - IS_STRING_ES_OP0;
10246 int op = 0;
10247
10248 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10249 || ((!i.mem_operands != !intel_syntax)
10250 && current_templates->end[-1].operand_types[1]
10251 .bitfield.baseindex))
10252 op = 1;
10253 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10254 }
10255 else
10256 expected_reg = hash_find (reg_hash, bx[addr_mode]);
10257
10258 if (i.base_reg != expected_reg
10259 || i.index_reg
10260 || operand_type_check (i.types[this_operand], disp))
10261 {
10262 /* The second memory operand must have the same size as
10263 the first one. */
10264 if (i.mem_operands
10265 && i.base_reg
10266 && !((addr_mode == CODE_64BIT
10267 && i.base_reg->reg_type.bitfield.qword)
10268 || (addr_mode == CODE_32BIT
10269 ? i.base_reg->reg_type.bitfield.dword
10270 : i.base_reg->reg_type.bitfield.word)))
10271 goto bad_address;
10272
10273 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10274 operand_string,
10275 intel_syntax ? '[' : '(',
10276 register_prefix,
10277 expected_reg->reg_name,
10278 intel_syntax ? ']' : ')');
10279 return 1;
10280 }
10281 else
10282 return 1;
10283
10284 bad_address:
10285 as_bad (_("`%s' is not a valid %s expression"),
10286 operand_string, kind);
10287 return 0;
10288 }
10289 else
10290 {
10291 if (addr_mode != CODE_16BIT)
10292 {
10293 /* 32-bit/64-bit checks. */
10294 if ((i.base_reg
10295 && ((addr_mode == CODE_64BIT
10296 ? !i.base_reg->reg_type.bitfield.qword
10297 : !i.base_reg->reg_type.bitfield.dword)
10298 || (i.index_reg && i.base_reg->reg_num == RegIP)
10299 || i.base_reg->reg_num == RegIZ))
10300 || (i.index_reg
10301 && !i.index_reg->reg_type.bitfield.xmmword
10302 && !i.index_reg->reg_type.bitfield.ymmword
10303 && !i.index_reg->reg_type.bitfield.zmmword
10304 && ((addr_mode == CODE_64BIT
10305 ? !i.index_reg->reg_type.bitfield.qword
10306 : !i.index_reg->reg_type.bitfield.dword)
10307 || !i.index_reg->reg_type.bitfield.baseindex)))
10308 goto bad_address;
10309
10310 /* bndmk, bndldx, and bndstx have special restrictions. */
10311 if (current_templates->start->base_opcode == 0xf30f1b
10312 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10313 {
10314 /* They cannot use RIP-relative addressing. */
10315 if (i.base_reg && i.base_reg->reg_num == RegIP)
10316 {
10317 as_bad (_("`%s' cannot be used here"), operand_string);
10318 return 0;
10319 }
10320
10321 /* bndldx and bndstx ignore their scale factor. */
10322 if (current_templates->start->base_opcode != 0xf30f1b
10323 && i.log2_scale_factor)
10324 as_warn (_("register scaling is being ignored here"));
10325 }
10326 }
10327 else
10328 {
10329 /* 16-bit checks. */
10330 if ((i.base_reg
10331 && (!i.base_reg->reg_type.bitfield.word
10332 || !i.base_reg->reg_type.bitfield.baseindex))
10333 || (i.index_reg
10334 && (!i.index_reg->reg_type.bitfield.word
10335 || !i.index_reg->reg_type.bitfield.baseindex
10336 || !(i.base_reg
10337 && i.base_reg->reg_num < 6
10338 && i.index_reg->reg_num >= 6
10339 && i.log2_scale_factor == 0))))
10340 goto bad_address;
10341 }
10342 }
10343 return 1;
10344 }
10345
10346 /* Handle vector immediates. */
10347
10348 static int
10349 RC_SAE_immediate (const char *imm_start)
10350 {
10351 unsigned int match_found, j;
10352 const char *pstr = imm_start;
10353 expressionS *exp;
10354
10355 if (*pstr != '{')
10356 return 0;
10357
10358 pstr++;
10359 match_found = 0;
10360 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10361 {
10362 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10363 {
10364 if (!i.rounding)
10365 {
10366 rc_op.type = RC_NamesTable[j].type;
10367 rc_op.operand = this_operand;
10368 i.rounding = &rc_op;
10369 }
10370 else
10371 {
10372 as_bad (_("duplicated `%s'"), imm_start);
10373 return 0;
10374 }
10375 pstr += RC_NamesTable[j].len;
10376 match_found = 1;
10377 break;
10378 }
10379 }
10380 if (!match_found)
10381 return 0;
10382
10383 if (*pstr++ != '}')
10384 {
10385 as_bad (_("Missing '}': '%s'"), imm_start);
10386 return 0;
10387 }
10388 /* RC/SAE immediate string should contain nothing more. */;
10389 if (*pstr != 0)
10390 {
10391 as_bad (_("Junk after '}': '%s'"), imm_start);
10392 return 0;
10393 }
10394
10395 exp = &im_expressions[i.imm_operands++];
10396 i.op[this_operand].imms = exp;
10397
10398 exp->X_op = O_constant;
10399 exp->X_add_number = 0;
10400 exp->X_add_symbol = (symbolS *) 0;
10401 exp->X_op_symbol = (symbolS *) 0;
10402
10403 i.types[this_operand].bitfield.imm8 = 1;
10404 return 1;
10405 }
10406
10407 /* Only string instructions can have a second memory operand, so
10408 reduce current_templates to just those if it contains any. */
10409 static int
10410 maybe_adjust_templates (void)
10411 {
10412 const insn_template *t;
10413
10414 gas_assert (i.mem_operands == 1);
10415
10416 for (t = current_templates->start; t < current_templates->end; ++t)
10417 if (t->opcode_modifier.isstring)
10418 break;
10419
10420 if (t < current_templates->end)
10421 {
10422 static templates aux_templates;
10423 bfd_boolean recheck;
10424
10425 aux_templates.start = t;
10426 for (; t < current_templates->end; ++t)
10427 if (!t->opcode_modifier.isstring)
10428 break;
10429 aux_templates.end = t;
10430
10431 /* Determine whether to re-check the first memory operand. */
10432 recheck = (aux_templates.start != current_templates->start
10433 || t != current_templates->end);
10434
10435 current_templates = &aux_templates;
10436
10437 if (recheck)
10438 {
10439 i.mem_operands = 0;
10440 if (i.memop1_string != NULL
10441 && i386_index_check (i.memop1_string) == 0)
10442 return 0;
10443 i.mem_operands = 1;
10444 }
10445 }
10446
10447 return 1;
10448 }
10449
10450 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
10451 on error. */
10452
10453 static int
10454 i386_att_operand (char *operand_string)
10455 {
10456 const reg_entry *r;
10457 char *end_op;
10458 char *op_string = operand_string;
10459
10460 if (is_space_char (*op_string))
10461 ++op_string;
10462
10463 /* We check for an absolute prefix (differentiating,
10464 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
10465 if (*op_string == ABSOLUTE_PREFIX)
10466 {
10467 ++op_string;
10468 if (is_space_char (*op_string))
10469 ++op_string;
10470 i.jumpabsolute = TRUE;
10471 }
10472
10473 /* Check if operand is a register. */
10474 if ((r = parse_register (op_string, &end_op)) != NULL)
10475 {
10476 i386_operand_type temp;
10477
10478 /* Check for a segment override by searching for ':' after a
10479 segment register. */
10480 op_string = end_op;
10481 if (is_space_char (*op_string))
10482 ++op_string;
10483 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
10484 {
10485 switch (r->reg_num)
10486 {
10487 case 0:
10488 i.seg[i.mem_operands] = &es;
10489 break;
10490 case 1:
10491 i.seg[i.mem_operands] = &cs;
10492 break;
10493 case 2:
10494 i.seg[i.mem_operands] = &ss;
10495 break;
10496 case 3:
10497 i.seg[i.mem_operands] = &ds;
10498 break;
10499 case 4:
10500 i.seg[i.mem_operands] = &fs;
10501 break;
10502 case 5:
10503 i.seg[i.mem_operands] = &gs;
10504 break;
10505 }
10506
10507 /* Skip the ':' and whitespace. */
10508 ++op_string;
10509 if (is_space_char (*op_string))
10510 ++op_string;
10511
10512 if (!is_digit_char (*op_string)
10513 && !is_identifier_char (*op_string)
10514 && *op_string != '('
10515 && *op_string != ABSOLUTE_PREFIX)
10516 {
10517 as_bad (_("bad memory operand `%s'"), op_string);
10518 return 0;
10519 }
10520 /* Handle case of %es:*foo. */
10521 if (*op_string == ABSOLUTE_PREFIX)
10522 {
10523 ++op_string;
10524 if (is_space_char (*op_string))
10525 ++op_string;
10526 i.jumpabsolute = TRUE;
10527 }
10528 goto do_memory_reference;
10529 }
10530
10531 /* Handle vector operations. */
10532 if (*op_string == '{')
10533 {
10534 op_string = check_VecOperations (op_string, NULL);
10535 if (op_string == NULL)
10536 return 0;
10537 }
10538
10539 if (*op_string)
10540 {
10541 as_bad (_("junk `%s' after register"), op_string);
10542 return 0;
10543 }
10544 temp = r->reg_type;
10545 temp.bitfield.baseindex = 0;
10546 i.types[this_operand] = operand_type_or (i.types[this_operand],
10547 temp);
10548 i.types[this_operand].bitfield.unspecified = 0;
10549 i.op[this_operand].regs = r;
10550 i.reg_operands++;
10551 }
10552 else if (*op_string == REGISTER_PREFIX)
10553 {
10554 as_bad (_("bad register name `%s'"), op_string);
10555 return 0;
10556 }
10557 else if (*op_string == IMMEDIATE_PREFIX)
10558 {
10559 ++op_string;
10560 if (i.jumpabsolute)
10561 {
10562 as_bad (_("immediate operand illegal with absolute jump"));
10563 return 0;
10564 }
10565 if (!i386_immediate (op_string))
10566 return 0;
10567 }
10568 else if (RC_SAE_immediate (operand_string))
10569 {
10570 /* If it is a RC or SAE immediate, do nothing. */
10571 ;
10572 }
10573 else if (is_digit_char (*op_string)
10574 || is_identifier_char (*op_string)
10575 || *op_string == '"'
10576 || *op_string == '(')
10577 {
10578 /* This is a memory reference of some sort. */
10579 char *base_string;
10580
10581 /* Start and end of displacement string expression (if found). */
10582 char *displacement_string_start;
10583 char *displacement_string_end;
10584 char *vop_start;
10585
10586 do_memory_reference:
10587 if (i.mem_operands == 1 && !maybe_adjust_templates ())
10588 return 0;
10589 if ((i.mem_operands == 1
10590 && !current_templates->start->opcode_modifier.isstring)
10591 || i.mem_operands == 2)
10592 {
10593 as_bad (_("too many memory references for `%s'"),
10594 current_templates->start->name);
10595 return 0;
10596 }
10597
10598 /* Check for base index form. We detect the base index form by
10599 looking for an ')' at the end of the operand, searching
10600 for the '(' matching it, and finding a REGISTER_PREFIX or ','
10601 after the '('. */
10602 base_string = op_string + strlen (op_string);
10603
10604 /* Handle vector operations. */
10605 vop_start = strchr (op_string, '{');
10606 if (vop_start && vop_start < base_string)
10607 {
10608 if (check_VecOperations (vop_start, base_string) == NULL)
10609 return 0;
10610 base_string = vop_start;
10611 }
10612
10613 --base_string;
10614 if (is_space_char (*base_string))
10615 --base_string;
10616
10617 /* If we only have a displacement, set-up for it to be parsed later. */
10618 displacement_string_start = op_string;
10619 displacement_string_end = base_string + 1;
10620
10621 if (*base_string == ')')
10622 {
10623 char *temp_string;
10624 unsigned int parens_balanced = 1;
10625 /* We've already checked that the number of left & right ()'s are
10626 equal, so this loop will not be infinite. */
10627 do
10628 {
10629 base_string--;
10630 if (*base_string == ')')
10631 parens_balanced++;
10632 if (*base_string == '(')
10633 parens_balanced--;
10634 }
10635 while (parens_balanced);
10636
10637 temp_string = base_string;
10638
10639 /* Skip past '(' and whitespace. */
10640 ++base_string;
10641 if (is_space_char (*base_string))
10642 ++base_string;
10643
10644 if (*base_string == ','
10645 || ((i.base_reg = parse_register (base_string, &end_op))
10646 != NULL))
10647 {
10648 displacement_string_end = temp_string;
10649
10650 i.types[this_operand].bitfield.baseindex = 1;
10651
10652 if (i.base_reg)
10653 {
10654 base_string = end_op;
10655 if (is_space_char (*base_string))
10656 ++base_string;
10657 }
10658
10659 /* There may be an index reg or scale factor here. */
10660 if (*base_string == ',')
10661 {
10662 ++base_string;
10663 if (is_space_char (*base_string))
10664 ++base_string;
10665
10666 if ((i.index_reg = parse_register (base_string, &end_op))
10667 != NULL)
10668 {
10669 base_string = end_op;
10670 if (is_space_char (*base_string))
10671 ++base_string;
10672 if (*base_string == ',')
10673 {
10674 ++base_string;
10675 if (is_space_char (*base_string))
10676 ++base_string;
10677 }
10678 else if (*base_string != ')')
10679 {
10680 as_bad (_("expecting `,' or `)' "
10681 "after index register in `%s'"),
10682 operand_string);
10683 return 0;
10684 }
10685 }
10686 else if (*base_string == REGISTER_PREFIX)
10687 {
10688 end_op = strchr (base_string, ',');
10689 if (end_op)
10690 *end_op = '\0';
10691 as_bad (_("bad register name `%s'"), base_string);
10692 return 0;
10693 }
10694
10695 /* Check for scale factor. */
10696 if (*base_string != ')')
10697 {
10698 char *end_scale = i386_scale (base_string);
10699
10700 if (!end_scale)
10701 return 0;
10702
10703 base_string = end_scale;
10704 if (is_space_char (*base_string))
10705 ++base_string;
10706 if (*base_string != ')')
10707 {
10708 as_bad (_("expecting `)' "
10709 "after scale factor in `%s'"),
10710 operand_string);
10711 return 0;
10712 }
10713 }
10714 else if (!i.index_reg)
10715 {
10716 as_bad (_("expecting index register or scale factor "
10717 "after `,'; got '%c'"),
10718 *base_string);
10719 return 0;
10720 }
10721 }
10722 else if (*base_string != ')')
10723 {
10724 as_bad (_("expecting `,' or `)' "
10725 "after base register in `%s'"),
10726 operand_string);
10727 return 0;
10728 }
10729 }
10730 else if (*base_string == REGISTER_PREFIX)
10731 {
10732 end_op = strchr (base_string, ',');
10733 if (end_op)
10734 *end_op = '\0';
10735 as_bad (_("bad register name `%s'"), base_string);
10736 return 0;
10737 }
10738 }
10739
10740 /* If there's an expression beginning the operand, parse it,
10741 assuming displacement_string_start and
10742 displacement_string_end are meaningful. */
10743 if (displacement_string_start != displacement_string_end)
10744 {
10745 if (!i386_displacement (displacement_string_start,
10746 displacement_string_end))
10747 return 0;
10748 }
10749
10750 /* Special case for (%dx) while doing input/output op. */
10751 if (i.base_reg
10752 && i.base_reg->reg_type.bitfield.instance == RegD
10753 && i.base_reg->reg_type.bitfield.word
10754 && i.index_reg == 0
10755 && i.log2_scale_factor == 0
10756 && i.seg[i.mem_operands] == 0
10757 && !operand_type_check (i.types[this_operand], disp))
10758 {
10759 i.types[this_operand] = i.base_reg->reg_type;
10760 return 1;
10761 }
10762
10763 if (i386_index_check (operand_string) == 0)
10764 return 0;
10765 i.flags[this_operand] |= Operand_Mem;
10766 if (i.mem_operands == 0)
10767 i.memop1_string = xstrdup (operand_string);
10768 i.mem_operands++;
10769 }
10770 else
10771 {
10772 /* It's not a memory operand; argh! */
10773 as_bad (_("invalid char %s beginning operand %d `%s'"),
10774 output_invalid (*op_string),
10775 this_operand + 1,
10776 op_string);
10777 return 0;
10778 }
10779 return 1; /* Normal return. */
10780 }
10781 \f
10782 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10783 that an rs_machine_dependent frag may reach. */
10784
10785 unsigned int
10786 i386_frag_max_var (fragS *frag)
10787 {
10788 /* The only relaxable frags are for jumps.
10789 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
10790 gas_assert (frag->fr_type == rs_machine_dependent);
10791 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10792 }
10793
10794 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10795 static int
10796 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10797 {
10798 /* STT_GNU_IFUNC symbol must go through PLT. */
10799 if ((symbol_get_bfdsym (fr_symbol)->flags
10800 & BSF_GNU_INDIRECT_FUNCTION) != 0)
10801 return 0;
10802
10803 if (!S_IS_EXTERNAL (fr_symbol))
10804 /* Symbol may be weak or local. */
10805 return !S_IS_WEAK (fr_symbol);
10806
10807 /* Global symbols with non-default visibility can't be preempted. */
10808 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10809 return 1;
10810
10811 if (fr_var != NO_RELOC)
10812 switch ((enum bfd_reloc_code_real) fr_var)
10813 {
10814 case BFD_RELOC_386_PLT32:
10815 case BFD_RELOC_X86_64_PLT32:
10816 /* Symbol with PLT relocation may be preempted. */
10817 return 0;
10818 default:
10819 abort ();
10820 }
10821
10822 /* Global symbols with default visibility in a shared library may be
10823 preempted by another definition. */
10824 return !shared;
10825 }
10826 #endif
10827
10828 /* Return the next non-empty frag. */
10829
10830 static fragS *
10831 i386_next_non_empty_frag (fragS *fragP)
10832 {
10833 /* There may be a frag with a ".fill 0" when there is no room in
10834 the current frag for frag_grow in output_insn. */
10835 for (fragP = fragP->fr_next;
10836 (fragP != NULL
10837 && fragP->fr_type == rs_fill
10838 && fragP->fr_fix == 0);
10839 fragP = fragP->fr_next)
10840 ;
10841 return fragP;
10842 }
10843
10844 /* Return the next jcc frag after BRANCH_PADDING. */
10845
10846 static fragS *
10847 i386_next_jcc_frag (fragS *fragP)
10848 {
10849 if (!fragP)
10850 return NULL;
10851
10852 if (fragP->fr_type == rs_machine_dependent
10853 && (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10854 == BRANCH_PADDING))
10855 {
10856 fragP = i386_next_non_empty_frag (fragP);
10857 if (fragP->fr_type != rs_machine_dependent)
10858 return NULL;
10859 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == COND_JUMP)
10860 return fragP;
10861 }
10862
10863 return NULL;
10864 }
10865
10866 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
10867
10868 static void
10869 i386_classify_machine_dependent_frag (fragS *fragP)
10870 {
10871 fragS *cmp_fragP;
10872 fragS *pad_fragP;
10873 fragS *branch_fragP;
10874 fragS *next_fragP;
10875 unsigned int max_prefix_length;
10876
10877 if (fragP->tc_frag_data.classified)
10878 return;
10879
10880 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
10881 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
10882 for (next_fragP = fragP;
10883 next_fragP != NULL;
10884 next_fragP = next_fragP->fr_next)
10885 {
10886 next_fragP->tc_frag_data.classified = 1;
10887 if (next_fragP->fr_type == rs_machine_dependent)
10888 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
10889 {
10890 case BRANCH_PADDING:
10891 /* The BRANCH_PADDING frag must be followed by a branch
10892 frag. */
10893 branch_fragP = i386_next_non_empty_frag (next_fragP);
10894 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10895 break;
10896 case FUSED_JCC_PADDING:
10897 /* Check if this is a fused jcc:
10898 FUSED_JCC_PADDING
10899 CMP like instruction
10900 BRANCH_PADDING
10901 COND_JUMP
10902 */
10903 cmp_fragP = i386_next_non_empty_frag (next_fragP);
10904 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
10905 branch_fragP = i386_next_jcc_frag (pad_fragP);
10906 if (branch_fragP)
10907 {
10908 /* The BRANCH_PADDING frag is merged with the
10909 FUSED_JCC_PADDING frag. */
10910 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10911 /* CMP like instruction size. */
10912 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
10913 frag_wane (pad_fragP);
10914 /* Skip to branch_fragP. */
10915 next_fragP = branch_fragP;
10916 }
10917 else if (next_fragP->tc_frag_data.max_prefix_length)
10918 {
10919 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
10920 a fused jcc. */
10921 next_fragP->fr_subtype
10922 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
10923 next_fragP->tc_frag_data.max_bytes
10924 = next_fragP->tc_frag_data.max_prefix_length;
10925 /* This will be updated in the BRANCH_PREFIX scan. */
10926 next_fragP->tc_frag_data.max_prefix_length = 0;
10927 }
10928 else
10929 frag_wane (next_fragP);
10930 break;
10931 }
10932 }
10933
10934 /* Stop if there is no BRANCH_PREFIX. */
10935 if (!align_branch_prefix_size)
10936 return;
10937
10938 /* Scan for BRANCH_PREFIX. */
10939 for (; fragP != NULL; fragP = fragP->fr_next)
10940 {
10941 if (fragP->fr_type != rs_machine_dependent
10942 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10943 != BRANCH_PREFIX))
10944 continue;
10945
10946 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
10947 COND_JUMP_PREFIX. */
10948 max_prefix_length = 0;
10949 for (next_fragP = fragP;
10950 next_fragP != NULL;
10951 next_fragP = next_fragP->fr_next)
10952 {
10953 if (next_fragP->fr_type == rs_fill)
10954 /* Skip rs_fill frags. */
10955 continue;
10956 else if (next_fragP->fr_type != rs_machine_dependent)
10957 /* Stop for all other frags. */
10958 break;
10959
10960 /* rs_machine_dependent frags. */
10961 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
10962 == BRANCH_PREFIX)
10963 {
10964 /* Count BRANCH_PREFIX frags. */
10965 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
10966 {
10967 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
10968 frag_wane (next_fragP);
10969 }
10970 else
10971 max_prefix_length
10972 += next_fragP->tc_frag_data.max_bytes;
10973 }
10974 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
10975 == BRANCH_PADDING)
10976 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
10977 == FUSED_JCC_PADDING))
10978 {
10979 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
10980 fragP->tc_frag_data.u.padding_fragP = next_fragP;
10981 break;
10982 }
10983 else
10984 /* Stop for other rs_machine_dependent frags. */
10985 break;
10986 }
10987
10988 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
10989
10990 /* Skip to the next frag. */
10991 fragP = next_fragP;
10992 }
10993 }
10994
10995 /* Compute padding size for
10996
10997 FUSED_JCC_PADDING
10998 CMP like instruction
10999 BRANCH_PADDING
11000 COND_JUMP/UNCOND_JUMP
11001
11002 or
11003
11004 BRANCH_PADDING
11005 COND_JUMP/UNCOND_JUMP
11006 */
11007
11008 static int
11009 i386_branch_padding_size (fragS *fragP, offsetT address)
11010 {
11011 unsigned int offset, size, padding_size;
11012 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11013
11014 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11015 if (!address)
11016 address = fragP->fr_address;
11017 address += fragP->fr_fix;
11018
11019 /* CMP like instrunction size. */
11020 size = fragP->tc_frag_data.cmp_size;
11021
11022 /* The base size of the branch frag. */
11023 size += branch_fragP->fr_fix;
11024
11025 /* Add opcode and displacement bytes for the rs_machine_dependent
11026 branch frag. */
11027 if (branch_fragP->fr_type == rs_machine_dependent)
11028 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11029
11030 /* Check if branch is within boundary and doesn't end at the last
11031 byte. */
11032 offset = address & ((1U << align_branch_power) - 1);
11033 if ((offset + size) >= (1U << align_branch_power))
11034 /* Padding needed to avoid crossing boundary. */
11035 padding_size = (1U << align_branch_power) - offset;
11036 else
11037 /* No padding needed. */
11038 padding_size = 0;
11039
11040 /* The return value may be saved in tc_frag_data.length which is
11041 unsigned byte. */
11042 if (!fits_in_unsigned_byte (padding_size))
11043 abort ();
11044
11045 return padding_size;
11046 }
11047
11048 /* i386_generic_table_relax_frag()
11049
11050 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11051 grow/shrink padding to align branch frags. Hand others to
11052 relax_frag(). */
11053
11054 long
11055 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11056 {
11057 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11058 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11059 {
11060 long padding_size = i386_branch_padding_size (fragP, 0);
11061 long grow = padding_size - fragP->tc_frag_data.length;
11062
11063 /* When the BRANCH_PREFIX frag is used, the computed address
11064 must match the actual address and there should be no padding. */
11065 if (fragP->tc_frag_data.padding_address
11066 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11067 || padding_size))
11068 abort ();
11069
11070 /* Update the padding size. */
11071 if (grow)
11072 fragP->tc_frag_data.length = padding_size;
11073
11074 return grow;
11075 }
11076 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11077 {
11078 fragS *padding_fragP, *next_fragP;
11079 long padding_size, left_size, last_size;
11080
11081 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11082 if (!padding_fragP)
11083 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11084 return (fragP->tc_frag_data.length
11085 - fragP->tc_frag_data.last_length);
11086
11087 /* Compute the relative address of the padding frag in the very
11088 first time where the BRANCH_PREFIX frag sizes are zero. */
11089 if (!fragP->tc_frag_data.padding_address)
11090 fragP->tc_frag_data.padding_address
11091 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11092
11093 /* First update the last length from the previous interation. */
11094 left_size = fragP->tc_frag_data.prefix_length;
11095 for (next_fragP = fragP;
11096 next_fragP != padding_fragP;
11097 next_fragP = next_fragP->fr_next)
11098 if (next_fragP->fr_type == rs_machine_dependent
11099 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11100 == BRANCH_PREFIX))
11101 {
11102 if (left_size)
11103 {
11104 int max = next_fragP->tc_frag_data.max_bytes;
11105 if (max)
11106 {
11107 int size;
11108 if (max > left_size)
11109 size = left_size;
11110 else
11111 size = max;
11112 left_size -= size;
11113 next_fragP->tc_frag_data.last_length = size;
11114 }
11115 }
11116 else
11117 next_fragP->tc_frag_data.last_length = 0;
11118 }
11119
11120 /* Check the padding size for the padding frag. */
11121 padding_size = i386_branch_padding_size
11122 (padding_fragP, (fragP->fr_address
11123 + fragP->tc_frag_data.padding_address));
11124
11125 last_size = fragP->tc_frag_data.prefix_length;
11126 /* Check if there is change from the last interation. */
11127 if (padding_size == last_size)
11128 {
11129 /* Update the expected address of the padding frag. */
11130 padding_fragP->tc_frag_data.padding_address
11131 = (fragP->fr_address + padding_size
11132 + fragP->tc_frag_data.padding_address);
11133 return 0;
11134 }
11135
11136 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11137 {
11138 /* No padding if there is no sufficient room. Clear the
11139 expected address of the padding frag. */
11140 padding_fragP->tc_frag_data.padding_address = 0;
11141 padding_size = 0;
11142 }
11143 else
11144 /* Store the expected address of the padding frag. */
11145 padding_fragP->tc_frag_data.padding_address
11146 = (fragP->fr_address + padding_size
11147 + fragP->tc_frag_data.padding_address);
11148
11149 fragP->tc_frag_data.prefix_length = padding_size;
11150
11151 /* Update the length for the current interation. */
11152 left_size = padding_size;
11153 for (next_fragP = fragP;
11154 next_fragP != padding_fragP;
11155 next_fragP = next_fragP->fr_next)
11156 if (next_fragP->fr_type == rs_machine_dependent
11157 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11158 == BRANCH_PREFIX))
11159 {
11160 if (left_size)
11161 {
11162 int max = next_fragP->tc_frag_data.max_bytes;
11163 if (max)
11164 {
11165 int size;
11166 if (max > left_size)
11167 size = left_size;
11168 else
11169 size = max;
11170 left_size -= size;
11171 next_fragP->tc_frag_data.length = size;
11172 }
11173 }
11174 else
11175 next_fragP->tc_frag_data.length = 0;
11176 }
11177
11178 return (fragP->tc_frag_data.length
11179 - fragP->tc_frag_data.last_length);
11180 }
11181 return relax_frag (segment, fragP, stretch);
11182 }
11183
11184 /* md_estimate_size_before_relax()
11185
11186 Called just before relax() for rs_machine_dependent frags. The x86
11187 assembler uses these frags to handle variable size jump
11188 instructions.
11189
11190 Any symbol that is now undefined will not become defined.
11191 Return the correct fr_subtype in the frag.
11192 Return the initial "guess for variable size of frag" to caller.
11193 The guess is actually the growth beyond the fixed part. Whatever
11194 we do to grow the fixed or variable part contributes to our
11195 returned value. */
11196
11197 int
11198 md_estimate_size_before_relax (fragS *fragP, segT segment)
11199 {
11200 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11201 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11202 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11203 {
11204 i386_classify_machine_dependent_frag (fragP);
11205 return fragP->tc_frag_data.length;
11206 }
11207
11208 /* We've already got fragP->fr_subtype right; all we have to do is
11209 check for un-relaxable symbols. On an ELF system, we can't relax
11210 an externally visible symbol, because it may be overridden by a
11211 shared library. */
11212 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11213 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11214 || (IS_ELF
11215 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11216 fragP->fr_var))
11217 #endif
11218 #if defined (OBJ_COFF) && defined (TE_PE)
11219 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11220 && S_IS_WEAK (fragP->fr_symbol))
11221 #endif
11222 )
11223 {
11224 /* Symbol is undefined in this segment, or we need to keep a
11225 reloc so that weak symbols can be overridden. */
11226 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11227 enum bfd_reloc_code_real reloc_type;
11228 unsigned char *opcode;
11229 int old_fr_fix;
11230
11231 if (fragP->fr_var != NO_RELOC)
11232 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11233 else if (size == 2)
11234 reloc_type = BFD_RELOC_16_PCREL;
11235 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11236 else if (need_plt32_p (fragP->fr_symbol))
11237 reloc_type = BFD_RELOC_X86_64_PLT32;
11238 #endif
11239 else
11240 reloc_type = BFD_RELOC_32_PCREL;
11241
11242 old_fr_fix = fragP->fr_fix;
11243 opcode = (unsigned char *) fragP->fr_opcode;
11244
11245 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11246 {
11247 case UNCOND_JUMP:
11248 /* Make jmp (0xeb) a (d)word displacement jump. */
11249 opcode[0] = 0xe9;
11250 fragP->fr_fix += size;
11251 fix_new (fragP, old_fr_fix, size,
11252 fragP->fr_symbol,
11253 fragP->fr_offset, 1,
11254 reloc_type);
11255 break;
11256
11257 case COND_JUMP86:
11258 if (size == 2
11259 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11260 {
11261 /* Negate the condition, and branch past an
11262 unconditional jump. */
11263 opcode[0] ^= 1;
11264 opcode[1] = 3;
11265 /* Insert an unconditional jump. */
11266 opcode[2] = 0xe9;
11267 /* We added two extra opcode bytes, and have a two byte
11268 offset. */
11269 fragP->fr_fix += 2 + 2;
11270 fix_new (fragP, old_fr_fix + 2, 2,
11271 fragP->fr_symbol,
11272 fragP->fr_offset, 1,
11273 reloc_type);
11274 break;
11275 }
11276 /* Fall through. */
11277
11278 case COND_JUMP:
11279 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11280 {
11281 fixS *fixP;
11282
11283 fragP->fr_fix += 1;
11284 fixP = fix_new (fragP, old_fr_fix, 1,
11285 fragP->fr_symbol,
11286 fragP->fr_offset, 1,
11287 BFD_RELOC_8_PCREL);
11288 fixP->fx_signed = 1;
11289 break;
11290 }
11291
11292 /* This changes the byte-displacement jump 0x7N
11293 to the (d)word-displacement jump 0x0f,0x8N. */
11294 opcode[1] = opcode[0] + 0x10;
11295 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11296 /* We've added an opcode byte. */
11297 fragP->fr_fix += 1 + size;
11298 fix_new (fragP, old_fr_fix + 1, size,
11299 fragP->fr_symbol,
11300 fragP->fr_offset, 1,
11301 reloc_type);
11302 break;
11303
11304 default:
11305 BAD_CASE (fragP->fr_subtype);
11306 break;
11307 }
11308 frag_wane (fragP);
11309 return fragP->fr_fix - old_fr_fix;
11310 }
11311
11312 /* Guess size depending on current relax state. Initially the relax
11313 state will correspond to a short jump and we return 1, because
11314 the variable part of the frag (the branch offset) is one byte
11315 long. However, we can relax a section more than once and in that
11316 case we must either set fr_subtype back to the unrelaxed state,
11317 or return the value for the appropriate branch. */
11318 return md_relax_table[fragP->fr_subtype].rlx_length;
11319 }
11320
11321 /* Called after relax() is finished.
11322
11323 In: Address of frag.
11324 fr_type == rs_machine_dependent.
11325 fr_subtype is what the address relaxed to.
11326
11327 Out: Any fixSs and constants are set up.
11328 Caller will turn frag into a ".space 0". */
11329
11330 void
11331 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
11332 fragS *fragP)
11333 {
11334 unsigned char *opcode;
11335 unsigned char *where_to_put_displacement = NULL;
11336 offsetT target_address;
11337 offsetT opcode_address;
11338 unsigned int extension = 0;
11339 offsetT displacement_from_opcode_start;
11340
11341 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11342 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
11343 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11344 {
11345 /* Generate nop padding. */
11346 unsigned int size = fragP->tc_frag_data.length;
11347 if (size)
11348 {
11349 if (size > fragP->tc_frag_data.max_bytes)
11350 abort ();
11351
11352 if (flag_debug)
11353 {
11354 const char *msg;
11355 const char *branch = "branch";
11356 const char *prefix = "";
11357 fragS *padding_fragP;
11358 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11359 == BRANCH_PREFIX)
11360 {
11361 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11362 switch (fragP->tc_frag_data.default_prefix)
11363 {
11364 default:
11365 abort ();
11366 break;
11367 case CS_PREFIX_OPCODE:
11368 prefix = " cs";
11369 break;
11370 case DS_PREFIX_OPCODE:
11371 prefix = " ds";
11372 break;
11373 case ES_PREFIX_OPCODE:
11374 prefix = " es";
11375 break;
11376 case FS_PREFIX_OPCODE:
11377 prefix = " fs";
11378 break;
11379 case GS_PREFIX_OPCODE:
11380 prefix = " gs";
11381 break;
11382 case SS_PREFIX_OPCODE:
11383 prefix = " ss";
11384 break;
11385 }
11386 if (padding_fragP)
11387 msg = _("%s:%u: add %d%s at 0x%llx to align "
11388 "%s within %d-byte boundary\n");
11389 else
11390 msg = _("%s:%u: add additional %d%s at 0x%llx to "
11391 "align %s within %d-byte boundary\n");
11392 }
11393 else
11394 {
11395 padding_fragP = fragP;
11396 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
11397 "%s within %d-byte boundary\n");
11398 }
11399
11400 if (padding_fragP)
11401 switch (padding_fragP->tc_frag_data.branch_type)
11402 {
11403 case align_branch_jcc:
11404 branch = "jcc";
11405 break;
11406 case align_branch_fused:
11407 branch = "fused jcc";
11408 break;
11409 case align_branch_jmp:
11410 branch = "jmp";
11411 break;
11412 case align_branch_call:
11413 branch = "call";
11414 break;
11415 case align_branch_indirect:
11416 branch = "indiret branch";
11417 break;
11418 case align_branch_ret:
11419 branch = "ret";
11420 break;
11421 default:
11422 break;
11423 }
11424
11425 fprintf (stdout, msg,
11426 fragP->fr_file, fragP->fr_line, size, prefix,
11427 (long long) fragP->fr_address, branch,
11428 1 << align_branch_power);
11429 }
11430 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11431 memset (fragP->fr_opcode,
11432 fragP->tc_frag_data.default_prefix, size);
11433 else
11434 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
11435 size, 0);
11436 fragP->fr_fix += size;
11437 }
11438 return;
11439 }
11440
11441 opcode = (unsigned char *) fragP->fr_opcode;
11442
11443 /* Address we want to reach in file space. */
11444 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
11445
11446 /* Address opcode resides at in file space. */
11447 opcode_address = fragP->fr_address + fragP->fr_fix;
11448
11449 /* Displacement from opcode start to fill into instruction. */
11450 displacement_from_opcode_start = target_address - opcode_address;
11451
11452 if ((fragP->fr_subtype & BIG) == 0)
11453 {
11454 /* Don't have to change opcode. */
11455 extension = 1; /* 1 opcode + 1 displacement */
11456 where_to_put_displacement = &opcode[1];
11457 }
11458 else
11459 {
11460 if (no_cond_jump_promotion
11461 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
11462 as_warn_where (fragP->fr_file, fragP->fr_line,
11463 _("long jump required"));
11464
11465 switch (fragP->fr_subtype)
11466 {
11467 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
11468 extension = 4; /* 1 opcode + 4 displacement */
11469 opcode[0] = 0xe9;
11470 where_to_put_displacement = &opcode[1];
11471 break;
11472
11473 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
11474 extension = 2; /* 1 opcode + 2 displacement */
11475 opcode[0] = 0xe9;
11476 where_to_put_displacement = &opcode[1];
11477 break;
11478
11479 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
11480 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
11481 extension = 5; /* 2 opcode + 4 displacement */
11482 opcode[1] = opcode[0] + 0x10;
11483 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11484 where_to_put_displacement = &opcode[2];
11485 break;
11486
11487 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
11488 extension = 3; /* 2 opcode + 2 displacement */
11489 opcode[1] = opcode[0] + 0x10;
11490 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11491 where_to_put_displacement = &opcode[2];
11492 break;
11493
11494 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
11495 extension = 4;
11496 opcode[0] ^= 1;
11497 opcode[1] = 3;
11498 opcode[2] = 0xe9;
11499 where_to_put_displacement = &opcode[3];
11500 break;
11501
11502 default:
11503 BAD_CASE (fragP->fr_subtype);
11504 break;
11505 }
11506 }
11507
11508 /* If size if less then four we are sure that the operand fits,
11509 but if it's 4, then it could be that the displacement is larger
11510 then -/+ 2GB. */
11511 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
11512 && object_64bit
11513 && ((addressT) (displacement_from_opcode_start - extension
11514 + ((addressT) 1 << 31))
11515 > (((addressT) 2 << 31) - 1)))
11516 {
11517 as_bad_where (fragP->fr_file, fragP->fr_line,
11518 _("jump target out of range"));
11519 /* Make us emit 0. */
11520 displacement_from_opcode_start = extension;
11521 }
11522 /* Now put displacement after opcode. */
11523 md_number_to_chars ((char *) where_to_put_displacement,
11524 (valueT) (displacement_from_opcode_start - extension),
11525 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
11526 fragP->fr_fix += extension;
11527 }
11528 \f
11529 /* Apply a fixup (fixP) to segment data, once it has been determined
11530 by our caller that we have all the info we need to fix it up.
11531
11532 Parameter valP is the pointer to the value of the bits.
11533
11534 On the 386, immediates, displacements, and data pointers are all in
11535 the same (little-endian) format, so we don't need to care about which
11536 we are handling. */
11537
11538 void
11539 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
11540 {
11541 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
11542 valueT value = *valP;
11543
11544 #if !defined (TE_Mach)
11545 if (fixP->fx_pcrel)
11546 {
11547 switch (fixP->fx_r_type)
11548 {
11549 default:
11550 break;
11551
11552 case BFD_RELOC_64:
11553 fixP->fx_r_type = BFD_RELOC_64_PCREL;
11554 break;
11555 case BFD_RELOC_32:
11556 case BFD_RELOC_X86_64_32S:
11557 fixP->fx_r_type = BFD_RELOC_32_PCREL;
11558 break;
11559 case BFD_RELOC_16:
11560 fixP->fx_r_type = BFD_RELOC_16_PCREL;
11561 break;
11562 case BFD_RELOC_8:
11563 fixP->fx_r_type = BFD_RELOC_8_PCREL;
11564 break;
11565 }
11566 }
11567
11568 if (fixP->fx_addsy != NULL
11569 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
11570 || fixP->fx_r_type == BFD_RELOC_64_PCREL
11571 || fixP->fx_r_type == BFD_RELOC_16_PCREL
11572 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
11573 && !use_rela_relocations)
11574 {
11575 /* This is a hack. There should be a better way to handle this.
11576 This covers for the fact that bfd_install_relocation will
11577 subtract the current location (for partial_inplace, PC relative
11578 relocations); see more below. */
11579 #ifndef OBJ_AOUT
11580 if (IS_ELF
11581 #ifdef TE_PE
11582 || OUTPUT_FLAVOR == bfd_target_coff_flavour
11583 #endif
11584 )
11585 value += fixP->fx_where + fixP->fx_frag->fr_address;
11586 #endif
11587 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11588 if (IS_ELF)
11589 {
11590 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
11591
11592 if ((sym_seg == seg
11593 || (symbol_section_p (fixP->fx_addsy)
11594 && sym_seg != absolute_section))
11595 && !generic_force_reloc (fixP))
11596 {
11597 /* Yes, we add the values in twice. This is because
11598 bfd_install_relocation subtracts them out again. I think
11599 bfd_install_relocation is broken, but I don't dare change
11600 it. FIXME. */
11601 value += fixP->fx_where + fixP->fx_frag->fr_address;
11602 }
11603 }
11604 #endif
11605 #if defined (OBJ_COFF) && defined (TE_PE)
11606 /* For some reason, the PE format does not store a
11607 section address offset for a PC relative symbol. */
11608 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
11609 || S_IS_WEAK (fixP->fx_addsy))
11610 value += md_pcrel_from (fixP);
11611 #endif
11612 }
11613 #if defined (OBJ_COFF) && defined (TE_PE)
11614 if (fixP->fx_addsy != NULL
11615 && S_IS_WEAK (fixP->fx_addsy)
11616 /* PR 16858: Do not modify weak function references. */
11617 && ! fixP->fx_pcrel)
11618 {
11619 #if !defined (TE_PEP)
11620 /* For x86 PE weak function symbols are neither PC-relative
11621 nor do they set S_IS_FUNCTION. So the only reliable way
11622 to detect them is to check the flags of their containing
11623 section. */
11624 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
11625 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
11626 ;
11627 else
11628 #endif
11629 value -= S_GET_VALUE (fixP->fx_addsy);
11630 }
11631 #endif
11632
11633 /* Fix a few things - the dynamic linker expects certain values here,
11634 and we must not disappoint it. */
11635 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11636 if (IS_ELF && fixP->fx_addsy)
11637 switch (fixP->fx_r_type)
11638 {
11639 case BFD_RELOC_386_PLT32:
11640 case BFD_RELOC_X86_64_PLT32:
11641 /* Make the jump instruction point to the address of the operand.
11642 At runtime we merely add the offset to the actual PLT entry.
11643 NB: Subtract the offset size only for jump instructions. */
11644 if (fixP->fx_pcrel)
11645 value = -4;
11646 break;
11647
11648 case BFD_RELOC_386_TLS_GD:
11649 case BFD_RELOC_386_TLS_LDM:
11650 case BFD_RELOC_386_TLS_IE_32:
11651 case BFD_RELOC_386_TLS_IE:
11652 case BFD_RELOC_386_TLS_GOTIE:
11653 case BFD_RELOC_386_TLS_GOTDESC:
11654 case BFD_RELOC_X86_64_TLSGD:
11655 case BFD_RELOC_X86_64_TLSLD:
11656 case BFD_RELOC_X86_64_GOTTPOFF:
11657 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11658 value = 0; /* Fully resolved at runtime. No addend. */
11659 /* Fallthrough */
11660 case BFD_RELOC_386_TLS_LE:
11661 case BFD_RELOC_386_TLS_LDO_32:
11662 case BFD_RELOC_386_TLS_LE_32:
11663 case BFD_RELOC_X86_64_DTPOFF32:
11664 case BFD_RELOC_X86_64_DTPOFF64:
11665 case BFD_RELOC_X86_64_TPOFF32:
11666 case BFD_RELOC_X86_64_TPOFF64:
11667 S_SET_THREAD_LOCAL (fixP->fx_addsy);
11668 break;
11669
11670 case BFD_RELOC_386_TLS_DESC_CALL:
11671 case BFD_RELOC_X86_64_TLSDESC_CALL:
11672 value = 0; /* Fully resolved at runtime. No addend. */
11673 S_SET_THREAD_LOCAL (fixP->fx_addsy);
11674 fixP->fx_done = 0;
11675 return;
11676
11677 case BFD_RELOC_VTABLE_INHERIT:
11678 case BFD_RELOC_VTABLE_ENTRY:
11679 fixP->fx_done = 0;
11680 return;
11681
11682 default:
11683 break;
11684 }
11685 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
11686 *valP = value;
11687 #endif /* !defined (TE_Mach) */
11688
11689 /* Are we finished with this relocation now? */
11690 if (fixP->fx_addsy == NULL)
11691 fixP->fx_done = 1;
11692 #if defined (OBJ_COFF) && defined (TE_PE)
11693 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
11694 {
11695 fixP->fx_done = 0;
11696 /* Remember value for tc_gen_reloc. */
11697 fixP->fx_addnumber = value;
11698 /* Clear out the frag for now. */
11699 value = 0;
11700 }
11701 #endif
11702 else if (use_rela_relocations)
11703 {
11704 fixP->fx_no_overflow = 1;
11705 /* Remember value for tc_gen_reloc. */
11706 fixP->fx_addnumber = value;
11707 value = 0;
11708 }
11709
11710 md_number_to_chars (p, value, fixP->fx_size);
11711 }
11712 \f
11713 const char *
11714 md_atof (int type, char *litP, int *sizeP)
11715 {
11716 /* This outputs the LITTLENUMs in REVERSE order;
11717 in accord with the bigendian 386. */
11718 return ieee_md_atof (type, litP, sizeP, FALSE);
11719 }
11720 \f
11721 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
11722
11723 static char *
11724 output_invalid (int c)
11725 {
11726 if (ISPRINT (c))
11727 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11728 "'%c'", c);
11729 else
11730 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11731 "(0x%x)", (unsigned char) c);
11732 return output_invalid_buf;
11733 }
11734
11735 /* REG_STRING starts *before* REGISTER_PREFIX. */
11736
11737 static const reg_entry *
11738 parse_real_register (char *reg_string, char **end_op)
11739 {
11740 char *s = reg_string;
11741 char *p;
11742 char reg_name_given[MAX_REG_NAME_SIZE + 1];
11743 const reg_entry *r;
11744
11745 /* Skip possible REGISTER_PREFIX and possible whitespace. */
11746 if (*s == REGISTER_PREFIX)
11747 ++s;
11748
11749 if (is_space_char (*s))
11750 ++s;
11751
11752 p = reg_name_given;
11753 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
11754 {
11755 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
11756 return (const reg_entry *) NULL;
11757 s++;
11758 }
11759
11760 /* For naked regs, make sure that we are not dealing with an identifier.
11761 This prevents confusing an identifier like `eax_var' with register
11762 `eax'. */
11763 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
11764 return (const reg_entry *) NULL;
11765
11766 *end_op = s;
11767
11768 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
11769
11770 /* Handle floating point regs, allowing spaces in the (i) part. */
11771 if (r == i386_regtab /* %st is first entry of table */)
11772 {
11773 if (!cpu_arch_flags.bitfield.cpu8087
11774 && !cpu_arch_flags.bitfield.cpu287
11775 && !cpu_arch_flags.bitfield.cpu387)
11776 return (const reg_entry *) NULL;
11777
11778 if (is_space_char (*s))
11779 ++s;
11780 if (*s == '(')
11781 {
11782 ++s;
11783 if (is_space_char (*s))
11784 ++s;
11785 if (*s >= '0' && *s <= '7')
11786 {
11787 int fpr = *s - '0';
11788 ++s;
11789 if (is_space_char (*s))
11790 ++s;
11791 if (*s == ')')
11792 {
11793 *end_op = s + 1;
11794 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
11795 know (r);
11796 return r + fpr;
11797 }
11798 }
11799 /* We have "%st(" then garbage. */
11800 return (const reg_entry *) NULL;
11801 }
11802 }
11803
11804 if (r == NULL || allow_pseudo_reg)
11805 return r;
11806
11807 if (operand_type_all_zero (&r->reg_type))
11808 return (const reg_entry *) NULL;
11809
11810 if ((r->reg_type.bitfield.dword
11811 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
11812 || r->reg_type.bitfield.class == RegCR
11813 || r->reg_type.bitfield.class == RegDR
11814 || r->reg_type.bitfield.class == RegTR)
11815 && !cpu_arch_flags.bitfield.cpui386)
11816 return (const reg_entry *) NULL;
11817
11818 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
11819 return (const reg_entry *) NULL;
11820
11821 if (!cpu_arch_flags.bitfield.cpuavx512f)
11822 {
11823 if (r->reg_type.bitfield.zmmword
11824 || r->reg_type.bitfield.class == RegMask)
11825 return (const reg_entry *) NULL;
11826
11827 if (!cpu_arch_flags.bitfield.cpuavx)
11828 {
11829 if (r->reg_type.bitfield.ymmword)
11830 return (const reg_entry *) NULL;
11831
11832 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
11833 return (const reg_entry *) NULL;
11834 }
11835 }
11836
11837 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
11838 return (const reg_entry *) NULL;
11839
11840 /* Don't allow fake index register unless allow_index_reg isn't 0. */
11841 if (!allow_index_reg && r->reg_num == RegIZ)
11842 return (const reg_entry *) NULL;
11843
11844 /* Upper 16 vector registers are only available with VREX in 64bit
11845 mode, and require EVEX encoding. */
11846 if (r->reg_flags & RegVRex)
11847 {
11848 if (!cpu_arch_flags.bitfield.cpuavx512f
11849 || flag_code != CODE_64BIT)
11850 return (const reg_entry *) NULL;
11851
11852 i.vec_encoding = vex_encoding_evex;
11853 }
11854
11855 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
11856 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
11857 && flag_code != CODE_64BIT)
11858 return (const reg_entry *) NULL;
11859
11860 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
11861 && !intel_syntax)
11862 return (const reg_entry *) NULL;
11863
11864 return r;
11865 }
11866
11867 /* REG_STRING starts *before* REGISTER_PREFIX. */
11868
11869 static const reg_entry *
11870 parse_register (char *reg_string, char **end_op)
11871 {
11872 const reg_entry *r;
11873
11874 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
11875 r = parse_real_register (reg_string, end_op);
11876 else
11877 r = NULL;
11878 if (!r)
11879 {
11880 char *save = input_line_pointer;
11881 char c;
11882 symbolS *symbolP;
11883
11884 input_line_pointer = reg_string;
11885 c = get_symbol_name (&reg_string);
11886 symbolP = symbol_find (reg_string);
11887 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
11888 {
11889 const expressionS *e = symbol_get_value_expression (symbolP);
11890
11891 know (e->X_op == O_register);
11892 know (e->X_add_number >= 0
11893 && (valueT) e->X_add_number < i386_regtab_size);
11894 r = i386_regtab + e->X_add_number;
11895 if ((r->reg_flags & RegVRex))
11896 i.vec_encoding = vex_encoding_evex;
11897 *end_op = input_line_pointer;
11898 }
11899 *input_line_pointer = c;
11900 input_line_pointer = save;
11901 }
11902 return r;
11903 }
11904
11905 int
11906 i386_parse_name (char *name, expressionS *e, char *nextcharP)
11907 {
11908 const reg_entry *r;
11909 char *end = input_line_pointer;
11910
11911 *end = *nextcharP;
11912 r = parse_register (name, &input_line_pointer);
11913 if (r && end <= input_line_pointer)
11914 {
11915 *nextcharP = *input_line_pointer;
11916 *input_line_pointer = 0;
11917 e->X_op = O_register;
11918 e->X_add_number = r - i386_regtab;
11919 return 1;
11920 }
11921 input_line_pointer = end;
11922 *end = 0;
11923 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
11924 }
11925
11926 void
11927 md_operand (expressionS *e)
11928 {
11929 char *end;
11930 const reg_entry *r;
11931
11932 switch (*input_line_pointer)
11933 {
11934 case REGISTER_PREFIX:
11935 r = parse_real_register (input_line_pointer, &end);
11936 if (r)
11937 {
11938 e->X_op = O_register;
11939 e->X_add_number = r - i386_regtab;
11940 input_line_pointer = end;
11941 }
11942 break;
11943
11944 case '[':
11945 gas_assert (intel_syntax);
11946 end = input_line_pointer++;
11947 expression (e);
11948 if (*input_line_pointer == ']')
11949 {
11950 ++input_line_pointer;
11951 e->X_op_symbol = make_expr_symbol (e);
11952 e->X_add_symbol = NULL;
11953 e->X_add_number = 0;
11954 e->X_op = O_index;
11955 }
11956 else
11957 {
11958 e->X_op = O_absent;
11959 input_line_pointer = end;
11960 }
11961 break;
11962 }
11963 }
11964
11965 \f
11966 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11967 const char *md_shortopts = "kVQ:sqnO::";
11968 #else
11969 const char *md_shortopts = "qnO::";
11970 #endif
11971
11972 #define OPTION_32 (OPTION_MD_BASE + 0)
11973 #define OPTION_64 (OPTION_MD_BASE + 1)
11974 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
11975 #define OPTION_MARCH (OPTION_MD_BASE + 3)
11976 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
11977 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
11978 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
11979 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
11980 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
11981 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
11982 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
11983 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
11984 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
11985 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
11986 #define OPTION_X32 (OPTION_MD_BASE + 14)
11987 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
11988 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
11989 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
11990 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
11991 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
11992 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
11993 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
11994 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
11995 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
11996 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
11997 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
11998 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
11999 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12000 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12001 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12002 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12003
12004 struct option md_longopts[] =
12005 {
12006 {"32", no_argument, NULL, OPTION_32},
12007 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12008 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12009 {"64", no_argument, NULL, OPTION_64},
12010 #endif
12011 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12012 {"x32", no_argument, NULL, OPTION_X32},
12013 {"mshared", no_argument, NULL, OPTION_MSHARED},
12014 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12015 #endif
12016 {"divide", no_argument, NULL, OPTION_DIVIDE},
12017 {"march", required_argument, NULL, OPTION_MARCH},
12018 {"mtune", required_argument, NULL, OPTION_MTUNE},
12019 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12020 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12021 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12022 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12023 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12024 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12025 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12026 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12027 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12028 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12029 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12030 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12031 # if defined (TE_PE) || defined (TE_PEP)
12032 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12033 #endif
12034 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12035 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12036 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12037 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12038 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12039 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12040 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12041 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12042 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12043 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12044 {NULL, no_argument, NULL, 0}
12045 };
12046 size_t md_longopts_size = sizeof (md_longopts);
12047
12048 int
12049 md_parse_option (int c, const char *arg)
12050 {
12051 unsigned int j;
12052 char *arch, *next, *saved, *type;
12053
12054 switch (c)
12055 {
12056 case 'n':
12057 optimize_align_code = 0;
12058 break;
12059
12060 case 'q':
12061 quiet_warnings = 1;
12062 break;
12063
12064 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12065 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12066 should be emitted or not. FIXME: Not implemented. */
12067 case 'Q':
12068 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12069 return 0;
12070 break;
12071
12072 /* -V: SVR4 argument to print version ID. */
12073 case 'V':
12074 print_version_id ();
12075 break;
12076
12077 /* -k: Ignore for FreeBSD compatibility. */
12078 case 'k':
12079 break;
12080
12081 case 's':
12082 /* -s: On i386 Solaris, this tells the native assembler to use
12083 .stab instead of .stab.excl. We always use .stab anyhow. */
12084 break;
12085
12086 case OPTION_MSHARED:
12087 shared = 1;
12088 break;
12089
12090 case OPTION_X86_USED_NOTE:
12091 if (strcasecmp (arg, "yes") == 0)
12092 x86_used_note = 1;
12093 else if (strcasecmp (arg, "no") == 0)
12094 x86_used_note = 0;
12095 else
12096 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12097 break;
12098
12099
12100 #endif
12101 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12102 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12103 case OPTION_64:
12104 {
12105 const char **list, **l;
12106
12107 list = bfd_target_list ();
12108 for (l = list; *l != NULL; l++)
12109 if (CONST_STRNEQ (*l, "elf64-x86-64")
12110 || strcmp (*l, "coff-x86-64") == 0
12111 || strcmp (*l, "pe-x86-64") == 0
12112 || strcmp (*l, "pei-x86-64") == 0
12113 || strcmp (*l, "mach-o-x86-64") == 0)
12114 {
12115 default_arch = "x86_64";
12116 break;
12117 }
12118 if (*l == NULL)
12119 as_fatal (_("no compiled in support for x86_64"));
12120 free (list);
12121 }
12122 break;
12123 #endif
12124
12125 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12126 case OPTION_X32:
12127 if (IS_ELF)
12128 {
12129 const char **list, **l;
12130
12131 list = bfd_target_list ();
12132 for (l = list; *l != NULL; l++)
12133 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12134 {
12135 default_arch = "x86_64:32";
12136 break;
12137 }
12138 if (*l == NULL)
12139 as_fatal (_("no compiled in support for 32bit x86_64"));
12140 free (list);
12141 }
12142 else
12143 as_fatal (_("32bit x86_64 is only supported for ELF"));
12144 break;
12145 #endif
12146
12147 case OPTION_32:
12148 default_arch = "i386";
12149 break;
12150
12151 case OPTION_DIVIDE:
12152 #ifdef SVR4_COMMENT_CHARS
12153 {
12154 char *n, *t;
12155 const char *s;
12156
12157 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12158 t = n;
12159 for (s = i386_comment_chars; *s != '\0'; s++)
12160 if (*s != '/')
12161 *t++ = *s;
12162 *t = '\0';
12163 i386_comment_chars = n;
12164 }
12165 #endif
12166 break;
12167
12168 case OPTION_MARCH:
12169 saved = xstrdup (arg);
12170 arch = saved;
12171 /* Allow -march=+nosse. */
12172 if (*arch == '+')
12173 arch++;
12174 do
12175 {
12176 if (*arch == '.')
12177 as_fatal (_("invalid -march= option: `%s'"), arg);
12178 next = strchr (arch, '+');
12179 if (next)
12180 *next++ = '\0';
12181 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12182 {
12183 if (strcmp (arch, cpu_arch [j].name) == 0)
12184 {
12185 /* Processor. */
12186 if (! cpu_arch[j].flags.bitfield.cpui386)
12187 continue;
12188
12189 cpu_arch_name = cpu_arch[j].name;
12190 cpu_sub_arch_name = NULL;
12191 cpu_arch_flags = cpu_arch[j].flags;
12192 cpu_arch_isa = cpu_arch[j].type;
12193 cpu_arch_isa_flags = cpu_arch[j].flags;
12194 if (!cpu_arch_tune_set)
12195 {
12196 cpu_arch_tune = cpu_arch_isa;
12197 cpu_arch_tune_flags = cpu_arch_isa_flags;
12198 }
12199 break;
12200 }
12201 else if (*cpu_arch [j].name == '.'
12202 && strcmp (arch, cpu_arch [j].name + 1) == 0)
12203 {
12204 /* ISA extension. */
12205 i386_cpu_flags flags;
12206
12207 flags = cpu_flags_or (cpu_arch_flags,
12208 cpu_arch[j].flags);
12209
12210 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12211 {
12212 if (cpu_sub_arch_name)
12213 {
12214 char *name = cpu_sub_arch_name;
12215 cpu_sub_arch_name = concat (name,
12216 cpu_arch[j].name,
12217 (const char *) NULL);
12218 free (name);
12219 }
12220 else
12221 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12222 cpu_arch_flags = flags;
12223 cpu_arch_isa_flags = flags;
12224 }
12225 else
12226 cpu_arch_isa_flags
12227 = cpu_flags_or (cpu_arch_isa_flags,
12228 cpu_arch[j].flags);
12229 break;
12230 }
12231 }
12232
12233 if (j >= ARRAY_SIZE (cpu_arch))
12234 {
12235 /* Disable an ISA extension. */
12236 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12237 if (strcmp (arch, cpu_noarch [j].name) == 0)
12238 {
12239 i386_cpu_flags flags;
12240
12241 flags = cpu_flags_and_not (cpu_arch_flags,
12242 cpu_noarch[j].flags);
12243 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12244 {
12245 if (cpu_sub_arch_name)
12246 {
12247 char *name = cpu_sub_arch_name;
12248 cpu_sub_arch_name = concat (arch,
12249 (const char *) NULL);
12250 free (name);
12251 }
12252 else
12253 cpu_sub_arch_name = xstrdup (arch);
12254 cpu_arch_flags = flags;
12255 cpu_arch_isa_flags = flags;
12256 }
12257 break;
12258 }
12259
12260 if (j >= ARRAY_SIZE (cpu_noarch))
12261 j = ARRAY_SIZE (cpu_arch);
12262 }
12263
12264 if (j >= ARRAY_SIZE (cpu_arch))
12265 as_fatal (_("invalid -march= option: `%s'"), arg);
12266
12267 arch = next;
12268 }
12269 while (next != NULL);
12270 free (saved);
12271 break;
12272
12273 case OPTION_MTUNE:
12274 if (*arg == '.')
12275 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12276 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12277 {
12278 if (strcmp (arg, cpu_arch [j].name) == 0)
12279 {
12280 cpu_arch_tune_set = 1;
12281 cpu_arch_tune = cpu_arch [j].type;
12282 cpu_arch_tune_flags = cpu_arch[j].flags;
12283 break;
12284 }
12285 }
12286 if (j >= ARRAY_SIZE (cpu_arch))
12287 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12288 break;
12289
12290 case OPTION_MMNEMONIC:
12291 if (strcasecmp (arg, "att") == 0)
12292 intel_mnemonic = 0;
12293 else if (strcasecmp (arg, "intel") == 0)
12294 intel_mnemonic = 1;
12295 else
12296 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
12297 break;
12298
12299 case OPTION_MSYNTAX:
12300 if (strcasecmp (arg, "att") == 0)
12301 intel_syntax = 0;
12302 else if (strcasecmp (arg, "intel") == 0)
12303 intel_syntax = 1;
12304 else
12305 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
12306 break;
12307
12308 case OPTION_MINDEX_REG:
12309 allow_index_reg = 1;
12310 break;
12311
12312 case OPTION_MNAKED_REG:
12313 allow_naked_reg = 1;
12314 break;
12315
12316 case OPTION_MSSE2AVX:
12317 sse2avx = 1;
12318 break;
12319
12320 case OPTION_MSSE_CHECK:
12321 if (strcasecmp (arg, "error") == 0)
12322 sse_check = check_error;
12323 else if (strcasecmp (arg, "warning") == 0)
12324 sse_check = check_warning;
12325 else if (strcasecmp (arg, "none") == 0)
12326 sse_check = check_none;
12327 else
12328 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
12329 break;
12330
12331 case OPTION_MOPERAND_CHECK:
12332 if (strcasecmp (arg, "error") == 0)
12333 operand_check = check_error;
12334 else if (strcasecmp (arg, "warning") == 0)
12335 operand_check = check_warning;
12336 else if (strcasecmp (arg, "none") == 0)
12337 operand_check = check_none;
12338 else
12339 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
12340 break;
12341
12342 case OPTION_MAVXSCALAR:
12343 if (strcasecmp (arg, "128") == 0)
12344 avxscalar = vex128;
12345 else if (strcasecmp (arg, "256") == 0)
12346 avxscalar = vex256;
12347 else
12348 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
12349 break;
12350
12351 case OPTION_MVEXWIG:
12352 if (strcmp (arg, "0") == 0)
12353 vexwig = vexw0;
12354 else if (strcmp (arg, "1") == 0)
12355 vexwig = vexw1;
12356 else
12357 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
12358 break;
12359
12360 case OPTION_MADD_BND_PREFIX:
12361 add_bnd_prefix = 1;
12362 break;
12363
12364 case OPTION_MEVEXLIG:
12365 if (strcmp (arg, "128") == 0)
12366 evexlig = evexl128;
12367 else if (strcmp (arg, "256") == 0)
12368 evexlig = evexl256;
12369 else if (strcmp (arg, "512") == 0)
12370 evexlig = evexl512;
12371 else
12372 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
12373 break;
12374
12375 case OPTION_MEVEXRCIG:
12376 if (strcmp (arg, "rne") == 0)
12377 evexrcig = rne;
12378 else if (strcmp (arg, "rd") == 0)
12379 evexrcig = rd;
12380 else if (strcmp (arg, "ru") == 0)
12381 evexrcig = ru;
12382 else if (strcmp (arg, "rz") == 0)
12383 evexrcig = rz;
12384 else
12385 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
12386 break;
12387
12388 case OPTION_MEVEXWIG:
12389 if (strcmp (arg, "0") == 0)
12390 evexwig = evexw0;
12391 else if (strcmp (arg, "1") == 0)
12392 evexwig = evexw1;
12393 else
12394 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
12395 break;
12396
12397 # if defined (TE_PE) || defined (TE_PEP)
12398 case OPTION_MBIG_OBJ:
12399 use_big_obj = 1;
12400 break;
12401 #endif
12402
12403 case OPTION_MOMIT_LOCK_PREFIX:
12404 if (strcasecmp (arg, "yes") == 0)
12405 omit_lock_prefix = 1;
12406 else if (strcasecmp (arg, "no") == 0)
12407 omit_lock_prefix = 0;
12408 else
12409 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
12410 break;
12411
12412 case OPTION_MFENCE_AS_LOCK_ADD:
12413 if (strcasecmp (arg, "yes") == 0)
12414 avoid_fence = 1;
12415 else if (strcasecmp (arg, "no") == 0)
12416 avoid_fence = 0;
12417 else
12418 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
12419 break;
12420
12421 case OPTION_MRELAX_RELOCATIONS:
12422 if (strcasecmp (arg, "yes") == 0)
12423 generate_relax_relocations = 1;
12424 else if (strcasecmp (arg, "no") == 0)
12425 generate_relax_relocations = 0;
12426 else
12427 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
12428 break;
12429
12430 case OPTION_MALIGN_BRANCH_BOUNDARY:
12431 {
12432 char *end;
12433 long int align = strtoul (arg, &end, 0);
12434 if (*end == '\0')
12435 {
12436 if (align == 0)
12437 {
12438 align_branch_power = 0;
12439 break;
12440 }
12441 else if (align >= 16)
12442 {
12443 int align_power;
12444 for (align_power = 0;
12445 (align & 1) == 0;
12446 align >>= 1, align_power++)
12447 continue;
12448 /* Limit alignment power to 31. */
12449 if (align == 1 && align_power < 32)
12450 {
12451 align_branch_power = align_power;
12452 break;
12453 }
12454 }
12455 }
12456 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
12457 }
12458 break;
12459
12460 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
12461 {
12462 char *end;
12463 int align = strtoul (arg, &end, 0);
12464 /* Some processors only support 5 prefixes. */
12465 if (*end == '\0' && align >= 0 && align < 6)
12466 {
12467 align_branch_prefix_size = align;
12468 break;
12469 }
12470 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
12471 arg);
12472 }
12473 break;
12474
12475 case OPTION_MALIGN_BRANCH:
12476 align_branch = 0;
12477 saved = xstrdup (arg);
12478 type = saved;
12479 do
12480 {
12481 next = strchr (type, '+');
12482 if (next)
12483 *next++ = '\0';
12484 if (strcasecmp (type, "jcc") == 0)
12485 align_branch |= align_branch_jcc_bit;
12486 else if (strcasecmp (type, "fused") == 0)
12487 align_branch |= align_branch_fused_bit;
12488 else if (strcasecmp (type, "jmp") == 0)
12489 align_branch |= align_branch_jmp_bit;
12490 else if (strcasecmp (type, "call") == 0)
12491 align_branch |= align_branch_call_bit;
12492 else if (strcasecmp (type, "ret") == 0)
12493 align_branch |= align_branch_ret_bit;
12494 else if (strcasecmp (type, "indirect") == 0)
12495 align_branch |= align_branch_indirect_bit;
12496 else
12497 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
12498 type = next;
12499 }
12500 while (next != NULL);
12501 free (saved);
12502 break;
12503
12504 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
12505 align_branch_power = 5;
12506 align_branch_prefix_size = 5;
12507 align_branch = (align_branch_jcc_bit
12508 | align_branch_fused_bit
12509 | align_branch_jmp_bit);
12510 break;
12511
12512 case OPTION_MAMD64:
12513 intel64 = 0;
12514 break;
12515
12516 case OPTION_MINTEL64:
12517 intel64 = 1;
12518 break;
12519
12520 case 'O':
12521 if (arg == NULL)
12522 {
12523 optimize = 1;
12524 /* Turn off -Os. */
12525 optimize_for_space = 0;
12526 }
12527 else if (*arg == 's')
12528 {
12529 optimize_for_space = 1;
12530 /* Turn on all encoding optimizations. */
12531 optimize = INT_MAX;
12532 }
12533 else
12534 {
12535 optimize = atoi (arg);
12536 /* Turn off -Os. */
12537 optimize_for_space = 0;
12538 }
12539 break;
12540
12541 default:
12542 return 0;
12543 }
12544 return 1;
12545 }
12546
12547 #define MESSAGE_TEMPLATE \
12548 " "
12549
12550 static char *
12551 output_message (FILE *stream, char *p, char *message, char *start,
12552 int *left_p, const char *name, int len)
12553 {
12554 int size = sizeof (MESSAGE_TEMPLATE);
12555 int left = *left_p;
12556
12557 /* Reserve 2 spaces for ", " or ",\0" */
12558 left -= len + 2;
12559
12560 /* Check if there is any room. */
12561 if (left >= 0)
12562 {
12563 if (p != start)
12564 {
12565 *p++ = ',';
12566 *p++ = ' ';
12567 }
12568 p = mempcpy (p, name, len);
12569 }
12570 else
12571 {
12572 /* Output the current message now and start a new one. */
12573 *p++ = ',';
12574 *p = '\0';
12575 fprintf (stream, "%s\n", message);
12576 p = start;
12577 left = size - (start - message) - len - 2;
12578
12579 gas_assert (left >= 0);
12580
12581 p = mempcpy (p, name, len);
12582 }
12583
12584 *left_p = left;
12585 return p;
12586 }
12587
12588 static void
12589 show_arch (FILE *stream, int ext, int check)
12590 {
12591 static char message[] = MESSAGE_TEMPLATE;
12592 char *start = message + 27;
12593 char *p;
12594 int size = sizeof (MESSAGE_TEMPLATE);
12595 int left;
12596 const char *name;
12597 int len;
12598 unsigned int j;
12599
12600 p = start;
12601 left = size - (start - message);
12602 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12603 {
12604 /* Should it be skipped? */
12605 if (cpu_arch [j].skip)
12606 continue;
12607
12608 name = cpu_arch [j].name;
12609 len = cpu_arch [j].len;
12610 if (*name == '.')
12611 {
12612 /* It is an extension. Skip if we aren't asked to show it. */
12613 if (ext)
12614 {
12615 name++;
12616 len--;
12617 }
12618 else
12619 continue;
12620 }
12621 else if (ext)
12622 {
12623 /* It is an processor. Skip if we show only extension. */
12624 continue;
12625 }
12626 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
12627 {
12628 /* It is an impossible processor - skip. */
12629 continue;
12630 }
12631
12632 p = output_message (stream, p, message, start, &left, name, len);
12633 }
12634
12635 /* Display disabled extensions. */
12636 if (ext)
12637 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12638 {
12639 name = cpu_noarch [j].name;
12640 len = cpu_noarch [j].len;
12641 p = output_message (stream, p, message, start, &left, name,
12642 len);
12643 }
12644
12645 *p = '\0';
12646 fprintf (stream, "%s\n", message);
12647 }
12648
12649 void
12650 md_show_usage (FILE *stream)
12651 {
12652 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12653 fprintf (stream, _("\
12654 -Qy, -Qn ignored\n\
12655 -V print assembler version number\n\
12656 -k ignored\n"));
12657 #endif
12658 fprintf (stream, _("\
12659 -n Do not optimize code alignment\n\
12660 -q quieten some warnings\n"));
12661 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12662 fprintf (stream, _("\
12663 -s ignored\n"));
12664 #endif
12665 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12666 || defined (TE_PE) || defined (TE_PEP))
12667 fprintf (stream, _("\
12668 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
12669 #endif
12670 #ifdef SVR4_COMMENT_CHARS
12671 fprintf (stream, _("\
12672 --divide do not treat `/' as a comment character\n"));
12673 #else
12674 fprintf (stream, _("\
12675 --divide ignored\n"));
12676 #endif
12677 fprintf (stream, _("\
12678 -march=CPU[,+EXTENSION...]\n\
12679 generate code for CPU and EXTENSION, CPU is one of:\n"));
12680 show_arch (stream, 0, 1);
12681 fprintf (stream, _("\
12682 EXTENSION is combination of:\n"));
12683 show_arch (stream, 1, 0);
12684 fprintf (stream, _("\
12685 -mtune=CPU optimize for CPU, CPU is one of:\n"));
12686 show_arch (stream, 0, 0);
12687 fprintf (stream, _("\
12688 -msse2avx encode SSE instructions with VEX prefix\n"));
12689 fprintf (stream, _("\
12690 -msse-check=[none|error|warning] (default: warning)\n\
12691 check SSE instructions\n"));
12692 fprintf (stream, _("\
12693 -moperand-check=[none|error|warning] (default: warning)\n\
12694 check operand combinations for validity\n"));
12695 fprintf (stream, _("\
12696 -mavxscalar=[128|256] (default: 128)\n\
12697 encode scalar AVX instructions with specific vector\n\
12698 length\n"));
12699 fprintf (stream, _("\
12700 -mvexwig=[0|1] (default: 0)\n\
12701 encode VEX instructions with specific VEX.W value\n\
12702 for VEX.W bit ignored instructions\n"));
12703 fprintf (stream, _("\
12704 -mevexlig=[128|256|512] (default: 128)\n\
12705 encode scalar EVEX instructions with specific vector\n\
12706 length\n"));
12707 fprintf (stream, _("\
12708 -mevexwig=[0|1] (default: 0)\n\
12709 encode EVEX instructions with specific EVEX.W value\n\
12710 for EVEX.W bit ignored instructions\n"));
12711 fprintf (stream, _("\
12712 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
12713 encode EVEX instructions with specific EVEX.RC value\n\
12714 for SAE-only ignored instructions\n"));
12715 fprintf (stream, _("\
12716 -mmnemonic=[att|intel] "));
12717 if (SYSV386_COMPAT)
12718 fprintf (stream, _("(default: att)\n"));
12719 else
12720 fprintf (stream, _("(default: intel)\n"));
12721 fprintf (stream, _("\
12722 use AT&T/Intel mnemonic\n"));
12723 fprintf (stream, _("\
12724 -msyntax=[att|intel] (default: att)\n\
12725 use AT&T/Intel syntax\n"));
12726 fprintf (stream, _("\
12727 -mindex-reg support pseudo index registers\n"));
12728 fprintf (stream, _("\
12729 -mnaked-reg don't require `%%' prefix for registers\n"));
12730 fprintf (stream, _("\
12731 -madd-bnd-prefix add BND prefix for all valid branches\n"));
12732 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12733 fprintf (stream, _("\
12734 -mshared disable branch optimization for shared code\n"));
12735 fprintf (stream, _("\
12736 -mx86-used-note=[no|yes] "));
12737 if (DEFAULT_X86_USED_NOTE)
12738 fprintf (stream, _("(default: yes)\n"));
12739 else
12740 fprintf (stream, _("(default: no)\n"));
12741 fprintf (stream, _("\
12742 generate x86 used ISA and feature properties\n"));
12743 #endif
12744 #if defined (TE_PE) || defined (TE_PEP)
12745 fprintf (stream, _("\
12746 -mbig-obj generate big object files\n"));
12747 #endif
12748 fprintf (stream, _("\
12749 -momit-lock-prefix=[no|yes] (default: no)\n\
12750 strip all lock prefixes\n"));
12751 fprintf (stream, _("\
12752 -mfence-as-lock-add=[no|yes] (default: no)\n\
12753 encode lfence, mfence and sfence as\n\
12754 lock addl $0x0, (%%{re}sp)\n"));
12755 fprintf (stream, _("\
12756 -mrelax-relocations=[no|yes] "));
12757 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
12758 fprintf (stream, _("(default: yes)\n"));
12759 else
12760 fprintf (stream, _("(default: no)\n"));
12761 fprintf (stream, _("\
12762 generate relax relocations\n"));
12763 fprintf (stream, _("\
12764 -malign-branch-boundary=NUM (default: 0)\n\
12765 align branches within NUM byte boundary\n"));
12766 fprintf (stream, _("\
12767 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
12768 TYPE is combination of jcc, fused, jmp, call, ret,\n\
12769 indirect\n\
12770 specify types of branches to align\n"));
12771 fprintf (stream, _("\
12772 -malign-branch-prefix-size=NUM (default: 5)\n\
12773 align branches with NUM prefixes per instruction\n"));
12774 fprintf (stream, _("\
12775 -mbranches-within-32B-boundaries\n\
12776 align branches within 32 byte boundary\n"));
12777 fprintf (stream, _("\
12778 -mamd64 accept only AMD64 ISA [default]\n"));
12779 fprintf (stream, _("\
12780 -mintel64 accept only Intel64 ISA\n"));
12781 }
12782
12783 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
12784 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12785 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12786
12787 /* Pick the target format to use. */
12788
12789 const char *
12790 i386_target_format (void)
12791 {
12792 if (!strncmp (default_arch, "x86_64", 6))
12793 {
12794 update_code_flag (CODE_64BIT, 1);
12795 if (default_arch[6] == '\0')
12796 x86_elf_abi = X86_64_ABI;
12797 else
12798 x86_elf_abi = X86_64_X32_ABI;
12799 }
12800 else if (!strcmp (default_arch, "i386"))
12801 update_code_flag (CODE_32BIT, 1);
12802 else if (!strcmp (default_arch, "iamcu"))
12803 {
12804 update_code_flag (CODE_32BIT, 1);
12805 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
12806 {
12807 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
12808 cpu_arch_name = "iamcu";
12809 cpu_sub_arch_name = NULL;
12810 cpu_arch_flags = iamcu_flags;
12811 cpu_arch_isa = PROCESSOR_IAMCU;
12812 cpu_arch_isa_flags = iamcu_flags;
12813 if (!cpu_arch_tune_set)
12814 {
12815 cpu_arch_tune = cpu_arch_isa;
12816 cpu_arch_tune_flags = cpu_arch_isa_flags;
12817 }
12818 }
12819 else if (cpu_arch_isa != PROCESSOR_IAMCU)
12820 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
12821 cpu_arch_name);
12822 }
12823 else
12824 as_fatal (_("unknown architecture"));
12825
12826 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
12827 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12828 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
12829 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12830
12831 switch (OUTPUT_FLAVOR)
12832 {
12833 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
12834 case bfd_target_aout_flavour:
12835 return AOUT_TARGET_FORMAT;
12836 #endif
12837 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
12838 # if defined (TE_PE) || defined (TE_PEP)
12839 case bfd_target_coff_flavour:
12840 if (flag_code == CODE_64BIT)
12841 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
12842 else
12843 return "pe-i386";
12844 # elif defined (TE_GO32)
12845 case bfd_target_coff_flavour:
12846 return "coff-go32";
12847 # else
12848 case bfd_target_coff_flavour:
12849 return "coff-i386";
12850 # endif
12851 #endif
12852 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12853 case bfd_target_elf_flavour:
12854 {
12855 const char *format;
12856
12857 switch (x86_elf_abi)
12858 {
12859 default:
12860 format = ELF_TARGET_FORMAT;
12861 #ifndef TE_SOLARIS
12862 tls_get_addr = "___tls_get_addr";
12863 #endif
12864 break;
12865 case X86_64_ABI:
12866 use_rela_relocations = 1;
12867 object_64bit = 1;
12868 #ifndef TE_SOLARIS
12869 tls_get_addr = "__tls_get_addr";
12870 #endif
12871 format = ELF_TARGET_FORMAT64;
12872 break;
12873 case X86_64_X32_ABI:
12874 use_rela_relocations = 1;
12875 object_64bit = 1;
12876 #ifndef TE_SOLARIS
12877 tls_get_addr = "__tls_get_addr";
12878 #endif
12879 disallow_64bit_reloc = 1;
12880 format = ELF_TARGET_FORMAT32;
12881 break;
12882 }
12883 if (cpu_arch_isa == PROCESSOR_L1OM)
12884 {
12885 if (x86_elf_abi != X86_64_ABI)
12886 as_fatal (_("Intel L1OM is 64bit only"));
12887 return ELF_TARGET_L1OM_FORMAT;
12888 }
12889 else if (cpu_arch_isa == PROCESSOR_K1OM)
12890 {
12891 if (x86_elf_abi != X86_64_ABI)
12892 as_fatal (_("Intel K1OM is 64bit only"));
12893 return ELF_TARGET_K1OM_FORMAT;
12894 }
12895 else if (cpu_arch_isa == PROCESSOR_IAMCU)
12896 {
12897 if (x86_elf_abi != I386_ABI)
12898 as_fatal (_("Intel MCU is 32bit only"));
12899 return ELF_TARGET_IAMCU_FORMAT;
12900 }
12901 else
12902 return format;
12903 }
12904 #endif
12905 #if defined (OBJ_MACH_O)
12906 case bfd_target_mach_o_flavour:
12907 if (flag_code == CODE_64BIT)
12908 {
12909 use_rela_relocations = 1;
12910 object_64bit = 1;
12911 return "mach-o-x86-64";
12912 }
12913 else
12914 return "mach-o-i386";
12915 #endif
12916 default:
12917 abort ();
12918 return NULL;
12919 }
12920 }
12921
12922 #endif /* OBJ_MAYBE_ more than one */
12923 \f
12924 symbolS *
12925 md_undefined_symbol (char *name)
12926 {
12927 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
12928 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
12929 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
12930 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
12931 {
12932 if (!GOT_symbol)
12933 {
12934 if (symbol_find (name))
12935 as_bad (_("GOT already in symbol table"));
12936 GOT_symbol = symbol_new (name, undefined_section,
12937 (valueT) 0, &zero_address_frag);
12938 };
12939 return GOT_symbol;
12940 }
12941 return 0;
12942 }
12943
12944 /* Round up a section size to the appropriate boundary. */
12945
12946 valueT
12947 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
12948 {
12949 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
12950 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
12951 {
12952 /* For a.out, force the section size to be aligned. If we don't do
12953 this, BFD will align it for us, but it will not write out the
12954 final bytes of the section. This may be a bug in BFD, but it is
12955 easier to fix it here since that is how the other a.out targets
12956 work. */
12957 int align;
12958
12959 align = bfd_section_alignment (segment);
12960 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
12961 }
12962 #endif
12963
12964 return size;
12965 }
12966
12967 /* On the i386, PC-relative offsets are relative to the start of the
12968 next instruction. That is, the address of the offset, plus its
12969 size, since the offset is always the last part of the insn. */
12970
12971 long
12972 md_pcrel_from (fixS *fixP)
12973 {
12974 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
12975 }
12976
12977 #ifndef I386COFF
12978
12979 static void
12980 s_bss (int ignore ATTRIBUTE_UNUSED)
12981 {
12982 int temp;
12983
12984 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12985 if (IS_ELF)
12986 obj_elf_section_change_hook ();
12987 #endif
12988 temp = get_absolute_expression ();
12989 subseg_set (bss_section, (subsegT) temp);
12990 demand_empty_rest_of_line ();
12991 }
12992
12993 #endif
12994
12995 /* Remember constant directive. */
12996
12997 void
12998 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
12999 {
13000 if (last_insn.kind != last_insn_directive
13001 && (bfd_section_flags (now_seg) & SEC_CODE))
13002 {
13003 last_insn.seg = now_seg;
13004 last_insn.kind = last_insn_directive;
13005 last_insn.name = "constant directive";
13006 last_insn.file = as_where (&last_insn.line);
13007 }
13008 }
13009
13010 void
13011 i386_validate_fix (fixS *fixp)
13012 {
13013 if (fixp->fx_subsy)
13014 {
13015 if (fixp->fx_subsy == GOT_symbol)
13016 {
13017 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13018 {
13019 if (!object_64bit)
13020 abort ();
13021 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13022 if (fixp->fx_tcbit2)
13023 fixp->fx_r_type = (fixp->fx_tcbit
13024 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13025 : BFD_RELOC_X86_64_GOTPCRELX);
13026 else
13027 #endif
13028 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13029 }
13030 else
13031 {
13032 if (!object_64bit)
13033 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13034 else
13035 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13036 }
13037 fixp->fx_subsy = 0;
13038 }
13039 }
13040 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13041 else if (!object_64bit)
13042 {
13043 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13044 && fixp->fx_tcbit2)
13045 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13046 }
13047 #endif
13048 }
13049
13050 arelent *
13051 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13052 {
13053 arelent *rel;
13054 bfd_reloc_code_real_type code;
13055
13056 switch (fixp->fx_r_type)
13057 {
13058 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13059 case BFD_RELOC_SIZE32:
13060 case BFD_RELOC_SIZE64:
13061 if (S_IS_DEFINED (fixp->fx_addsy)
13062 && !S_IS_EXTERNAL (fixp->fx_addsy))
13063 {
13064 /* Resolve size relocation against local symbol to size of
13065 the symbol plus addend. */
13066 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13067 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13068 && !fits_in_unsigned_long (value))
13069 as_bad_where (fixp->fx_file, fixp->fx_line,
13070 _("symbol size computation overflow"));
13071 fixp->fx_addsy = NULL;
13072 fixp->fx_subsy = NULL;
13073 md_apply_fix (fixp, (valueT *) &value, NULL);
13074 return NULL;
13075 }
13076 #endif
13077 /* Fall through. */
13078
13079 case BFD_RELOC_X86_64_PLT32:
13080 case BFD_RELOC_X86_64_GOT32:
13081 case BFD_RELOC_X86_64_GOTPCREL:
13082 case BFD_RELOC_X86_64_GOTPCRELX:
13083 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13084 case BFD_RELOC_386_PLT32:
13085 case BFD_RELOC_386_GOT32:
13086 case BFD_RELOC_386_GOT32X:
13087 case BFD_RELOC_386_GOTOFF:
13088 case BFD_RELOC_386_GOTPC:
13089 case BFD_RELOC_386_TLS_GD:
13090 case BFD_RELOC_386_TLS_LDM:
13091 case BFD_RELOC_386_TLS_LDO_32:
13092 case BFD_RELOC_386_TLS_IE_32:
13093 case BFD_RELOC_386_TLS_IE:
13094 case BFD_RELOC_386_TLS_GOTIE:
13095 case BFD_RELOC_386_TLS_LE_32:
13096 case BFD_RELOC_386_TLS_LE:
13097 case BFD_RELOC_386_TLS_GOTDESC:
13098 case BFD_RELOC_386_TLS_DESC_CALL:
13099 case BFD_RELOC_X86_64_TLSGD:
13100 case BFD_RELOC_X86_64_TLSLD:
13101 case BFD_RELOC_X86_64_DTPOFF32:
13102 case BFD_RELOC_X86_64_DTPOFF64:
13103 case BFD_RELOC_X86_64_GOTTPOFF:
13104 case BFD_RELOC_X86_64_TPOFF32:
13105 case BFD_RELOC_X86_64_TPOFF64:
13106 case BFD_RELOC_X86_64_GOTOFF64:
13107 case BFD_RELOC_X86_64_GOTPC32:
13108 case BFD_RELOC_X86_64_GOT64:
13109 case BFD_RELOC_X86_64_GOTPCREL64:
13110 case BFD_RELOC_X86_64_GOTPC64:
13111 case BFD_RELOC_X86_64_GOTPLT64:
13112 case BFD_RELOC_X86_64_PLTOFF64:
13113 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13114 case BFD_RELOC_X86_64_TLSDESC_CALL:
13115 case BFD_RELOC_RVA:
13116 case BFD_RELOC_VTABLE_ENTRY:
13117 case BFD_RELOC_VTABLE_INHERIT:
13118 #ifdef TE_PE
13119 case BFD_RELOC_32_SECREL:
13120 #endif
13121 code = fixp->fx_r_type;
13122 break;
13123 case BFD_RELOC_X86_64_32S:
13124 if (!fixp->fx_pcrel)
13125 {
13126 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13127 code = fixp->fx_r_type;
13128 break;
13129 }
13130 /* Fall through. */
13131 default:
13132 if (fixp->fx_pcrel)
13133 {
13134 switch (fixp->fx_size)
13135 {
13136 default:
13137 as_bad_where (fixp->fx_file, fixp->fx_line,
13138 _("can not do %d byte pc-relative relocation"),
13139 fixp->fx_size);
13140 code = BFD_RELOC_32_PCREL;
13141 break;
13142 case 1: code = BFD_RELOC_8_PCREL; break;
13143 case 2: code = BFD_RELOC_16_PCREL; break;
13144 case 4: code = BFD_RELOC_32_PCREL; break;
13145 #ifdef BFD64
13146 case 8: code = BFD_RELOC_64_PCREL; break;
13147 #endif
13148 }
13149 }
13150 else
13151 {
13152 switch (fixp->fx_size)
13153 {
13154 default:
13155 as_bad_where (fixp->fx_file, fixp->fx_line,
13156 _("can not do %d byte relocation"),
13157 fixp->fx_size);
13158 code = BFD_RELOC_32;
13159 break;
13160 case 1: code = BFD_RELOC_8; break;
13161 case 2: code = BFD_RELOC_16; break;
13162 case 4: code = BFD_RELOC_32; break;
13163 #ifdef BFD64
13164 case 8: code = BFD_RELOC_64; break;
13165 #endif
13166 }
13167 }
13168 break;
13169 }
13170
13171 if ((code == BFD_RELOC_32
13172 || code == BFD_RELOC_32_PCREL
13173 || code == BFD_RELOC_X86_64_32S)
13174 && GOT_symbol
13175 && fixp->fx_addsy == GOT_symbol)
13176 {
13177 if (!object_64bit)
13178 code = BFD_RELOC_386_GOTPC;
13179 else
13180 code = BFD_RELOC_X86_64_GOTPC32;
13181 }
13182 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13183 && GOT_symbol
13184 && fixp->fx_addsy == GOT_symbol)
13185 {
13186 code = BFD_RELOC_X86_64_GOTPC64;
13187 }
13188
13189 rel = XNEW (arelent);
13190 rel->sym_ptr_ptr = XNEW (asymbol *);
13191 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13192
13193 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13194
13195 if (!use_rela_relocations)
13196 {
13197 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13198 vtable entry to be used in the relocation's section offset. */
13199 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13200 rel->address = fixp->fx_offset;
13201 #if defined (OBJ_COFF) && defined (TE_PE)
13202 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13203 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13204 else
13205 #endif
13206 rel->addend = 0;
13207 }
13208 /* Use the rela in 64bit mode. */
13209 else
13210 {
13211 if (disallow_64bit_reloc)
13212 switch (code)
13213 {
13214 case BFD_RELOC_X86_64_DTPOFF64:
13215 case BFD_RELOC_X86_64_TPOFF64:
13216 case BFD_RELOC_64_PCREL:
13217 case BFD_RELOC_X86_64_GOTOFF64:
13218 case BFD_RELOC_X86_64_GOT64:
13219 case BFD_RELOC_X86_64_GOTPCREL64:
13220 case BFD_RELOC_X86_64_GOTPC64:
13221 case BFD_RELOC_X86_64_GOTPLT64:
13222 case BFD_RELOC_X86_64_PLTOFF64:
13223 as_bad_where (fixp->fx_file, fixp->fx_line,
13224 _("cannot represent relocation type %s in x32 mode"),
13225 bfd_get_reloc_code_name (code));
13226 break;
13227 default:
13228 break;
13229 }
13230
13231 if (!fixp->fx_pcrel)
13232 rel->addend = fixp->fx_offset;
13233 else
13234 switch (code)
13235 {
13236 case BFD_RELOC_X86_64_PLT32:
13237 case BFD_RELOC_X86_64_GOT32:
13238 case BFD_RELOC_X86_64_GOTPCREL:
13239 case BFD_RELOC_X86_64_GOTPCRELX:
13240 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13241 case BFD_RELOC_X86_64_TLSGD:
13242 case BFD_RELOC_X86_64_TLSLD:
13243 case BFD_RELOC_X86_64_GOTTPOFF:
13244 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13245 case BFD_RELOC_X86_64_TLSDESC_CALL:
13246 rel->addend = fixp->fx_offset - fixp->fx_size;
13247 break;
13248 default:
13249 rel->addend = (section->vma
13250 - fixp->fx_size
13251 + fixp->fx_addnumber
13252 + md_pcrel_from (fixp));
13253 break;
13254 }
13255 }
13256
13257 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
13258 if (rel->howto == NULL)
13259 {
13260 as_bad_where (fixp->fx_file, fixp->fx_line,
13261 _("cannot represent relocation type %s"),
13262 bfd_get_reloc_code_name (code));
13263 /* Set howto to a garbage value so that we can keep going. */
13264 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
13265 gas_assert (rel->howto != NULL);
13266 }
13267
13268 return rel;
13269 }
13270
13271 #include "tc-i386-intel.c"
13272
13273 void
13274 tc_x86_parse_to_dw2regnum (expressionS *exp)
13275 {
13276 int saved_naked_reg;
13277 char saved_register_dot;
13278
13279 saved_naked_reg = allow_naked_reg;
13280 allow_naked_reg = 1;
13281 saved_register_dot = register_chars['.'];
13282 register_chars['.'] = '.';
13283 allow_pseudo_reg = 1;
13284 expression_and_evaluate (exp);
13285 allow_pseudo_reg = 0;
13286 register_chars['.'] = saved_register_dot;
13287 allow_naked_reg = saved_naked_reg;
13288
13289 if (exp->X_op == O_register && exp->X_add_number >= 0)
13290 {
13291 if ((addressT) exp->X_add_number < i386_regtab_size)
13292 {
13293 exp->X_op = O_constant;
13294 exp->X_add_number = i386_regtab[exp->X_add_number]
13295 .dw2_regnum[flag_code >> 1];
13296 }
13297 else
13298 exp->X_op = O_illegal;
13299 }
13300 }
13301
13302 void
13303 tc_x86_frame_initial_instructions (void)
13304 {
13305 static unsigned int sp_regno[2];
13306
13307 if (!sp_regno[flag_code >> 1])
13308 {
13309 char *saved_input = input_line_pointer;
13310 char sp[][4] = {"esp", "rsp"};
13311 expressionS exp;
13312
13313 input_line_pointer = sp[flag_code >> 1];
13314 tc_x86_parse_to_dw2regnum (&exp);
13315 gas_assert (exp.X_op == O_constant);
13316 sp_regno[flag_code >> 1] = exp.X_add_number;
13317 input_line_pointer = saved_input;
13318 }
13319
13320 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
13321 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
13322 }
13323
13324 int
13325 x86_dwarf2_addr_size (void)
13326 {
13327 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13328 if (x86_elf_abi == X86_64_X32_ABI)
13329 return 4;
13330 #endif
13331 return bfd_arch_bits_per_address (stdoutput) / 8;
13332 }
13333
13334 int
13335 i386_elf_section_type (const char *str, size_t len)
13336 {
13337 if (flag_code == CODE_64BIT
13338 && len == sizeof ("unwind") - 1
13339 && strncmp (str, "unwind", 6) == 0)
13340 return SHT_X86_64_UNWIND;
13341
13342 return -1;
13343 }
13344
13345 #ifdef TE_SOLARIS
13346 void
13347 i386_solaris_fix_up_eh_frame (segT sec)
13348 {
13349 if (flag_code == CODE_64BIT)
13350 elf_section_type (sec) = SHT_X86_64_UNWIND;
13351 }
13352 #endif
13353
13354 #ifdef TE_PE
13355 void
13356 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
13357 {
13358 expressionS exp;
13359
13360 exp.X_op = O_secrel;
13361 exp.X_add_symbol = symbol;
13362 exp.X_add_number = 0;
13363 emit_expr (&exp, size);
13364 }
13365 #endif
13366
13367 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13368 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
13369
13370 bfd_vma
13371 x86_64_section_letter (int letter, const char **ptr_msg)
13372 {
13373 if (flag_code == CODE_64BIT)
13374 {
13375 if (letter == 'l')
13376 return SHF_X86_64_LARGE;
13377
13378 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
13379 }
13380 else
13381 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
13382 return -1;
13383 }
13384
13385 bfd_vma
13386 x86_64_section_word (char *str, size_t len)
13387 {
13388 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
13389 return SHF_X86_64_LARGE;
13390
13391 return -1;
13392 }
13393
13394 static void
13395 handle_large_common (int small ATTRIBUTE_UNUSED)
13396 {
13397 if (flag_code != CODE_64BIT)
13398 {
13399 s_comm_internal (0, elf_common_parse);
13400 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
13401 }
13402 else
13403 {
13404 static segT lbss_section;
13405 asection *saved_com_section_ptr = elf_com_section_ptr;
13406 asection *saved_bss_section = bss_section;
13407
13408 if (lbss_section == NULL)
13409 {
13410 flagword applicable;
13411 segT seg = now_seg;
13412 subsegT subseg = now_subseg;
13413
13414 /* The .lbss section is for local .largecomm symbols. */
13415 lbss_section = subseg_new (".lbss", 0);
13416 applicable = bfd_applicable_section_flags (stdoutput);
13417 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
13418 seg_info (lbss_section)->bss = 1;
13419
13420 subseg_set (seg, subseg);
13421 }
13422
13423 elf_com_section_ptr = &_bfd_elf_large_com_section;
13424 bss_section = lbss_section;
13425
13426 s_comm_internal (0, elf_common_parse);
13427
13428 elf_com_section_ptr = saved_com_section_ptr;
13429 bss_section = saved_bss_section;
13430 }
13431 }
13432 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 0.313578 seconds and 4 git commands to generate.