d9305fbfa5cded6c1479ec393958239bce23e8f8
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2018 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifndef REGISTER_WARNINGS
37 #define REGISTER_WARNINGS 1
38 #endif
39
40 #ifndef INFER_ADDR_PREFIX
41 #define INFER_ADDR_PREFIX 1
42 #endif
43
44 #ifndef DEFAULT_ARCH
45 #define DEFAULT_ARCH "i386"
46 #endif
47
48 #ifndef INLINE
49 #if __GNUC__ >= 2
50 #define INLINE __inline__
51 #else
52 #define INLINE
53 #endif
54 #endif
55
56 /* Prefixes will be emitted in the order defined below.
57 WAIT_PREFIX must be the first prefix since FWAIT is really is an
58 instruction, and so must come before any prefixes.
59 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
60 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
61 #define WAIT_PREFIX 0
62 #define SEG_PREFIX 1
63 #define ADDR_PREFIX 2
64 #define DATA_PREFIX 3
65 #define REP_PREFIX 4
66 #define HLE_PREFIX REP_PREFIX
67 #define BND_PREFIX REP_PREFIX
68 #define LOCK_PREFIX 5
69 #define REX_PREFIX 6 /* must come last. */
70 #define MAX_PREFIXES 7 /* max prefixes per opcode */
71
72 /* we define the syntax here (modulo base,index,scale syntax) */
73 #define REGISTER_PREFIX '%'
74 #define IMMEDIATE_PREFIX '$'
75 #define ABSOLUTE_PREFIX '*'
76
77 /* these are the instruction mnemonic suffixes in AT&T syntax or
78 memory operand size in Intel syntax. */
79 #define WORD_MNEM_SUFFIX 'w'
80 #define BYTE_MNEM_SUFFIX 'b'
81 #define SHORT_MNEM_SUFFIX 's'
82 #define LONG_MNEM_SUFFIX 'l'
83 #define QWORD_MNEM_SUFFIX 'q'
84 /* Intel Syntax. Use a non-ascii letter since since it never appears
85 in instructions. */
86 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
87
88 #define END_OF_INSN '\0'
89
90 /*
91 'templates' is for grouping together 'template' structures for opcodes
92 of the same name. This is only used for storing the insns in the grand
93 ole hash table of insns.
94 The templates themselves start at START and range up to (but not including)
95 END.
96 */
97 typedef struct
98 {
99 const insn_template *start;
100 const insn_template *end;
101 }
102 templates;
103
104 /* 386 operand encoding bytes: see 386 book for details of this. */
105 typedef struct
106 {
107 unsigned int regmem; /* codes register or memory operand */
108 unsigned int reg; /* codes register operand (or extended opcode) */
109 unsigned int mode; /* how to interpret regmem & reg */
110 }
111 modrm_byte;
112
113 /* x86-64 extension prefix. */
114 typedef int rex_byte;
115
116 /* 386 opcode byte to code indirect addressing. */
117 typedef struct
118 {
119 unsigned base;
120 unsigned index;
121 unsigned scale;
122 }
123 sib_byte;
124
125 /* x86 arch names, types and features */
126 typedef struct
127 {
128 const char *name; /* arch name */
129 unsigned int len; /* arch string length */
130 enum processor_type type; /* arch type */
131 i386_cpu_flags flags; /* cpu feature flags */
132 unsigned int skip; /* show_arch should skip this. */
133 }
134 arch_entry;
135
136 /* Used to turn off indicated flags. */
137 typedef struct
138 {
139 const char *name; /* arch name */
140 unsigned int len; /* arch string length */
141 i386_cpu_flags flags; /* cpu feature flags */
142 }
143 noarch_entry;
144
145 static void update_code_flag (int, int);
146 static void set_code_flag (int);
147 static void set_16bit_gcc_code_flag (int);
148 static void set_intel_syntax (int);
149 static void set_intel_mnemonic (int);
150 static void set_allow_index_reg (int);
151 static void set_check (int);
152 static void set_cpu_arch (int);
153 #ifdef TE_PE
154 static void pe_directive_secrel (int);
155 #endif
156 static void signed_cons (int);
157 static char *output_invalid (int c);
158 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
159 const char *);
160 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
161 const char *);
162 static int i386_att_operand (char *);
163 static int i386_intel_operand (char *, int);
164 static int i386_intel_simplify (expressionS *);
165 static int i386_intel_parse_name (const char *, expressionS *);
166 static const reg_entry *parse_register (char *, char **);
167 static char *parse_insn (char *, char *);
168 static char *parse_operands (char *, const char *);
169 static void swap_operands (void);
170 static void swap_2_operands (int, int);
171 static void optimize_imm (void);
172 static void optimize_disp (void);
173 static const insn_template *match_template (char);
174 static int check_string (void);
175 static int process_suffix (void);
176 static int check_byte_reg (void);
177 static int check_long_reg (void);
178 static int check_qword_reg (void);
179 static int check_word_reg (void);
180 static int finalize_imm (void);
181 static int process_operands (void);
182 static const seg_entry *build_modrm_byte (void);
183 static void output_insn (void);
184 static void output_imm (fragS *, offsetT);
185 static void output_disp (fragS *, offsetT);
186 #ifndef I386COFF
187 static void s_bss (int);
188 #endif
189 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
190 static void handle_large_common (int small ATTRIBUTE_UNUSED);
191 #endif
192
193 static const char *default_arch = DEFAULT_ARCH;
194
195 /* This struct describes rounding control and SAE in the instruction. */
196 struct RC_Operation
197 {
198 enum rc_type
199 {
200 rne = 0,
201 rd,
202 ru,
203 rz,
204 saeonly
205 } type;
206 int operand;
207 };
208
209 static struct RC_Operation rc_op;
210
211 /* The struct describes masking, applied to OPERAND in the instruction.
212 MASK is a pointer to the corresponding mask register. ZEROING tells
213 whether merging or zeroing mask is used. */
214 struct Mask_Operation
215 {
216 const reg_entry *mask;
217 unsigned int zeroing;
218 /* The operand where this operation is associated. */
219 int operand;
220 };
221
222 static struct Mask_Operation mask_op;
223
224 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
225 broadcast factor. */
226 struct Broadcast_Operation
227 {
228 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
229 int type;
230
231 /* Index of broadcasted operand. */
232 int operand;
233 };
234
235 static struct Broadcast_Operation broadcast_op;
236
237 /* VEX prefix. */
238 typedef struct
239 {
240 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
241 unsigned char bytes[4];
242 unsigned int length;
243 /* Destination or source register specifier. */
244 const reg_entry *register_specifier;
245 } vex_prefix;
246
247 /* 'md_assemble ()' gathers together information and puts it into a
248 i386_insn. */
249
250 union i386_op
251 {
252 expressionS *disps;
253 expressionS *imms;
254 const reg_entry *regs;
255 };
256
257 enum i386_error
258 {
259 operand_size_mismatch,
260 operand_type_mismatch,
261 register_type_mismatch,
262 number_of_operands_mismatch,
263 invalid_instruction_suffix,
264 bad_imm4,
265 unsupported_with_intel_mnemonic,
266 unsupported_syntax,
267 unsupported,
268 invalid_vsib_address,
269 invalid_vector_register_set,
270 unsupported_vector_index_register,
271 unsupported_broadcast,
272 broadcast_not_on_src_operand,
273 broadcast_needed,
274 unsupported_masking,
275 mask_not_on_destination,
276 no_default_mask,
277 unsupported_rc_sae,
278 rc_sae_operand_not_last_imm,
279 invalid_register_operand,
280 };
281
282 struct _i386_insn
283 {
284 /* TM holds the template for the insn were currently assembling. */
285 insn_template tm;
286
287 /* SUFFIX holds the instruction size suffix for byte, word, dword
288 or qword, if given. */
289 char suffix;
290
291 /* OPERANDS gives the number of given operands. */
292 unsigned int operands;
293
294 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
295 of given register, displacement, memory operands and immediate
296 operands. */
297 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
298
299 /* TYPES [i] is the type (see above #defines) which tells us how to
300 use OP[i] for the corresponding operand. */
301 i386_operand_type types[MAX_OPERANDS];
302
303 /* Displacement expression, immediate expression, or register for each
304 operand. */
305 union i386_op op[MAX_OPERANDS];
306
307 /* Flags for operands. */
308 unsigned int flags[MAX_OPERANDS];
309 #define Operand_PCrel 1
310
311 /* Relocation type for operand */
312 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
313
314 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
315 the base index byte below. */
316 const reg_entry *base_reg;
317 const reg_entry *index_reg;
318 unsigned int log2_scale_factor;
319
320 /* SEG gives the seg_entries of this insn. They are zero unless
321 explicit segment overrides are given. */
322 const seg_entry *seg[2];
323
324 /* Copied first memory operand string, for re-checking. */
325 char *memop1_string;
326
327 /* PREFIX holds all the given prefix opcodes (usually null).
328 PREFIXES is the number of prefix opcodes. */
329 unsigned int prefixes;
330 unsigned char prefix[MAX_PREFIXES];
331
332 /* RM and SIB are the modrm byte and the sib byte where the
333 addressing modes of this insn are encoded. */
334 modrm_byte rm;
335 rex_byte rex;
336 rex_byte vrex;
337 sib_byte sib;
338 vex_prefix vex;
339
340 /* Masking attributes. */
341 struct Mask_Operation *mask;
342
343 /* Rounding control and SAE attributes. */
344 struct RC_Operation *rounding;
345
346 /* Broadcasting attributes. */
347 struct Broadcast_Operation *broadcast;
348
349 /* Compressed disp8*N attribute. */
350 unsigned int memshift;
351
352 /* Prefer load or store in encoding. */
353 enum
354 {
355 dir_encoding_default = 0,
356 dir_encoding_load,
357 dir_encoding_store
358 } dir_encoding;
359
360 /* Prefer 8bit or 32bit displacement in encoding. */
361 enum
362 {
363 disp_encoding_default = 0,
364 disp_encoding_8bit,
365 disp_encoding_32bit
366 } disp_encoding;
367
368 /* Prefer the REX byte in encoding. */
369 bfd_boolean rex_encoding;
370
371 /* Disable instruction size optimization. */
372 bfd_boolean no_optimize;
373
374 /* How to encode vector instructions. */
375 enum
376 {
377 vex_encoding_default = 0,
378 vex_encoding_vex2,
379 vex_encoding_vex3,
380 vex_encoding_evex
381 } vec_encoding;
382
383 /* REP prefix. */
384 const char *rep_prefix;
385
386 /* HLE prefix. */
387 const char *hle_prefix;
388
389 /* Have BND prefix. */
390 const char *bnd_prefix;
391
392 /* Have NOTRACK prefix. */
393 const char *notrack_prefix;
394
395 /* Error message. */
396 enum i386_error error;
397 };
398
399 typedef struct _i386_insn i386_insn;
400
401 /* Link RC type with corresponding string, that'll be looked for in
402 asm. */
403 struct RC_name
404 {
405 enum rc_type type;
406 const char *name;
407 unsigned int len;
408 };
409
410 static const struct RC_name RC_NamesTable[] =
411 {
412 { rne, STRING_COMMA_LEN ("rn-sae") },
413 { rd, STRING_COMMA_LEN ("rd-sae") },
414 { ru, STRING_COMMA_LEN ("ru-sae") },
415 { rz, STRING_COMMA_LEN ("rz-sae") },
416 { saeonly, STRING_COMMA_LEN ("sae") },
417 };
418
419 /* List of chars besides those in app.c:symbol_chars that can start an
420 operand. Used to prevent the scrubber eating vital white-space. */
421 const char extra_symbol_chars[] = "*%-([{}"
422 #ifdef LEX_AT
423 "@"
424 #endif
425 #ifdef LEX_QM
426 "?"
427 #endif
428 ;
429
430 #if (defined (TE_I386AIX) \
431 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
432 && !defined (TE_GNU) \
433 && !defined (TE_LINUX) \
434 && !defined (TE_NACL) \
435 && !defined (TE_FreeBSD) \
436 && !defined (TE_DragonFly) \
437 && !defined (TE_NetBSD)))
438 /* This array holds the chars that always start a comment. If the
439 pre-processor is disabled, these aren't very useful. The option
440 --divide will remove '/' from this list. */
441 const char *i386_comment_chars = "#/";
442 #define SVR4_COMMENT_CHARS 1
443 #define PREFIX_SEPARATOR '\\'
444
445 #else
446 const char *i386_comment_chars = "#";
447 #define PREFIX_SEPARATOR '/'
448 #endif
449
450 /* This array holds the chars that only start a comment at the beginning of
451 a line. If the line seems to have the form '# 123 filename'
452 .line and .file directives will appear in the pre-processed output.
453 Note that input_file.c hand checks for '#' at the beginning of the
454 first line of the input file. This is because the compiler outputs
455 #NO_APP at the beginning of its output.
456 Also note that comments started like this one will always work if
457 '/' isn't otherwise defined. */
458 const char line_comment_chars[] = "#/";
459
460 const char line_separator_chars[] = ";";
461
462 /* Chars that can be used to separate mant from exp in floating point
463 nums. */
464 const char EXP_CHARS[] = "eE";
465
466 /* Chars that mean this number is a floating point constant
467 As in 0f12.456
468 or 0d1.2345e12. */
469 const char FLT_CHARS[] = "fFdDxX";
470
471 /* Tables for lexical analysis. */
472 static char mnemonic_chars[256];
473 static char register_chars[256];
474 static char operand_chars[256];
475 static char identifier_chars[256];
476 static char digit_chars[256];
477
478 /* Lexical macros. */
479 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
480 #define is_operand_char(x) (operand_chars[(unsigned char) x])
481 #define is_register_char(x) (register_chars[(unsigned char) x])
482 #define is_space_char(x) ((x) == ' ')
483 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
484 #define is_digit_char(x) (digit_chars[(unsigned char) x])
485
486 /* All non-digit non-letter characters that may occur in an operand. */
487 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
488
489 /* md_assemble() always leaves the strings it's passed unaltered. To
490 effect this we maintain a stack of saved characters that we've smashed
491 with '\0's (indicating end of strings for various sub-fields of the
492 assembler instruction). */
493 static char save_stack[32];
494 static char *save_stack_p;
495 #define END_STRING_AND_SAVE(s) \
496 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
497 #define RESTORE_END_STRING(s) \
498 do { *(s) = *--save_stack_p; } while (0)
499
500 /* The instruction we're assembling. */
501 static i386_insn i;
502
503 /* Possible templates for current insn. */
504 static const templates *current_templates;
505
506 /* Per instruction expressionS buffers: max displacements & immediates. */
507 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
508 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
509
510 /* Current operand we are working on. */
511 static int this_operand = -1;
512
513 /* We support four different modes. FLAG_CODE variable is used to distinguish
514 these. */
515
516 enum flag_code {
517 CODE_32BIT,
518 CODE_16BIT,
519 CODE_64BIT };
520
521 static enum flag_code flag_code;
522 static unsigned int object_64bit;
523 static unsigned int disallow_64bit_reloc;
524 static int use_rela_relocations = 0;
525
526 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
527 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
528 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
529
530 /* The ELF ABI to use. */
531 enum x86_elf_abi
532 {
533 I386_ABI,
534 X86_64_ABI,
535 X86_64_X32_ABI
536 };
537
538 static enum x86_elf_abi x86_elf_abi = I386_ABI;
539 #endif
540
541 #if defined (TE_PE) || defined (TE_PEP)
542 /* Use big object file format. */
543 static int use_big_obj = 0;
544 #endif
545
546 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
547 /* 1 if generating code for a shared library. */
548 static int shared = 0;
549 #endif
550
551 /* 1 for intel syntax,
552 0 if att syntax. */
553 static int intel_syntax = 0;
554
555 /* 1 for Intel64 ISA,
556 0 if AMD64 ISA. */
557 static int intel64;
558
559 /* 1 for intel mnemonic,
560 0 if att mnemonic. */
561 static int intel_mnemonic = !SYSV386_COMPAT;
562
563 /* 1 if pseudo registers are permitted. */
564 static int allow_pseudo_reg = 0;
565
566 /* 1 if register prefix % not required. */
567 static int allow_naked_reg = 0;
568
569 /* 1 if the assembler should add BND prefix for all control-transferring
570 instructions supporting it, even if this prefix wasn't specified
571 explicitly. */
572 static int add_bnd_prefix = 0;
573
574 /* 1 if pseudo index register, eiz/riz, is allowed . */
575 static int allow_index_reg = 0;
576
577 /* 1 if the assembler should ignore LOCK prefix, even if it was
578 specified explicitly. */
579 static int omit_lock_prefix = 0;
580
581 /* 1 if the assembler should encode lfence, mfence, and sfence as
582 "lock addl $0, (%{re}sp)". */
583 static int avoid_fence = 0;
584
585 /* 1 if the assembler should generate relax relocations. */
586
587 static int generate_relax_relocations
588 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
589
590 static enum check_kind
591 {
592 check_none = 0,
593 check_warning,
594 check_error
595 }
596 sse_check, operand_check = check_warning;
597
598 /* Optimization:
599 1. Clear the REX_W bit with register operand if possible.
600 2. Above plus use 128bit vector instruction to clear the full vector
601 register.
602 */
603 static int optimize = 0;
604
605 /* Optimization:
606 1. Clear the REX_W bit with register operand if possible.
607 2. Above plus use 128bit vector instruction to clear the full vector
608 register.
609 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
610 "testb $imm7,%r8".
611 */
612 static int optimize_for_space = 0;
613
614 /* Register prefix used for error message. */
615 static const char *register_prefix = "%";
616
617 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
618 leave, push, and pop instructions so that gcc has the same stack
619 frame as in 32 bit mode. */
620 static char stackop_size = '\0';
621
622 /* Non-zero to optimize code alignment. */
623 int optimize_align_code = 1;
624
625 /* Non-zero to quieten some warnings. */
626 static int quiet_warnings = 0;
627
628 /* CPU name. */
629 static const char *cpu_arch_name = NULL;
630 static char *cpu_sub_arch_name = NULL;
631
632 /* CPU feature flags. */
633 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
634
635 /* If we have selected a cpu we are generating instructions for. */
636 static int cpu_arch_tune_set = 0;
637
638 /* Cpu we are generating instructions for. */
639 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
640
641 /* CPU feature flags of cpu we are generating instructions for. */
642 static i386_cpu_flags cpu_arch_tune_flags;
643
644 /* CPU instruction set architecture used. */
645 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
646
647 /* CPU feature flags of instruction set architecture used. */
648 i386_cpu_flags cpu_arch_isa_flags;
649
650 /* If set, conditional jumps are not automatically promoted to handle
651 larger than a byte offset. */
652 static unsigned int no_cond_jump_promotion = 0;
653
654 /* Encode SSE instructions with VEX prefix. */
655 static unsigned int sse2avx;
656
657 /* Encode scalar AVX instructions with specific vector length. */
658 static enum
659 {
660 vex128 = 0,
661 vex256
662 } avxscalar;
663
664 /* Encode scalar EVEX LIG instructions with specific vector length. */
665 static enum
666 {
667 evexl128 = 0,
668 evexl256,
669 evexl512
670 } evexlig;
671
672 /* Encode EVEX WIG instructions with specific evex.w. */
673 static enum
674 {
675 evexw0 = 0,
676 evexw1
677 } evexwig;
678
679 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
680 static enum rc_type evexrcig = rne;
681
682 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
683 static symbolS *GOT_symbol;
684
685 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
686 unsigned int x86_dwarf2_return_column;
687
688 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
689 int x86_cie_data_alignment;
690
691 /* Interface to relax_segment.
692 There are 3 major relax states for 386 jump insns because the
693 different types of jumps add different sizes to frags when we're
694 figuring out what sort of jump to choose to reach a given label. */
695
696 /* Types. */
697 #define UNCOND_JUMP 0
698 #define COND_JUMP 1
699 #define COND_JUMP86 2
700
701 /* Sizes. */
702 #define CODE16 1
703 #define SMALL 0
704 #define SMALL16 (SMALL | CODE16)
705 #define BIG 2
706 #define BIG16 (BIG | CODE16)
707
708 #ifndef INLINE
709 #ifdef __GNUC__
710 #define INLINE __inline__
711 #else
712 #define INLINE
713 #endif
714 #endif
715
716 #define ENCODE_RELAX_STATE(type, size) \
717 ((relax_substateT) (((type) << 2) | (size)))
718 #define TYPE_FROM_RELAX_STATE(s) \
719 ((s) >> 2)
720 #define DISP_SIZE_FROM_RELAX_STATE(s) \
721 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
722
723 /* This table is used by relax_frag to promote short jumps to long
724 ones where necessary. SMALL (short) jumps may be promoted to BIG
725 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
726 don't allow a short jump in a 32 bit code segment to be promoted to
727 a 16 bit offset jump because it's slower (requires data size
728 prefix), and doesn't work, unless the destination is in the bottom
729 64k of the code segment (The top 16 bits of eip are zeroed). */
730
731 const relax_typeS md_relax_table[] =
732 {
733 /* The fields are:
734 1) most positive reach of this state,
735 2) most negative reach of this state,
736 3) how many bytes this mode will have in the variable part of the frag
737 4) which index into the table to try if we can't fit into this one. */
738
739 /* UNCOND_JUMP states. */
740 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
741 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
742 /* dword jmp adds 4 bytes to frag:
743 0 extra opcode bytes, 4 displacement bytes. */
744 {0, 0, 4, 0},
745 /* word jmp adds 2 byte2 to frag:
746 0 extra opcode bytes, 2 displacement bytes. */
747 {0, 0, 2, 0},
748
749 /* COND_JUMP states. */
750 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
751 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
752 /* dword conditionals adds 5 bytes to frag:
753 1 extra opcode byte, 4 displacement bytes. */
754 {0, 0, 5, 0},
755 /* word conditionals add 3 bytes to frag:
756 1 extra opcode byte, 2 displacement bytes. */
757 {0, 0, 3, 0},
758
759 /* COND_JUMP86 states. */
760 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
761 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
762 /* dword conditionals adds 5 bytes to frag:
763 1 extra opcode byte, 4 displacement bytes. */
764 {0, 0, 5, 0},
765 /* word conditionals add 4 bytes to frag:
766 1 displacement byte and a 3 byte long branch insn. */
767 {0, 0, 4, 0}
768 };
769
770 static const arch_entry cpu_arch[] =
771 {
772 /* Do not replace the first two entries - i386_target_format()
773 relies on them being there in this order. */
774 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
775 CPU_GENERIC32_FLAGS, 0 },
776 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
777 CPU_GENERIC64_FLAGS, 0 },
778 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
779 CPU_NONE_FLAGS, 0 },
780 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
781 CPU_I186_FLAGS, 0 },
782 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
783 CPU_I286_FLAGS, 0 },
784 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
785 CPU_I386_FLAGS, 0 },
786 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
787 CPU_I486_FLAGS, 0 },
788 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
789 CPU_I586_FLAGS, 0 },
790 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
791 CPU_I686_FLAGS, 0 },
792 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
793 CPU_I586_FLAGS, 0 },
794 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
795 CPU_PENTIUMPRO_FLAGS, 0 },
796 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
797 CPU_P2_FLAGS, 0 },
798 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
799 CPU_P3_FLAGS, 0 },
800 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
801 CPU_P4_FLAGS, 0 },
802 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
803 CPU_CORE_FLAGS, 0 },
804 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
805 CPU_NOCONA_FLAGS, 0 },
806 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
807 CPU_CORE_FLAGS, 1 },
808 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
809 CPU_CORE_FLAGS, 0 },
810 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
811 CPU_CORE2_FLAGS, 1 },
812 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
813 CPU_CORE2_FLAGS, 0 },
814 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
815 CPU_COREI7_FLAGS, 0 },
816 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
817 CPU_L1OM_FLAGS, 0 },
818 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
819 CPU_K1OM_FLAGS, 0 },
820 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
821 CPU_IAMCU_FLAGS, 0 },
822 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
823 CPU_K6_FLAGS, 0 },
824 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
825 CPU_K6_2_FLAGS, 0 },
826 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
827 CPU_ATHLON_FLAGS, 0 },
828 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
829 CPU_K8_FLAGS, 1 },
830 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
831 CPU_K8_FLAGS, 0 },
832 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
833 CPU_K8_FLAGS, 0 },
834 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
835 CPU_AMDFAM10_FLAGS, 0 },
836 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
837 CPU_BDVER1_FLAGS, 0 },
838 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
839 CPU_BDVER2_FLAGS, 0 },
840 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
841 CPU_BDVER3_FLAGS, 0 },
842 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
843 CPU_BDVER4_FLAGS, 0 },
844 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
845 CPU_ZNVER1_FLAGS, 0 },
846 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
847 CPU_ZNVER2_FLAGS, 0 },
848 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
849 CPU_BTVER1_FLAGS, 0 },
850 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
851 CPU_BTVER2_FLAGS, 0 },
852 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
853 CPU_8087_FLAGS, 0 },
854 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
855 CPU_287_FLAGS, 0 },
856 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
857 CPU_387_FLAGS, 0 },
858 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
859 CPU_687_FLAGS, 0 },
860 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
861 CPU_MMX_FLAGS, 0 },
862 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
863 CPU_SSE_FLAGS, 0 },
864 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
865 CPU_SSE2_FLAGS, 0 },
866 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
867 CPU_SSE3_FLAGS, 0 },
868 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
869 CPU_SSSE3_FLAGS, 0 },
870 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
871 CPU_SSE4_1_FLAGS, 0 },
872 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
873 CPU_SSE4_2_FLAGS, 0 },
874 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
875 CPU_SSE4_2_FLAGS, 0 },
876 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
877 CPU_AVX_FLAGS, 0 },
878 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
879 CPU_AVX2_FLAGS, 0 },
880 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
881 CPU_AVX512F_FLAGS, 0 },
882 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
883 CPU_AVX512CD_FLAGS, 0 },
884 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
885 CPU_AVX512ER_FLAGS, 0 },
886 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
887 CPU_AVX512PF_FLAGS, 0 },
888 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
889 CPU_AVX512DQ_FLAGS, 0 },
890 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
891 CPU_AVX512BW_FLAGS, 0 },
892 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
893 CPU_AVX512VL_FLAGS, 0 },
894 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
895 CPU_VMX_FLAGS, 0 },
896 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
897 CPU_VMFUNC_FLAGS, 0 },
898 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
899 CPU_SMX_FLAGS, 0 },
900 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
901 CPU_XSAVE_FLAGS, 0 },
902 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
903 CPU_XSAVEOPT_FLAGS, 0 },
904 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
905 CPU_XSAVEC_FLAGS, 0 },
906 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
907 CPU_XSAVES_FLAGS, 0 },
908 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
909 CPU_AES_FLAGS, 0 },
910 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
911 CPU_PCLMUL_FLAGS, 0 },
912 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
913 CPU_PCLMUL_FLAGS, 1 },
914 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
915 CPU_FSGSBASE_FLAGS, 0 },
916 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
917 CPU_RDRND_FLAGS, 0 },
918 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
919 CPU_F16C_FLAGS, 0 },
920 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
921 CPU_BMI2_FLAGS, 0 },
922 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
923 CPU_FMA_FLAGS, 0 },
924 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
925 CPU_FMA4_FLAGS, 0 },
926 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
927 CPU_XOP_FLAGS, 0 },
928 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
929 CPU_LWP_FLAGS, 0 },
930 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
931 CPU_MOVBE_FLAGS, 0 },
932 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
933 CPU_CX16_FLAGS, 0 },
934 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
935 CPU_EPT_FLAGS, 0 },
936 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
937 CPU_LZCNT_FLAGS, 0 },
938 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
939 CPU_HLE_FLAGS, 0 },
940 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
941 CPU_RTM_FLAGS, 0 },
942 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
943 CPU_INVPCID_FLAGS, 0 },
944 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
945 CPU_CLFLUSH_FLAGS, 0 },
946 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
947 CPU_NOP_FLAGS, 0 },
948 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
949 CPU_SYSCALL_FLAGS, 0 },
950 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
951 CPU_RDTSCP_FLAGS, 0 },
952 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
953 CPU_3DNOW_FLAGS, 0 },
954 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
955 CPU_3DNOWA_FLAGS, 0 },
956 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
957 CPU_PADLOCK_FLAGS, 0 },
958 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
959 CPU_SVME_FLAGS, 1 },
960 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
961 CPU_SVME_FLAGS, 0 },
962 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
963 CPU_SSE4A_FLAGS, 0 },
964 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
965 CPU_ABM_FLAGS, 0 },
966 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
967 CPU_BMI_FLAGS, 0 },
968 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
969 CPU_TBM_FLAGS, 0 },
970 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
971 CPU_ADX_FLAGS, 0 },
972 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
973 CPU_RDSEED_FLAGS, 0 },
974 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
975 CPU_PRFCHW_FLAGS, 0 },
976 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
977 CPU_SMAP_FLAGS, 0 },
978 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
979 CPU_MPX_FLAGS, 0 },
980 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
981 CPU_SHA_FLAGS, 0 },
982 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
983 CPU_CLFLUSHOPT_FLAGS, 0 },
984 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
985 CPU_PREFETCHWT1_FLAGS, 0 },
986 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
987 CPU_SE1_FLAGS, 0 },
988 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
989 CPU_CLWB_FLAGS, 0 },
990 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
991 CPU_AVX512IFMA_FLAGS, 0 },
992 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
993 CPU_AVX512VBMI_FLAGS, 0 },
994 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
995 CPU_AVX512_4FMAPS_FLAGS, 0 },
996 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
997 CPU_AVX512_4VNNIW_FLAGS, 0 },
998 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
999 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1000 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1001 CPU_AVX512_VBMI2_FLAGS, 0 },
1002 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1003 CPU_AVX512_VNNI_FLAGS, 0 },
1004 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1005 CPU_AVX512_BITALG_FLAGS, 0 },
1006 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1007 CPU_CLZERO_FLAGS, 0 },
1008 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1009 CPU_MWAITX_FLAGS, 0 },
1010 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1011 CPU_OSPKE_FLAGS, 0 },
1012 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1013 CPU_RDPID_FLAGS, 0 },
1014 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1015 CPU_PTWRITE_FLAGS, 0 },
1016 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1017 CPU_IBT_FLAGS, 0 },
1018 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1019 CPU_SHSTK_FLAGS, 0 },
1020 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1021 CPU_GFNI_FLAGS, 0 },
1022 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1023 CPU_VAES_FLAGS, 0 },
1024 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1025 CPU_VPCLMULQDQ_FLAGS, 0 },
1026 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1027 CPU_WBNOINVD_FLAGS, 0 },
1028 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1029 CPU_PCONFIG_FLAGS, 0 },
1030 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1031 CPU_WAITPKG_FLAGS, 0 },
1032 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1033 CPU_CLDEMOTE_FLAGS, 0 },
1034 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1035 CPU_MOVDIRI_FLAGS, 0 },
1036 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1037 CPU_MOVDIR64B_FLAGS, 0 },
1038 };
1039
1040 static const noarch_entry cpu_noarch[] =
1041 {
1042 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1043 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1044 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1045 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1046 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1047 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1048 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1049 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1050 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1051 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1052 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1053 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1054 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1055 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1056 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1057 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1058 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1059 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1060 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1061 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1062 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1063 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1064 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1065 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1066 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1067 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1068 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1069 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1070 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1071 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1072 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1073 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1074 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1075 };
1076
1077 #ifdef I386COFF
1078 /* Like s_lcomm_internal in gas/read.c but the alignment string
1079 is allowed to be optional. */
1080
1081 static symbolS *
1082 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1083 {
1084 addressT align = 0;
1085
1086 SKIP_WHITESPACE ();
1087
1088 if (needs_align
1089 && *input_line_pointer == ',')
1090 {
1091 align = parse_align (needs_align - 1);
1092
1093 if (align == (addressT) -1)
1094 return NULL;
1095 }
1096 else
1097 {
1098 if (size >= 8)
1099 align = 3;
1100 else if (size >= 4)
1101 align = 2;
1102 else if (size >= 2)
1103 align = 1;
1104 else
1105 align = 0;
1106 }
1107
1108 bss_alloc (symbolP, size, align);
1109 return symbolP;
1110 }
1111
1112 static void
1113 pe_lcomm (int needs_align)
1114 {
1115 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1116 }
1117 #endif
1118
1119 const pseudo_typeS md_pseudo_table[] =
1120 {
1121 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1122 {"align", s_align_bytes, 0},
1123 #else
1124 {"align", s_align_ptwo, 0},
1125 #endif
1126 {"arch", set_cpu_arch, 0},
1127 #ifndef I386COFF
1128 {"bss", s_bss, 0},
1129 #else
1130 {"lcomm", pe_lcomm, 1},
1131 #endif
1132 {"ffloat", float_cons, 'f'},
1133 {"dfloat", float_cons, 'd'},
1134 {"tfloat", float_cons, 'x'},
1135 {"value", cons, 2},
1136 {"slong", signed_cons, 4},
1137 {"noopt", s_ignore, 0},
1138 {"optim", s_ignore, 0},
1139 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1140 {"code16", set_code_flag, CODE_16BIT},
1141 {"code32", set_code_flag, CODE_32BIT},
1142 #ifdef BFD64
1143 {"code64", set_code_flag, CODE_64BIT},
1144 #endif
1145 {"intel_syntax", set_intel_syntax, 1},
1146 {"att_syntax", set_intel_syntax, 0},
1147 {"intel_mnemonic", set_intel_mnemonic, 1},
1148 {"att_mnemonic", set_intel_mnemonic, 0},
1149 {"allow_index_reg", set_allow_index_reg, 1},
1150 {"disallow_index_reg", set_allow_index_reg, 0},
1151 {"sse_check", set_check, 0},
1152 {"operand_check", set_check, 1},
1153 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1154 {"largecomm", handle_large_common, 0},
1155 #else
1156 {"file", dwarf2_directive_file, 0},
1157 {"loc", dwarf2_directive_loc, 0},
1158 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1159 #endif
1160 #ifdef TE_PE
1161 {"secrel32", pe_directive_secrel, 0},
1162 #endif
1163 {0, 0, 0}
1164 };
1165
1166 /* For interface with expression (). */
1167 extern char *input_line_pointer;
1168
1169 /* Hash table for instruction mnemonic lookup. */
1170 static struct hash_control *op_hash;
1171
1172 /* Hash table for register lookup. */
1173 static struct hash_control *reg_hash;
1174 \f
1175 /* Various efficient no-op patterns for aligning code labels.
1176 Note: Don't try to assemble the instructions in the comments.
1177 0L and 0w are not legal. */
1178 static const unsigned char f32_1[] =
1179 {0x90}; /* nop */
1180 static const unsigned char f32_2[] =
1181 {0x66,0x90}; /* xchg %ax,%ax */
1182 static const unsigned char f32_3[] =
1183 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1184 static const unsigned char f32_4[] =
1185 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1186 static const unsigned char f32_6[] =
1187 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1188 static const unsigned char f32_7[] =
1189 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1190 static const unsigned char f16_3[] =
1191 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1192 static const unsigned char f16_4[] =
1193 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1194 static const unsigned char jump_disp8[] =
1195 {0xeb}; /* jmp disp8 */
1196 static const unsigned char jump32_disp32[] =
1197 {0xe9}; /* jmp disp32 */
1198 static const unsigned char jump16_disp32[] =
1199 {0x66,0xe9}; /* jmp disp32 */
1200 /* 32-bit NOPs patterns. */
1201 static const unsigned char *const f32_patt[] = {
1202 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1203 };
1204 /* 16-bit NOPs patterns. */
1205 static const unsigned char *const f16_patt[] = {
1206 f32_1, f32_2, f16_3, f16_4
1207 };
1208 /* nopl (%[re]ax) */
1209 static const unsigned char alt_3[] =
1210 {0x0f,0x1f,0x00};
1211 /* nopl 0(%[re]ax) */
1212 static const unsigned char alt_4[] =
1213 {0x0f,0x1f,0x40,0x00};
1214 /* nopl 0(%[re]ax,%[re]ax,1) */
1215 static const unsigned char alt_5[] =
1216 {0x0f,0x1f,0x44,0x00,0x00};
1217 /* nopw 0(%[re]ax,%[re]ax,1) */
1218 static const unsigned char alt_6[] =
1219 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1220 /* nopl 0L(%[re]ax) */
1221 static const unsigned char alt_7[] =
1222 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1223 /* nopl 0L(%[re]ax,%[re]ax,1) */
1224 static const unsigned char alt_8[] =
1225 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1226 /* nopw 0L(%[re]ax,%[re]ax,1) */
1227 static const unsigned char alt_9[] =
1228 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1229 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1230 static const unsigned char alt_10[] =
1231 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1232 /* data16 nopw %cs:0L(%eax,%eax,1) */
1233 static const unsigned char alt_11[] =
1234 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1235 /* 32-bit and 64-bit NOPs patterns. */
1236 static const unsigned char *const alt_patt[] = {
1237 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1238 alt_9, alt_10, alt_11
1239 };
1240
1241 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1242 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1243
1244 static void
1245 i386_output_nops (char *where, const unsigned char *const *patt,
1246 int count, int max_single_nop_size)
1247
1248 {
1249 /* Place the longer NOP first. */
1250 int last;
1251 int offset;
1252 const unsigned char *nops = patt[max_single_nop_size - 1];
1253
1254 /* Use the smaller one if the requsted one isn't available. */
1255 if (nops == NULL)
1256 {
1257 max_single_nop_size--;
1258 nops = patt[max_single_nop_size - 1];
1259 }
1260
1261 last = count % max_single_nop_size;
1262
1263 count -= last;
1264 for (offset = 0; offset < count; offset += max_single_nop_size)
1265 memcpy (where + offset, nops, max_single_nop_size);
1266
1267 if (last)
1268 {
1269 nops = patt[last - 1];
1270 if (nops == NULL)
1271 {
1272 /* Use the smaller one plus one-byte NOP if the needed one
1273 isn't available. */
1274 last--;
1275 nops = patt[last - 1];
1276 memcpy (where + offset, nops, last);
1277 where[offset + last] = *patt[0];
1278 }
1279 else
1280 memcpy (where + offset, nops, last);
1281 }
1282 }
1283
1284 static INLINE int
1285 fits_in_imm7 (offsetT num)
1286 {
1287 return (num & 0x7f) == num;
1288 }
1289
1290 static INLINE int
1291 fits_in_imm31 (offsetT num)
1292 {
1293 return (num & 0x7fffffff) == num;
1294 }
1295
1296 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1297 single NOP instruction LIMIT. */
1298
1299 void
1300 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1301 {
1302 const unsigned char *const *patt = NULL;
1303 int max_single_nop_size;
1304 /* Maximum number of NOPs before switching to jump over NOPs. */
1305 int max_number_of_nops;
1306
1307 switch (fragP->fr_type)
1308 {
1309 case rs_fill_nop:
1310 case rs_align_code:
1311 break;
1312 default:
1313 return;
1314 }
1315
1316 /* We need to decide which NOP sequence to use for 32bit and
1317 64bit. When -mtune= is used:
1318
1319 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1320 PROCESSOR_GENERIC32, f32_patt will be used.
1321 2. For the rest, alt_patt will be used.
1322
1323 When -mtune= isn't used, alt_patt will be used if
1324 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1325 be used.
1326
1327 When -march= or .arch is used, we can't use anything beyond
1328 cpu_arch_isa_flags. */
1329
1330 if (flag_code == CODE_16BIT)
1331 {
1332 patt = f16_patt;
1333 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1334 /* Limit number of NOPs to 2 in 16-bit mode. */
1335 max_number_of_nops = 2;
1336 }
1337 else
1338 {
1339 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1340 {
1341 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1342 switch (cpu_arch_tune)
1343 {
1344 case PROCESSOR_UNKNOWN:
1345 /* We use cpu_arch_isa_flags to check if we SHOULD
1346 optimize with nops. */
1347 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1348 patt = alt_patt;
1349 else
1350 patt = f32_patt;
1351 break;
1352 case PROCESSOR_PENTIUM4:
1353 case PROCESSOR_NOCONA:
1354 case PROCESSOR_CORE:
1355 case PROCESSOR_CORE2:
1356 case PROCESSOR_COREI7:
1357 case PROCESSOR_L1OM:
1358 case PROCESSOR_K1OM:
1359 case PROCESSOR_GENERIC64:
1360 case PROCESSOR_K6:
1361 case PROCESSOR_ATHLON:
1362 case PROCESSOR_K8:
1363 case PROCESSOR_AMDFAM10:
1364 case PROCESSOR_BD:
1365 case PROCESSOR_ZNVER:
1366 case PROCESSOR_BT:
1367 patt = alt_patt;
1368 break;
1369 case PROCESSOR_I386:
1370 case PROCESSOR_I486:
1371 case PROCESSOR_PENTIUM:
1372 case PROCESSOR_PENTIUMPRO:
1373 case PROCESSOR_IAMCU:
1374 case PROCESSOR_GENERIC32:
1375 patt = f32_patt;
1376 break;
1377 }
1378 }
1379 else
1380 {
1381 switch (fragP->tc_frag_data.tune)
1382 {
1383 case PROCESSOR_UNKNOWN:
1384 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1385 PROCESSOR_UNKNOWN. */
1386 abort ();
1387 break;
1388
1389 case PROCESSOR_I386:
1390 case PROCESSOR_I486:
1391 case PROCESSOR_PENTIUM:
1392 case PROCESSOR_IAMCU:
1393 case PROCESSOR_K6:
1394 case PROCESSOR_ATHLON:
1395 case PROCESSOR_K8:
1396 case PROCESSOR_AMDFAM10:
1397 case PROCESSOR_BD:
1398 case PROCESSOR_ZNVER:
1399 case PROCESSOR_BT:
1400 case PROCESSOR_GENERIC32:
1401 /* We use cpu_arch_isa_flags to check if we CAN optimize
1402 with nops. */
1403 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1404 patt = alt_patt;
1405 else
1406 patt = f32_patt;
1407 break;
1408 case PROCESSOR_PENTIUMPRO:
1409 case PROCESSOR_PENTIUM4:
1410 case PROCESSOR_NOCONA:
1411 case PROCESSOR_CORE:
1412 case PROCESSOR_CORE2:
1413 case PROCESSOR_COREI7:
1414 case PROCESSOR_L1OM:
1415 case PROCESSOR_K1OM:
1416 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1417 patt = alt_patt;
1418 else
1419 patt = f32_patt;
1420 break;
1421 case PROCESSOR_GENERIC64:
1422 patt = alt_patt;
1423 break;
1424 }
1425 }
1426
1427 if (patt == f32_patt)
1428 {
1429 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1430 /* Limit number of NOPs to 2 for older processors. */
1431 max_number_of_nops = 2;
1432 }
1433 else
1434 {
1435 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1436 /* Limit number of NOPs to 7 for newer processors. */
1437 max_number_of_nops = 7;
1438 }
1439 }
1440
1441 if (limit == 0)
1442 limit = max_single_nop_size;
1443
1444 if (fragP->fr_type == rs_fill_nop)
1445 {
1446 /* Output NOPs for .nop directive. */
1447 if (limit > max_single_nop_size)
1448 {
1449 as_bad_where (fragP->fr_file, fragP->fr_line,
1450 _("invalid single nop size: %d "
1451 "(expect within [0, %d])"),
1452 limit, max_single_nop_size);
1453 return;
1454 }
1455 }
1456 else
1457 fragP->fr_var = count;
1458
1459 if ((count / max_single_nop_size) > max_number_of_nops)
1460 {
1461 /* Generate jump over NOPs. */
1462 offsetT disp = count - 2;
1463 if (fits_in_imm7 (disp))
1464 {
1465 /* Use "jmp disp8" if possible. */
1466 count = disp;
1467 where[0] = jump_disp8[0];
1468 where[1] = count;
1469 where += 2;
1470 }
1471 else
1472 {
1473 unsigned int size_of_jump;
1474
1475 if (flag_code == CODE_16BIT)
1476 {
1477 where[0] = jump16_disp32[0];
1478 where[1] = jump16_disp32[1];
1479 size_of_jump = 2;
1480 }
1481 else
1482 {
1483 where[0] = jump32_disp32[0];
1484 size_of_jump = 1;
1485 }
1486
1487 count -= size_of_jump + 4;
1488 if (!fits_in_imm31 (count))
1489 {
1490 as_bad_where (fragP->fr_file, fragP->fr_line,
1491 _("jump over nop padding out of range"));
1492 return;
1493 }
1494
1495 md_number_to_chars (where + size_of_jump, count, 4);
1496 where += size_of_jump + 4;
1497 }
1498 }
1499
1500 /* Generate multiple NOPs. */
1501 i386_output_nops (where, patt, count, limit);
1502 }
1503
1504 static INLINE int
1505 operand_type_all_zero (const union i386_operand_type *x)
1506 {
1507 switch (ARRAY_SIZE(x->array))
1508 {
1509 case 3:
1510 if (x->array[2])
1511 return 0;
1512 /* Fall through. */
1513 case 2:
1514 if (x->array[1])
1515 return 0;
1516 /* Fall through. */
1517 case 1:
1518 return !x->array[0];
1519 default:
1520 abort ();
1521 }
1522 }
1523
1524 static INLINE void
1525 operand_type_set (union i386_operand_type *x, unsigned int v)
1526 {
1527 switch (ARRAY_SIZE(x->array))
1528 {
1529 case 3:
1530 x->array[2] = v;
1531 /* Fall through. */
1532 case 2:
1533 x->array[1] = v;
1534 /* Fall through. */
1535 case 1:
1536 x->array[0] = v;
1537 /* Fall through. */
1538 break;
1539 default:
1540 abort ();
1541 }
1542 }
1543
1544 static INLINE int
1545 operand_type_equal (const union i386_operand_type *x,
1546 const union i386_operand_type *y)
1547 {
1548 switch (ARRAY_SIZE(x->array))
1549 {
1550 case 3:
1551 if (x->array[2] != y->array[2])
1552 return 0;
1553 /* Fall through. */
1554 case 2:
1555 if (x->array[1] != y->array[1])
1556 return 0;
1557 /* Fall through. */
1558 case 1:
1559 return x->array[0] == y->array[0];
1560 break;
1561 default:
1562 abort ();
1563 }
1564 }
1565
1566 static INLINE int
1567 cpu_flags_all_zero (const union i386_cpu_flags *x)
1568 {
1569 switch (ARRAY_SIZE(x->array))
1570 {
1571 case 4:
1572 if (x->array[3])
1573 return 0;
1574 /* Fall through. */
1575 case 3:
1576 if (x->array[2])
1577 return 0;
1578 /* Fall through. */
1579 case 2:
1580 if (x->array[1])
1581 return 0;
1582 /* Fall through. */
1583 case 1:
1584 return !x->array[0];
1585 default:
1586 abort ();
1587 }
1588 }
1589
1590 static INLINE int
1591 cpu_flags_equal (const union i386_cpu_flags *x,
1592 const union i386_cpu_flags *y)
1593 {
1594 switch (ARRAY_SIZE(x->array))
1595 {
1596 case 4:
1597 if (x->array[3] != y->array[3])
1598 return 0;
1599 /* Fall through. */
1600 case 3:
1601 if (x->array[2] != y->array[2])
1602 return 0;
1603 /* Fall through. */
1604 case 2:
1605 if (x->array[1] != y->array[1])
1606 return 0;
1607 /* Fall through. */
1608 case 1:
1609 return x->array[0] == y->array[0];
1610 break;
1611 default:
1612 abort ();
1613 }
1614 }
1615
1616 static INLINE int
1617 cpu_flags_check_cpu64 (i386_cpu_flags f)
1618 {
1619 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1620 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1621 }
1622
1623 static INLINE i386_cpu_flags
1624 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1625 {
1626 switch (ARRAY_SIZE (x.array))
1627 {
1628 case 4:
1629 x.array [3] &= y.array [3];
1630 /* Fall through. */
1631 case 3:
1632 x.array [2] &= y.array [2];
1633 /* Fall through. */
1634 case 2:
1635 x.array [1] &= y.array [1];
1636 /* Fall through. */
1637 case 1:
1638 x.array [0] &= y.array [0];
1639 break;
1640 default:
1641 abort ();
1642 }
1643 return x;
1644 }
1645
1646 static INLINE i386_cpu_flags
1647 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1648 {
1649 switch (ARRAY_SIZE (x.array))
1650 {
1651 case 4:
1652 x.array [3] |= y.array [3];
1653 /* Fall through. */
1654 case 3:
1655 x.array [2] |= y.array [2];
1656 /* Fall through. */
1657 case 2:
1658 x.array [1] |= y.array [1];
1659 /* Fall through. */
1660 case 1:
1661 x.array [0] |= y.array [0];
1662 break;
1663 default:
1664 abort ();
1665 }
1666 return x;
1667 }
1668
1669 static INLINE i386_cpu_flags
1670 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1671 {
1672 switch (ARRAY_SIZE (x.array))
1673 {
1674 case 4:
1675 x.array [3] &= ~y.array [3];
1676 /* Fall through. */
1677 case 3:
1678 x.array [2] &= ~y.array [2];
1679 /* Fall through. */
1680 case 2:
1681 x.array [1] &= ~y.array [1];
1682 /* Fall through. */
1683 case 1:
1684 x.array [0] &= ~y.array [0];
1685 break;
1686 default:
1687 abort ();
1688 }
1689 return x;
1690 }
1691
1692 #define CPU_FLAGS_ARCH_MATCH 0x1
1693 #define CPU_FLAGS_64BIT_MATCH 0x2
1694
1695 #define CPU_FLAGS_PERFECT_MATCH \
1696 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1697
1698 /* Return CPU flags match bits. */
1699
1700 static int
1701 cpu_flags_match (const insn_template *t)
1702 {
1703 i386_cpu_flags x = t->cpu_flags;
1704 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1705
1706 x.bitfield.cpu64 = 0;
1707 x.bitfield.cpuno64 = 0;
1708
1709 if (cpu_flags_all_zero (&x))
1710 {
1711 /* This instruction is available on all archs. */
1712 match |= CPU_FLAGS_ARCH_MATCH;
1713 }
1714 else
1715 {
1716 /* This instruction is available only on some archs. */
1717 i386_cpu_flags cpu = cpu_arch_flags;
1718
1719 /* AVX512VL is no standalone feature - match it and then strip it. */
1720 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1721 return match;
1722 x.bitfield.cpuavx512vl = 0;
1723
1724 cpu = cpu_flags_and (x, cpu);
1725 if (!cpu_flags_all_zero (&cpu))
1726 {
1727 if (x.bitfield.cpuavx)
1728 {
1729 /* We need to check a few extra flags with AVX. */
1730 if (cpu.bitfield.cpuavx
1731 && (!t->opcode_modifier.sse2avx || sse2avx)
1732 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1733 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1734 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1735 match |= CPU_FLAGS_ARCH_MATCH;
1736 }
1737 else if (x.bitfield.cpuavx512f)
1738 {
1739 /* We need to check a few extra flags with AVX512F. */
1740 if (cpu.bitfield.cpuavx512f
1741 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1742 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1743 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1744 match |= CPU_FLAGS_ARCH_MATCH;
1745 }
1746 else
1747 match |= CPU_FLAGS_ARCH_MATCH;
1748 }
1749 }
1750 return match;
1751 }
1752
1753 static INLINE i386_operand_type
1754 operand_type_and (i386_operand_type x, i386_operand_type y)
1755 {
1756 switch (ARRAY_SIZE (x.array))
1757 {
1758 case 3:
1759 x.array [2] &= y.array [2];
1760 /* Fall through. */
1761 case 2:
1762 x.array [1] &= y.array [1];
1763 /* Fall through. */
1764 case 1:
1765 x.array [0] &= y.array [0];
1766 break;
1767 default:
1768 abort ();
1769 }
1770 return x;
1771 }
1772
1773 static INLINE i386_operand_type
1774 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1775 {
1776 switch (ARRAY_SIZE (x.array))
1777 {
1778 case 3:
1779 x.array [2] &= ~y.array [2];
1780 /* Fall through. */
1781 case 2:
1782 x.array [1] &= ~y.array [1];
1783 /* Fall through. */
1784 case 1:
1785 x.array [0] &= ~y.array [0];
1786 break;
1787 default:
1788 abort ();
1789 }
1790 return x;
1791 }
1792
1793 static INLINE i386_operand_type
1794 operand_type_or (i386_operand_type x, i386_operand_type y)
1795 {
1796 switch (ARRAY_SIZE (x.array))
1797 {
1798 case 3:
1799 x.array [2] |= y.array [2];
1800 /* Fall through. */
1801 case 2:
1802 x.array [1] |= y.array [1];
1803 /* Fall through. */
1804 case 1:
1805 x.array [0] |= y.array [0];
1806 break;
1807 default:
1808 abort ();
1809 }
1810 return x;
1811 }
1812
1813 static INLINE i386_operand_type
1814 operand_type_xor (i386_operand_type x, i386_operand_type y)
1815 {
1816 switch (ARRAY_SIZE (x.array))
1817 {
1818 case 3:
1819 x.array [2] ^= y.array [2];
1820 /* Fall through. */
1821 case 2:
1822 x.array [1] ^= y.array [1];
1823 /* Fall through. */
1824 case 1:
1825 x.array [0] ^= y.array [0];
1826 break;
1827 default:
1828 abort ();
1829 }
1830 return x;
1831 }
1832
1833 static const i386_operand_type acc32 = OPERAND_TYPE_ACC32;
1834 static const i386_operand_type acc64 = OPERAND_TYPE_ACC64;
1835 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1836 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1837 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1838 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1839 static const i386_operand_type anydisp
1840 = OPERAND_TYPE_ANYDISP;
1841 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1842 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
1843 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1844 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1845 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1846 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1847 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1848 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1849 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1850 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1851 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1852 static const i386_operand_type vec_imm4 = OPERAND_TYPE_VEC_IMM4;
1853
1854 enum operand_type
1855 {
1856 reg,
1857 imm,
1858 disp,
1859 anymem
1860 };
1861
1862 static INLINE int
1863 operand_type_check (i386_operand_type t, enum operand_type c)
1864 {
1865 switch (c)
1866 {
1867 case reg:
1868 return t.bitfield.reg;
1869
1870 case imm:
1871 return (t.bitfield.imm8
1872 || t.bitfield.imm8s
1873 || t.bitfield.imm16
1874 || t.bitfield.imm32
1875 || t.bitfield.imm32s
1876 || t.bitfield.imm64);
1877
1878 case disp:
1879 return (t.bitfield.disp8
1880 || t.bitfield.disp16
1881 || t.bitfield.disp32
1882 || t.bitfield.disp32s
1883 || t.bitfield.disp64);
1884
1885 case anymem:
1886 return (t.bitfield.disp8
1887 || t.bitfield.disp16
1888 || t.bitfield.disp32
1889 || t.bitfield.disp32s
1890 || t.bitfield.disp64
1891 || t.bitfield.baseindex);
1892
1893 default:
1894 abort ();
1895 }
1896
1897 return 0;
1898 }
1899
1900 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit on
1901 operand J for instruction template T. */
1902
1903 static INLINE int
1904 match_reg_size (const insn_template *t, unsigned int wanted, unsigned int given)
1905 {
1906 return !((i.types[given].bitfield.byte
1907 && !t->operand_types[wanted].bitfield.byte)
1908 || (i.types[given].bitfield.word
1909 && !t->operand_types[wanted].bitfield.word)
1910 || (i.types[given].bitfield.dword
1911 && !t->operand_types[wanted].bitfield.dword)
1912 || (i.types[given].bitfield.qword
1913 && !t->operand_types[wanted].bitfield.qword)
1914 || (i.types[given].bitfield.tbyte
1915 && !t->operand_types[wanted].bitfield.tbyte));
1916 }
1917
1918 /* Return 1 if there is no conflict in SIMD register on
1919 operand J for instruction template T. */
1920
1921 static INLINE int
1922 match_simd_size (const insn_template *t, unsigned int wanted, unsigned int given)
1923 {
1924 return !((i.types[given].bitfield.xmmword
1925 && !t->operand_types[wanted].bitfield.xmmword)
1926 || (i.types[given].bitfield.ymmword
1927 && !t->operand_types[wanted].bitfield.ymmword)
1928 || (i.types[given].bitfield.zmmword
1929 && !t->operand_types[wanted].bitfield.zmmword));
1930 }
1931
1932 /* Return 1 if there is no conflict in any size on operand J for
1933 instruction template T. */
1934
1935 static INLINE int
1936 match_mem_size (const insn_template *t, unsigned int wanted, unsigned int given)
1937 {
1938 return (match_reg_size (t, wanted, given)
1939 && !((i.types[given].bitfield.unspecified
1940 && !i.broadcast
1941 && !t->operand_types[wanted].bitfield.unspecified)
1942 || (i.types[given].bitfield.fword
1943 && !t->operand_types[wanted].bitfield.fword)
1944 /* For scalar opcode templates to allow register and memory
1945 operands at the same time, some special casing is needed
1946 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
1947 down-conversion vpmov*. */
1948 || ((t->operand_types[wanted].bitfield.regsimd
1949 && !t->opcode_modifier.broadcast
1950 && (t->operand_types[wanted].bitfield.byte
1951 || t->operand_types[wanted].bitfield.word
1952 || t->operand_types[wanted].bitfield.dword
1953 || t->operand_types[wanted].bitfield.qword))
1954 ? (i.types[given].bitfield.xmmword
1955 || i.types[given].bitfield.ymmword
1956 || i.types[given].bitfield.zmmword)
1957 : !match_simd_size(t, wanted, given))));
1958 }
1959
1960 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
1961 operands for instruction template T, and it has MATCH_REVERSE set if there
1962 is no size conflict on any operands for the template with operands reversed
1963 (and the template allows for reversing in the first place). */
1964
1965 #define MATCH_STRAIGHT 1
1966 #define MATCH_REVERSE 2
1967
1968 static INLINE unsigned int
1969 operand_size_match (const insn_template *t)
1970 {
1971 unsigned int j, match = MATCH_STRAIGHT;
1972
1973 /* Don't check jump instructions. */
1974 if (t->opcode_modifier.jump
1975 || t->opcode_modifier.jumpbyte
1976 || t->opcode_modifier.jumpdword
1977 || t->opcode_modifier.jumpintersegment)
1978 return match;
1979
1980 /* Check memory and accumulator operand size. */
1981 for (j = 0; j < i.operands; j++)
1982 {
1983 if (!i.types[j].bitfield.reg && !i.types[j].bitfield.regsimd
1984 && t->operand_types[j].bitfield.anysize)
1985 continue;
1986
1987 if (t->operand_types[j].bitfield.reg
1988 && !match_reg_size (t, j, j))
1989 {
1990 match = 0;
1991 break;
1992 }
1993
1994 if (t->operand_types[j].bitfield.regsimd
1995 && !match_simd_size (t, j, j))
1996 {
1997 match = 0;
1998 break;
1999 }
2000
2001 if (t->operand_types[j].bitfield.acc
2002 && (!match_reg_size (t, j, j) || !match_simd_size (t, j, j)))
2003 {
2004 match = 0;
2005 break;
2006 }
2007
2008 if (i.types[j].bitfield.mem && !match_mem_size (t, j, j))
2009 {
2010 match = 0;
2011 break;
2012 }
2013 }
2014
2015 if (!t->opcode_modifier.d)
2016 {
2017 mismatch:
2018 if (!match)
2019 i.error = operand_size_mismatch;
2020 return match;
2021 }
2022
2023 /* Check reverse. */
2024 gas_assert (i.operands == 2);
2025
2026 for (j = 0; j < 2; j++)
2027 {
2028 if ((t->operand_types[j].bitfield.reg
2029 || t->operand_types[j].bitfield.acc)
2030 && !match_reg_size (t, j, !j))
2031 goto mismatch;
2032
2033 if (i.types[!j].bitfield.mem
2034 && !match_mem_size (t, j, !j))
2035 goto mismatch;
2036 }
2037
2038 return match | MATCH_REVERSE;
2039 }
2040
2041 static INLINE int
2042 operand_type_match (i386_operand_type overlap,
2043 i386_operand_type given)
2044 {
2045 i386_operand_type temp = overlap;
2046
2047 temp.bitfield.jumpabsolute = 0;
2048 temp.bitfield.unspecified = 0;
2049 temp.bitfield.byte = 0;
2050 temp.bitfield.word = 0;
2051 temp.bitfield.dword = 0;
2052 temp.bitfield.fword = 0;
2053 temp.bitfield.qword = 0;
2054 temp.bitfield.tbyte = 0;
2055 temp.bitfield.xmmword = 0;
2056 temp.bitfield.ymmword = 0;
2057 temp.bitfield.zmmword = 0;
2058 if (operand_type_all_zero (&temp))
2059 goto mismatch;
2060
2061 if (given.bitfield.baseindex == overlap.bitfield.baseindex
2062 && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
2063 return 1;
2064
2065 mismatch:
2066 i.error = operand_type_mismatch;
2067 return 0;
2068 }
2069
2070 /* If given types g0 and g1 are registers they must be of the same type
2071 unless the expected operand type register overlap is null.
2072 Memory operand size of certain SIMD instructions is also being checked
2073 here. */
2074
2075 static INLINE int
2076 operand_type_register_match (i386_operand_type g0,
2077 i386_operand_type t0,
2078 i386_operand_type g1,
2079 i386_operand_type t1)
2080 {
2081 if (!g0.bitfield.reg
2082 && !g0.bitfield.regsimd
2083 && (!operand_type_check (g0, anymem)
2084 || g0.bitfield.unspecified
2085 || !t0.bitfield.regsimd))
2086 return 1;
2087
2088 if (!g1.bitfield.reg
2089 && !g1.bitfield.regsimd
2090 && (!operand_type_check (g1, anymem)
2091 || g1.bitfield.unspecified
2092 || !t1.bitfield.regsimd))
2093 return 1;
2094
2095 if (g0.bitfield.byte == g1.bitfield.byte
2096 && g0.bitfield.word == g1.bitfield.word
2097 && g0.bitfield.dword == g1.bitfield.dword
2098 && g0.bitfield.qword == g1.bitfield.qword
2099 && g0.bitfield.xmmword == g1.bitfield.xmmword
2100 && g0.bitfield.ymmword == g1.bitfield.ymmword
2101 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2102 return 1;
2103
2104 if (!(t0.bitfield.byte & t1.bitfield.byte)
2105 && !(t0.bitfield.word & t1.bitfield.word)
2106 && !(t0.bitfield.dword & t1.bitfield.dword)
2107 && !(t0.bitfield.qword & t1.bitfield.qword)
2108 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2109 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2110 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2111 return 1;
2112
2113 i.error = register_type_mismatch;
2114
2115 return 0;
2116 }
2117
2118 static INLINE unsigned int
2119 register_number (const reg_entry *r)
2120 {
2121 unsigned int nr = r->reg_num;
2122
2123 if (r->reg_flags & RegRex)
2124 nr += 8;
2125
2126 if (r->reg_flags & RegVRex)
2127 nr += 16;
2128
2129 return nr;
2130 }
2131
2132 static INLINE unsigned int
2133 mode_from_disp_size (i386_operand_type t)
2134 {
2135 if (t.bitfield.disp8)
2136 return 1;
2137 else if (t.bitfield.disp16
2138 || t.bitfield.disp32
2139 || t.bitfield.disp32s)
2140 return 2;
2141 else
2142 return 0;
2143 }
2144
2145 static INLINE int
2146 fits_in_signed_byte (addressT num)
2147 {
2148 return num + 0x80 <= 0xff;
2149 }
2150
2151 static INLINE int
2152 fits_in_unsigned_byte (addressT num)
2153 {
2154 return num <= 0xff;
2155 }
2156
2157 static INLINE int
2158 fits_in_unsigned_word (addressT num)
2159 {
2160 return num <= 0xffff;
2161 }
2162
2163 static INLINE int
2164 fits_in_signed_word (addressT num)
2165 {
2166 return num + 0x8000 <= 0xffff;
2167 }
2168
2169 static INLINE int
2170 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2171 {
2172 #ifndef BFD64
2173 return 1;
2174 #else
2175 return num + 0x80000000 <= 0xffffffff;
2176 #endif
2177 } /* fits_in_signed_long() */
2178
2179 static INLINE int
2180 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2181 {
2182 #ifndef BFD64
2183 return 1;
2184 #else
2185 return num <= 0xffffffff;
2186 #endif
2187 } /* fits_in_unsigned_long() */
2188
2189 static INLINE int
2190 fits_in_disp8 (offsetT num)
2191 {
2192 int shift = i.memshift;
2193 unsigned int mask;
2194
2195 if (shift == -1)
2196 abort ();
2197
2198 mask = (1 << shift) - 1;
2199
2200 /* Return 0 if NUM isn't properly aligned. */
2201 if ((num & mask))
2202 return 0;
2203
2204 /* Check if NUM will fit in 8bit after shift. */
2205 return fits_in_signed_byte (num >> shift);
2206 }
2207
2208 static INLINE int
2209 fits_in_imm4 (offsetT num)
2210 {
2211 return (num & 0xf) == num;
2212 }
2213
2214 static i386_operand_type
2215 smallest_imm_type (offsetT num)
2216 {
2217 i386_operand_type t;
2218
2219 operand_type_set (&t, 0);
2220 t.bitfield.imm64 = 1;
2221
2222 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2223 {
2224 /* This code is disabled on the 486 because all the Imm1 forms
2225 in the opcode table are slower on the i486. They're the
2226 versions with the implicitly specified single-position
2227 displacement, which has another syntax if you really want to
2228 use that form. */
2229 t.bitfield.imm1 = 1;
2230 t.bitfield.imm8 = 1;
2231 t.bitfield.imm8s = 1;
2232 t.bitfield.imm16 = 1;
2233 t.bitfield.imm32 = 1;
2234 t.bitfield.imm32s = 1;
2235 }
2236 else if (fits_in_signed_byte (num))
2237 {
2238 t.bitfield.imm8 = 1;
2239 t.bitfield.imm8s = 1;
2240 t.bitfield.imm16 = 1;
2241 t.bitfield.imm32 = 1;
2242 t.bitfield.imm32s = 1;
2243 }
2244 else if (fits_in_unsigned_byte (num))
2245 {
2246 t.bitfield.imm8 = 1;
2247 t.bitfield.imm16 = 1;
2248 t.bitfield.imm32 = 1;
2249 t.bitfield.imm32s = 1;
2250 }
2251 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2252 {
2253 t.bitfield.imm16 = 1;
2254 t.bitfield.imm32 = 1;
2255 t.bitfield.imm32s = 1;
2256 }
2257 else if (fits_in_signed_long (num))
2258 {
2259 t.bitfield.imm32 = 1;
2260 t.bitfield.imm32s = 1;
2261 }
2262 else if (fits_in_unsigned_long (num))
2263 t.bitfield.imm32 = 1;
2264
2265 return t;
2266 }
2267
2268 static offsetT
2269 offset_in_range (offsetT val, int size)
2270 {
2271 addressT mask;
2272
2273 switch (size)
2274 {
2275 case 1: mask = ((addressT) 1 << 8) - 1; break;
2276 case 2: mask = ((addressT) 1 << 16) - 1; break;
2277 case 4: mask = ((addressT) 2 << 31) - 1; break;
2278 #ifdef BFD64
2279 case 8: mask = ((addressT) 2 << 63) - 1; break;
2280 #endif
2281 default: abort ();
2282 }
2283
2284 #ifdef BFD64
2285 /* If BFD64, sign extend val for 32bit address mode. */
2286 if (flag_code != CODE_64BIT
2287 || i.prefix[ADDR_PREFIX])
2288 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2289 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2290 #endif
2291
2292 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2293 {
2294 char buf1[40], buf2[40];
2295
2296 sprint_value (buf1, val);
2297 sprint_value (buf2, val & mask);
2298 as_warn (_("%s shortened to %s"), buf1, buf2);
2299 }
2300 return val & mask;
2301 }
2302
2303 enum PREFIX_GROUP
2304 {
2305 PREFIX_EXIST = 0,
2306 PREFIX_LOCK,
2307 PREFIX_REP,
2308 PREFIX_DS,
2309 PREFIX_OTHER
2310 };
2311
2312 /* Returns
2313 a. PREFIX_EXIST if attempting to add a prefix where one from the
2314 same class already exists.
2315 b. PREFIX_LOCK if lock prefix is added.
2316 c. PREFIX_REP if rep/repne prefix is added.
2317 d. PREFIX_DS if ds prefix is added.
2318 e. PREFIX_OTHER if other prefix is added.
2319 */
2320
2321 static enum PREFIX_GROUP
2322 add_prefix (unsigned int prefix)
2323 {
2324 enum PREFIX_GROUP ret = PREFIX_OTHER;
2325 unsigned int q;
2326
2327 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2328 && flag_code == CODE_64BIT)
2329 {
2330 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2331 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2332 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2333 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2334 ret = PREFIX_EXIST;
2335 q = REX_PREFIX;
2336 }
2337 else
2338 {
2339 switch (prefix)
2340 {
2341 default:
2342 abort ();
2343
2344 case DS_PREFIX_OPCODE:
2345 ret = PREFIX_DS;
2346 /* Fall through. */
2347 case CS_PREFIX_OPCODE:
2348 case ES_PREFIX_OPCODE:
2349 case FS_PREFIX_OPCODE:
2350 case GS_PREFIX_OPCODE:
2351 case SS_PREFIX_OPCODE:
2352 q = SEG_PREFIX;
2353 break;
2354
2355 case REPNE_PREFIX_OPCODE:
2356 case REPE_PREFIX_OPCODE:
2357 q = REP_PREFIX;
2358 ret = PREFIX_REP;
2359 break;
2360
2361 case LOCK_PREFIX_OPCODE:
2362 q = LOCK_PREFIX;
2363 ret = PREFIX_LOCK;
2364 break;
2365
2366 case FWAIT_OPCODE:
2367 q = WAIT_PREFIX;
2368 break;
2369
2370 case ADDR_PREFIX_OPCODE:
2371 q = ADDR_PREFIX;
2372 break;
2373
2374 case DATA_PREFIX_OPCODE:
2375 q = DATA_PREFIX;
2376 break;
2377 }
2378 if (i.prefix[q] != 0)
2379 ret = PREFIX_EXIST;
2380 }
2381
2382 if (ret)
2383 {
2384 if (!i.prefix[q])
2385 ++i.prefixes;
2386 i.prefix[q] |= prefix;
2387 }
2388 else
2389 as_bad (_("same type of prefix used twice"));
2390
2391 return ret;
2392 }
2393
2394 static void
2395 update_code_flag (int value, int check)
2396 {
2397 PRINTF_LIKE ((*as_error));
2398
2399 flag_code = (enum flag_code) value;
2400 if (flag_code == CODE_64BIT)
2401 {
2402 cpu_arch_flags.bitfield.cpu64 = 1;
2403 cpu_arch_flags.bitfield.cpuno64 = 0;
2404 }
2405 else
2406 {
2407 cpu_arch_flags.bitfield.cpu64 = 0;
2408 cpu_arch_flags.bitfield.cpuno64 = 1;
2409 }
2410 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2411 {
2412 if (check)
2413 as_error = as_fatal;
2414 else
2415 as_error = as_bad;
2416 (*as_error) (_("64bit mode not supported on `%s'."),
2417 cpu_arch_name ? cpu_arch_name : default_arch);
2418 }
2419 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2420 {
2421 if (check)
2422 as_error = as_fatal;
2423 else
2424 as_error = as_bad;
2425 (*as_error) (_("32bit mode not supported on `%s'."),
2426 cpu_arch_name ? cpu_arch_name : default_arch);
2427 }
2428 stackop_size = '\0';
2429 }
2430
2431 static void
2432 set_code_flag (int value)
2433 {
2434 update_code_flag (value, 0);
2435 }
2436
2437 static void
2438 set_16bit_gcc_code_flag (int new_code_flag)
2439 {
2440 flag_code = (enum flag_code) new_code_flag;
2441 if (flag_code != CODE_16BIT)
2442 abort ();
2443 cpu_arch_flags.bitfield.cpu64 = 0;
2444 cpu_arch_flags.bitfield.cpuno64 = 1;
2445 stackop_size = LONG_MNEM_SUFFIX;
2446 }
2447
2448 static void
2449 set_intel_syntax (int syntax_flag)
2450 {
2451 /* Find out if register prefixing is specified. */
2452 int ask_naked_reg = 0;
2453
2454 SKIP_WHITESPACE ();
2455 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2456 {
2457 char *string;
2458 int e = get_symbol_name (&string);
2459
2460 if (strcmp (string, "prefix") == 0)
2461 ask_naked_reg = 1;
2462 else if (strcmp (string, "noprefix") == 0)
2463 ask_naked_reg = -1;
2464 else
2465 as_bad (_("bad argument to syntax directive."));
2466 (void) restore_line_pointer (e);
2467 }
2468 demand_empty_rest_of_line ();
2469
2470 intel_syntax = syntax_flag;
2471
2472 if (ask_naked_reg == 0)
2473 allow_naked_reg = (intel_syntax
2474 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2475 else
2476 allow_naked_reg = (ask_naked_reg < 0);
2477
2478 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2479
2480 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2481 identifier_chars['$'] = intel_syntax ? '$' : 0;
2482 register_prefix = allow_naked_reg ? "" : "%";
2483 }
2484
2485 static void
2486 set_intel_mnemonic (int mnemonic_flag)
2487 {
2488 intel_mnemonic = mnemonic_flag;
2489 }
2490
2491 static void
2492 set_allow_index_reg (int flag)
2493 {
2494 allow_index_reg = flag;
2495 }
2496
2497 static void
2498 set_check (int what)
2499 {
2500 enum check_kind *kind;
2501 const char *str;
2502
2503 if (what)
2504 {
2505 kind = &operand_check;
2506 str = "operand";
2507 }
2508 else
2509 {
2510 kind = &sse_check;
2511 str = "sse";
2512 }
2513
2514 SKIP_WHITESPACE ();
2515
2516 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2517 {
2518 char *string;
2519 int e = get_symbol_name (&string);
2520
2521 if (strcmp (string, "none") == 0)
2522 *kind = check_none;
2523 else if (strcmp (string, "warning") == 0)
2524 *kind = check_warning;
2525 else if (strcmp (string, "error") == 0)
2526 *kind = check_error;
2527 else
2528 as_bad (_("bad argument to %s_check directive."), str);
2529 (void) restore_line_pointer (e);
2530 }
2531 else
2532 as_bad (_("missing argument for %s_check directive"), str);
2533
2534 demand_empty_rest_of_line ();
2535 }
2536
2537 static void
2538 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2539 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2540 {
2541 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2542 static const char *arch;
2543
2544 /* Intel LIOM is only supported on ELF. */
2545 if (!IS_ELF)
2546 return;
2547
2548 if (!arch)
2549 {
2550 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2551 use default_arch. */
2552 arch = cpu_arch_name;
2553 if (!arch)
2554 arch = default_arch;
2555 }
2556
2557 /* If we are targeting Intel MCU, we must enable it. */
2558 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2559 || new_flag.bitfield.cpuiamcu)
2560 return;
2561
2562 /* If we are targeting Intel L1OM, we must enable it. */
2563 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2564 || new_flag.bitfield.cpul1om)
2565 return;
2566
2567 /* If we are targeting Intel K1OM, we must enable it. */
2568 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2569 || new_flag.bitfield.cpuk1om)
2570 return;
2571
2572 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2573 #endif
2574 }
2575
2576 static void
2577 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2578 {
2579 SKIP_WHITESPACE ();
2580
2581 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2582 {
2583 char *string;
2584 int e = get_symbol_name (&string);
2585 unsigned int j;
2586 i386_cpu_flags flags;
2587
2588 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2589 {
2590 if (strcmp (string, cpu_arch[j].name) == 0)
2591 {
2592 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2593
2594 if (*string != '.')
2595 {
2596 cpu_arch_name = cpu_arch[j].name;
2597 cpu_sub_arch_name = NULL;
2598 cpu_arch_flags = cpu_arch[j].flags;
2599 if (flag_code == CODE_64BIT)
2600 {
2601 cpu_arch_flags.bitfield.cpu64 = 1;
2602 cpu_arch_flags.bitfield.cpuno64 = 0;
2603 }
2604 else
2605 {
2606 cpu_arch_flags.bitfield.cpu64 = 0;
2607 cpu_arch_flags.bitfield.cpuno64 = 1;
2608 }
2609 cpu_arch_isa = cpu_arch[j].type;
2610 cpu_arch_isa_flags = cpu_arch[j].flags;
2611 if (!cpu_arch_tune_set)
2612 {
2613 cpu_arch_tune = cpu_arch_isa;
2614 cpu_arch_tune_flags = cpu_arch_isa_flags;
2615 }
2616 break;
2617 }
2618
2619 flags = cpu_flags_or (cpu_arch_flags,
2620 cpu_arch[j].flags);
2621
2622 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2623 {
2624 if (cpu_sub_arch_name)
2625 {
2626 char *name = cpu_sub_arch_name;
2627 cpu_sub_arch_name = concat (name,
2628 cpu_arch[j].name,
2629 (const char *) NULL);
2630 free (name);
2631 }
2632 else
2633 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2634 cpu_arch_flags = flags;
2635 cpu_arch_isa_flags = flags;
2636 }
2637 else
2638 cpu_arch_isa_flags
2639 = cpu_flags_or (cpu_arch_isa_flags,
2640 cpu_arch[j].flags);
2641 (void) restore_line_pointer (e);
2642 demand_empty_rest_of_line ();
2643 return;
2644 }
2645 }
2646
2647 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2648 {
2649 /* Disable an ISA extension. */
2650 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2651 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2652 {
2653 flags = cpu_flags_and_not (cpu_arch_flags,
2654 cpu_noarch[j].flags);
2655 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2656 {
2657 if (cpu_sub_arch_name)
2658 {
2659 char *name = cpu_sub_arch_name;
2660 cpu_sub_arch_name = concat (name, string,
2661 (const char *) NULL);
2662 free (name);
2663 }
2664 else
2665 cpu_sub_arch_name = xstrdup (string);
2666 cpu_arch_flags = flags;
2667 cpu_arch_isa_flags = flags;
2668 }
2669 (void) restore_line_pointer (e);
2670 demand_empty_rest_of_line ();
2671 return;
2672 }
2673
2674 j = ARRAY_SIZE (cpu_arch);
2675 }
2676
2677 if (j >= ARRAY_SIZE (cpu_arch))
2678 as_bad (_("no such architecture: `%s'"), string);
2679
2680 *input_line_pointer = e;
2681 }
2682 else
2683 as_bad (_("missing cpu architecture"));
2684
2685 no_cond_jump_promotion = 0;
2686 if (*input_line_pointer == ','
2687 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2688 {
2689 char *string;
2690 char e;
2691
2692 ++input_line_pointer;
2693 e = get_symbol_name (&string);
2694
2695 if (strcmp (string, "nojumps") == 0)
2696 no_cond_jump_promotion = 1;
2697 else if (strcmp (string, "jumps") == 0)
2698 ;
2699 else
2700 as_bad (_("no such architecture modifier: `%s'"), string);
2701
2702 (void) restore_line_pointer (e);
2703 }
2704
2705 demand_empty_rest_of_line ();
2706 }
2707
2708 enum bfd_architecture
2709 i386_arch (void)
2710 {
2711 if (cpu_arch_isa == PROCESSOR_L1OM)
2712 {
2713 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2714 || flag_code != CODE_64BIT)
2715 as_fatal (_("Intel L1OM is 64bit ELF only"));
2716 return bfd_arch_l1om;
2717 }
2718 else if (cpu_arch_isa == PROCESSOR_K1OM)
2719 {
2720 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2721 || flag_code != CODE_64BIT)
2722 as_fatal (_("Intel K1OM is 64bit ELF only"));
2723 return bfd_arch_k1om;
2724 }
2725 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2726 {
2727 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2728 || flag_code == CODE_64BIT)
2729 as_fatal (_("Intel MCU is 32bit ELF only"));
2730 return bfd_arch_iamcu;
2731 }
2732 else
2733 return bfd_arch_i386;
2734 }
2735
2736 unsigned long
2737 i386_mach (void)
2738 {
2739 if (!strncmp (default_arch, "x86_64", 6))
2740 {
2741 if (cpu_arch_isa == PROCESSOR_L1OM)
2742 {
2743 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2744 || default_arch[6] != '\0')
2745 as_fatal (_("Intel L1OM is 64bit ELF only"));
2746 return bfd_mach_l1om;
2747 }
2748 else if (cpu_arch_isa == PROCESSOR_K1OM)
2749 {
2750 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2751 || default_arch[6] != '\0')
2752 as_fatal (_("Intel K1OM is 64bit ELF only"));
2753 return bfd_mach_k1om;
2754 }
2755 else if (default_arch[6] == '\0')
2756 return bfd_mach_x86_64;
2757 else
2758 return bfd_mach_x64_32;
2759 }
2760 else if (!strcmp (default_arch, "i386")
2761 || !strcmp (default_arch, "iamcu"))
2762 {
2763 if (cpu_arch_isa == PROCESSOR_IAMCU)
2764 {
2765 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2766 as_fatal (_("Intel MCU is 32bit ELF only"));
2767 return bfd_mach_i386_iamcu;
2768 }
2769 else
2770 return bfd_mach_i386_i386;
2771 }
2772 else
2773 as_fatal (_("unknown architecture"));
2774 }
2775 \f
2776 void
2777 md_begin (void)
2778 {
2779 const char *hash_err;
2780
2781 /* Support pseudo prefixes like {disp32}. */
2782 lex_type ['{'] = LEX_BEGIN_NAME;
2783
2784 /* Initialize op_hash hash table. */
2785 op_hash = hash_new ();
2786
2787 {
2788 const insn_template *optab;
2789 templates *core_optab;
2790
2791 /* Setup for loop. */
2792 optab = i386_optab;
2793 core_optab = XNEW (templates);
2794 core_optab->start = optab;
2795
2796 while (1)
2797 {
2798 ++optab;
2799 if (optab->name == NULL
2800 || strcmp (optab->name, (optab - 1)->name) != 0)
2801 {
2802 /* different name --> ship out current template list;
2803 add to hash table; & begin anew. */
2804 core_optab->end = optab;
2805 hash_err = hash_insert (op_hash,
2806 (optab - 1)->name,
2807 (void *) core_optab);
2808 if (hash_err)
2809 {
2810 as_fatal (_("can't hash %s: %s"),
2811 (optab - 1)->name,
2812 hash_err);
2813 }
2814 if (optab->name == NULL)
2815 break;
2816 core_optab = XNEW (templates);
2817 core_optab->start = optab;
2818 }
2819 }
2820 }
2821
2822 /* Initialize reg_hash hash table. */
2823 reg_hash = hash_new ();
2824 {
2825 const reg_entry *regtab;
2826 unsigned int regtab_size = i386_regtab_size;
2827
2828 for (regtab = i386_regtab; regtab_size--; regtab++)
2829 {
2830 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2831 if (hash_err)
2832 as_fatal (_("can't hash %s: %s"),
2833 regtab->reg_name,
2834 hash_err);
2835 }
2836 }
2837
2838 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
2839 {
2840 int c;
2841 char *p;
2842
2843 for (c = 0; c < 256; c++)
2844 {
2845 if (ISDIGIT (c))
2846 {
2847 digit_chars[c] = c;
2848 mnemonic_chars[c] = c;
2849 register_chars[c] = c;
2850 operand_chars[c] = c;
2851 }
2852 else if (ISLOWER (c))
2853 {
2854 mnemonic_chars[c] = c;
2855 register_chars[c] = c;
2856 operand_chars[c] = c;
2857 }
2858 else if (ISUPPER (c))
2859 {
2860 mnemonic_chars[c] = TOLOWER (c);
2861 register_chars[c] = mnemonic_chars[c];
2862 operand_chars[c] = c;
2863 }
2864 else if (c == '{' || c == '}')
2865 {
2866 mnemonic_chars[c] = c;
2867 operand_chars[c] = c;
2868 }
2869
2870 if (ISALPHA (c) || ISDIGIT (c))
2871 identifier_chars[c] = c;
2872 else if (c >= 128)
2873 {
2874 identifier_chars[c] = c;
2875 operand_chars[c] = c;
2876 }
2877 }
2878
2879 #ifdef LEX_AT
2880 identifier_chars['@'] = '@';
2881 #endif
2882 #ifdef LEX_QM
2883 identifier_chars['?'] = '?';
2884 operand_chars['?'] = '?';
2885 #endif
2886 digit_chars['-'] = '-';
2887 mnemonic_chars['_'] = '_';
2888 mnemonic_chars['-'] = '-';
2889 mnemonic_chars['.'] = '.';
2890 identifier_chars['_'] = '_';
2891 identifier_chars['.'] = '.';
2892
2893 for (p = operand_special_chars; *p != '\0'; p++)
2894 operand_chars[(unsigned char) *p] = *p;
2895 }
2896
2897 if (flag_code == CODE_64BIT)
2898 {
2899 #if defined (OBJ_COFF) && defined (TE_PE)
2900 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2901 ? 32 : 16);
2902 #else
2903 x86_dwarf2_return_column = 16;
2904 #endif
2905 x86_cie_data_alignment = -8;
2906 }
2907 else
2908 {
2909 x86_dwarf2_return_column = 8;
2910 x86_cie_data_alignment = -4;
2911 }
2912 }
2913
2914 void
2915 i386_print_statistics (FILE *file)
2916 {
2917 hash_print_statistics (file, "i386 opcode", op_hash);
2918 hash_print_statistics (file, "i386 register", reg_hash);
2919 }
2920 \f
2921 #ifdef DEBUG386
2922
2923 /* Debugging routines for md_assemble. */
2924 static void pte (insn_template *);
2925 static void pt (i386_operand_type);
2926 static void pe (expressionS *);
2927 static void ps (symbolS *);
2928
2929 static void
2930 pi (char *line, i386_insn *x)
2931 {
2932 unsigned int j;
2933
2934 fprintf (stdout, "%s: template ", line);
2935 pte (&x->tm);
2936 fprintf (stdout, " address: base %s index %s scale %x\n",
2937 x->base_reg ? x->base_reg->reg_name : "none",
2938 x->index_reg ? x->index_reg->reg_name : "none",
2939 x->log2_scale_factor);
2940 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
2941 x->rm.mode, x->rm.reg, x->rm.regmem);
2942 fprintf (stdout, " sib: base %x index %x scale %x\n",
2943 x->sib.base, x->sib.index, x->sib.scale);
2944 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
2945 (x->rex & REX_W) != 0,
2946 (x->rex & REX_R) != 0,
2947 (x->rex & REX_X) != 0,
2948 (x->rex & REX_B) != 0);
2949 for (j = 0; j < x->operands; j++)
2950 {
2951 fprintf (stdout, " #%d: ", j + 1);
2952 pt (x->types[j]);
2953 fprintf (stdout, "\n");
2954 if (x->types[j].bitfield.reg
2955 || x->types[j].bitfield.regmmx
2956 || x->types[j].bitfield.regsimd
2957 || x->types[j].bitfield.sreg2
2958 || x->types[j].bitfield.sreg3
2959 || x->types[j].bitfield.control
2960 || x->types[j].bitfield.debug
2961 || x->types[j].bitfield.test)
2962 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
2963 if (operand_type_check (x->types[j], imm))
2964 pe (x->op[j].imms);
2965 if (operand_type_check (x->types[j], disp))
2966 pe (x->op[j].disps);
2967 }
2968 }
2969
2970 static void
2971 pte (insn_template *t)
2972 {
2973 unsigned int j;
2974 fprintf (stdout, " %d operands ", t->operands);
2975 fprintf (stdout, "opcode %x ", t->base_opcode);
2976 if (t->extension_opcode != None)
2977 fprintf (stdout, "ext %x ", t->extension_opcode);
2978 if (t->opcode_modifier.d)
2979 fprintf (stdout, "D");
2980 if (t->opcode_modifier.w)
2981 fprintf (stdout, "W");
2982 fprintf (stdout, "\n");
2983 for (j = 0; j < t->operands; j++)
2984 {
2985 fprintf (stdout, " #%d type ", j + 1);
2986 pt (t->operand_types[j]);
2987 fprintf (stdout, "\n");
2988 }
2989 }
2990
2991 static void
2992 pe (expressionS *e)
2993 {
2994 fprintf (stdout, " operation %d\n", e->X_op);
2995 fprintf (stdout, " add_number %ld (%lx)\n",
2996 (long) e->X_add_number, (long) e->X_add_number);
2997 if (e->X_add_symbol)
2998 {
2999 fprintf (stdout, " add_symbol ");
3000 ps (e->X_add_symbol);
3001 fprintf (stdout, "\n");
3002 }
3003 if (e->X_op_symbol)
3004 {
3005 fprintf (stdout, " op_symbol ");
3006 ps (e->X_op_symbol);
3007 fprintf (stdout, "\n");
3008 }
3009 }
3010
3011 static void
3012 ps (symbolS *s)
3013 {
3014 fprintf (stdout, "%s type %s%s",
3015 S_GET_NAME (s),
3016 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3017 segment_name (S_GET_SEGMENT (s)));
3018 }
3019
3020 static struct type_name
3021 {
3022 i386_operand_type mask;
3023 const char *name;
3024 }
3025 const type_names[] =
3026 {
3027 { OPERAND_TYPE_REG8, "r8" },
3028 { OPERAND_TYPE_REG16, "r16" },
3029 { OPERAND_TYPE_REG32, "r32" },
3030 { OPERAND_TYPE_REG64, "r64" },
3031 { OPERAND_TYPE_IMM8, "i8" },
3032 { OPERAND_TYPE_IMM8, "i8s" },
3033 { OPERAND_TYPE_IMM16, "i16" },
3034 { OPERAND_TYPE_IMM32, "i32" },
3035 { OPERAND_TYPE_IMM32S, "i32s" },
3036 { OPERAND_TYPE_IMM64, "i64" },
3037 { OPERAND_TYPE_IMM1, "i1" },
3038 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3039 { OPERAND_TYPE_DISP8, "d8" },
3040 { OPERAND_TYPE_DISP16, "d16" },
3041 { OPERAND_TYPE_DISP32, "d32" },
3042 { OPERAND_TYPE_DISP32S, "d32s" },
3043 { OPERAND_TYPE_DISP64, "d64" },
3044 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3045 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3046 { OPERAND_TYPE_CONTROL, "control reg" },
3047 { OPERAND_TYPE_TEST, "test reg" },
3048 { OPERAND_TYPE_DEBUG, "debug reg" },
3049 { OPERAND_TYPE_FLOATREG, "FReg" },
3050 { OPERAND_TYPE_FLOATACC, "FAcc" },
3051 { OPERAND_TYPE_SREG2, "SReg2" },
3052 { OPERAND_TYPE_SREG3, "SReg3" },
3053 { OPERAND_TYPE_ACC, "Acc" },
3054 { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
3055 { OPERAND_TYPE_REGMMX, "rMMX" },
3056 { OPERAND_TYPE_REGXMM, "rXMM" },
3057 { OPERAND_TYPE_REGYMM, "rYMM" },
3058 { OPERAND_TYPE_REGZMM, "rZMM" },
3059 { OPERAND_TYPE_REGMASK, "Mask reg" },
3060 { OPERAND_TYPE_ESSEG, "es" },
3061 };
3062
3063 static void
3064 pt (i386_operand_type t)
3065 {
3066 unsigned int j;
3067 i386_operand_type a;
3068
3069 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3070 {
3071 a = operand_type_and (t, type_names[j].mask);
3072 if (!operand_type_all_zero (&a))
3073 fprintf (stdout, "%s, ", type_names[j].name);
3074 }
3075 fflush (stdout);
3076 }
3077
3078 #endif /* DEBUG386 */
3079 \f
3080 static bfd_reloc_code_real_type
3081 reloc (unsigned int size,
3082 int pcrel,
3083 int sign,
3084 bfd_reloc_code_real_type other)
3085 {
3086 if (other != NO_RELOC)
3087 {
3088 reloc_howto_type *rel;
3089
3090 if (size == 8)
3091 switch (other)
3092 {
3093 case BFD_RELOC_X86_64_GOT32:
3094 return BFD_RELOC_X86_64_GOT64;
3095 break;
3096 case BFD_RELOC_X86_64_GOTPLT64:
3097 return BFD_RELOC_X86_64_GOTPLT64;
3098 break;
3099 case BFD_RELOC_X86_64_PLTOFF64:
3100 return BFD_RELOC_X86_64_PLTOFF64;
3101 break;
3102 case BFD_RELOC_X86_64_GOTPC32:
3103 other = BFD_RELOC_X86_64_GOTPC64;
3104 break;
3105 case BFD_RELOC_X86_64_GOTPCREL:
3106 other = BFD_RELOC_X86_64_GOTPCREL64;
3107 break;
3108 case BFD_RELOC_X86_64_TPOFF32:
3109 other = BFD_RELOC_X86_64_TPOFF64;
3110 break;
3111 case BFD_RELOC_X86_64_DTPOFF32:
3112 other = BFD_RELOC_X86_64_DTPOFF64;
3113 break;
3114 default:
3115 break;
3116 }
3117
3118 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3119 if (other == BFD_RELOC_SIZE32)
3120 {
3121 if (size == 8)
3122 other = BFD_RELOC_SIZE64;
3123 if (pcrel)
3124 {
3125 as_bad (_("there are no pc-relative size relocations"));
3126 return NO_RELOC;
3127 }
3128 }
3129 #endif
3130
3131 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3132 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3133 sign = -1;
3134
3135 rel = bfd_reloc_type_lookup (stdoutput, other);
3136 if (!rel)
3137 as_bad (_("unknown relocation (%u)"), other);
3138 else if (size != bfd_get_reloc_size (rel))
3139 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3140 bfd_get_reloc_size (rel),
3141 size);
3142 else if (pcrel && !rel->pc_relative)
3143 as_bad (_("non-pc-relative relocation for pc-relative field"));
3144 else if ((rel->complain_on_overflow == complain_overflow_signed
3145 && !sign)
3146 || (rel->complain_on_overflow == complain_overflow_unsigned
3147 && sign > 0))
3148 as_bad (_("relocated field and relocation type differ in signedness"));
3149 else
3150 return other;
3151 return NO_RELOC;
3152 }
3153
3154 if (pcrel)
3155 {
3156 if (!sign)
3157 as_bad (_("there are no unsigned pc-relative relocations"));
3158 switch (size)
3159 {
3160 case 1: return BFD_RELOC_8_PCREL;
3161 case 2: return BFD_RELOC_16_PCREL;
3162 case 4: return BFD_RELOC_32_PCREL;
3163 case 8: return BFD_RELOC_64_PCREL;
3164 }
3165 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3166 }
3167 else
3168 {
3169 if (sign > 0)
3170 switch (size)
3171 {
3172 case 4: return BFD_RELOC_X86_64_32S;
3173 }
3174 else
3175 switch (size)
3176 {
3177 case 1: return BFD_RELOC_8;
3178 case 2: return BFD_RELOC_16;
3179 case 4: return BFD_RELOC_32;
3180 case 8: return BFD_RELOC_64;
3181 }
3182 as_bad (_("cannot do %s %u byte relocation"),
3183 sign > 0 ? "signed" : "unsigned", size);
3184 }
3185
3186 return NO_RELOC;
3187 }
3188
3189 /* Here we decide which fixups can be adjusted to make them relative to
3190 the beginning of the section instead of the symbol. Basically we need
3191 to make sure that the dynamic relocations are done correctly, so in
3192 some cases we force the original symbol to be used. */
3193
3194 int
3195 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3196 {
3197 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3198 if (!IS_ELF)
3199 return 1;
3200
3201 /* Don't adjust pc-relative references to merge sections in 64-bit
3202 mode. */
3203 if (use_rela_relocations
3204 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3205 && fixP->fx_pcrel)
3206 return 0;
3207
3208 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3209 and changed later by validate_fix. */
3210 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3211 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3212 return 0;
3213
3214 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3215 for size relocations. */
3216 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3217 || fixP->fx_r_type == BFD_RELOC_SIZE64
3218 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3219 || fixP->fx_r_type == BFD_RELOC_386_PLT32
3220 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3221 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3222 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3223 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3224 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3225 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3226 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3227 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3228 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3229 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3230 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3231 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3232 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
3233 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3234 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3235 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3236 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3237 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3238 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3239 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3240 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3241 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3242 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3243 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3244 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3245 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3246 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3247 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3248 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3249 return 0;
3250 #endif
3251 return 1;
3252 }
3253
3254 static int
3255 intel_float_operand (const char *mnemonic)
3256 {
3257 /* Note that the value returned is meaningful only for opcodes with (memory)
3258 operands, hence the code here is free to improperly handle opcodes that
3259 have no operands (for better performance and smaller code). */
3260
3261 if (mnemonic[0] != 'f')
3262 return 0; /* non-math */
3263
3264 switch (mnemonic[1])
3265 {
3266 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3267 the fs segment override prefix not currently handled because no
3268 call path can make opcodes without operands get here */
3269 case 'i':
3270 return 2 /* integer op */;
3271 case 'l':
3272 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3273 return 3; /* fldcw/fldenv */
3274 break;
3275 case 'n':
3276 if (mnemonic[2] != 'o' /* fnop */)
3277 return 3; /* non-waiting control op */
3278 break;
3279 case 'r':
3280 if (mnemonic[2] == 's')
3281 return 3; /* frstor/frstpm */
3282 break;
3283 case 's':
3284 if (mnemonic[2] == 'a')
3285 return 3; /* fsave */
3286 if (mnemonic[2] == 't')
3287 {
3288 switch (mnemonic[3])
3289 {
3290 case 'c': /* fstcw */
3291 case 'd': /* fstdw */
3292 case 'e': /* fstenv */
3293 case 's': /* fsts[gw] */
3294 return 3;
3295 }
3296 }
3297 break;
3298 case 'x':
3299 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3300 return 0; /* fxsave/fxrstor are not really math ops */
3301 break;
3302 }
3303
3304 return 1;
3305 }
3306
3307 /* Build the VEX prefix. */
3308
3309 static void
3310 build_vex_prefix (const insn_template *t)
3311 {
3312 unsigned int register_specifier;
3313 unsigned int implied_prefix;
3314 unsigned int vector_length;
3315
3316 /* Check register specifier. */
3317 if (i.vex.register_specifier)
3318 {
3319 register_specifier =
3320 ~register_number (i.vex.register_specifier) & 0xf;
3321 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3322 }
3323 else
3324 register_specifier = 0xf;
3325
3326 /* Use 2-byte VEX prefix by swapping destination and source
3327 operand. */
3328 if (i.vec_encoding != vex_encoding_vex3
3329 && i.dir_encoding == dir_encoding_default
3330 && i.operands == i.reg_operands
3331 && i.tm.opcode_modifier.vexopcode == VEX0F
3332 && i.tm.opcode_modifier.load
3333 && i.rex == REX_B)
3334 {
3335 unsigned int xchg = i.operands - 1;
3336 union i386_op temp_op;
3337 i386_operand_type temp_type;
3338
3339 temp_type = i.types[xchg];
3340 i.types[xchg] = i.types[0];
3341 i.types[0] = temp_type;
3342 temp_op = i.op[xchg];
3343 i.op[xchg] = i.op[0];
3344 i.op[0] = temp_op;
3345
3346 gas_assert (i.rm.mode == 3);
3347
3348 i.rex = REX_R;
3349 xchg = i.rm.regmem;
3350 i.rm.regmem = i.rm.reg;
3351 i.rm.reg = xchg;
3352
3353 /* Use the next insn. */
3354 i.tm = t[1];
3355 }
3356
3357 if (i.tm.opcode_modifier.vex == VEXScalar)
3358 vector_length = avxscalar;
3359 else if (i.tm.opcode_modifier.vex == VEX256)
3360 vector_length = 1;
3361 else
3362 {
3363 unsigned int op;
3364
3365 vector_length = 0;
3366 for (op = 0; op < t->operands; ++op)
3367 if (t->operand_types[op].bitfield.xmmword
3368 && t->operand_types[op].bitfield.ymmword
3369 && i.types[op].bitfield.ymmword)
3370 {
3371 vector_length = 1;
3372 break;
3373 }
3374 }
3375
3376 switch ((i.tm.base_opcode >> 8) & 0xff)
3377 {
3378 case 0:
3379 implied_prefix = 0;
3380 break;
3381 case DATA_PREFIX_OPCODE:
3382 implied_prefix = 1;
3383 break;
3384 case REPE_PREFIX_OPCODE:
3385 implied_prefix = 2;
3386 break;
3387 case REPNE_PREFIX_OPCODE:
3388 implied_prefix = 3;
3389 break;
3390 default:
3391 abort ();
3392 }
3393
3394 /* Use 2-byte VEX prefix if possible. */
3395 if (i.vec_encoding != vex_encoding_vex3
3396 && i.tm.opcode_modifier.vexopcode == VEX0F
3397 && i.tm.opcode_modifier.vexw != VEXW1
3398 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3399 {
3400 /* 2-byte VEX prefix. */
3401 unsigned int r;
3402
3403 i.vex.length = 2;
3404 i.vex.bytes[0] = 0xc5;
3405
3406 /* Check the REX.R bit. */
3407 r = (i.rex & REX_R) ? 0 : 1;
3408 i.vex.bytes[1] = (r << 7
3409 | register_specifier << 3
3410 | vector_length << 2
3411 | implied_prefix);
3412 }
3413 else
3414 {
3415 /* 3-byte VEX prefix. */
3416 unsigned int m, w;
3417
3418 i.vex.length = 3;
3419
3420 switch (i.tm.opcode_modifier.vexopcode)
3421 {
3422 case VEX0F:
3423 m = 0x1;
3424 i.vex.bytes[0] = 0xc4;
3425 break;
3426 case VEX0F38:
3427 m = 0x2;
3428 i.vex.bytes[0] = 0xc4;
3429 break;
3430 case VEX0F3A:
3431 m = 0x3;
3432 i.vex.bytes[0] = 0xc4;
3433 break;
3434 case XOP08:
3435 m = 0x8;
3436 i.vex.bytes[0] = 0x8f;
3437 break;
3438 case XOP09:
3439 m = 0x9;
3440 i.vex.bytes[0] = 0x8f;
3441 break;
3442 case XOP0A:
3443 m = 0xa;
3444 i.vex.bytes[0] = 0x8f;
3445 break;
3446 default:
3447 abort ();
3448 }
3449
3450 /* The high 3 bits of the second VEX byte are 1's compliment
3451 of RXB bits from REX. */
3452 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3453
3454 /* Check the REX.W bit. */
3455 w = (i.rex & REX_W) ? 1 : 0;
3456 if (i.tm.opcode_modifier.vexw == VEXW1)
3457 w = 1;
3458
3459 i.vex.bytes[2] = (w << 7
3460 | register_specifier << 3
3461 | vector_length << 2
3462 | implied_prefix);
3463 }
3464 }
3465
3466 static INLINE bfd_boolean
3467 is_evex_encoding (const insn_template *t)
3468 {
3469 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3470 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3471 || t->opcode_modifier.staticrounding || t->opcode_modifier.sae;
3472 }
3473
3474 /* Build the EVEX prefix. */
3475
3476 static void
3477 build_evex_prefix (void)
3478 {
3479 unsigned int register_specifier;
3480 unsigned int implied_prefix;
3481 unsigned int m, w;
3482 rex_byte vrex_used = 0;
3483
3484 /* Check register specifier. */
3485 if (i.vex.register_specifier)
3486 {
3487 gas_assert ((i.vrex & REX_X) == 0);
3488
3489 register_specifier = i.vex.register_specifier->reg_num;
3490 if ((i.vex.register_specifier->reg_flags & RegRex))
3491 register_specifier += 8;
3492 /* The upper 16 registers are encoded in the fourth byte of the
3493 EVEX prefix. */
3494 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3495 i.vex.bytes[3] = 0x8;
3496 register_specifier = ~register_specifier & 0xf;
3497 }
3498 else
3499 {
3500 register_specifier = 0xf;
3501
3502 /* Encode upper 16 vector index register in the fourth byte of
3503 the EVEX prefix. */
3504 if (!(i.vrex & REX_X))
3505 i.vex.bytes[3] = 0x8;
3506 else
3507 vrex_used |= REX_X;
3508 }
3509
3510 switch ((i.tm.base_opcode >> 8) & 0xff)
3511 {
3512 case 0:
3513 implied_prefix = 0;
3514 break;
3515 case DATA_PREFIX_OPCODE:
3516 implied_prefix = 1;
3517 break;
3518 case REPE_PREFIX_OPCODE:
3519 implied_prefix = 2;
3520 break;
3521 case REPNE_PREFIX_OPCODE:
3522 implied_prefix = 3;
3523 break;
3524 default:
3525 abort ();
3526 }
3527
3528 /* 4 byte EVEX prefix. */
3529 i.vex.length = 4;
3530 i.vex.bytes[0] = 0x62;
3531
3532 /* mmmm bits. */
3533 switch (i.tm.opcode_modifier.vexopcode)
3534 {
3535 case VEX0F:
3536 m = 1;
3537 break;
3538 case VEX0F38:
3539 m = 2;
3540 break;
3541 case VEX0F3A:
3542 m = 3;
3543 break;
3544 default:
3545 abort ();
3546 break;
3547 }
3548
3549 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3550 bits from REX. */
3551 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3552
3553 /* The fifth bit of the second EVEX byte is 1's compliment of the
3554 REX_R bit in VREX. */
3555 if (!(i.vrex & REX_R))
3556 i.vex.bytes[1] |= 0x10;
3557 else
3558 vrex_used |= REX_R;
3559
3560 if ((i.reg_operands + i.imm_operands) == i.operands)
3561 {
3562 /* When all operands are registers, the REX_X bit in REX is not
3563 used. We reuse it to encode the upper 16 registers, which is
3564 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3565 as 1's compliment. */
3566 if ((i.vrex & REX_B))
3567 {
3568 vrex_used |= REX_B;
3569 i.vex.bytes[1] &= ~0x40;
3570 }
3571 }
3572
3573 /* EVEX instructions shouldn't need the REX prefix. */
3574 i.vrex &= ~vrex_used;
3575 gas_assert (i.vrex == 0);
3576
3577 /* Check the REX.W bit. */
3578 w = (i.rex & REX_W) ? 1 : 0;
3579 if (i.tm.opcode_modifier.vexw)
3580 {
3581 if (i.tm.opcode_modifier.vexw == VEXW1)
3582 w = 1;
3583 }
3584 /* If w is not set it means we are dealing with WIG instruction. */
3585 else if (!w)
3586 {
3587 if (evexwig == evexw1)
3588 w = 1;
3589 }
3590
3591 /* Encode the U bit. */
3592 implied_prefix |= 0x4;
3593
3594 /* The third byte of the EVEX prefix. */
3595 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3596
3597 /* The fourth byte of the EVEX prefix. */
3598 /* The zeroing-masking bit. */
3599 if (i.mask && i.mask->zeroing)
3600 i.vex.bytes[3] |= 0x80;
3601
3602 /* Don't always set the broadcast bit if there is no RC. */
3603 if (!i.rounding)
3604 {
3605 /* Encode the vector length. */
3606 unsigned int vec_length;
3607
3608 if (!i.tm.opcode_modifier.evex
3609 || i.tm.opcode_modifier.evex == EVEXDYN)
3610 {
3611 unsigned int op;
3612
3613 vec_length = 0;
3614 for (op = 0; op < i.tm.operands; ++op)
3615 if (i.tm.operand_types[op].bitfield.xmmword
3616 + i.tm.operand_types[op].bitfield.ymmword
3617 + i.tm.operand_types[op].bitfield.zmmword > 1)
3618 {
3619 if (i.types[op].bitfield.zmmword)
3620 i.tm.opcode_modifier.evex = EVEX512;
3621 else if (i.types[op].bitfield.ymmword)
3622 i.tm.opcode_modifier.evex = EVEX256;
3623 else if (i.types[op].bitfield.xmmword)
3624 i.tm.opcode_modifier.evex = EVEX128;
3625 else
3626 continue;
3627 break;
3628 }
3629 }
3630
3631 switch (i.tm.opcode_modifier.evex)
3632 {
3633 case EVEXLIG: /* LL' is ignored */
3634 vec_length = evexlig << 5;
3635 break;
3636 case EVEX128:
3637 vec_length = 0 << 5;
3638 break;
3639 case EVEX256:
3640 vec_length = 1 << 5;
3641 break;
3642 case EVEX512:
3643 vec_length = 2 << 5;
3644 break;
3645 default:
3646 abort ();
3647 break;
3648 }
3649 i.vex.bytes[3] |= vec_length;
3650 /* Encode the broadcast bit. */
3651 if (i.broadcast)
3652 i.vex.bytes[3] |= 0x10;
3653 }
3654 else
3655 {
3656 if (i.rounding->type != saeonly)
3657 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3658 else
3659 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3660 }
3661
3662 if (i.mask && i.mask->mask)
3663 i.vex.bytes[3] |= i.mask->mask->reg_num;
3664 }
3665
3666 static void
3667 process_immext (void)
3668 {
3669 expressionS *exp;
3670
3671 if ((i.tm.cpu_flags.bitfield.cpusse3 || i.tm.cpu_flags.bitfield.cpusvme)
3672 && i.operands > 0)
3673 {
3674 /* MONITOR/MWAIT as well as SVME instructions have fixed operands
3675 with an opcode suffix which is coded in the same place as an
3676 8-bit immediate field would be.
3677 Here we check those operands and remove them afterwards. */
3678 unsigned int x;
3679
3680 for (x = 0; x < i.operands; x++)
3681 if (register_number (i.op[x].regs) != x)
3682 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3683 register_prefix, i.op[x].regs->reg_name, x + 1,
3684 i.tm.name);
3685
3686 i.operands = 0;
3687 }
3688
3689 if (i.tm.cpu_flags.bitfield.cpumwaitx && i.operands > 0)
3690 {
3691 /* MONITORX/MWAITX instructions have fixed operands with an opcode
3692 suffix which is coded in the same place as an 8-bit immediate
3693 field would be.
3694 Here we check those operands and remove them afterwards. */
3695 unsigned int x;
3696
3697 if (i.operands != 3)
3698 abort();
3699
3700 for (x = 0; x < 2; x++)
3701 if (register_number (i.op[x].regs) != x)
3702 goto bad_register_operand;
3703
3704 /* Check for third operand for mwaitx/monitorx insn. */
3705 if (register_number (i.op[x].regs)
3706 != (x + (i.tm.extension_opcode == 0xfb)))
3707 {
3708 bad_register_operand:
3709 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3710 register_prefix, i.op[x].regs->reg_name, x+1,
3711 i.tm.name);
3712 }
3713
3714 i.operands = 0;
3715 }
3716
3717 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3718 which is coded in the same place as an 8-bit immediate field
3719 would be. Here we fake an 8-bit immediate operand from the
3720 opcode suffix stored in tm.extension_opcode.
3721
3722 AVX instructions also use this encoding, for some of
3723 3 argument instructions. */
3724
3725 gas_assert (i.imm_operands <= 1
3726 && (i.operands <= 2
3727 || ((i.tm.opcode_modifier.vex
3728 || i.tm.opcode_modifier.vexopcode
3729 || is_evex_encoding (&i.tm))
3730 && i.operands <= 4)));
3731
3732 exp = &im_expressions[i.imm_operands++];
3733 i.op[i.operands].imms = exp;
3734 i.types[i.operands] = imm8;
3735 i.operands++;
3736 exp->X_op = O_constant;
3737 exp->X_add_number = i.tm.extension_opcode;
3738 i.tm.extension_opcode = None;
3739 }
3740
3741
3742 static int
3743 check_hle (void)
3744 {
3745 switch (i.tm.opcode_modifier.hleprefixok)
3746 {
3747 default:
3748 abort ();
3749 case HLEPrefixNone:
3750 as_bad (_("invalid instruction `%s' after `%s'"),
3751 i.tm.name, i.hle_prefix);
3752 return 0;
3753 case HLEPrefixLock:
3754 if (i.prefix[LOCK_PREFIX])
3755 return 1;
3756 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3757 return 0;
3758 case HLEPrefixAny:
3759 return 1;
3760 case HLEPrefixRelease:
3761 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3762 {
3763 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3764 i.tm.name);
3765 return 0;
3766 }
3767 if (i.mem_operands == 0
3768 || !operand_type_check (i.types[i.operands - 1], anymem))
3769 {
3770 as_bad (_("memory destination needed for instruction `%s'"
3771 " after `xrelease'"), i.tm.name);
3772 return 0;
3773 }
3774 return 1;
3775 }
3776 }
3777
3778 /* Try the shortest encoding by shortening operand size. */
3779
3780 static void
3781 optimize_encoding (void)
3782 {
3783 int j;
3784
3785 if (optimize_for_space
3786 && i.reg_operands == 1
3787 && i.imm_operands == 1
3788 && !i.types[1].bitfield.byte
3789 && i.op[0].imms->X_op == O_constant
3790 && fits_in_imm7 (i.op[0].imms->X_add_number)
3791 && ((i.tm.base_opcode == 0xa8
3792 && i.tm.extension_opcode == None)
3793 || (i.tm.base_opcode == 0xf6
3794 && i.tm.extension_opcode == 0x0)))
3795 {
3796 /* Optimize: -Os:
3797 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
3798 */
3799 unsigned int base_regnum = i.op[1].regs->reg_num;
3800 if (flag_code == CODE_64BIT || base_regnum < 4)
3801 {
3802 i.types[1].bitfield.byte = 1;
3803 /* Ignore the suffix. */
3804 i.suffix = 0;
3805 if (base_regnum >= 4
3806 && !(i.op[1].regs->reg_flags & RegRex))
3807 {
3808 /* Handle SP, BP, SI and DI registers. */
3809 if (i.types[1].bitfield.word)
3810 j = 16;
3811 else if (i.types[1].bitfield.dword)
3812 j = 32;
3813 else
3814 j = 48;
3815 i.op[1].regs -= j;
3816 }
3817 }
3818 }
3819 else if (flag_code == CODE_64BIT
3820 && ((i.types[1].bitfield.qword
3821 && i.reg_operands == 1
3822 && i.imm_operands == 1
3823 && i.op[0].imms->X_op == O_constant
3824 && ((i.tm.base_opcode == 0xb0
3825 && i.tm.extension_opcode == None
3826 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
3827 || (fits_in_imm31 (i.op[0].imms->X_add_number)
3828 && (((i.tm.base_opcode == 0x24
3829 || i.tm.base_opcode == 0xa8)
3830 && i.tm.extension_opcode == None)
3831 || (i.tm.base_opcode == 0x80
3832 && i.tm.extension_opcode == 0x4)
3833 || ((i.tm.base_opcode == 0xf6
3834 || i.tm.base_opcode == 0xc6)
3835 && i.tm.extension_opcode == 0x0)))))
3836 || (i.types[0].bitfield.qword
3837 && ((i.reg_operands == 2
3838 && i.op[0].regs == i.op[1].regs
3839 && ((i.tm.base_opcode == 0x30
3840 || i.tm.base_opcode == 0x28)
3841 && i.tm.extension_opcode == None))
3842 || (i.reg_operands == 1
3843 && i.operands == 1
3844 && i.tm.base_opcode == 0x30
3845 && i.tm.extension_opcode == None)))))
3846 {
3847 /* Optimize: -O:
3848 andq $imm31, %r64 -> andl $imm31, %r32
3849 testq $imm31, %r64 -> testl $imm31, %r32
3850 xorq %r64, %r64 -> xorl %r32, %r32
3851 subq %r64, %r64 -> subl %r32, %r32
3852 movq $imm31, %r64 -> movl $imm31, %r32
3853 movq $imm32, %r64 -> movl $imm32, %r32
3854 */
3855 i.tm.opcode_modifier.norex64 = 1;
3856 if (i.tm.base_opcode == 0xb0 || i.tm.base_opcode == 0xc6)
3857 {
3858 /* Handle
3859 movq $imm31, %r64 -> movl $imm31, %r32
3860 movq $imm32, %r64 -> movl $imm32, %r32
3861 */
3862 i.tm.operand_types[0].bitfield.imm32 = 1;
3863 i.tm.operand_types[0].bitfield.imm32s = 0;
3864 i.tm.operand_types[0].bitfield.imm64 = 0;
3865 i.types[0].bitfield.imm32 = 1;
3866 i.types[0].bitfield.imm32s = 0;
3867 i.types[0].bitfield.imm64 = 0;
3868 i.types[1].bitfield.dword = 1;
3869 i.types[1].bitfield.qword = 0;
3870 if (i.tm.base_opcode == 0xc6)
3871 {
3872 /* Handle
3873 movq $imm31, %r64 -> movl $imm31, %r32
3874 */
3875 i.tm.base_opcode = 0xb0;
3876 i.tm.extension_opcode = None;
3877 i.tm.opcode_modifier.shortform = 1;
3878 i.tm.opcode_modifier.modrm = 0;
3879 }
3880 }
3881 }
3882 else if (optimize > 1
3883 && i.reg_operands == 3
3884 && i.op[0].regs == i.op[1].regs
3885 && !i.types[2].bitfield.xmmword
3886 && (i.tm.opcode_modifier.vex
3887 || ((!i.mask || i.mask->zeroing)
3888 && !i.rounding
3889 && is_evex_encoding (&i.tm)
3890 && (i.vec_encoding != vex_encoding_evex
3891 || i.tm.cpu_flags.bitfield.cpuavx512vl
3892 || (i.tm.operand_types[2].bitfield.zmmword
3893 && i.types[2].bitfield.ymmword)
3894 || cpu_arch_isa_flags.bitfield.cpuavx512vl)))
3895 && ((i.tm.base_opcode == 0x55
3896 || i.tm.base_opcode == 0x6655
3897 || i.tm.base_opcode == 0x66df
3898 || i.tm.base_opcode == 0x57
3899 || i.tm.base_opcode == 0x6657
3900 || i.tm.base_opcode == 0x66ef
3901 || i.tm.base_opcode == 0x66f8
3902 || i.tm.base_opcode == 0x66f9
3903 || i.tm.base_opcode == 0x66fa
3904 || i.tm.base_opcode == 0x66fb)
3905 && i.tm.extension_opcode == None))
3906 {
3907 /* Optimize: -O2:
3908 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
3909 vpsubq and vpsubw:
3910 EVEX VOP %zmmM, %zmmM, %zmmN
3911 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
3912 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3913 EVEX VOP %ymmM, %ymmM, %ymmN
3914 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
3915 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3916 VEX VOP %ymmM, %ymmM, %ymmN
3917 -> VEX VOP %xmmM, %xmmM, %xmmN
3918 VOP, one of vpandn and vpxor:
3919 VEX VOP %ymmM, %ymmM, %ymmN
3920 -> VEX VOP %xmmM, %xmmM, %xmmN
3921 VOP, one of vpandnd and vpandnq:
3922 EVEX VOP %zmmM, %zmmM, %zmmN
3923 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
3924 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3925 EVEX VOP %ymmM, %ymmM, %ymmN
3926 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
3927 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3928 VOP, one of vpxord and vpxorq:
3929 EVEX VOP %zmmM, %zmmM, %zmmN
3930 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
3931 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3932 EVEX VOP %ymmM, %ymmM, %ymmN
3933 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
3934 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3935 */
3936 if (is_evex_encoding (&i.tm))
3937 {
3938 if (i.vec_encoding == vex_encoding_evex)
3939 i.tm.opcode_modifier.evex = EVEX128;
3940 else
3941 {
3942 i.tm.opcode_modifier.vex = VEX128;
3943 i.tm.opcode_modifier.vexw = VEXW0;
3944 i.tm.opcode_modifier.evex = 0;
3945 }
3946 }
3947 else
3948 i.tm.opcode_modifier.vex = VEX128;
3949
3950 if (i.tm.opcode_modifier.vex)
3951 for (j = 0; j < 3; j++)
3952 {
3953 i.types[j].bitfield.xmmword = 1;
3954 i.types[j].bitfield.ymmword = 0;
3955 }
3956 }
3957 }
3958
3959 /* This is the guts of the machine-dependent assembler. LINE points to a
3960 machine dependent instruction. This function is supposed to emit
3961 the frags/bytes it assembles to. */
3962
3963 void
3964 md_assemble (char *line)
3965 {
3966 unsigned int j;
3967 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
3968 const insn_template *t;
3969
3970 /* Initialize globals. */
3971 memset (&i, '\0', sizeof (i));
3972 for (j = 0; j < MAX_OPERANDS; j++)
3973 i.reloc[j] = NO_RELOC;
3974 memset (disp_expressions, '\0', sizeof (disp_expressions));
3975 memset (im_expressions, '\0', sizeof (im_expressions));
3976 save_stack_p = save_stack;
3977
3978 /* First parse an instruction mnemonic & call i386_operand for the operands.
3979 We assume that the scrubber has arranged it so that line[0] is the valid
3980 start of a (possibly prefixed) mnemonic. */
3981
3982 line = parse_insn (line, mnemonic);
3983 if (line == NULL)
3984 return;
3985 mnem_suffix = i.suffix;
3986
3987 line = parse_operands (line, mnemonic);
3988 this_operand = -1;
3989 xfree (i.memop1_string);
3990 i.memop1_string = NULL;
3991 if (line == NULL)
3992 return;
3993
3994 /* Now we've parsed the mnemonic into a set of templates, and have the
3995 operands at hand. */
3996
3997 /* All intel opcodes have reversed operands except for "bound" and
3998 "enter". We also don't reverse intersegment "jmp" and "call"
3999 instructions with 2 immediate operands so that the immediate segment
4000 precedes the offset, as it does when in AT&T mode. */
4001 if (intel_syntax
4002 && i.operands > 1
4003 && (strcmp (mnemonic, "bound") != 0)
4004 && (strcmp (mnemonic, "invlpga") != 0)
4005 && !(operand_type_check (i.types[0], imm)
4006 && operand_type_check (i.types[1], imm)))
4007 swap_operands ();
4008
4009 /* The order of the immediates should be reversed
4010 for 2 immediates extrq and insertq instructions */
4011 if (i.imm_operands == 2
4012 && (strcmp (mnemonic, "extrq") == 0
4013 || strcmp (mnemonic, "insertq") == 0))
4014 swap_2_operands (0, 1);
4015
4016 if (i.imm_operands)
4017 optimize_imm ();
4018
4019 /* Don't optimize displacement for movabs since it only takes 64bit
4020 displacement. */
4021 if (i.disp_operands
4022 && i.disp_encoding != disp_encoding_32bit
4023 && (flag_code != CODE_64BIT
4024 || strcmp (mnemonic, "movabs") != 0))
4025 optimize_disp ();
4026
4027 /* Next, we find a template that matches the given insn,
4028 making sure the overlap of the given operands types is consistent
4029 with the template operand types. */
4030
4031 if (!(t = match_template (mnem_suffix)))
4032 return;
4033
4034 if (sse_check != check_none
4035 && !i.tm.opcode_modifier.noavx
4036 && !i.tm.cpu_flags.bitfield.cpuavx
4037 && (i.tm.cpu_flags.bitfield.cpusse
4038 || i.tm.cpu_flags.bitfield.cpusse2
4039 || i.tm.cpu_flags.bitfield.cpusse3
4040 || i.tm.cpu_flags.bitfield.cpussse3
4041 || i.tm.cpu_flags.bitfield.cpusse4_1
4042 || i.tm.cpu_flags.bitfield.cpusse4_2
4043 || i.tm.cpu_flags.bitfield.cpupclmul
4044 || i.tm.cpu_flags.bitfield.cpuaes
4045 || i.tm.cpu_flags.bitfield.cpugfni))
4046 {
4047 (sse_check == check_warning
4048 ? as_warn
4049 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4050 }
4051
4052 /* Zap movzx and movsx suffix. The suffix has been set from
4053 "word ptr" or "byte ptr" on the source operand in Intel syntax
4054 or extracted from mnemonic in AT&T syntax. But we'll use
4055 the destination register to choose the suffix for encoding. */
4056 if ((i.tm.base_opcode & ~9) == 0x0fb6)
4057 {
4058 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
4059 there is no suffix, the default will be byte extension. */
4060 if (i.reg_operands != 2
4061 && !i.suffix
4062 && intel_syntax)
4063 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4064
4065 i.suffix = 0;
4066 }
4067
4068 if (i.tm.opcode_modifier.fwait)
4069 if (!add_prefix (FWAIT_OPCODE))
4070 return;
4071
4072 /* Check if REP prefix is OK. */
4073 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4074 {
4075 as_bad (_("invalid instruction `%s' after `%s'"),
4076 i.tm.name, i.rep_prefix);
4077 return;
4078 }
4079
4080 /* Check for lock without a lockable instruction. Destination operand
4081 must be memory unless it is xchg (0x86). */
4082 if (i.prefix[LOCK_PREFIX]
4083 && (!i.tm.opcode_modifier.islockable
4084 || i.mem_operands == 0
4085 || (i.tm.base_opcode != 0x86
4086 && !operand_type_check (i.types[i.operands - 1], anymem))))
4087 {
4088 as_bad (_("expecting lockable instruction after `lock'"));
4089 return;
4090 }
4091
4092 /* Check if HLE prefix is OK. */
4093 if (i.hle_prefix && !check_hle ())
4094 return;
4095
4096 /* Check BND prefix. */
4097 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4098 as_bad (_("expecting valid branch instruction after `bnd'"));
4099
4100 /* Check NOTRACK prefix. */
4101 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4102 as_bad (_("expecting indirect branch instruction after `notrack'"));
4103
4104 if (i.tm.cpu_flags.bitfield.cpumpx)
4105 {
4106 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4107 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4108 else if (flag_code != CODE_16BIT
4109 ? i.prefix[ADDR_PREFIX]
4110 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4111 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4112 }
4113
4114 /* Insert BND prefix. */
4115 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4116 {
4117 if (!i.prefix[BND_PREFIX])
4118 add_prefix (BND_PREFIX_OPCODE);
4119 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4120 {
4121 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4122 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4123 }
4124 }
4125
4126 /* Check string instruction segment overrides. */
4127 if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
4128 {
4129 if (!check_string ())
4130 return;
4131 i.disp_operands = 0;
4132 }
4133
4134 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4135 optimize_encoding ();
4136
4137 if (!process_suffix ())
4138 return;
4139
4140 /* Update operand types. */
4141 for (j = 0; j < i.operands; j++)
4142 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4143
4144 /* Make still unresolved immediate matches conform to size of immediate
4145 given in i.suffix. */
4146 if (!finalize_imm ())
4147 return;
4148
4149 if (i.types[0].bitfield.imm1)
4150 i.imm_operands = 0; /* kludge for shift insns. */
4151
4152 /* We only need to check those implicit registers for instructions
4153 with 3 operands or less. */
4154 if (i.operands <= 3)
4155 for (j = 0; j < i.operands; j++)
4156 if (i.types[j].bitfield.inoutportreg
4157 || i.types[j].bitfield.shiftcount
4158 || (i.types[j].bitfield.acc && !i.types[j].bitfield.xmmword))
4159 i.reg_operands--;
4160
4161 /* ImmExt should be processed after SSE2AVX. */
4162 if (!i.tm.opcode_modifier.sse2avx
4163 && i.tm.opcode_modifier.immext)
4164 process_immext ();
4165
4166 /* For insns with operands there are more diddles to do to the opcode. */
4167 if (i.operands)
4168 {
4169 if (!process_operands ())
4170 return;
4171 }
4172 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4173 {
4174 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4175 as_warn (_("translating to `%sp'"), i.tm.name);
4176 }
4177
4178 if (i.tm.opcode_modifier.vex || i.tm.opcode_modifier.vexopcode
4179 || is_evex_encoding (&i.tm))
4180 {
4181 if (flag_code == CODE_16BIT)
4182 {
4183 as_bad (_("instruction `%s' isn't supported in 16-bit mode."),
4184 i.tm.name);
4185 return;
4186 }
4187
4188 if (i.tm.opcode_modifier.vex)
4189 build_vex_prefix (t);
4190 else
4191 build_evex_prefix ();
4192 }
4193
4194 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4195 instructions may define INT_OPCODE as well, so avoid this corner
4196 case for those instructions that use MODRM. */
4197 if (i.tm.base_opcode == INT_OPCODE
4198 && !i.tm.opcode_modifier.modrm
4199 && i.op[0].imms->X_add_number == 3)
4200 {
4201 i.tm.base_opcode = INT3_OPCODE;
4202 i.imm_operands = 0;
4203 }
4204
4205 if ((i.tm.opcode_modifier.jump
4206 || i.tm.opcode_modifier.jumpbyte
4207 || i.tm.opcode_modifier.jumpdword)
4208 && i.op[0].disps->X_op == O_constant)
4209 {
4210 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4211 the absolute address given by the constant. Since ix86 jumps and
4212 calls are pc relative, we need to generate a reloc. */
4213 i.op[0].disps->X_add_symbol = &abs_symbol;
4214 i.op[0].disps->X_op = O_symbol;
4215 }
4216
4217 if (i.tm.opcode_modifier.rex64)
4218 i.rex |= REX_W;
4219
4220 /* For 8 bit registers we need an empty rex prefix. Also if the
4221 instruction already has a prefix, we need to convert old
4222 registers to new ones. */
4223
4224 if ((i.types[0].bitfield.reg && i.types[0].bitfield.byte
4225 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4226 || (i.types[1].bitfield.reg && i.types[1].bitfield.byte
4227 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4228 || (((i.types[0].bitfield.reg && i.types[0].bitfield.byte)
4229 || (i.types[1].bitfield.reg && i.types[1].bitfield.byte))
4230 && i.rex != 0))
4231 {
4232 int x;
4233
4234 i.rex |= REX_OPCODE;
4235 for (x = 0; x < 2; x++)
4236 {
4237 /* Look for 8 bit operand that uses old registers. */
4238 if (i.types[x].bitfield.reg && i.types[x].bitfield.byte
4239 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4240 {
4241 /* In case it is "hi" register, give up. */
4242 if (i.op[x].regs->reg_num > 3)
4243 as_bad (_("can't encode register '%s%s' in an "
4244 "instruction requiring REX prefix."),
4245 register_prefix, i.op[x].regs->reg_name);
4246
4247 /* Otherwise it is equivalent to the extended register.
4248 Since the encoding doesn't change this is merely
4249 cosmetic cleanup for debug output. */
4250
4251 i.op[x].regs = i.op[x].regs + 8;
4252 }
4253 }
4254 }
4255
4256 if (i.rex == 0 && i.rex_encoding)
4257 {
4258 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4259 that uses legacy register. If it is "hi" register, don't add
4260 the REX_OPCODE byte. */
4261 int x;
4262 for (x = 0; x < 2; x++)
4263 if (i.types[x].bitfield.reg
4264 && i.types[x].bitfield.byte
4265 && (i.op[x].regs->reg_flags & RegRex64) == 0
4266 && i.op[x].regs->reg_num > 3)
4267 {
4268 i.rex_encoding = FALSE;
4269 break;
4270 }
4271
4272 if (i.rex_encoding)
4273 i.rex = REX_OPCODE;
4274 }
4275
4276 if (i.rex != 0)
4277 add_prefix (REX_OPCODE | i.rex);
4278
4279 /* We are ready to output the insn. */
4280 output_insn ();
4281 }
4282
4283 static char *
4284 parse_insn (char *line, char *mnemonic)
4285 {
4286 char *l = line;
4287 char *token_start = l;
4288 char *mnem_p;
4289 int supported;
4290 const insn_template *t;
4291 char *dot_p = NULL;
4292
4293 while (1)
4294 {
4295 mnem_p = mnemonic;
4296 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4297 {
4298 if (*mnem_p == '.')
4299 dot_p = mnem_p;
4300 mnem_p++;
4301 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4302 {
4303 as_bad (_("no such instruction: `%s'"), token_start);
4304 return NULL;
4305 }
4306 l++;
4307 }
4308 if (!is_space_char (*l)
4309 && *l != END_OF_INSN
4310 && (intel_syntax
4311 || (*l != PREFIX_SEPARATOR
4312 && *l != ',')))
4313 {
4314 as_bad (_("invalid character %s in mnemonic"),
4315 output_invalid (*l));
4316 return NULL;
4317 }
4318 if (token_start == l)
4319 {
4320 if (!intel_syntax && *l == PREFIX_SEPARATOR)
4321 as_bad (_("expecting prefix; got nothing"));
4322 else
4323 as_bad (_("expecting mnemonic; got nothing"));
4324 return NULL;
4325 }
4326
4327 /* Look up instruction (or prefix) via hash table. */
4328 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4329
4330 if (*l != END_OF_INSN
4331 && (!is_space_char (*l) || l[1] != END_OF_INSN)
4332 && current_templates
4333 && current_templates->start->opcode_modifier.isprefix)
4334 {
4335 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4336 {
4337 as_bad ((flag_code != CODE_64BIT
4338 ? _("`%s' is only supported in 64-bit mode")
4339 : _("`%s' is not supported in 64-bit mode")),
4340 current_templates->start->name);
4341 return NULL;
4342 }
4343 /* If we are in 16-bit mode, do not allow addr16 or data16.
4344 Similarly, in 32-bit mode, do not allow addr32 or data32. */
4345 if ((current_templates->start->opcode_modifier.size16
4346 || current_templates->start->opcode_modifier.size32)
4347 && flag_code != CODE_64BIT
4348 && (current_templates->start->opcode_modifier.size32
4349 ^ (flag_code == CODE_16BIT)))
4350 {
4351 as_bad (_("redundant %s prefix"),
4352 current_templates->start->name);
4353 return NULL;
4354 }
4355 if (current_templates->start->opcode_length == 0)
4356 {
4357 /* Handle pseudo prefixes. */
4358 switch (current_templates->start->base_opcode)
4359 {
4360 case 0x0:
4361 /* {disp8} */
4362 i.disp_encoding = disp_encoding_8bit;
4363 break;
4364 case 0x1:
4365 /* {disp32} */
4366 i.disp_encoding = disp_encoding_32bit;
4367 break;
4368 case 0x2:
4369 /* {load} */
4370 i.dir_encoding = dir_encoding_load;
4371 break;
4372 case 0x3:
4373 /* {store} */
4374 i.dir_encoding = dir_encoding_store;
4375 break;
4376 case 0x4:
4377 /* {vex2} */
4378 i.vec_encoding = vex_encoding_vex2;
4379 break;
4380 case 0x5:
4381 /* {vex3} */
4382 i.vec_encoding = vex_encoding_vex3;
4383 break;
4384 case 0x6:
4385 /* {evex} */
4386 i.vec_encoding = vex_encoding_evex;
4387 break;
4388 case 0x7:
4389 /* {rex} */
4390 i.rex_encoding = TRUE;
4391 break;
4392 case 0x8:
4393 /* {nooptimize} */
4394 i.no_optimize = TRUE;
4395 break;
4396 default:
4397 abort ();
4398 }
4399 }
4400 else
4401 {
4402 /* Add prefix, checking for repeated prefixes. */
4403 switch (add_prefix (current_templates->start->base_opcode))
4404 {
4405 case PREFIX_EXIST:
4406 return NULL;
4407 case PREFIX_DS:
4408 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4409 i.notrack_prefix = current_templates->start->name;
4410 break;
4411 case PREFIX_REP:
4412 if (current_templates->start->cpu_flags.bitfield.cpuhle)
4413 i.hle_prefix = current_templates->start->name;
4414 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4415 i.bnd_prefix = current_templates->start->name;
4416 else
4417 i.rep_prefix = current_templates->start->name;
4418 break;
4419 default:
4420 break;
4421 }
4422 }
4423 /* Skip past PREFIX_SEPARATOR and reset token_start. */
4424 token_start = ++l;
4425 }
4426 else
4427 break;
4428 }
4429
4430 if (!current_templates)
4431 {
4432 /* Check if we should swap operand or force 32bit displacement in
4433 encoding. */
4434 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4435 i.dir_encoding = dir_encoding_store;
4436 else if (mnem_p - 3 == dot_p
4437 && dot_p[1] == 'd'
4438 && dot_p[2] == '8')
4439 i.disp_encoding = disp_encoding_8bit;
4440 else if (mnem_p - 4 == dot_p
4441 && dot_p[1] == 'd'
4442 && dot_p[2] == '3'
4443 && dot_p[3] == '2')
4444 i.disp_encoding = disp_encoding_32bit;
4445 else
4446 goto check_suffix;
4447 mnem_p = dot_p;
4448 *dot_p = '\0';
4449 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4450 }
4451
4452 if (!current_templates)
4453 {
4454 check_suffix:
4455 /* See if we can get a match by trimming off a suffix. */
4456 switch (mnem_p[-1])
4457 {
4458 case WORD_MNEM_SUFFIX:
4459 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4460 i.suffix = SHORT_MNEM_SUFFIX;
4461 else
4462 /* Fall through. */
4463 case BYTE_MNEM_SUFFIX:
4464 case QWORD_MNEM_SUFFIX:
4465 i.suffix = mnem_p[-1];
4466 mnem_p[-1] = '\0';
4467 current_templates = (const templates *) hash_find (op_hash,
4468 mnemonic);
4469 break;
4470 case SHORT_MNEM_SUFFIX:
4471 case LONG_MNEM_SUFFIX:
4472 if (!intel_syntax)
4473 {
4474 i.suffix = mnem_p[-1];
4475 mnem_p[-1] = '\0';
4476 current_templates = (const templates *) hash_find (op_hash,
4477 mnemonic);
4478 }
4479 break;
4480
4481 /* Intel Syntax. */
4482 case 'd':
4483 if (intel_syntax)
4484 {
4485 if (intel_float_operand (mnemonic) == 1)
4486 i.suffix = SHORT_MNEM_SUFFIX;
4487 else
4488 i.suffix = LONG_MNEM_SUFFIX;
4489 mnem_p[-1] = '\0';
4490 current_templates = (const templates *) hash_find (op_hash,
4491 mnemonic);
4492 }
4493 break;
4494 }
4495 if (!current_templates)
4496 {
4497 as_bad (_("no such instruction: `%s'"), token_start);
4498 return NULL;
4499 }
4500 }
4501
4502 if (current_templates->start->opcode_modifier.jump
4503 || current_templates->start->opcode_modifier.jumpbyte)
4504 {
4505 /* Check for a branch hint. We allow ",pt" and ",pn" for
4506 predict taken and predict not taken respectively.
4507 I'm not sure that branch hints actually do anything on loop
4508 and jcxz insns (JumpByte) for current Pentium4 chips. They
4509 may work in the future and it doesn't hurt to accept them
4510 now. */
4511 if (l[0] == ',' && l[1] == 'p')
4512 {
4513 if (l[2] == 't')
4514 {
4515 if (!add_prefix (DS_PREFIX_OPCODE))
4516 return NULL;
4517 l += 3;
4518 }
4519 else if (l[2] == 'n')
4520 {
4521 if (!add_prefix (CS_PREFIX_OPCODE))
4522 return NULL;
4523 l += 3;
4524 }
4525 }
4526 }
4527 /* Any other comma loses. */
4528 if (*l == ',')
4529 {
4530 as_bad (_("invalid character %s in mnemonic"),
4531 output_invalid (*l));
4532 return NULL;
4533 }
4534
4535 /* Check if instruction is supported on specified architecture. */
4536 supported = 0;
4537 for (t = current_templates->start; t < current_templates->end; ++t)
4538 {
4539 supported |= cpu_flags_match (t);
4540 if (supported == CPU_FLAGS_PERFECT_MATCH)
4541 {
4542 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4543 as_warn (_("use .code16 to ensure correct addressing mode"));
4544
4545 return l;
4546 }
4547 }
4548
4549 if (!(supported & CPU_FLAGS_64BIT_MATCH))
4550 as_bad (flag_code == CODE_64BIT
4551 ? _("`%s' is not supported in 64-bit mode")
4552 : _("`%s' is only supported in 64-bit mode"),
4553 current_templates->start->name);
4554 else
4555 as_bad (_("`%s' is not supported on `%s%s'"),
4556 current_templates->start->name,
4557 cpu_arch_name ? cpu_arch_name : default_arch,
4558 cpu_sub_arch_name ? cpu_sub_arch_name : "");
4559
4560 return NULL;
4561 }
4562
4563 static char *
4564 parse_operands (char *l, const char *mnemonic)
4565 {
4566 char *token_start;
4567
4568 /* 1 if operand is pending after ','. */
4569 unsigned int expecting_operand = 0;
4570
4571 /* Non-zero if operand parens not balanced. */
4572 unsigned int paren_not_balanced;
4573
4574 while (*l != END_OF_INSN)
4575 {
4576 /* Skip optional white space before operand. */
4577 if (is_space_char (*l))
4578 ++l;
4579 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4580 {
4581 as_bad (_("invalid character %s before operand %d"),
4582 output_invalid (*l),
4583 i.operands + 1);
4584 return NULL;
4585 }
4586 token_start = l; /* After white space. */
4587 paren_not_balanced = 0;
4588 while (paren_not_balanced || *l != ',')
4589 {
4590 if (*l == END_OF_INSN)
4591 {
4592 if (paren_not_balanced)
4593 {
4594 if (!intel_syntax)
4595 as_bad (_("unbalanced parenthesis in operand %d."),
4596 i.operands + 1);
4597 else
4598 as_bad (_("unbalanced brackets in operand %d."),
4599 i.operands + 1);
4600 return NULL;
4601 }
4602 else
4603 break; /* we are done */
4604 }
4605 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4606 {
4607 as_bad (_("invalid character %s in operand %d"),
4608 output_invalid (*l),
4609 i.operands + 1);
4610 return NULL;
4611 }
4612 if (!intel_syntax)
4613 {
4614 if (*l == '(')
4615 ++paren_not_balanced;
4616 if (*l == ')')
4617 --paren_not_balanced;
4618 }
4619 else
4620 {
4621 if (*l == '[')
4622 ++paren_not_balanced;
4623 if (*l == ']')
4624 --paren_not_balanced;
4625 }
4626 l++;
4627 }
4628 if (l != token_start)
4629 { /* Yes, we've read in another operand. */
4630 unsigned int operand_ok;
4631 this_operand = i.operands++;
4632 if (i.operands > MAX_OPERANDS)
4633 {
4634 as_bad (_("spurious operands; (%d operands/instruction max)"),
4635 MAX_OPERANDS);
4636 return NULL;
4637 }
4638 i.types[this_operand].bitfield.unspecified = 1;
4639 /* Now parse operand adding info to 'i' as we go along. */
4640 END_STRING_AND_SAVE (l);
4641
4642 if (intel_syntax)
4643 operand_ok =
4644 i386_intel_operand (token_start,
4645 intel_float_operand (mnemonic));
4646 else
4647 operand_ok = i386_att_operand (token_start);
4648
4649 RESTORE_END_STRING (l);
4650 if (!operand_ok)
4651 return NULL;
4652 }
4653 else
4654 {
4655 if (expecting_operand)
4656 {
4657 expecting_operand_after_comma:
4658 as_bad (_("expecting operand after ','; got nothing"));
4659 return NULL;
4660 }
4661 if (*l == ',')
4662 {
4663 as_bad (_("expecting operand before ','; got nothing"));
4664 return NULL;
4665 }
4666 }
4667
4668 /* Now *l must be either ',' or END_OF_INSN. */
4669 if (*l == ',')
4670 {
4671 if (*++l == END_OF_INSN)
4672 {
4673 /* Just skip it, if it's \n complain. */
4674 goto expecting_operand_after_comma;
4675 }
4676 expecting_operand = 1;
4677 }
4678 }
4679 return l;
4680 }
4681
4682 static void
4683 swap_2_operands (int xchg1, int xchg2)
4684 {
4685 union i386_op temp_op;
4686 i386_operand_type temp_type;
4687 enum bfd_reloc_code_real temp_reloc;
4688
4689 temp_type = i.types[xchg2];
4690 i.types[xchg2] = i.types[xchg1];
4691 i.types[xchg1] = temp_type;
4692 temp_op = i.op[xchg2];
4693 i.op[xchg2] = i.op[xchg1];
4694 i.op[xchg1] = temp_op;
4695 temp_reloc = i.reloc[xchg2];
4696 i.reloc[xchg2] = i.reloc[xchg1];
4697 i.reloc[xchg1] = temp_reloc;
4698
4699 if (i.mask)
4700 {
4701 if (i.mask->operand == xchg1)
4702 i.mask->operand = xchg2;
4703 else if (i.mask->operand == xchg2)
4704 i.mask->operand = xchg1;
4705 }
4706 if (i.broadcast)
4707 {
4708 if (i.broadcast->operand == xchg1)
4709 i.broadcast->operand = xchg2;
4710 else if (i.broadcast->operand == xchg2)
4711 i.broadcast->operand = xchg1;
4712 }
4713 if (i.rounding)
4714 {
4715 if (i.rounding->operand == xchg1)
4716 i.rounding->operand = xchg2;
4717 else if (i.rounding->operand == xchg2)
4718 i.rounding->operand = xchg1;
4719 }
4720 }
4721
4722 static void
4723 swap_operands (void)
4724 {
4725 switch (i.operands)
4726 {
4727 case 5:
4728 case 4:
4729 swap_2_operands (1, i.operands - 2);
4730 /* Fall through. */
4731 case 3:
4732 case 2:
4733 swap_2_operands (0, i.operands - 1);
4734 break;
4735 default:
4736 abort ();
4737 }
4738
4739 if (i.mem_operands == 2)
4740 {
4741 const seg_entry *temp_seg;
4742 temp_seg = i.seg[0];
4743 i.seg[0] = i.seg[1];
4744 i.seg[1] = temp_seg;
4745 }
4746 }
4747
4748 /* Try to ensure constant immediates are represented in the smallest
4749 opcode possible. */
4750 static void
4751 optimize_imm (void)
4752 {
4753 char guess_suffix = 0;
4754 int op;
4755
4756 if (i.suffix)
4757 guess_suffix = i.suffix;
4758 else if (i.reg_operands)
4759 {
4760 /* Figure out a suffix from the last register operand specified.
4761 We can't do this properly yet, ie. excluding InOutPortReg,
4762 but the following works for instructions with immediates.
4763 In any case, we can't set i.suffix yet. */
4764 for (op = i.operands; --op >= 0;)
4765 if (i.types[op].bitfield.reg && i.types[op].bitfield.byte)
4766 {
4767 guess_suffix = BYTE_MNEM_SUFFIX;
4768 break;
4769 }
4770 else if (i.types[op].bitfield.reg && i.types[op].bitfield.word)
4771 {
4772 guess_suffix = WORD_MNEM_SUFFIX;
4773 break;
4774 }
4775 else if (i.types[op].bitfield.reg && i.types[op].bitfield.dword)
4776 {
4777 guess_suffix = LONG_MNEM_SUFFIX;
4778 break;
4779 }
4780 else if (i.types[op].bitfield.reg && i.types[op].bitfield.qword)
4781 {
4782 guess_suffix = QWORD_MNEM_SUFFIX;
4783 break;
4784 }
4785 }
4786 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
4787 guess_suffix = WORD_MNEM_SUFFIX;
4788
4789 for (op = i.operands; --op >= 0;)
4790 if (operand_type_check (i.types[op], imm))
4791 {
4792 switch (i.op[op].imms->X_op)
4793 {
4794 case O_constant:
4795 /* If a suffix is given, this operand may be shortened. */
4796 switch (guess_suffix)
4797 {
4798 case LONG_MNEM_SUFFIX:
4799 i.types[op].bitfield.imm32 = 1;
4800 i.types[op].bitfield.imm64 = 1;
4801 break;
4802 case WORD_MNEM_SUFFIX:
4803 i.types[op].bitfield.imm16 = 1;
4804 i.types[op].bitfield.imm32 = 1;
4805 i.types[op].bitfield.imm32s = 1;
4806 i.types[op].bitfield.imm64 = 1;
4807 break;
4808 case BYTE_MNEM_SUFFIX:
4809 i.types[op].bitfield.imm8 = 1;
4810 i.types[op].bitfield.imm8s = 1;
4811 i.types[op].bitfield.imm16 = 1;
4812 i.types[op].bitfield.imm32 = 1;
4813 i.types[op].bitfield.imm32s = 1;
4814 i.types[op].bitfield.imm64 = 1;
4815 break;
4816 }
4817
4818 /* If this operand is at most 16 bits, convert it
4819 to a signed 16 bit number before trying to see
4820 whether it will fit in an even smaller size.
4821 This allows a 16-bit operand such as $0xffe0 to
4822 be recognised as within Imm8S range. */
4823 if ((i.types[op].bitfield.imm16)
4824 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
4825 {
4826 i.op[op].imms->X_add_number =
4827 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
4828 }
4829 #ifdef BFD64
4830 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
4831 if ((i.types[op].bitfield.imm32)
4832 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
4833 == 0))
4834 {
4835 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
4836 ^ ((offsetT) 1 << 31))
4837 - ((offsetT) 1 << 31));
4838 }
4839 #endif
4840 i.types[op]
4841 = operand_type_or (i.types[op],
4842 smallest_imm_type (i.op[op].imms->X_add_number));
4843
4844 /* We must avoid matching of Imm32 templates when 64bit
4845 only immediate is available. */
4846 if (guess_suffix == QWORD_MNEM_SUFFIX)
4847 i.types[op].bitfield.imm32 = 0;
4848 break;
4849
4850 case O_absent:
4851 case O_register:
4852 abort ();
4853
4854 /* Symbols and expressions. */
4855 default:
4856 /* Convert symbolic operand to proper sizes for matching, but don't
4857 prevent matching a set of insns that only supports sizes other
4858 than those matching the insn suffix. */
4859 {
4860 i386_operand_type mask, allowed;
4861 const insn_template *t;
4862
4863 operand_type_set (&mask, 0);
4864 operand_type_set (&allowed, 0);
4865
4866 for (t = current_templates->start;
4867 t < current_templates->end;
4868 ++t)
4869 allowed = operand_type_or (allowed,
4870 t->operand_types[op]);
4871 switch (guess_suffix)
4872 {
4873 case QWORD_MNEM_SUFFIX:
4874 mask.bitfield.imm64 = 1;
4875 mask.bitfield.imm32s = 1;
4876 break;
4877 case LONG_MNEM_SUFFIX:
4878 mask.bitfield.imm32 = 1;
4879 break;
4880 case WORD_MNEM_SUFFIX:
4881 mask.bitfield.imm16 = 1;
4882 break;
4883 case BYTE_MNEM_SUFFIX:
4884 mask.bitfield.imm8 = 1;
4885 break;
4886 default:
4887 break;
4888 }
4889 allowed = operand_type_and (mask, allowed);
4890 if (!operand_type_all_zero (&allowed))
4891 i.types[op] = operand_type_and (i.types[op], mask);
4892 }
4893 break;
4894 }
4895 }
4896 }
4897
4898 /* Try to use the smallest displacement type too. */
4899 static void
4900 optimize_disp (void)
4901 {
4902 int op;
4903
4904 for (op = i.operands; --op >= 0;)
4905 if (operand_type_check (i.types[op], disp))
4906 {
4907 if (i.op[op].disps->X_op == O_constant)
4908 {
4909 offsetT op_disp = i.op[op].disps->X_add_number;
4910
4911 if (i.types[op].bitfield.disp16
4912 && (op_disp & ~(offsetT) 0xffff) == 0)
4913 {
4914 /* If this operand is at most 16 bits, convert
4915 to a signed 16 bit number and don't use 64bit
4916 displacement. */
4917 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
4918 i.types[op].bitfield.disp64 = 0;
4919 }
4920 #ifdef BFD64
4921 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
4922 if (i.types[op].bitfield.disp32
4923 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
4924 {
4925 /* If this operand is at most 32 bits, convert
4926 to a signed 32 bit number and don't use 64bit
4927 displacement. */
4928 op_disp &= (((offsetT) 2 << 31) - 1);
4929 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
4930 i.types[op].bitfield.disp64 = 0;
4931 }
4932 #endif
4933 if (!op_disp && i.types[op].bitfield.baseindex)
4934 {
4935 i.types[op].bitfield.disp8 = 0;
4936 i.types[op].bitfield.disp16 = 0;
4937 i.types[op].bitfield.disp32 = 0;
4938 i.types[op].bitfield.disp32s = 0;
4939 i.types[op].bitfield.disp64 = 0;
4940 i.op[op].disps = 0;
4941 i.disp_operands--;
4942 }
4943 else if (flag_code == CODE_64BIT)
4944 {
4945 if (fits_in_signed_long (op_disp))
4946 {
4947 i.types[op].bitfield.disp64 = 0;
4948 i.types[op].bitfield.disp32s = 1;
4949 }
4950 if (i.prefix[ADDR_PREFIX]
4951 && fits_in_unsigned_long (op_disp))
4952 i.types[op].bitfield.disp32 = 1;
4953 }
4954 if ((i.types[op].bitfield.disp32
4955 || i.types[op].bitfield.disp32s
4956 || i.types[op].bitfield.disp16)
4957 && fits_in_disp8 (op_disp))
4958 i.types[op].bitfield.disp8 = 1;
4959 }
4960 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
4961 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
4962 {
4963 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
4964 i.op[op].disps, 0, i.reloc[op]);
4965 i.types[op].bitfield.disp8 = 0;
4966 i.types[op].bitfield.disp16 = 0;
4967 i.types[op].bitfield.disp32 = 0;
4968 i.types[op].bitfield.disp32s = 0;
4969 i.types[op].bitfield.disp64 = 0;
4970 }
4971 else
4972 /* We only support 64bit displacement on constants. */
4973 i.types[op].bitfield.disp64 = 0;
4974 }
4975 }
4976
4977 /* Check if operands are valid for the instruction. */
4978
4979 static int
4980 check_VecOperands (const insn_template *t)
4981 {
4982 unsigned int op;
4983 i386_cpu_flags cpu;
4984 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
4985
4986 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
4987 any one operand are implicity requiring AVX512VL support if the actual
4988 operand size is YMMword or XMMword. Since this function runs after
4989 template matching, there's no need to check for YMMword/XMMword in
4990 the template. */
4991 cpu = cpu_flags_and (t->cpu_flags, avx512);
4992 if (!cpu_flags_all_zero (&cpu)
4993 && !t->cpu_flags.bitfield.cpuavx512vl
4994 && !cpu_arch_flags.bitfield.cpuavx512vl)
4995 {
4996 for (op = 0; op < t->operands; ++op)
4997 {
4998 if (t->operand_types[op].bitfield.zmmword
4999 && (i.types[op].bitfield.ymmword
5000 || i.types[op].bitfield.xmmword))
5001 {
5002 i.error = unsupported;
5003 return 1;
5004 }
5005 }
5006 }
5007
5008 /* Without VSIB byte, we can't have a vector register for index. */
5009 if (!t->opcode_modifier.vecsib
5010 && i.index_reg
5011 && (i.index_reg->reg_type.bitfield.xmmword
5012 || i.index_reg->reg_type.bitfield.ymmword
5013 || i.index_reg->reg_type.bitfield.zmmword))
5014 {
5015 i.error = unsupported_vector_index_register;
5016 return 1;
5017 }
5018
5019 /* Check if default mask is allowed. */
5020 if (t->opcode_modifier.nodefmask
5021 && (!i.mask || i.mask->mask->reg_num == 0))
5022 {
5023 i.error = no_default_mask;
5024 return 1;
5025 }
5026
5027 /* For VSIB byte, we need a vector register for index, and all vector
5028 registers must be distinct. */
5029 if (t->opcode_modifier.vecsib)
5030 {
5031 if (!i.index_reg
5032 || !((t->opcode_modifier.vecsib == VecSIB128
5033 && i.index_reg->reg_type.bitfield.xmmword)
5034 || (t->opcode_modifier.vecsib == VecSIB256
5035 && i.index_reg->reg_type.bitfield.ymmword)
5036 || (t->opcode_modifier.vecsib == VecSIB512
5037 && i.index_reg->reg_type.bitfield.zmmword)))
5038 {
5039 i.error = invalid_vsib_address;
5040 return 1;
5041 }
5042
5043 gas_assert (i.reg_operands == 2 || i.mask);
5044 if (i.reg_operands == 2 && !i.mask)
5045 {
5046 gas_assert (i.types[0].bitfield.regsimd);
5047 gas_assert (i.types[0].bitfield.xmmword
5048 || i.types[0].bitfield.ymmword);
5049 gas_assert (i.types[2].bitfield.regsimd);
5050 gas_assert (i.types[2].bitfield.xmmword
5051 || i.types[2].bitfield.ymmword);
5052 if (operand_check == check_none)
5053 return 0;
5054 if (register_number (i.op[0].regs)
5055 != register_number (i.index_reg)
5056 && register_number (i.op[2].regs)
5057 != register_number (i.index_reg)
5058 && register_number (i.op[0].regs)
5059 != register_number (i.op[2].regs))
5060 return 0;
5061 if (operand_check == check_error)
5062 {
5063 i.error = invalid_vector_register_set;
5064 return 1;
5065 }
5066 as_warn (_("mask, index, and destination registers should be distinct"));
5067 }
5068 else if (i.reg_operands == 1 && i.mask)
5069 {
5070 if (i.types[1].bitfield.regsimd
5071 && (i.types[1].bitfield.xmmword
5072 || i.types[1].bitfield.ymmword
5073 || i.types[1].bitfield.zmmword)
5074 && (register_number (i.op[1].regs)
5075 == register_number (i.index_reg)))
5076 {
5077 if (operand_check == check_error)
5078 {
5079 i.error = invalid_vector_register_set;
5080 return 1;
5081 }
5082 if (operand_check != check_none)
5083 as_warn (_("index and destination registers should be distinct"));
5084 }
5085 }
5086 }
5087
5088 /* Check if broadcast is supported by the instruction and is applied
5089 to the memory operand. */
5090 if (i.broadcast)
5091 {
5092 i386_operand_type type, overlap;
5093
5094 /* Check if specified broadcast is supported in this instruction,
5095 and it's applied to memory operand of DWORD or QWORD type. */
5096 op = i.broadcast->operand;
5097 if (!t->opcode_modifier.broadcast
5098 || !i.types[op].bitfield.mem
5099 || (!i.types[op].bitfield.unspecified
5100 && (t->operand_types[op].bitfield.dword
5101 ? !i.types[op].bitfield.dword
5102 : !i.types[op].bitfield.qword)))
5103 {
5104 bad_broadcast:
5105 i.error = unsupported_broadcast;
5106 return 1;
5107 }
5108
5109 operand_type_set (&type, 0);
5110 switch ((t->operand_types[op].bitfield.dword ? 4 : 8) * i.broadcast->type)
5111 {
5112 case 8:
5113 type.bitfield.qword = 1;
5114 break;
5115 case 16:
5116 type.bitfield.xmmword = 1;
5117 break;
5118 case 32:
5119 type.bitfield.ymmword = 1;
5120 break;
5121 case 64:
5122 type.bitfield.zmmword = 1;
5123 break;
5124 default:
5125 goto bad_broadcast;
5126 }
5127
5128 overlap = operand_type_and (type, t->operand_types[op]);
5129 if (operand_type_all_zero (&overlap))
5130 goto bad_broadcast;
5131
5132 if (t->opcode_modifier.checkregsize)
5133 {
5134 unsigned int j;
5135
5136 type.bitfield.baseindex = 1;
5137 for (j = 0; j < i.operands; ++j)
5138 {
5139 if (j != op
5140 && !operand_type_register_match(i.types[j],
5141 t->operand_types[j],
5142 type,
5143 t->operand_types[op]))
5144 goto bad_broadcast;
5145 }
5146 }
5147 }
5148 /* If broadcast is supported in this instruction, we need to check if
5149 operand of one-element size isn't specified without broadcast. */
5150 else if (t->opcode_modifier.broadcast && i.mem_operands)
5151 {
5152 /* Find memory operand. */
5153 for (op = 0; op < i.operands; op++)
5154 if (operand_type_check (i.types[op], anymem))
5155 break;
5156 gas_assert (op < i.operands);
5157 /* Check size of the memory operand. */
5158 if (t->operand_types[op].bitfield.dword
5159 ? i.types[op].bitfield.dword
5160 : i.types[op].bitfield.qword)
5161 {
5162 i.error = broadcast_needed;
5163 return 1;
5164 }
5165 }
5166 else
5167 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5168
5169 /* Check if requested masking is supported. */
5170 if (i.mask
5171 && (!t->opcode_modifier.masking
5172 || (i.mask->zeroing
5173 && t->opcode_modifier.masking == MERGING_MASKING)))
5174 {
5175 i.error = unsupported_masking;
5176 return 1;
5177 }
5178
5179 /* Check if masking is applied to dest operand. */
5180 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5181 {
5182 i.error = mask_not_on_destination;
5183 return 1;
5184 }
5185
5186 /* Check RC/SAE. */
5187 if (i.rounding)
5188 {
5189 if ((i.rounding->type != saeonly
5190 && !t->opcode_modifier.staticrounding)
5191 || (i.rounding->type == saeonly
5192 && (t->opcode_modifier.staticrounding
5193 || !t->opcode_modifier.sae)))
5194 {
5195 i.error = unsupported_rc_sae;
5196 return 1;
5197 }
5198 /* If the instruction has several immediate operands and one of
5199 them is rounding, the rounding operand should be the last
5200 immediate operand. */
5201 if (i.imm_operands > 1
5202 && i.rounding->operand != (int) (i.imm_operands - 1))
5203 {
5204 i.error = rc_sae_operand_not_last_imm;
5205 return 1;
5206 }
5207 }
5208
5209 /* Check vector Disp8 operand. */
5210 if (t->opcode_modifier.disp8memshift
5211 && i.disp_encoding != disp_encoding_32bit)
5212 {
5213 if (i.broadcast)
5214 i.memshift = t->operand_types[op].bitfield.dword ? 2 : 3;
5215 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5216 i.memshift = t->opcode_modifier.disp8memshift;
5217 else
5218 {
5219 const i386_operand_type *type = NULL;
5220
5221 i.memshift = 0;
5222 for (op = 0; op < i.operands; op++)
5223 if (operand_type_check (i.types[op], anymem))
5224 {
5225 if (t->operand_types[op].bitfield.xmmword
5226 + t->operand_types[op].bitfield.ymmword
5227 + t->operand_types[op].bitfield.zmmword <= 1)
5228 type = &t->operand_types[op];
5229 else if (!i.types[op].bitfield.unspecified)
5230 type = &i.types[op];
5231 }
5232 else if (i.types[op].bitfield.regsimd)
5233 {
5234 if (i.types[op].bitfield.zmmword)
5235 i.memshift = 6;
5236 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5237 i.memshift = 5;
5238 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5239 i.memshift = 4;
5240 }
5241
5242 if (type)
5243 {
5244 if (type->bitfield.zmmword)
5245 i.memshift = 6;
5246 else if (type->bitfield.ymmword)
5247 i.memshift = 5;
5248 else if (type->bitfield.xmmword)
5249 i.memshift = 4;
5250 }
5251
5252 /* For the check in fits_in_disp8(). */
5253 if (i.memshift == 0)
5254 i.memshift = -1;
5255 }
5256
5257 for (op = 0; op < i.operands; op++)
5258 if (operand_type_check (i.types[op], disp)
5259 && i.op[op].disps->X_op == O_constant)
5260 {
5261 if (fits_in_disp8 (i.op[op].disps->X_add_number))
5262 {
5263 i.types[op].bitfield.disp8 = 1;
5264 return 0;
5265 }
5266 i.types[op].bitfield.disp8 = 0;
5267 }
5268 }
5269
5270 i.memshift = 0;
5271
5272 return 0;
5273 }
5274
5275 /* Check if operands are valid for the instruction. Update VEX
5276 operand types. */
5277
5278 static int
5279 VEX_check_operands (const insn_template *t)
5280 {
5281 if (i.vec_encoding == vex_encoding_evex)
5282 {
5283 /* This instruction must be encoded with EVEX prefix. */
5284 if (!is_evex_encoding (t))
5285 {
5286 i.error = unsupported;
5287 return 1;
5288 }
5289 return 0;
5290 }
5291
5292 if (!t->opcode_modifier.vex)
5293 {
5294 /* This instruction template doesn't have VEX prefix. */
5295 if (i.vec_encoding != vex_encoding_default)
5296 {
5297 i.error = unsupported;
5298 return 1;
5299 }
5300 return 0;
5301 }
5302
5303 /* Only check VEX_Imm4, which must be the first operand. */
5304 if (t->operand_types[0].bitfield.vec_imm4)
5305 {
5306 if (i.op[0].imms->X_op != O_constant
5307 || !fits_in_imm4 (i.op[0].imms->X_add_number))
5308 {
5309 i.error = bad_imm4;
5310 return 1;
5311 }
5312
5313 /* Turn off Imm8 so that update_imm won't complain. */
5314 i.types[0] = vec_imm4;
5315 }
5316
5317 return 0;
5318 }
5319
5320 static const insn_template *
5321 match_template (char mnem_suffix)
5322 {
5323 /* Points to template once we've found it. */
5324 const insn_template *t;
5325 i386_operand_type overlap0, overlap1, overlap2, overlap3;
5326 i386_operand_type overlap4;
5327 unsigned int found_reverse_match;
5328 i386_opcode_modifier suffix_check, mnemsuf_check;
5329 i386_operand_type operand_types [MAX_OPERANDS];
5330 int addr_prefix_disp;
5331 unsigned int j;
5332 unsigned int found_cpu_match, size_match;
5333 unsigned int check_register;
5334 enum i386_error specific_error = 0;
5335
5336 #if MAX_OPERANDS != 5
5337 # error "MAX_OPERANDS must be 5."
5338 #endif
5339
5340 found_reverse_match = 0;
5341 addr_prefix_disp = -1;
5342
5343 memset (&suffix_check, 0, sizeof (suffix_check));
5344 if (intel_syntax && i.broadcast)
5345 /* nothing */;
5346 else if (i.suffix == BYTE_MNEM_SUFFIX)
5347 suffix_check.no_bsuf = 1;
5348 else if (i.suffix == WORD_MNEM_SUFFIX)
5349 suffix_check.no_wsuf = 1;
5350 else if (i.suffix == SHORT_MNEM_SUFFIX)
5351 suffix_check.no_ssuf = 1;
5352 else if (i.suffix == LONG_MNEM_SUFFIX)
5353 suffix_check.no_lsuf = 1;
5354 else if (i.suffix == QWORD_MNEM_SUFFIX)
5355 suffix_check.no_qsuf = 1;
5356 else if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5357 suffix_check.no_ldsuf = 1;
5358
5359 memset (&mnemsuf_check, 0, sizeof (mnemsuf_check));
5360 if (intel_syntax)
5361 {
5362 switch (mnem_suffix)
5363 {
5364 case BYTE_MNEM_SUFFIX: mnemsuf_check.no_bsuf = 1; break;
5365 case WORD_MNEM_SUFFIX: mnemsuf_check.no_wsuf = 1; break;
5366 case SHORT_MNEM_SUFFIX: mnemsuf_check.no_ssuf = 1; break;
5367 case LONG_MNEM_SUFFIX: mnemsuf_check.no_lsuf = 1; break;
5368 case QWORD_MNEM_SUFFIX: mnemsuf_check.no_qsuf = 1; break;
5369 }
5370 }
5371
5372 /* Must have right number of operands. */
5373 i.error = number_of_operands_mismatch;
5374
5375 for (t = current_templates->start; t < current_templates->end; t++)
5376 {
5377 addr_prefix_disp = -1;
5378
5379 if (i.operands != t->operands)
5380 continue;
5381
5382 /* Check processor support. */
5383 i.error = unsupported;
5384 found_cpu_match = (cpu_flags_match (t)
5385 == CPU_FLAGS_PERFECT_MATCH);
5386 if (!found_cpu_match)
5387 continue;
5388
5389 /* Check AT&T mnemonic. */
5390 i.error = unsupported_with_intel_mnemonic;
5391 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5392 continue;
5393
5394 /* Check AT&T/Intel syntax and Intel64/AMD64 ISA. */
5395 i.error = unsupported_syntax;
5396 if ((intel_syntax && t->opcode_modifier.attsyntax)
5397 || (!intel_syntax && t->opcode_modifier.intelsyntax)
5398 || (intel64 && t->opcode_modifier.amd64)
5399 || (!intel64 && t->opcode_modifier.intel64))
5400 continue;
5401
5402 /* Check the suffix, except for some instructions in intel mode. */
5403 i.error = invalid_instruction_suffix;
5404 if ((!intel_syntax || !t->opcode_modifier.ignoresize)
5405 && ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5406 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5407 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5408 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5409 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5410 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf)))
5411 continue;
5412 /* In Intel mode all mnemonic suffixes must be explicitly allowed. */
5413 if ((t->opcode_modifier.no_bsuf && mnemsuf_check.no_bsuf)
5414 || (t->opcode_modifier.no_wsuf && mnemsuf_check.no_wsuf)
5415 || (t->opcode_modifier.no_lsuf && mnemsuf_check.no_lsuf)
5416 || (t->opcode_modifier.no_ssuf && mnemsuf_check.no_ssuf)
5417 || (t->opcode_modifier.no_qsuf && mnemsuf_check.no_qsuf)
5418 || (t->opcode_modifier.no_ldsuf && mnemsuf_check.no_ldsuf))
5419 continue;
5420
5421 size_match = operand_size_match (t);
5422 if (!size_match)
5423 continue;
5424
5425 for (j = 0; j < MAX_OPERANDS; j++)
5426 operand_types[j] = t->operand_types[j];
5427
5428 /* In general, don't allow 64-bit operands in 32-bit mode. */
5429 if (i.suffix == QWORD_MNEM_SUFFIX
5430 && flag_code != CODE_64BIT
5431 && (intel_syntax
5432 ? (!t->opcode_modifier.ignoresize
5433 && !intel_float_operand (t->name))
5434 : intel_float_operand (t->name) != 2)
5435 && ((!operand_types[0].bitfield.regmmx
5436 && !operand_types[0].bitfield.regsimd)
5437 || (!operand_types[t->operands > 1].bitfield.regmmx
5438 && !operand_types[t->operands > 1].bitfield.regsimd))
5439 && (t->base_opcode != 0x0fc7
5440 || t->extension_opcode != 1 /* cmpxchg8b */))
5441 continue;
5442
5443 /* In general, don't allow 32-bit operands on pre-386. */
5444 else if (i.suffix == LONG_MNEM_SUFFIX
5445 && !cpu_arch_flags.bitfield.cpui386
5446 && (intel_syntax
5447 ? (!t->opcode_modifier.ignoresize
5448 && !intel_float_operand (t->name))
5449 : intel_float_operand (t->name) != 2)
5450 && ((!operand_types[0].bitfield.regmmx
5451 && !operand_types[0].bitfield.regsimd)
5452 || (!operand_types[t->operands > 1].bitfield.regmmx
5453 && !operand_types[t->operands > 1].bitfield.regsimd)))
5454 continue;
5455
5456 /* Do not verify operands when there are none. */
5457 else
5458 {
5459 if (!t->operands)
5460 /* We've found a match; break out of loop. */
5461 break;
5462 }
5463
5464 /* Address size prefix will turn Disp64/Disp32/Disp16 operand
5465 into Disp32/Disp16/Disp32 operand. */
5466 if (i.prefix[ADDR_PREFIX] != 0)
5467 {
5468 /* There should be only one Disp operand. */
5469 switch (flag_code)
5470 {
5471 case CODE_16BIT:
5472 for (j = 0; j < MAX_OPERANDS; j++)
5473 {
5474 if (operand_types[j].bitfield.disp16)
5475 {
5476 addr_prefix_disp = j;
5477 operand_types[j].bitfield.disp32 = 1;
5478 operand_types[j].bitfield.disp16 = 0;
5479 break;
5480 }
5481 }
5482 break;
5483 case CODE_32BIT:
5484 for (j = 0; j < MAX_OPERANDS; j++)
5485 {
5486 if (operand_types[j].bitfield.disp32)
5487 {
5488 addr_prefix_disp = j;
5489 operand_types[j].bitfield.disp32 = 0;
5490 operand_types[j].bitfield.disp16 = 1;
5491 break;
5492 }
5493 }
5494 break;
5495 case CODE_64BIT:
5496 for (j = 0; j < MAX_OPERANDS; j++)
5497 {
5498 if (operand_types[j].bitfield.disp64)
5499 {
5500 addr_prefix_disp = j;
5501 operand_types[j].bitfield.disp64 = 0;
5502 operand_types[j].bitfield.disp32 = 1;
5503 break;
5504 }
5505 }
5506 break;
5507 }
5508 }
5509
5510 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
5511 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5512 continue;
5513
5514 /* We check register size if needed. */
5515 if (t->opcode_modifier.checkregsize)
5516 {
5517 check_register = (1 << t->operands) - 1;
5518 if (i.broadcast)
5519 check_register &= ~(1 << i.broadcast->operand);
5520 }
5521 else
5522 check_register = 0;
5523
5524 overlap0 = operand_type_and (i.types[0], operand_types[0]);
5525 switch (t->operands)
5526 {
5527 case 1:
5528 if (!operand_type_match (overlap0, i.types[0]))
5529 continue;
5530 break;
5531 case 2:
5532 /* xchg %eax, %eax is a special case. It is an alias for nop
5533 only in 32bit mode and we can use opcode 0x90. In 64bit
5534 mode, we can't use 0x90 for xchg %eax, %eax since it should
5535 zero-extend %eax to %rax. */
5536 if (flag_code == CODE_64BIT
5537 && t->base_opcode == 0x90
5538 && operand_type_equal (&i.types [0], &acc32)
5539 && operand_type_equal (&i.types [1], &acc32))
5540 continue;
5541 /* xrelease mov %eax, <disp> is another special case. It must not
5542 match the accumulator-only encoding of mov. */
5543 if (flag_code != CODE_64BIT
5544 && i.hle_prefix
5545 && t->base_opcode == 0xa0
5546 && i.types[0].bitfield.acc
5547 && operand_type_check (i.types[1], anymem))
5548 continue;
5549 if (!(size_match & MATCH_STRAIGHT))
5550 goto check_reverse;
5551 /* If we want store form, we reverse direction of operands. */
5552 if (i.dir_encoding == dir_encoding_store
5553 && t->opcode_modifier.d)
5554 goto check_reverse;
5555 /* Fall through. */
5556
5557 case 3:
5558 /* If we want store form, we skip the current load. */
5559 if (i.dir_encoding == dir_encoding_store
5560 && i.mem_operands == 0
5561 && t->opcode_modifier.load)
5562 continue;
5563 /* Fall through. */
5564 case 4:
5565 case 5:
5566 overlap1 = operand_type_and (i.types[1], operand_types[1]);
5567 if (!operand_type_match (overlap0, i.types[0])
5568 || !operand_type_match (overlap1, i.types[1])
5569 || ((check_register & 3) == 3
5570 && !operand_type_register_match (i.types[0],
5571 operand_types[0],
5572 i.types[1],
5573 operand_types[1])))
5574 {
5575 /* Check if other direction is valid ... */
5576 if (!t->opcode_modifier.d)
5577 continue;
5578
5579 check_reverse:
5580 if (!(size_match & MATCH_REVERSE))
5581 continue;
5582 /* Try reversing direction of operands. */
5583 overlap0 = operand_type_and (i.types[0], operand_types[1]);
5584 overlap1 = operand_type_and (i.types[1], operand_types[0]);
5585 if (!operand_type_match (overlap0, i.types[0])
5586 || !operand_type_match (overlap1, i.types[1])
5587 || (check_register
5588 && !operand_type_register_match (i.types[0],
5589 operand_types[1],
5590 i.types[1],
5591 operand_types[0])))
5592 {
5593 /* Does not match either direction. */
5594 continue;
5595 }
5596 /* found_reverse_match holds which of D or FloatR
5597 we've found. */
5598 if (!t->opcode_modifier.d)
5599 found_reverse_match = 0;
5600 else if (operand_types[0].bitfield.tbyte)
5601 found_reverse_match = Opcode_FloatD;
5602 else
5603 found_reverse_match = Opcode_D;
5604 if (t->opcode_modifier.floatr)
5605 found_reverse_match |= Opcode_FloatR;
5606 }
5607 else
5608 {
5609 /* Found a forward 2 operand match here. */
5610 switch (t->operands)
5611 {
5612 case 5:
5613 overlap4 = operand_type_and (i.types[4],
5614 operand_types[4]);
5615 /* Fall through. */
5616 case 4:
5617 overlap3 = operand_type_and (i.types[3],
5618 operand_types[3]);
5619 /* Fall through. */
5620 case 3:
5621 overlap2 = operand_type_and (i.types[2],
5622 operand_types[2]);
5623 break;
5624 }
5625
5626 switch (t->operands)
5627 {
5628 case 5:
5629 if (!operand_type_match (overlap4, i.types[4])
5630 || !operand_type_register_match (i.types[3],
5631 operand_types[3],
5632 i.types[4],
5633 operand_types[4]))
5634 continue;
5635 /* Fall through. */
5636 case 4:
5637 if (!operand_type_match (overlap3, i.types[3])
5638 || ((check_register & 0xa) == 0xa
5639 && !operand_type_register_match (i.types[1],
5640 operand_types[1],
5641 i.types[3],
5642 operand_types[3]))
5643 || ((check_register & 0xc) == 0xc
5644 && !operand_type_register_match (i.types[2],
5645 operand_types[2],
5646 i.types[3],
5647 operand_types[3])))
5648 continue;
5649 /* Fall through. */
5650 case 3:
5651 /* Here we make use of the fact that there are no
5652 reverse match 3 operand instructions. */
5653 if (!operand_type_match (overlap2, i.types[2])
5654 || ((check_register & 5) == 5
5655 && !operand_type_register_match (i.types[0],
5656 operand_types[0],
5657 i.types[2],
5658 operand_types[2]))
5659 || ((check_register & 6) == 6
5660 && !operand_type_register_match (i.types[1],
5661 operand_types[1],
5662 i.types[2],
5663 operand_types[2])))
5664 continue;
5665 break;
5666 }
5667 }
5668 /* Found either forward/reverse 2, 3 or 4 operand match here:
5669 slip through to break. */
5670 }
5671 if (!found_cpu_match)
5672 {
5673 found_reverse_match = 0;
5674 continue;
5675 }
5676
5677 /* Check if vector and VEX operands are valid. */
5678 if (check_VecOperands (t) || VEX_check_operands (t))
5679 {
5680 specific_error = i.error;
5681 continue;
5682 }
5683
5684 /* We've found a match; break out of loop. */
5685 break;
5686 }
5687
5688 if (t == current_templates->end)
5689 {
5690 /* We found no match. */
5691 const char *err_msg;
5692 switch (specific_error ? specific_error : i.error)
5693 {
5694 default:
5695 abort ();
5696 case operand_size_mismatch:
5697 err_msg = _("operand size mismatch");
5698 break;
5699 case operand_type_mismatch:
5700 err_msg = _("operand type mismatch");
5701 break;
5702 case register_type_mismatch:
5703 err_msg = _("register type mismatch");
5704 break;
5705 case number_of_operands_mismatch:
5706 err_msg = _("number of operands mismatch");
5707 break;
5708 case invalid_instruction_suffix:
5709 err_msg = _("invalid instruction suffix");
5710 break;
5711 case bad_imm4:
5712 err_msg = _("constant doesn't fit in 4 bits");
5713 break;
5714 case unsupported_with_intel_mnemonic:
5715 err_msg = _("unsupported with Intel mnemonic");
5716 break;
5717 case unsupported_syntax:
5718 err_msg = _("unsupported syntax");
5719 break;
5720 case unsupported:
5721 as_bad (_("unsupported instruction `%s'"),
5722 current_templates->start->name);
5723 return NULL;
5724 case invalid_vsib_address:
5725 err_msg = _("invalid VSIB address");
5726 break;
5727 case invalid_vector_register_set:
5728 err_msg = _("mask, index, and destination registers must be distinct");
5729 break;
5730 case unsupported_vector_index_register:
5731 err_msg = _("unsupported vector index register");
5732 break;
5733 case unsupported_broadcast:
5734 err_msg = _("unsupported broadcast");
5735 break;
5736 case broadcast_not_on_src_operand:
5737 err_msg = _("broadcast not on source memory operand");
5738 break;
5739 case broadcast_needed:
5740 err_msg = _("broadcast is needed for operand of such type");
5741 break;
5742 case unsupported_masking:
5743 err_msg = _("unsupported masking");
5744 break;
5745 case mask_not_on_destination:
5746 err_msg = _("mask not on destination operand");
5747 break;
5748 case no_default_mask:
5749 err_msg = _("default mask isn't allowed");
5750 break;
5751 case unsupported_rc_sae:
5752 err_msg = _("unsupported static rounding/sae");
5753 break;
5754 case rc_sae_operand_not_last_imm:
5755 if (intel_syntax)
5756 err_msg = _("RC/SAE operand must precede immediate operands");
5757 else
5758 err_msg = _("RC/SAE operand must follow immediate operands");
5759 break;
5760 case invalid_register_operand:
5761 err_msg = _("invalid register operand");
5762 break;
5763 }
5764 as_bad (_("%s for `%s'"), err_msg,
5765 current_templates->start->name);
5766 return NULL;
5767 }
5768
5769 if (!quiet_warnings)
5770 {
5771 if (!intel_syntax
5772 && (i.types[0].bitfield.jumpabsolute
5773 != operand_types[0].bitfield.jumpabsolute))
5774 {
5775 as_warn (_("indirect %s without `*'"), t->name);
5776 }
5777
5778 if (t->opcode_modifier.isprefix
5779 && t->opcode_modifier.ignoresize)
5780 {
5781 /* Warn them that a data or address size prefix doesn't
5782 affect assembly of the next line of code. */
5783 as_warn (_("stand-alone `%s' prefix"), t->name);
5784 }
5785 }
5786
5787 /* Copy the template we found. */
5788 i.tm = *t;
5789
5790 if (addr_prefix_disp != -1)
5791 i.tm.operand_types[addr_prefix_disp]
5792 = operand_types[addr_prefix_disp];
5793
5794 if (found_reverse_match)
5795 {
5796 /* If we found a reverse match we must alter the opcode
5797 direction bit. found_reverse_match holds bits to change
5798 (different for int & float insns). */
5799
5800 i.tm.base_opcode ^= found_reverse_match;
5801
5802 i.tm.operand_types[0] = operand_types[1];
5803 i.tm.operand_types[1] = operand_types[0];
5804 }
5805
5806 return t;
5807 }
5808
5809 static int
5810 check_string (void)
5811 {
5812 int mem_op = operand_type_check (i.types[0], anymem) ? 0 : 1;
5813 if (i.tm.operand_types[mem_op].bitfield.esseg)
5814 {
5815 if (i.seg[0] != NULL && i.seg[0] != &es)
5816 {
5817 as_bad (_("`%s' operand %d must use `%ses' segment"),
5818 i.tm.name,
5819 mem_op + 1,
5820 register_prefix);
5821 return 0;
5822 }
5823 /* There's only ever one segment override allowed per instruction.
5824 This instruction possibly has a legal segment override on the
5825 second operand, so copy the segment to where non-string
5826 instructions store it, allowing common code. */
5827 i.seg[0] = i.seg[1];
5828 }
5829 else if (i.tm.operand_types[mem_op + 1].bitfield.esseg)
5830 {
5831 if (i.seg[1] != NULL && i.seg[1] != &es)
5832 {
5833 as_bad (_("`%s' operand %d must use `%ses' segment"),
5834 i.tm.name,
5835 mem_op + 2,
5836 register_prefix);
5837 return 0;
5838 }
5839 }
5840 return 1;
5841 }
5842
5843 static int
5844 process_suffix (void)
5845 {
5846 /* If matched instruction specifies an explicit instruction mnemonic
5847 suffix, use it. */
5848 if (i.tm.opcode_modifier.size16)
5849 i.suffix = WORD_MNEM_SUFFIX;
5850 else if (i.tm.opcode_modifier.size32)
5851 i.suffix = LONG_MNEM_SUFFIX;
5852 else if (i.tm.opcode_modifier.size64)
5853 i.suffix = QWORD_MNEM_SUFFIX;
5854 else if (i.reg_operands)
5855 {
5856 /* If there's no instruction mnemonic suffix we try to invent one
5857 based on register operands. */
5858 if (!i.suffix)
5859 {
5860 /* We take i.suffix from the last register operand specified,
5861 Destination register type is more significant than source
5862 register type. crc32 in SSE4.2 prefers source register
5863 type. */
5864 if (i.tm.base_opcode == 0xf20f38f1)
5865 {
5866 if (i.types[0].bitfield.reg && i.types[0].bitfield.word)
5867 i.suffix = WORD_MNEM_SUFFIX;
5868 else if (i.types[0].bitfield.reg && i.types[0].bitfield.dword)
5869 i.suffix = LONG_MNEM_SUFFIX;
5870 else if (i.types[0].bitfield.reg && i.types[0].bitfield.qword)
5871 i.suffix = QWORD_MNEM_SUFFIX;
5872 }
5873 else if (i.tm.base_opcode == 0xf20f38f0)
5874 {
5875 if (i.types[0].bitfield.reg && i.types[0].bitfield.byte)
5876 i.suffix = BYTE_MNEM_SUFFIX;
5877 }
5878
5879 if (!i.suffix)
5880 {
5881 int op;
5882
5883 if (i.tm.base_opcode == 0xf20f38f1
5884 || i.tm.base_opcode == 0xf20f38f0)
5885 {
5886 /* We have to know the operand size for crc32. */
5887 as_bad (_("ambiguous memory operand size for `%s`"),
5888 i.tm.name);
5889 return 0;
5890 }
5891
5892 for (op = i.operands; --op >= 0;)
5893 if (!i.tm.operand_types[op].bitfield.inoutportreg
5894 && !i.tm.operand_types[op].bitfield.shiftcount)
5895 {
5896 if (!i.types[op].bitfield.reg)
5897 continue;
5898 if (i.types[op].bitfield.byte)
5899 i.suffix = BYTE_MNEM_SUFFIX;
5900 else if (i.types[op].bitfield.word)
5901 i.suffix = WORD_MNEM_SUFFIX;
5902 else if (i.types[op].bitfield.dword)
5903 i.suffix = LONG_MNEM_SUFFIX;
5904 else if (i.types[op].bitfield.qword)
5905 i.suffix = QWORD_MNEM_SUFFIX;
5906 else
5907 continue;
5908 break;
5909 }
5910 }
5911 }
5912 else if (i.suffix == BYTE_MNEM_SUFFIX)
5913 {
5914 if (intel_syntax
5915 && i.tm.opcode_modifier.ignoresize
5916 && i.tm.opcode_modifier.no_bsuf)
5917 i.suffix = 0;
5918 else if (!check_byte_reg ())
5919 return 0;
5920 }
5921 else if (i.suffix == LONG_MNEM_SUFFIX)
5922 {
5923 if (intel_syntax
5924 && i.tm.opcode_modifier.ignoresize
5925 && i.tm.opcode_modifier.no_lsuf
5926 && !i.tm.opcode_modifier.todword
5927 && !i.tm.opcode_modifier.toqword)
5928 i.suffix = 0;
5929 else if (!check_long_reg ())
5930 return 0;
5931 }
5932 else if (i.suffix == QWORD_MNEM_SUFFIX)
5933 {
5934 if (intel_syntax
5935 && i.tm.opcode_modifier.ignoresize
5936 && i.tm.opcode_modifier.no_qsuf
5937 && !i.tm.opcode_modifier.todword
5938 && !i.tm.opcode_modifier.toqword)
5939 i.suffix = 0;
5940 else if (!check_qword_reg ())
5941 return 0;
5942 }
5943 else if (i.suffix == WORD_MNEM_SUFFIX)
5944 {
5945 if (intel_syntax
5946 && i.tm.opcode_modifier.ignoresize
5947 && i.tm.opcode_modifier.no_wsuf)
5948 i.suffix = 0;
5949 else if (!check_word_reg ())
5950 return 0;
5951 }
5952 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
5953 /* Do nothing if the instruction is going to ignore the prefix. */
5954 ;
5955 else
5956 abort ();
5957 }
5958 else if (i.tm.opcode_modifier.defaultsize
5959 && !i.suffix
5960 /* exclude fldenv/frstor/fsave/fstenv */
5961 && i.tm.opcode_modifier.no_ssuf)
5962 {
5963 i.suffix = stackop_size;
5964 }
5965 else if (intel_syntax
5966 && !i.suffix
5967 && (i.tm.operand_types[0].bitfield.jumpabsolute
5968 || i.tm.opcode_modifier.jumpbyte
5969 || i.tm.opcode_modifier.jumpintersegment
5970 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
5971 && i.tm.extension_opcode <= 3)))
5972 {
5973 switch (flag_code)
5974 {
5975 case CODE_64BIT:
5976 if (!i.tm.opcode_modifier.no_qsuf)
5977 {
5978 i.suffix = QWORD_MNEM_SUFFIX;
5979 break;
5980 }
5981 /* Fall through. */
5982 case CODE_32BIT:
5983 if (!i.tm.opcode_modifier.no_lsuf)
5984 i.suffix = LONG_MNEM_SUFFIX;
5985 break;
5986 case CODE_16BIT:
5987 if (!i.tm.opcode_modifier.no_wsuf)
5988 i.suffix = WORD_MNEM_SUFFIX;
5989 break;
5990 }
5991 }
5992
5993 if (!i.suffix)
5994 {
5995 if (!intel_syntax)
5996 {
5997 if (i.tm.opcode_modifier.w)
5998 {
5999 as_bad (_("no instruction mnemonic suffix given and "
6000 "no register operands; can't size instruction"));
6001 return 0;
6002 }
6003 }
6004 else
6005 {
6006 unsigned int suffixes;
6007
6008 suffixes = !i.tm.opcode_modifier.no_bsuf;
6009 if (!i.tm.opcode_modifier.no_wsuf)
6010 suffixes |= 1 << 1;
6011 if (!i.tm.opcode_modifier.no_lsuf)
6012 suffixes |= 1 << 2;
6013 if (!i.tm.opcode_modifier.no_ldsuf)
6014 suffixes |= 1 << 3;
6015 if (!i.tm.opcode_modifier.no_ssuf)
6016 suffixes |= 1 << 4;
6017 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6018 suffixes |= 1 << 5;
6019
6020 /* There are more than suffix matches. */
6021 if (i.tm.opcode_modifier.w
6022 || ((suffixes & (suffixes - 1))
6023 && !i.tm.opcode_modifier.defaultsize
6024 && !i.tm.opcode_modifier.ignoresize))
6025 {
6026 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6027 return 0;
6028 }
6029 }
6030 }
6031
6032 /* Change the opcode based on the operand size given by i.suffix. */
6033 switch (i.suffix)
6034 {
6035 /* Size floating point instruction. */
6036 case LONG_MNEM_SUFFIX:
6037 if (i.tm.opcode_modifier.floatmf)
6038 {
6039 i.tm.base_opcode ^= 4;
6040 break;
6041 }
6042 /* fall through */
6043 case WORD_MNEM_SUFFIX:
6044 case QWORD_MNEM_SUFFIX:
6045 /* It's not a byte, select word/dword operation. */
6046 if (i.tm.opcode_modifier.w)
6047 {
6048 if (i.tm.opcode_modifier.shortform)
6049 i.tm.base_opcode |= 8;
6050 else
6051 i.tm.base_opcode |= 1;
6052 }
6053 /* fall through */
6054 case SHORT_MNEM_SUFFIX:
6055 /* Now select between word & dword operations via the operand
6056 size prefix, except for instructions that will ignore this
6057 prefix anyway. */
6058 if (i.reg_operands > 0
6059 && i.types[0].bitfield.reg
6060 && i.tm.opcode_modifier.addrprefixopreg
6061 && (i.tm.opcode_modifier.immext
6062 || i.operands == 1))
6063 {
6064 /* The address size override prefix changes the size of the
6065 first operand. */
6066 if ((flag_code == CODE_32BIT
6067 && i.op[0].regs->reg_type.bitfield.word)
6068 || (flag_code != CODE_32BIT
6069 && i.op[0].regs->reg_type.bitfield.dword))
6070 if (!add_prefix (ADDR_PREFIX_OPCODE))
6071 return 0;
6072 }
6073 else if (i.suffix != QWORD_MNEM_SUFFIX
6074 && !i.tm.opcode_modifier.ignoresize
6075 && !i.tm.opcode_modifier.floatmf
6076 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6077 || (flag_code == CODE_64BIT
6078 && i.tm.opcode_modifier.jumpbyte)))
6079 {
6080 unsigned int prefix = DATA_PREFIX_OPCODE;
6081
6082 if (i.tm.opcode_modifier.jumpbyte) /* jcxz, loop */
6083 prefix = ADDR_PREFIX_OPCODE;
6084
6085 if (!add_prefix (prefix))
6086 return 0;
6087 }
6088
6089 /* Set mode64 for an operand. */
6090 if (i.suffix == QWORD_MNEM_SUFFIX
6091 && flag_code == CODE_64BIT
6092 && !i.tm.opcode_modifier.norex64
6093 /* Special case for xchg %rax,%rax. It is NOP and doesn't
6094 need rex64. */
6095 && ! (i.operands == 2
6096 && i.tm.base_opcode == 0x90
6097 && i.tm.extension_opcode == None
6098 && operand_type_equal (&i.types [0], &acc64)
6099 && operand_type_equal (&i.types [1], &acc64)))
6100 i.rex |= REX_W;
6101
6102 break;
6103 }
6104
6105 if (i.reg_operands != 0
6106 && i.operands > 1
6107 && i.tm.opcode_modifier.addrprefixopreg
6108 && !i.tm.opcode_modifier.immext)
6109 {
6110 /* Check invalid register operand when the address size override
6111 prefix changes the size of register operands. */
6112 unsigned int op;
6113 enum { need_word, need_dword, need_qword } need;
6114
6115 if (flag_code == CODE_32BIT)
6116 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6117 else
6118 {
6119 if (i.prefix[ADDR_PREFIX])
6120 need = need_dword;
6121 else
6122 need = flag_code == CODE_64BIT ? need_qword : need_word;
6123 }
6124
6125 for (op = 0; op < i.operands; op++)
6126 if (i.types[op].bitfield.reg
6127 && ((need == need_word
6128 && !i.op[op].regs->reg_type.bitfield.word)
6129 || (need == need_dword
6130 && !i.op[op].regs->reg_type.bitfield.dword)
6131 || (need == need_qword
6132 && !i.op[op].regs->reg_type.bitfield.qword)))
6133 {
6134 as_bad (_("invalid register operand size for `%s'"),
6135 i.tm.name);
6136 return 0;
6137 }
6138 }
6139
6140 return 1;
6141 }
6142
6143 static int
6144 check_byte_reg (void)
6145 {
6146 int op;
6147
6148 for (op = i.operands; --op >= 0;)
6149 {
6150 /* Skip non-register operands. */
6151 if (!i.types[op].bitfield.reg)
6152 continue;
6153
6154 /* If this is an eight bit register, it's OK. If it's the 16 or
6155 32 bit version of an eight bit register, we will just use the
6156 low portion, and that's OK too. */
6157 if (i.types[op].bitfield.byte)
6158 continue;
6159
6160 /* I/O port address operands are OK too. */
6161 if (i.tm.operand_types[op].bitfield.inoutportreg)
6162 continue;
6163
6164 /* crc32 doesn't generate this warning. */
6165 if (i.tm.base_opcode == 0xf20f38f0)
6166 continue;
6167
6168 if ((i.types[op].bitfield.word
6169 || i.types[op].bitfield.dword
6170 || i.types[op].bitfield.qword)
6171 && i.op[op].regs->reg_num < 4
6172 /* Prohibit these changes in 64bit mode, since the lowering
6173 would be more complicated. */
6174 && flag_code != CODE_64BIT)
6175 {
6176 #if REGISTER_WARNINGS
6177 if (!quiet_warnings)
6178 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6179 register_prefix,
6180 (i.op[op].regs + (i.types[op].bitfield.word
6181 ? REGNAM_AL - REGNAM_AX
6182 : REGNAM_AL - REGNAM_EAX))->reg_name,
6183 register_prefix,
6184 i.op[op].regs->reg_name,
6185 i.suffix);
6186 #endif
6187 continue;
6188 }
6189 /* Any other register is bad. */
6190 if (i.types[op].bitfield.reg
6191 || i.types[op].bitfield.regmmx
6192 || i.types[op].bitfield.regsimd
6193 || i.types[op].bitfield.sreg2
6194 || i.types[op].bitfield.sreg3
6195 || i.types[op].bitfield.control
6196 || i.types[op].bitfield.debug
6197 || i.types[op].bitfield.test)
6198 {
6199 as_bad (_("`%s%s' not allowed with `%s%c'"),
6200 register_prefix,
6201 i.op[op].regs->reg_name,
6202 i.tm.name,
6203 i.suffix);
6204 return 0;
6205 }
6206 }
6207 return 1;
6208 }
6209
6210 static int
6211 check_long_reg (void)
6212 {
6213 int op;
6214
6215 for (op = i.operands; --op >= 0;)
6216 /* Skip non-register operands. */
6217 if (!i.types[op].bitfield.reg)
6218 continue;
6219 /* Reject eight bit registers, except where the template requires
6220 them. (eg. movzb) */
6221 else if (i.types[op].bitfield.byte
6222 && (i.tm.operand_types[op].bitfield.reg
6223 || i.tm.operand_types[op].bitfield.acc)
6224 && (i.tm.operand_types[op].bitfield.word
6225 || i.tm.operand_types[op].bitfield.dword))
6226 {
6227 as_bad (_("`%s%s' not allowed with `%s%c'"),
6228 register_prefix,
6229 i.op[op].regs->reg_name,
6230 i.tm.name,
6231 i.suffix);
6232 return 0;
6233 }
6234 /* Warn if the e prefix on a general reg is missing. */
6235 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6236 && i.types[op].bitfield.word
6237 && (i.tm.operand_types[op].bitfield.reg
6238 || i.tm.operand_types[op].bitfield.acc)
6239 && i.tm.operand_types[op].bitfield.dword)
6240 {
6241 /* Prohibit these changes in the 64bit mode, since the
6242 lowering is more complicated. */
6243 if (flag_code == CODE_64BIT)
6244 {
6245 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6246 register_prefix, i.op[op].regs->reg_name,
6247 i.suffix);
6248 return 0;
6249 }
6250 #if REGISTER_WARNINGS
6251 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6252 register_prefix,
6253 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
6254 register_prefix, i.op[op].regs->reg_name, i.suffix);
6255 #endif
6256 }
6257 /* Warn if the r prefix on a general reg is present. */
6258 else if (i.types[op].bitfield.qword
6259 && (i.tm.operand_types[op].bitfield.reg
6260 || i.tm.operand_types[op].bitfield.acc)
6261 && i.tm.operand_types[op].bitfield.dword)
6262 {
6263 if (intel_syntax
6264 && i.tm.opcode_modifier.toqword
6265 && !i.types[0].bitfield.regsimd)
6266 {
6267 /* Convert to QWORD. We want REX byte. */
6268 i.suffix = QWORD_MNEM_SUFFIX;
6269 }
6270 else
6271 {
6272 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6273 register_prefix, i.op[op].regs->reg_name,
6274 i.suffix);
6275 return 0;
6276 }
6277 }
6278 return 1;
6279 }
6280
6281 static int
6282 check_qword_reg (void)
6283 {
6284 int op;
6285
6286 for (op = i.operands; --op >= 0; )
6287 /* Skip non-register operands. */
6288 if (!i.types[op].bitfield.reg)
6289 continue;
6290 /* Reject eight bit registers, except where the template requires
6291 them. (eg. movzb) */
6292 else if (i.types[op].bitfield.byte
6293 && (i.tm.operand_types[op].bitfield.reg
6294 || i.tm.operand_types[op].bitfield.acc)
6295 && (i.tm.operand_types[op].bitfield.word
6296 || i.tm.operand_types[op].bitfield.dword))
6297 {
6298 as_bad (_("`%s%s' not allowed with `%s%c'"),
6299 register_prefix,
6300 i.op[op].regs->reg_name,
6301 i.tm.name,
6302 i.suffix);
6303 return 0;
6304 }
6305 /* Warn if the r prefix on a general reg is missing. */
6306 else if ((i.types[op].bitfield.word
6307 || i.types[op].bitfield.dword)
6308 && (i.tm.operand_types[op].bitfield.reg
6309 || i.tm.operand_types[op].bitfield.acc)
6310 && i.tm.operand_types[op].bitfield.qword)
6311 {
6312 /* Prohibit these changes in the 64bit mode, since the
6313 lowering is more complicated. */
6314 if (intel_syntax
6315 && i.tm.opcode_modifier.todword
6316 && !i.types[0].bitfield.regsimd)
6317 {
6318 /* Convert to DWORD. We don't want REX byte. */
6319 i.suffix = LONG_MNEM_SUFFIX;
6320 }
6321 else
6322 {
6323 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6324 register_prefix, i.op[op].regs->reg_name,
6325 i.suffix);
6326 return 0;
6327 }
6328 }
6329 return 1;
6330 }
6331
6332 static int
6333 check_word_reg (void)
6334 {
6335 int op;
6336 for (op = i.operands; --op >= 0;)
6337 /* Skip non-register operands. */
6338 if (!i.types[op].bitfield.reg)
6339 continue;
6340 /* Reject eight bit registers, except where the template requires
6341 them. (eg. movzb) */
6342 else if (i.types[op].bitfield.byte
6343 && (i.tm.operand_types[op].bitfield.reg
6344 || i.tm.operand_types[op].bitfield.acc)
6345 && (i.tm.operand_types[op].bitfield.word
6346 || i.tm.operand_types[op].bitfield.dword))
6347 {
6348 as_bad (_("`%s%s' not allowed with `%s%c'"),
6349 register_prefix,
6350 i.op[op].regs->reg_name,
6351 i.tm.name,
6352 i.suffix);
6353 return 0;
6354 }
6355 /* Warn if the e or r prefix on a general reg is present. */
6356 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6357 && (i.types[op].bitfield.dword
6358 || i.types[op].bitfield.qword)
6359 && (i.tm.operand_types[op].bitfield.reg
6360 || i.tm.operand_types[op].bitfield.acc)
6361 && i.tm.operand_types[op].bitfield.word)
6362 {
6363 /* Prohibit these changes in the 64bit mode, since the
6364 lowering is more complicated. */
6365 if (flag_code == CODE_64BIT)
6366 {
6367 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6368 register_prefix, i.op[op].regs->reg_name,
6369 i.suffix);
6370 return 0;
6371 }
6372 #if REGISTER_WARNINGS
6373 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6374 register_prefix,
6375 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
6376 register_prefix, i.op[op].regs->reg_name, i.suffix);
6377 #endif
6378 }
6379 return 1;
6380 }
6381
6382 static int
6383 update_imm (unsigned int j)
6384 {
6385 i386_operand_type overlap = i.types[j];
6386 if ((overlap.bitfield.imm8
6387 || overlap.bitfield.imm8s
6388 || overlap.bitfield.imm16
6389 || overlap.bitfield.imm32
6390 || overlap.bitfield.imm32s
6391 || overlap.bitfield.imm64)
6392 && !operand_type_equal (&overlap, &imm8)
6393 && !operand_type_equal (&overlap, &imm8s)
6394 && !operand_type_equal (&overlap, &imm16)
6395 && !operand_type_equal (&overlap, &imm32)
6396 && !operand_type_equal (&overlap, &imm32s)
6397 && !operand_type_equal (&overlap, &imm64))
6398 {
6399 if (i.suffix)
6400 {
6401 i386_operand_type temp;
6402
6403 operand_type_set (&temp, 0);
6404 if (i.suffix == BYTE_MNEM_SUFFIX)
6405 {
6406 temp.bitfield.imm8 = overlap.bitfield.imm8;
6407 temp.bitfield.imm8s = overlap.bitfield.imm8s;
6408 }
6409 else if (i.suffix == WORD_MNEM_SUFFIX)
6410 temp.bitfield.imm16 = overlap.bitfield.imm16;
6411 else if (i.suffix == QWORD_MNEM_SUFFIX)
6412 {
6413 temp.bitfield.imm64 = overlap.bitfield.imm64;
6414 temp.bitfield.imm32s = overlap.bitfield.imm32s;
6415 }
6416 else
6417 temp.bitfield.imm32 = overlap.bitfield.imm32;
6418 overlap = temp;
6419 }
6420 else if (operand_type_equal (&overlap, &imm16_32_32s)
6421 || operand_type_equal (&overlap, &imm16_32)
6422 || operand_type_equal (&overlap, &imm16_32s))
6423 {
6424 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6425 overlap = imm16;
6426 else
6427 overlap = imm32s;
6428 }
6429 if (!operand_type_equal (&overlap, &imm8)
6430 && !operand_type_equal (&overlap, &imm8s)
6431 && !operand_type_equal (&overlap, &imm16)
6432 && !operand_type_equal (&overlap, &imm32)
6433 && !operand_type_equal (&overlap, &imm32s)
6434 && !operand_type_equal (&overlap, &imm64))
6435 {
6436 as_bad (_("no instruction mnemonic suffix given; "
6437 "can't determine immediate size"));
6438 return 0;
6439 }
6440 }
6441 i.types[j] = overlap;
6442
6443 return 1;
6444 }
6445
6446 static int
6447 finalize_imm (void)
6448 {
6449 unsigned int j, n;
6450
6451 /* Update the first 2 immediate operands. */
6452 n = i.operands > 2 ? 2 : i.operands;
6453 if (n)
6454 {
6455 for (j = 0; j < n; j++)
6456 if (update_imm (j) == 0)
6457 return 0;
6458
6459 /* The 3rd operand can't be immediate operand. */
6460 gas_assert (operand_type_check (i.types[2], imm) == 0);
6461 }
6462
6463 return 1;
6464 }
6465
6466 static int
6467 process_operands (void)
6468 {
6469 /* Default segment register this instruction will use for memory
6470 accesses. 0 means unknown. This is only for optimizing out
6471 unnecessary segment overrides. */
6472 const seg_entry *default_seg = 0;
6473
6474 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6475 {
6476 unsigned int dupl = i.operands;
6477 unsigned int dest = dupl - 1;
6478 unsigned int j;
6479
6480 /* The destination must be an xmm register. */
6481 gas_assert (i.reg_operands
6482 && MAX_OPERANDS > dupl
6483 && operand_type_equal (&i.types[dest], &regxmm));
6484
6485 if (i.tm.operand_types[0].bitfield.acc
6486 && i.tm.operand_types[0].bitfield.xmmword)
6487 {
6488 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6489 {
6490 /* Keep xmm0 for instructions with VEX prefix and 3
6491 sources. */
6492 i.tm.operand_types[0].bitfield.acc = 0;
6493 i.tm.operand_types[0].bitfield.regsimd = 1;
6494 goto duplicate;
6495 }
6496 else
6497 {
6498 /* We remove the first xmm0 and keep the number of
6499 operands unchanged, which in fact duplicates the
6500 destination. */
6501 for (j = 1; j < i.operands; j++)
6502 {
6503 i.op[j - 1] = i.op[j];
6504 i.types[j - 1] = i.types[j];
6505 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6506 }
6507 }
6508 }
6509 else if (i.tm.opcode_modifier.implicit1stxmm0)
6510 {
6511 gas_assert ((MAX_OPERANDS - 1) > dupl
6512 && (i.tm.opcode_modifier.vexsources
6513 == VEX3SOURCES));
6514
6515 /* Add the implicit xmm0 for instructions with VEX prefix
6516 and 3 sources. */
6517 for (j = i.operands; j > 0; j--)
6518 {
6519 i.op[j] = i.op[j - 1];
6520 i.types[j] = i.types[j - 1];
6521 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
6522 }
6523 i.op[0].regs
6524 = (const reg_entry *) hash_find (reg_hash, "xmm0");
6525 i.types[0] = regxmm;
6526 i.tm.operand_types[0] = regxmm;
6527
6528 i.operands += 2;
6529 i.reg_operands += 2;
6530 i.tm.operands += 2;
6531
6532 dupl++;
6533 dest++;
6534 i.op[dupl] = i.op[dest];
6535 i.types[dupl] = i.types[dest];
6536 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6537 }
6538 else
6539 {
6540 duplicate:
6541 i.operands++;
6542 i.reg_operands++;
6543 i.tm.operands++;
6544
6545 i.op[dupl] = i.op[dest];
6546 i.types[dupl] = i.types[dest];
6547 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6548 }
6549
6550 if (i.tm.opcode_modifier.immext)
6551 process_immext ();
6552 }
6553 else if (i.tm.operand_types[0].bitfield.acc
6554 && i.tm.operand_types[0].bitfield.xmmword)
6555 {
6556 unsigned int j;
6557
6558 for (j = 1; j < i.operands; j++)
6559 {
6560 i.op[j - 1] = i.op[j];
6561 i.types[j - 1] = i.types[j];
6562
6563 /* We need to adjust fields in i.tm since they are used by
6564 build_modrm_byte. */
6565 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
6566 }
6567
6568 i.operands--;
6569 i.reg_operands--;
6570 i.tm.operands--;
6571 }
6572 else if (i.tm.opcode_modifier.implicitquadgroup)
6573 {
6574 unsigned int regnum, first_reg_in_group, last_reg_in_group;
6575
6576 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
6577 gas_assert (i.operands >= 2 && i.types[1].bitfield.regsimd);
6578 regnum = register_number (i.op[1].regs);
6579 first_reg_in_group = regnum & ~3;
6580 last_reg_in_group = first_reg_in_group + 3;
6581 if (regnum != first_reg_in_group)
6582 as_warn (_("source register `%s%s' implicitly denotes"
6583 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
6584 register_prefix, i.op[1].regs->reg_name,
6585 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
6586 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
6587 i.tm.name);
6588 }
6589 else if (i.tm.opcode_modifier.regkludge)
6590 {
6591 /* The imul $imm, %reg instruction is converted into
6592 imul $imm, %reg, %reg, and the clr %reg instruction
6593 is converted into xor %reg, %reg. */
6594
6595 unsigned int first_reg_op;
6596
6597 if (operand_type_check (i.types[0], reg))
6598 first_reg_op = 0;
6599 else
6600 first_reg_op = 1;
6601 /* Pretend we saw the extra register operand. */
6602 gas_assert (i.reg_operands == 1
6603 && i.op[first_reg_op + 1].regs == 0);
6604 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
6605 i.types[first_reg_op + 1] = i.types[first_reg_op];
6606 i.operands++;
6607 i.reg_operands++;
6608 }
6609
6610 if (i.tm.opcode_modifier.shortform)
6611 {
6612 if (i.types[0].bitfield.sreg2
6613 || i.types[0].bitfield.sreg3)
6614 {
6615 if (i.tm.base_opcode == POP_SEG_SHORT
6616 && i.op[0].regs->reg_num == 1)
6617 {
6618 as_bad (_("you can't `pop %scs'"), register_prefix);
6619 return 0;
6620 }
6621 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
6622 if ((i.op[0].regs->reg_flags & RegRex) != 0)
6623 i.rex |= REX_B;
6624 }
6625 else
6626 {
6627 /* The register or float register operand is in operand
6628 0 or 1. */
6629 unsigned int op;
6630
6631 if ((i.types[0].bitfield.reg && i.types[0].bitfield.tbyte)
6632 || operand_type_check (i.types[0], reg))
6633 op = 0;
6634 else
6635 op = 1;
6636 /* Register goes in low 3 bits of opcode. */
6637 i.tm.base_opcode |= i.op[op].regs->reg_num;
6638 if ((i.op[op].regs->reg_flags & RegRex) != 0)
6639 i.rex |= REX_B;
6640 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
6641 {
6642 /* Warn about some common errors, but press on regardless.
6643 The first case can be generated by gcc (<= 2.8.1). */
6644 if (i.operands == 2)
6645 {
6646 /* Reversed arguments on faddp, fsubp, etc. */
6647 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
6648 register_prefix, i.op[!intel_syntax].regs->reg_name,
6649 register_prefix, i.op[intel_syntax].regs->reg_name);
6650 }
6651 else
6652 {
6653 /* Extraneous `l' suffix on fp insn. */
6654 as_warn (_("translating to `%s %s%s'"), i.tm.name,
6655 register_prefix, i.op[0].regs->reg_name);
6656 }
6657 }
6658 }
6659 }
6660 else if (i.tm.opcode_modifier.modrm)
6661 {
6662 /* The opcode is completed (modulo i.tm.extension_opcode which
6663 must be put into the modrm byte). Now, we make the modrm and
6664 index base bytes based on all the info we've collected. */
6665
6666 default_seg = build_modrm_byte ();
6667 }
6668 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
6669 {
6670 default_seg = &ds;
6671 }
6672 else if (i.tm.opcode_modifier.isstring)
6673 {
6674 /* For the string instructions that allow a segment override
6675 on one of their operands, the default segment is ds. */
6676 default_seg = &ds;
6677 }
6678
6679 if (i.tm.base_opcode == 0x8d /* lea */
6680 && i.seg[0]
6681 && !quiet_warnings)
6682 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
6683
6684 /* If a segment was explicitly specified, and the specified segment
6685 is not the default, use an opcode prefix to select it. If we
6686 never figured out what the default segment is, then default_seg
6687 will be zero at this point, and the specified segment prefix will
6688 always be used. */
6689 if ((i.seg[0]) && (i.seg[0] != default_seg))
6690 {
6691 if (!add_prefix (i.seg[0]->seg_prefix))
6692 return 0;
6693 }
6694 return 1;
6695 }
6696
6697 static const seg_entry *
6698 build_modrm_byte (void)
6699 {
6700 const seg_entry *default_seg = 0;
6701 unsigned int source, dest;
6702 int vex_3_sources;
6703
6704 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
6705 if (vex_3_sources)
6706 {
6707 unsigned int nds, reg_slot;
6708 expressionS *exp;
6709
6710 dest = i.operands - 1;
6711 nds = dest - 1;
6712
6713 /* There are 2 kinds of instructions:
6714 1. 5 operands: 4 register operands or 3 register operands
6715 plus 1 memory operand plus one Vec_Imm4 operand, VexXDS, and
6716 VexW0 or VexW1. The destination must be either XMM, YMM or
6717 ZMM register.
6718 2. 4 operands: 4 register operands or 3 register operands
6719 plus 1 memory operand, with VexXDS. */
6720 gas_assert ((i.reg_operands == 4
6721 || (i.reg_operands == 3 && i.mem_operands == 1))
6722 && i.tm.opcode_modifier.vexvvvv == VEXXDS
6723 && i.tm.opcode_modifier.vexw
6724 && i.tm.operand_types[dest].bitfield.regsimd);
6725
6726 /* If VexW1 is set, the first non-immediate operand is the source and
6727 the second non-immediate one is encoded in the immediate operand. */
6728 if (i.tm.opcode_modifier.vexw == VEXW1)
6729 {
6730 source = i.imm_operands;
6731 reg_slot = i.imm_operands + 1;
6732 }
6733 else
6734 {
6735 source = i.imm_operands + 1;
6736 reg_slot = i.imm_operands;
6737 }
6738
6739 if (i.imm_operands == 0)
6740 {
6741 /* When there is no immediate operand, generate an 8bit
6742 immediate operand to encode the first operand. */
6743 exp = &im_expressions[i.imm_operands++];
6744 i.op[i.operands].imms = exp;
6745 i.types[i.operands] = imm8;
6746 i.operands++;
6747
6748 gas_assert (i.tm.operand_types[reg_slot].bitfield.regsimd);
6749 exp->X_op = O_constant;
6750 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
6751 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
6752 }
6753 else
6754 {
6755 unsigned int imm_slot;
6756
6757 gas_assert (i.imm_operands == 1 && i.types[0].bitfield.vec_imm4);
6758
6759 if (i.tm.opcode_modifier.immext)
6760 {
6761 /* When ImmExt is set, the immediate byte is the last
6762 operand. */
6763 imm_slot = i.operands - 1;
6764 source--;
6765 reg_slot--;
6766 }
6767 else
6768 {
6769 imm_slot = 0;
6770
6771 /* Turn on Imm8 so that output_imm will generate it. */
6772 i.types[imm_slot].bitfield.imm8 = 1;
6773 }
6774
6775 gas_assert (i.tm.operand_types[reg_slot].bitfield.regsimd);
6776 i.op[imm_slot].imms->X_add_number
6777 |= register_number (i.op[reg_slot].regs) << 4;
6778 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
6779 }
6780
6781 gas_assert (i.tm.operand_types[nds].bitfield.regsimd);
6782 i.vex.register_specifier = i.op[nds].regs;
6783 }
6784 else
6785 source = dest = 0;
6786
6787 /* i.reg_operands MUST be the number of real register operands;
6788 implicit registers do not count. If there are 3 register
6789 operands, it must be a instruction with VexNDS. For a
6790 instruction with VexNDD, the destination register is encoded
6791 in VEX prefix. If there are 4 register operands, it must be
6792 a instruction with VEX prefix and 3 sources. */
6793 if (i.mem_operands == 0
6794 && ((i.reg_operands == 2
6795 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
6796 || (i.reg_operands == 3
6797 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
6798 || (i.reg_operands == 4 && vex_3_sources)))
6799 {
6800 switch (i.operands)
6801 {
6802 case 2:
6803 source = 0;
6804 break;
6805 case 3:
6806 /* When there are 3 operands, one of them may be immediate,
6807 which may be the first or the last operand. Otherwise,
6808 the first operand must be shift count register (cl) or it
6809 is an instruction with VexNDS. */
6810 gas_assert (i.imm_operands == 1
6811 || (i.imm_operands == 0
6812 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
6813 || i.types[0].bitfield.shiftcount)));
6814 if (operand_type_check (i.types[0], imm)
6815 || i.types[0].bitfield.shiftcount)
6816 source = 1;
6817 else
6818 source = 0;
6819 break;
6820 case 4:
6821 /* When there are 4 operands, the first two must be 8bit
6822 immediate operands. The source operand will be the 3rd
6823 one.
6824
6825 For instructions with VexNDS, if the first operand
6826 an imm8, the source operand is the 2nd one. If the last
6827 operand is imm8, the source operand is the first one. */
6828 gas_assert ((i.imm_operands == 2
6829 && i.types[0].bitfield.imm8
6830 && i.types[1].bitfield.imm8)
6831 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
6832 && i.imm_operands == 1
6833 && (i.types[0].bitfield.imm8
6834 || i.types[i.operands - 1].bitfield.imm8
6835 || i.rounding)));
6836 if (i.imm_operands == 2)
6837 source = 2;
6838 else
6839 {
6840 if (i.types[0].bitfield.imm8)
6841 source = 1;
6842 else
6843 source = 0;
6844 }
6845 break;
6846 case 5:
6847 if (is_evex_encoding (&i.tm))
6848 {
6849 /* For EVEX instructions, when there are 5 operands, the
6850 first one must be immediate operand. If the second one
6851 is immediate operand, the source operand is the 3th
6852 one. If the last one is immediate operand, the source
6853 operand is the 2nd one. */
6854 gas_assert (i.imm_operands == 2
6855 && i.tm.opcode_modifier.sae
6856 && operand_type_check (i.types[0], imm));
6857 if (operand_type_check (i.types[1], imm))
6858 source = 2;
6859 else if (operand_type_check (i.types[4], imm))
6860 source = 1;
6861 else
6862 abort ();
6863 }
6864 break;
6865 default:
6866 abort ();
6867 }
6868
6869 if (!vex_3_sources)
6870 {
6871 dest = source + 1;
6872
6873 /* RC/SAE operand could be between DEST and SRC. That happens
6874 when one operand is GPR and the other one is XMM/YMM/ZMM
6875 register. */
6876 if (i.rounding && i.rounding->operand == (int) dest)
6877 dest++;
6878
6879 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
6880 {
6881 /* For instructions with VexNDS, the register-only source
6882 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
6883 register. It is encoded in VEX prefix. We need to
6884 clear RegMem bit before calling operand_type_equal. */
6885
6886 i386_operand_type op;
6887 unsigned int vvvv;
6888
6889 /* Check register-only source operand when two source
6890 operands are swapped. */
6891 if (!i.tm.operand_types[source].bitfield.baseindex
6892 && i.tm.operand_types[dest].bitfield.baseindex)
6893 {
6894 vvvv = source;
6895 source = dest;
6896 }
6897 else
6898 vvvv = dest;
6899
6900 op = i.tm.operand_types[vvvv];
6901 op.bitfield.regmem = 0;
6902 if ((dest + 1) >= i.operands
6903 || ((!op.bitfield.reg
6904 || (!op.bitfield.dword && !op.bitfield.qword))
6905 && !op.bitfield.regsimd
6906 && !operand_type_equal (&op, &regmask)))
6907 abort ();
6908 i.vex.register_specifier = i.op[vvvv].regs;
6909 dest++;
6910 }
6911 }
6912
6913 i.rm.mode = 3;
6914 /* One of the register operands will be encoded in the i.tm.reg
6915 field, the other in the combined i.tm.mode and i.tm.regmem
6916 fields. If no form of this instruction supports a memory
6917 destination operand, then we assume the source operand may
6918 sometimes be a memory operand and so we need to store the
6919 destination in the i.rm.reg field. */
6920 if (!i.tm.operand_types[dest].bitfield.regmem
6921 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
6922 {
6923 i.rm.reg = i.op[dest].regs->reg_num;
6924 i.rm.regmem = i.op[source].regs->reg_num;
6925 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
6926 i.rex |= REX_R;
6927 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
6928 i.vrex |= REX_R;
6929 if ((i.op[source].regs->reg_flags & RegRex) != 0)
6930 i.rex |= REX_B;
6931 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
6932 i.vrex |= REX_B;
6933 }
6934 else
6935 {
6936 i.rm.reg = i.op[source].regs->reg_num;
6937 i.rm.regmem = i.op[dest].regs->reg_num;
6938 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
6939 i.rex |= REX_B;
6940 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
6941 i.vrex |= REX_B;
6942 if ((i.op[source].regs->reg_flags & RegRex) != 0)
6943 i.rex |= REX_R;
6944 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
6945 i.vrex |= REX_R;
6946 }
6947 if (flag_code != CODE_64BIT && (i.rex & REX_R))
6948 {
6949 if (!i.types[i.tm.operand_types[0].bitfield.regmem].bitfield.control)
6950 abort ();
6951 i.rex &= ~REX_R;
6952 add_prefix (LOCK_PREFIX_OPCODE);
6953 }
6954 }
6955 else
6956 { /* If it's not 2 reg operands... */
6957 unsigned int mem;
6958
6959 if (i.mem_operands)
6960 {
6961 unsigned int fake_zero_displacement = 0;
6962 unsigned int op;
6963
6964 for (op = 0; op < i.operands; op++)
6965 if (operand_type_check (i.types[op], anymem))
6966 break;
6967 gas_assert (op < i.operands);
6968
6969 if (i.tm.opcode_modifier.vecsib)
6970 {
6971 if (i.index_reg->reg_num == RegEiz
6972 || i.index_reg->reg_num == RegRiz)
6973 abort ();
6974
6975 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6976 if (!i.base_reg)
6977 {
6978 i.sib.base = NO_BASE_REGISTER;
6979 i.sib.scale = i.log2_scale_factor;
6980 i.types[op].bitfield.disp8 = 0;
6981 i.types[op].bitfield.disp16 = 0;
6982 i.types[op].bitfield.disp64 = 0;
6983 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
6984 {
6985 /* Must be 32 bit */
6986 i.types[op].bitfield.disp32 = 1;
6987 i.types[op].bitfield.disp32s = 0;
6988 }
6989 else
6990 {
6991 i.types[op].bitfield.disp32 = 0;
6992 i.types[op].bitfield.disp32s = 1;
6993 }
6994 }
6995 i.sib.index = i.index_reg->reg_num;
6996 if ((i.index_reg->reg_flags & RegRex) != 0)
6997 i.rex |= REX_X;
6998 if ((i.index_reg->reg_flags & RegVRex) != 0)
6999 i.vrex |= REX_X;
7000 }
7001
7002 default_seg = &ds;
7003
7004 if (i.base_reg == 0)
7005 {
7006 i.rm.mode = 0;
7007 if (!i.disp_operands)
7008 fake_zero_displacement = 1;
7009 if (i.index_reg == 0)
7010 {
7011 i386_operand_type newdisp;
7012
7013 gas_assert (!i.tm.opcode_modifier.vecsib);
7014 /* Operand is just <disp> */
7015 if (flag_code == CODE_64BIT)
7016 {
7017 /* 64bit mode overwrites the 32bit absolute
7018 addressing by RIP relative addressing and
7019 absolute addressing is encoded by one of the
7020 redundant SIB forms. */
7021 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7022 i.sib.base = NO_BASE_REGISTER;
7023 i.sib.index = NO_INDEX_REGISTER;
7024 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7025 }
7026 else if ((flag_code == CODE_16BIT)
7027 ^ (i.prefix[ADDR_PREFIX] != 0))
7028 {
7029 i.rm.regmem = NO_BASE_REGISTER_16;
7030 newdisp = disp16;
7031 }
7032 else
7033 {
7034 i.rm.regmem = NO_BASE_REGISTER;
7035 newdisp = disp32;
7036 }
7037 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7038 i.types[op] = operand_type_or (i.types[op], newdisp);
7039 }
7040 else if (!i.tm.opcode_modifier.vecsib)
7041 {
7042 /* !i.base_reg && i.index_reg */
7043 if (i.index_reg->reg_num == RegEiz
7044 || i.index_reg->reg_num == RegRiz)
7045 i.sib.index = NO_INDEX_REGISTER;
7046 else
7047 i.sib.index = i.index_reg->reg_num;
7048 i.sib.base = NO_BASE_REGISTER;
7049 i.sib.scale = i.log2_scale_factor;
7050 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7051 i.types[op].bitfield.disp8 = 0;
7052 i.types[op].bitfield.disp16 = 0;
7053 i.types[op].bitfield.disp64 = 0;
7054 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7055 {
7056 /* Must be 32 bit */
7057 i.types[op].bitfield.disp32 = 1;
7058 i.types[op].bitfield.disp32s = 0;
7059 }
7060 else
7061 {
7062 i.types[op].bitfield.disp32 = 0;
7063 i.types[op].bitfield.disp32s = 1;
7064 }
7065 if ((i.index_reg->reg_flags & RegRex) != 0)
7066 i.rex |= REX_X;
7067 }
7068 }
7069 /* RIP addressing for 64bit mode. */
7070 else if (i.base_reg->reg_num == RegRip ||
7071 i.base_reg->reg_num == RegEip)
7072 {
7073 gas_assert (!i.tm.opcode_modifier.vecsib);
7074 i.rm.regmem = NO_BASE_REGISTER;
7075 i.types[op].bitfield.disp8 = 0;
7076 i.types[op].bitfield.disp16 = 0;
7077 i.types[op].bitfield.disp32 = 0;
7078 i.types[op].bitfield.disp32s = 1;
7079 i.types[op].bitfield.disp64 = 0;
7080 i.flags[op] |= Operand_PCrel;
7081 if (! i.disp_operands)
7082 fake_zero_displacement = 1;
7083 }
7084 else if (i.base_reg->reg_type.bitfield.word)
7085 {
7086 gas_assert (!i.tm.opcode_modifier.vecsib);
7087 switch (i.base_reg->reg_num)
7088 {
7089 case 3: /* (%bx) */
7090 if (i.index_reg == 0)
7091 i.rm.regmem = 7;
7092 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
7093 i.rm.regmem = i.index_reg->reg_num - 6;
7094 break;
7095 case 5: /* (%bp) */
7096 default_seg = &ss;
7097 if (i.index_reg == 0)
7098 {
7099 i.rm.regmem = 6;
7100 if (operand_type_check (i.types[op], disp) == 0)
7101 {
7102 /* fake (%bp) into 0(%bp) */
7103 i.types[op].bitfield.disp8 = 1;
7104 fake_zero_displacement = 1;
7105 }
7106 }
7107 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
7108 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7109 break;
7110 default: /* (%si) -> 4 or (%di) -> 5 */
7111 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7112 }
7113 i.rm.mode = mode_from_disp_size (i.types[op]);
7114 }
7115 else /* i.base_reg and 32/64 bit mode */
7116 {
7117 if (flag_code == CODE_64BIT
7118 && operand_type_check (i.types[op], disp))
7119 {
7120 i.types[op].bitfield.disp16 = 0;
7121 i.types[op].bitfield.disp64 = 0;
7122 if (i.prefix[ADDR_PREFIX] == 0)
7123 {
7124 i.types[op].bitfield.disp32 = 0;
7125 i.types[op].bitfield.disp32s = 1;
7126 }
7127 else
7128 {
7129 i.types[op].bitfield.disp32 = 1;
7130 i.types[op].bitfield.disp32s = 0;
7131 }
7132 }
7133
7134 if (!i.tm.opcode_modifier.vecsib)
7135 i.rm.regmem = i.base_reg->reg_num;
7136 if ((i.base_reg->reg_flags & RegRex) != 0)
7137 i.rex |= REX_B;
7138 i.sib.base = i.base_reg->reg_num;
7139 /* x86-64 ignores REX prefix bit here to avoid decoder
7140 complications. */
7141 if (!(i.base_reg->reg_flags & RegRex)
7142 && (i.base_reg->reg_num == EBP_REG_NUM
7143 || i.base_reg->reg_num == ESP_REG_NUM))
7144 default_seg = &ss;
7145 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7146 {
7147 fake_zero_displacement = 1;
7148 i.types[op].bitfield.disp8 = 1;
7149 }
7150 i.sib.scale = i.log2_scale_factor;
7151 if (i.index_reg == 0)
7152 {
7153 gas_assert (!i.tm.opcode_modifier.vecsib);
7154 /* <disp>(%esp) becomes two byte modrm with no index
7155 register. We've already stored the code for esp
7156 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7157 Any base register besides %esp will not use the
7158 extra modrm byte. */
7159 i.sib.index = NO_INDEX_REGISTER;
7160 }
7161 else if (!i.tm.opcode_modifier.vecsib)
7162 {
7163 if (i.index_reg->reg_num == RegEiz
7164 || i.index_reg->reg_num == RegRiz)
7165 i.sib.index = NO_INDEX_REGISTER;
7166 else
7167 i.sib.index = i.index_reg->reg_num;
7168 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7169 if ((i.index_reg->reg_flags & RegRex) != 0)
7170 i.rex |= REX_X;
7171 }
7172
7173 if (i.disp_operands
7174 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7175 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7176 i.rm.mode = 0;
7177 else
7178 {
7179 if (!fake_zero_displacement
7180 && !i.disp_operands
7181 && i.disp_encoding)
7182 {
7183 fake_zero_displacement = 1;
7184 if (i.disp_encoding == disp_encoding_8bit)
7185 i.types[op].bitfield.disp8 = 1;
7186 else
7187 i.types[op].bitfield.disp32 = 1;
7188 }
7189 i.rm.mode = mode_from_disp_size (i.types[op]);
7190 }
7191 }
7192
7193 if (fake_zero_displacement)
7194 {
7195 /* Fakes a zero displacement assuming that i.types[op]
7196 holds the correct displacement size. */
7197 expressionS *exp;
7198
7199 gas_assert (i.op[op].disps == 0);
7200 exp = &disp_expressions[i.disp_operands++];
7201 i.op[op].disps = exp;
7202 exp->X_op = O_constant;
7203 exp->X_add_number = 0;
7204 exp->X_add_symbol = (symbolS *) 0;
7205 exp->X_op_symbol = (symbolS *) 0;
7206 }
7207
7208 mem = op;
7209 }
7210 else
7211 mem = ~0;
7212
7213 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7214 {
7215 if (operand_type_check (i.types[0], imm))
7216 i.vex.register_specifier = NULL;
7217 else
7218 {
7219 /* VEX.vvvv encodes one of the sources when the first
7220 operand is not an immediate. */
7221 if (i.tm.opcode_modifier.vexw == VEXW0)
7222 i.vex.register_specifier = i.op[0].regs;
7223 else
7224 i.vex.register_specifier = i.op[1].regs;
7225 }
7226
7227 /* Destination is a XMM register encoded in the ModRM.reg
7228 and VEX.R bit. */
7229 i.rm.reg = i.op[2].regs->reg_num;
7230 if ((i.op[2].regs->reg_flags & RegRex) != 0)
7231 i.rex |= REX_R;
7232
7233 /* ModRM.rm and VEX.B encodes the other source. */
7234 if (!i.mem_operands)
7235 {
7236 i.rm.mode = 3;
7237
7238 if (i.tm.opcode_modifier.vexw == VEXW0)
7239 i.rm.regmem = i.op[1].regs->reg_num;
7240 else
7241 i.rm.regmem = i.op[0].regs->reg_num;
7242
7243 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7244 i.rex |= REX_B;
7245 }
7246 }
7247 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7248 {
7249 i.vex.register_specifier = i.op[2].regs;
7250 if (!i.mem_operands)
7251 {
7252 i.rm.mode = 3;
7253 i.rm.regmem = i.op[1].regs->reg_num;
7254 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7255 i.rex |= REX_B;
7256 }
7257 }
7258 /* Fill in i.rm.reg or i.rm.regmem field with register operand
7259 (if any) based on i.tm.extension_opcode. Again, we must be
7260 careful to make sure that segment/control/debug/test/MMX
7261 registers are coded into the i.rm.reg field. */
7262 else if (i.reg_operands)
7263 {
7264 unsigned int op;
7265 unsigned int vex_reg = ~0;
7266
7267 for (op = 0; op < i.operands; op++)
7268 if (i.types[op].bitfield.reg
7269 || i.types[op].bitfield.regmmx
7270 || i.types[op].bitfield.regsimd
7271 || i.types[op].bitfield.regbnd
7272 || i.types[op].bitfield.regmask
7273 || i.types[op].bitfield.sreg2
7274 || i.types[op].bitfield.sreg3
7275 || i.types[op].bitfield.control
7276 || i.types[op].bitfield.debug
7277 || i.types[op].bitfield.test)
7278 break;
7279
7280 if (vex_3_sources)
7281 op = dest;
7282 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7283 {
7284 /* For instructions with VexNDS, the register-only
7285 source operand is encoded in VEX prefix. */
7286 gas_assert (mem != (unsigned int) ~0);
7287
7288 if (op > mem)
7289 {
7290 vex_reg = op++;
7291 gas_assert (op < i.operands);
7292 }
7293 else
7294 {
7295 /* Check register-only source operand when two source
7296 operands are swapped. */
7297 if (!i.tm.operand_types[op].bitfield.baseindex
7298 && i.tm.operand_types[op + 1].bitfield.baseindex)
7299 {
7300 vex_reg = op;
7301 op += 2;
7302 gas_assert (mem == (vex_reg + 1)
7303 && op < i.operands);
7304 }
7305 else
7306 {
7307 vex_reg = op + 1;
7308 gas_assert (vex_reg < i.operands);
7309 }
7310 }
7311 }
7312 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7313 {
7314 /* For instructions with VexNDD, the register destination
7315 is encoded in VEX prefix. */
7316 if (i.mem_operands == 0)
7317 {
7318 /* There is no memory operand. */
7319 gas_assert ((op + 2) == i.operands);
7320 vex_reg = op + 1;
7321 }
7322 else
7323 {
7324 /* There are only 2 non-immediate operands. */
7325 gas_assert (op < i.imm_operands + 2
7326 && i.operands == i.imm_operands + 2);
7327 vex_reg = i.imm_operands + 1;
7328 }
7329 }
7330 else
7331 gas_assert (op < i.operands);
7332
7333 if (vex_reg != (unsigned int) ~0)
7334 {
7335 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7336
7337 if ((!type->bitfield.reg
7338 || (!type->bitfield.dword && !type->bitfield.qword))
7339 && !type->bitfield.regsimd
7340 && !operand_type_equal (type, &regmask))
7341 abort ();
7342
7343 i.vex.register_specifier = i.op[vex_reg].regs;
7344 }
7345
7346 /* Don't set OP operand twice. */
7347 if (vex_reg != op)
7348 {
7349 /* If there is an extension opcode to put here, the
7350 register number must be put into the regmem field. */
7351 if (i.tm.extension_opcode != None)
7352 {
7353 i.rm.regmem = i.op[op].regs->reg_num;
7354 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7355 i.rex |= REX_B;
7356 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7357 i.vrex |= REX_B;
7358 }
7359 else
7360 {
7361 i.rm.reg = i.op[op].regs->reg_num;
7362 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7363 i.rex |= REX_R;
7364 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7365 i.vrex |= REX_R;
7366 }
7367 }
7368
7369 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7370 must set it to 3 to indicate this is a register operand
7371 in the regmem field. */
7372 if (!i.mem_operands)
7373 i.rm.mode = 3;
7374 }
7375
7376 /* Fill in i.rm.reg field with extension opcode (if any). */
7377 if (i.tm.extension_opcode != None)
7378 i.rm.reg = i.tm.extension_opcode;
7379 }
7380 return default_seg;
7381 }
7382
7383 static void
7384 output_branch (void)
7385 {
7386 char *p;
7387 int size;
7388 int code16;
7389 int prefix;
7390 relax_substateT subtype;
7391 symbolS *sym;
7392 offsetT off;
7393
7394 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7395 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7396
7397 prefix = 0;
7398 if (i.prefix[DATA_PREFIX] != 0)
7399 {
7400 prefix = 1;
7401 i.prefixes -= 1;
7402 code16 ^= CODE16;
7403 }
7404 /* Pentium4 branch hints. */
7405 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7406 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7407 {
7408 prefix++;
7409 i.prefixes--;
7410 }
7411 if (i.prefix[REX_PREFIX] != 0)
7412 {
7413 prefix++;
7414 i.prefixes--;
7415 }
7416
7417 /* BND prefixed jump. */
7418 if (i.prefix[BND_PREFIX] != 0)
7419 {
7420 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7421 i.prefixes -= 1;
7422 }
7423
7424 if (i.prefixes != 0 && !intel_syntax)
7425 as_warn (_("skipping prefixes on this instruction"));
7426
7427 /* It's always a symbol; End frag & setup for relax.
7428 Make sure there is enough room in this frag for the largest
7429 instruction we may generate in md_convert_frag. This is 2
7430 bytes for the opcode and room for the prefix and largest
7431 displacement. */
7432 frag_grow (prefix + 2 + 4);
7433 /* Prefix and 1 opcode byte go in fr_fix. */
7434 p = frag_more (prefix + 1);
7435 if (i.prefix[DATA_PREFIX] != 0)
7436 *p++ = DATA_PREFIX_OPCODE;
7437 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7438 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7439 *p++ = i.prefix[SEG_PREFIX];
7440 if (i.prefix[REX_PREFIX] != 0)
7441 *p++ = i.prefix[REX_PREFIX];
7442 *p = i.tm.base_opcode;
7443
7444 if ((unsigned char) *p == JUMP_PC_RELATIVE)
7445 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7446 else if (cpu_arch_flags.bitfield.cpui386)
7447 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7448 else
7449 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7450 subtype |= code16;
7451
7452 sym = i.op[0].disps->X_add_symbol;
7453 off = i.op[0].disps->X_add_number;
7454
7455 if (i.op[0].disps->X_op != O_constant
7456 && i.op[0].disps->X_op != O_symbol)
7457 {
7458 /* Handle complex expressions. */
7459 sym = make_expr_symbol (i.op[0].disps);
7460 off = 0;
7461 }
7462
7463 /* 1 possible extra opcode + 4 byte displacement go in var part.
7464 Pass reloc in fr_var. */
7465 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7466 }
7467
7468 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7469 /* Return TRUE iff PLT32 relocation should be used for branching to
7470 symbol S. */
7471
7472 static bfd_boolean
7473 need_plt32_p (symbolS *s)
7474 {
7475 /* PLT32 relocation is ELF only. */
7476 if (!IS_ELF)
7477 return FALSE;
7478
7479 /* Since there is no need to prepare for PLT branch on x86-64, we
7480 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
7481 be used as a marker for 32-bit PC-relative branches. */
7482 if (!object_64bit)
7483 return FALSE;
7484
7485 /* Weak or undefined symbol need PLT32 relocation. */
7486 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
7487 return TRUE;
7488
7489 /* Non-global symbol doesn't need PLT32 relocation. */
7490 if (! S_IS_EXTERNAL (s))
7491 return FALSE;
7492
7493 /* Other global symbols need PLT32 relocation. NB: Symbol with
7494 non-default visibilities are treated as normal global symbol
7495 so that PLT32 relocation can be used as a marker for 32-bit
7496 PC-relative branches. It is useful for linker relaxation. */
7497 return TRUE;
7498 }
7499 #endif
7500
7501 static void
7502 output_jump (void)
7503 {
7504 char *p;
7505 int size;
7506 fixS *fixP;
7507 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
7508
7509 if (i.tm.opcode_modifier.jumpbyte)
7510 {
7511 /* This is a loop or jecxz type instruction. */
7512 size = 1;
7513 if (i.prefix[ADDR_PREFIX] != 0)
7514 {
7515 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
7516 i.prefixes -= 1;
7517 }
7518 /* Pentium4 branch hints. */
7519 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7520 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7521 {
7522 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
7523 i.prefixes--;
7524 }
7525 }
7526 else
7527 {
7528 int code16;
7529
7530 code16 = 0;
7531 if (flag_code == CODE_16BIT)
7532 code16 = CODE16;
7533
7534 if (i.prefix[DATA_PREFIX] != 0)
7535 {
7536 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
7537 i.prefixes -= 1;
7538 code16 ^= CODE16;
7539 }
7540
7541 size = 4;
7542 if (code16)
7543 size = 2;
7544 }
7545
7546 if (i.prefix[REX_PREFIX] != 0)
7547 {
7548 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
7549 i.prefixes -= 1;
7550 }
7551
7552 /* BND prefixed jump. */
7553 if (i.prefix[BND_PREFIX] != 0)
7554 {
7555 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7556 i.prefixes -= 1;
7557 }
7558
7559 if (i.prefixes != 0 && !intel_syntax)
7560 as_warn (_("skipping prefixes on this instruction"));
7561
7562 p = frag_more (i.tm.opcode_length + size);
7563 switch (i.tm.opcode_length)
7564 {
7565 case 2:
7566 *p++ = i.tm.base_opcode >> 8;
7567 /* Fall through. */
7568 case 1:
7569 *p++ = i.tm.base_opcode;
7570 break;
7571 default:
7572 abort ();
7573 }
7574
7575 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7576 if (size == 4
7577 && jump_reloc == NO_RELOC
7578 && need_plt32_p (i.op[0].disps->X_add_symbol))
7579 jump_reloc = BFD_RELOC_X86_64_PLT32;
7580 #endif
7581
7582 jump_reloc = reloc (size, 1, 1, jump_reloc);
7583
7584 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7585 i.op[0].disps, 1, jump_reloc);
7586
7587 /* All jumps handled here are signed, but don't use a signed limit
7588 check for 32 and 16 bit jumps as we want to allow wrap around at
7589 4G and 64k respectively. */
7590 if (size == 1)
7591 fixP->fx_signed = 1;
7592 }
7593
7594 static void
7595 output_interseg_jump (void)
7596 {
7597 char *p;
7598 int size;
7599 int prefix;
7600 int code16;
7601
7602 code16 = 0;
7603 if (flag_code == CODE_16BIT)
7604 code16 = CODE16;
7605
7606 prefix = 0;
7607 if (i.prefix[DATA_PREFIX] != 0)
7608 {
7609 prefix = 1;
7610 i.prefixes -= 1;
7611 code16 ^= CODE16;
7612 }
7613 if (i.prefix[REX_PREFIX] != 0)
7614 {
7615 prefix++;
7616 i.prefixes -= 1;
7617 }
7618
7619 size = 4;
7620 if (code16)
7621 size = 2;
7622
7623 if (i.prefixes != 0 && !intel_syntax)
7624 as_warn (_("skipping prefixes on this instruction"));
7625
7626 /* 1 opcode; 2 segment; offset */
7627 p = frag_more (prefix + 1 + 2 + size);
7628
7629 if (i.prefix[DATA_PREFIX] != 0)
7630 *p++ = DATA_PREFIX_OPCODE;
7631
7632 if (i.prefix[REX_PREFIX] != 0)
7633 *p++ = i.prefix[REX_PREFIX];
7634
7635 *p++ = i.tm.base_opcode;
7636 if (i.op[1].imms->X_op == O_constant)
7637 {
7638 offsetT n = i.op[1].imms->X_add_number;
7639
7640 if (size == 2
7641 && !fits_in_unsigned_word (n)
7642 && !fits_in_signed_word (n))
7643 {
7644 as_bad (_("16-bit jump out of range"));
7645 return;
7646 }
7647 md_number_to_chars (p, n, size);
7648 }
7649 else
7650 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7651 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
7652 if (i.op[0].imms->X_op != O_constant)
7653 as_bad (_("can't handle non absolute segment in `%s'"),
7654 i.tm.name);
7655 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
7656 }
7657
7658 static void
7659 output_insn (void)
7660 {
7661 fragS *insn_start_frag;
7662 offsetT insn_start_off;
7663
7664 /* Tie dwarf2 debug info to the address at the start of the insn.
7665 We can't do this after the insn has been output as the current
7666 frag may have been closed off. eg. by frag_var. */
7667 dwarf2_emit_insn (0);
7668
7669 insn_start_frag = frag_now;
7670 insn_start_off = frag_now_fix ();
7671
7672 /* Output jumps. */
7673 if (i.tm.opcode_modifier.jump)
7674 output_branch ();
7675 else if (i.tm.opcode_modifier.jumpbyte
7676 || i.tm.opcode_modifier.jumpdword)
7677 output_jump ();
7678 else if (i.tm.opcode_modifier.jumpintersegment)
7679 output_interseg_jump ();
7680 else
7681 {
7682 /* Output normal instructions here. */
7683 char *p;
7684 unsigned char *q;
7685 unsigned int j;
7686 unsigned int prefix;
7687
7688 if (avoid_fence
7689 && i.tm.base_opcode == 0xfae
7690 && i.operands == 1
7691 && i.imm_operands == 1
7692 && (i.op[0].imms->X_add_number == 0xe8
7693 || i.op[0].imms->X_add_number == 0xf0
7694 || i.op[0].imms->X_add_number == 0xf8))
7695 {
7696 /* Encode lfence, mfence, and sfence as
7697 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
7698 offsetT val = 0x240483f0ULL;
7699 p = frag_more (5);
7700 md_number_to_chars (p, val, 5);
7701 return;
7702 }
7703
7704 /* Some processors fail on LOCK prefix. This options makes
7705 assembler ignore LOCK prefix and serves as a workaround. */
7706 if (omit_lock_prefix)
7707 {
7708 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
7709 return;
7710 i.prefix[LOCK_PREFIX] = 0;
7711 }
7712
7713 /* Since the VEX/EVEX prefix contains the implicit prefix, we
7714 don't need the explicit prefix. */
7715 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
7716 {
7717 switch (i.tm.opcode_length)
7718 {
7719 case 3:
7720 if (i.tm.base_opcode & 0xff000000)
7721 {
7722 prefix = (i.tm.base_opcode >> 24) & 0xff;
7723 add_prefix (prefix);
7724 }
7725 break;
7726 case 2:
7727 if ((i.tm.base_opcode & 0xff0000) != 0)
7728 {
7729 prefix = (i.tm.base_opcode >> 16) & 0xff;
7730 if (!i.tm.cpu_flags.bitfield.cpupadlock
7731 || prefix != REPE_PREFIX_OPCODE
7732 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
7733 add_prefix (prefix);
7734 }
7735 break;
7736 case 1:
7737 break;
7738 case 0:
7739 /* Check for pseudo prefixes. */
7740 as_bad_where (insn_start_frag->fr_file,
7741 insn_start_frag->fr_line,
7742 _("pseudo prefix without instruction"));
7743 return;
7744 default:
7745 abort ();
7746 }
7747
7748 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
7749 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
7750 R_X86_64_GOTTPOFF relocation so that linker can safely
7751 perform IE->LE optimization. */
7752 if (x86_elf_abi == X86_64_X32_ABI
7753 && i.operands == 2
7754 && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
7755 && i.prefix[REX_PREFIX] == 0)
7756 add_prefix (REX_OPCODE);
7757 #endif
7758
7759 /* The prefix bytes. */
7760 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
7761 if (*q)
7762 FRAG_APPEND_1_CHAR (*q);
7763 }
7764 else
7765 {
7766 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
7767 if (*q)
7768 switch (j)
7769 {
7770 case REX_PREFIX:
7771 /* REX byte is encoded in VEX prefix. */
7772 break;
7773 case SEG_PREFIX:
7774 case ADDR_PREFIX:
7775 FRAG_APPEND_1_CHAR (*q);
7776 break;
7777 default:
7778 /* There should be no other prefixes for instructions
7779 with VEX prefix. */
7780 abort ();
7781 }
7782
7783 /* For EVEX instructions i.vrex should become 0 after
7784 build_evex_prefix. For VEX instructions upper 16 registers
7785 aren't available, so VREX should be 0. */
7786 if (i.vrex)
7787 abort ();
7788 /* Now the VEX prefix. */
7789 p = frag_more (i.vex.length);
7790 for (j = 0; j < i.vex.length; j++)
7791 p[j] = i.vex.bytes[j];
7792 }
7793
7794 /* Now the opcode; be careful about word order here! */
7795 if (i.tm.opcode_length == 1)
7796 {
7797 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
7798 }
7799 else
7800 {
7801 switch (i.tm.opcode_length)
7802 {
7803 case 4:
7804 p = frag_more (4);
7805 *p++ = (i.tm.base_opcode >> 24) & 0xff;
7806 *p++ = (i.tm.base_opcode >> 16) & 0xff;
7807 break;
7808 case 3:
7809 p = frag_more (3);
7810 *p++ = (i.tm.base_opcode >> 16) & 0xff;
7811 break;
7812 case 2:
7813 p = frag_more (2);
7814 break;
7815 default:
7816 abort ();
7817 break;
7818 }
7819
7820 /* Put out high byte first: can't use md_number_to_chars! */
7821 *p++ = (i.tm.base_opcode >> 8) & 0xff;
7822 *p = i.tm.base_opcode & 0xff;
7823 }
7824
7825 /* Now the modrm byte and sib byte (if present). */
7826 if (i.tm.opcode_modifier.modrm)
7827 {
7828 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
7829 | i.rm.reg << 3
7830 | i.rm.mode << 6));
7831 /* If i.rm.regmem == ESP (4)
7832 && i.rm.mode != (Register mode)
7833 && not 16 bit
7834 ==> need second modrm byte. */
7835 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
7836 && i.rm.mode != 3
7837 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
7838 FRAG_APPEND_1_CHAR ((i.sib.base << 0
7839 | i.sib.index << 3
7840 | i.sib.scale << 6));
7841 }
7842
7843 if (i.disp_operands)
7844 output_disp (insn_start_frag, insn_start_off);
7845
7846 if (i.imm_operands)
7847 output_imm (insn_start_frag, insn_start_off);
7848 }
7849
7850 #ifdef DEBUG386
7851 if (flag_debug)
7852 {
7853 pi ("" /*line*/, &i);
7854 }
7855 #endif /* DEBUG386 */
7856 }
7857
7858 /* Return the size of the displacement operand N. */
7859
7860 static int
7861 disp_size (unsigned int n)
7862 {
7863 int size = 4;
7864
7865 if (i.types[n].bitfield.disp64)
7866 size = 8;
7867 else if (i.types[n].bitfield.disp8)
7868 size = 1;
7869 else if (i.types[n].bitfield.disp16)
7870 size = 2;
7871 return size;
7872 }
7873
7874 /* Return the size of the immediate operand N. */
7875
7876 static int
7877 imm_size (unsigned int n)
7878 {
7879 int size = 4;
7880 if (i.types[n].bitfield.imm64)
7881 size = 8;
7882 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
7883 size = 1;
7884 else if (i.types[n].bitfield.imm16)
7885 size = 2;
7886 return size;
7887 }
7888
7889 static void
7890 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
7891 {
7892 char *p;
7893 unsigned int n;
7894
7895 for (n = 0; n < i.operands; n++)
7896 {
7897 if (operand_type_check (i.types[n], disp))
7898 {
7899 if (i.op[n].disps->X_op == O_constant)
7900 {
7901 int size = disp_size (n);
7902 offsetT val = i.op[n].disps->X_add_number;
7903
7904 val = offset_in_range (val >> i.memshift, size);
7905 p = frag_more (size);
7906 md_number_to_chars (p, val, size);
7907 }
7908 else
7909 {
7910 enum bfd_reloc_code_real reloc_type;
7911 int size = disp_size (n);
7912 int sign = i.types[n].bitfield.disp32s;
7913 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
7914 fixS *fixP;
7915
7916 /* We can't have 8 bit displacement here. */
7917 gas_assert (!i.types[n].bitfield.disp8);
7918
7919 /* The PC relative address is computed relative
7920 to the instruction boundary, so in case immediate
7921 fields follows, we need to adjust the value. */
7922 if (pcrel && i.imm_operands)
7923 {
7924 unsigned int n1;
7925 int sz = 0;
7926
7927 for (n1 = 0; n1 < i.operands; n1++)
7928 if (operand_type_check (i.types[n1], imm))
7929 {
7930 /* Only one immediate is allowed for PC
7931 relative address. */
7932 gas_assert (sz == 0);
7933 sz = imm_size (n1);
7934 i.op[n].disps->X_add_number -= sz;
7935 }
7936 /* We should find the immediate. */
7937 gas_assert (sz != 0);
7938 }
7939
7940 p = frag_more (size);
7941 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
7942 if (GOT_symbol
7943 && GOT_symbol == i.op[n].disps->X_add_symbol
7944 && (((reloc_type == BFD_RELOC_32
7945 || reloc_type == BFD_RELOC_X86_64_32S
7946 || (reloc_type == BFD_RELOC_64
7947 && object_64bit))
7948 && (i.op[n].disps->X_op == O_symbol
7949 || (i.op[n].disps->X_op == O_add
7950 && ((symbol_get_value_expression
7951 (i.op[n].disps->X_op_symbol)->X_op)
7952 == O_subtract))))
7953 || reloc_type == BFD_RELOC_32_PCREL))
7954 {
7955 offsetT add;
7956
7957 if (insn_start_frag == frag_now)
7958 add = (p - frag_now->fr_literal) - insn_start_off;
7959 else
7960 {
7961 fragS *fr;
7962
7963 add = insn_start_frag->fr_fix - insn_start_off;
7964 for (fr = insn_start_frag->fr_next;
7965 fr && fr != frag_now; fr = fr->fr_next)
7966 add += fr->fr_fix;
7967 add += p - frag_now->fr_literal;
7968 }
7969
7970 if (!object_64bit)
7971 {
7972 reloc_type = BFD_RELOC_386_GOTPC;
7973 i.op[n].imms->X_add_number += add;
7974 }
7975 else if (reloc_type == BFD_RELOC_64)
7976 reloc_type = BFD_RELOC_X86_64_GOTPC64;
7977 else
7978 /* Don't do the adjustment for x86-64, as there
7979 the pcrel addressing is relative to the _next_
7980 insn, and that is taken care of in other code. */
7981 reloc_type = BFD_RELOC_X86_64_GOTPC32;
7982 }
7983 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
7984 size, i.op[n].disps, pcrel,
7985 reloc_type);
7986 /* Check for "call/jmp *mem", "mov mem, %reg",
7987 "test %reg, mem" and "binop mem, %reg" where binop
7988 is one of adc, add, and, cmp, or, sbb, sub, xor
7989 instructions. Always generate R_386_GOT32X for
7990 "sym*GOT" operand in 32-bit mode. */
7991 if ((generate_relax_relocations
7992 || (!object_64bit
7993 && i.rm.mode == 0
7994 && i.rm.regmem == 5))
7995 && (i.rm.mode == 2
7996 || (i.rm.mode == 0 && i.rm.regmem == 5))
7997 && ((i.operands == 1
7998 && i.tm.base_opcode == 0xff
7999 && (i.rm.reg == 2 || i.rm.reg == 4))
8000 || (i.operands == 2
8001 && (i.tm.base_opcode == 0x8b
8002 || i.tm.base_opcode == 0x85
8003 || (i.tm.base_opcode & 0xc7) == 0x03))))
8004 {
8005 if (object_64bit)
8006 {
8007 fixP->fx_tcbit = i.rex != 0;
8008 if (i.base_reg
8009 && (i.base_reg->reg_num == RegRip
8010 || i.base_reg->reg_num == RegEip))
8011 fixP->fx_tcbit2 = 1;
8012 }
8013 else
8014 fixP->fx_tcbit2 = 1;
8015 }
8016 }
8017 }
8018 }
8019 }
8020
8021 static void
8022 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
8023 {
8024 char *p;
8025 unsigned int n;
8026
8027 for (n = 0; n < i.operands; n++)
8028 {
8029 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
8030 if (i.rounding && (int) n == i.rounding->operand)
8031 continue;
8032
8033 if (operand_type_check (i.types[n], imm))
8034 {
8035 if (i.op[n].imms->X_op == O_constant)
8036 {
8037 int size = imm_size (n);
8038 offsetT val;
8039
8040 val = offset_in_range (i.op[n].imms->X_add_number,
8041 size);
8042 p = frag_more (size);
8043 md_number_to_chars (p, val, size);
8044 }
8045 else
8046 {
8047 /* Not absolute_section.
8048 Need a 32-bit fixup (don't support 8bit
8049 non-absolute imms). Try to support other
8050 sizes ... */
8051 enum bfd_reloc_code_real reloc_type;
8052 int size = imm_size (n);
8053 int sign;
8054
8055 if (i.types[n].bitfield.imm32s
8056 && (i.suffix == QWORD_MNEM_SUFFIX
8057 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
8058 sign = 1;
8059 else
8060 sign = 0;
8061
8062 p = frag_more (size);
8063 reloc_type = reloc (size, 0, sign, i.reloc[n]);
8064
8065 /* This is tough to explain. We end up with this one if we
8066 * have operands that look like
8067 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
8068 * obtain the absolute address of the GOT, and it is strongly
8069 * preferable from a performance point of view to avoid using
8070 * a runtime relocation for this. The actual sequence of
8071 * instructions often look something like:
8072 *
8073 * call .L66
8074 * .L66:
8075 * popl %ebx
8076 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
8077 *
8078 * The call and pop essentially return the absolute address
8079 * of the label .L66 and store it in %ebx. The linker itself
8080 * will ultimately change the first operand of the addl so
8081 * that %ebx points to the GOT, but to keep things simple, the
8082 * .o file must have this operand set so that it generates not
8083 * the absolute address of .L66, but the absolute address of
8084 * itself. This allows the linker itself simply treat a GOTPC
8085 * relocation as asking for a pcrel offset to the GOT to be
8086 * added in, and the addend of the relocation is stored in the
8087 * operand field for the instruction itself.
8088 *
8089 * Our job here is to fix the operand so that it would add
8090 * the correct offset so that %ebx would point to itself. The
8091 * thing that is tricky is that .-.L66 will point to the
8092 * beginning of the instruction, so we need to further modify
8093 * the operand so that it will point to itself. There are
8094 * other cases where you have something like:
8095 *
8096 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
8097 *
8098 * and here no correction would be required. Internally in
8099 * the assembler we treat operands of this form as not being
8100 * pcrel since the '.' is explicitly mentioned, and I wonder
8101 * whether it would simplify matters to do it this way. Who
8102 * knows. In earlier versions of the PIC patches, the
8103 * pcrel_adjust field was used to store the correction, but
8104 * since the expression is not pcrel, I felt it would be
8105 * confusing to do it this way. */
8106
8107 if ((reloc_type == BFD_RELOC_32
8108 || reloc_type == BFD_RELOC_X86_64_32S
8109 || reloc_type == BFD_RELOC_64)
8110 && GOT_symbol
8111 && GOT_symbol == i.op[n].imms->X_add_symbol
8112 && (i.op[n].imms->X_op == O_symbol
8113 || (i.op[n].imms->X_op == O_add
8114 && ((symbol_get_value_expression
8115 (i.op[n].imms->X_op_symbol)->X_op)
8116 == O_subtract))))
8117 {
8118 offsetT add;
8119
8120 if (insn_start_frag == frag_now)
8121 add = (p - frag_now->fr_literal) - insn_start_off;
8122 else
8123 {
8124 fragS *fr;
8125
8126 add = insn_start_frag->fr_fix - insn_start_off;
8127 for (fr = insn_start_frag->fr_next;
8128 fr && fr != frag_now; fr = fr->fr_next)
8129 add += fr->fr_fix;
8130 add += p - frag_now->fr_literal;
8131 }
8132
8133 if (!object_64bit)
8134 reloc_type = BFD_RELOC_386_GOTPC;
8135 else if (size == 4)
8136 reloc_type = BFD_RELOC_X86_64_GOTPC32;
8137 else if (size == 8)
8138 reloc_type = BFD_RELOC_X86_64_GOTPC64;
8139 i.op[n].imms->X_add_number += add;
8140 }
8141 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8142 i.op[n].imms, 0, reloc_type);
8143 }
8144 }
8145 }
8146 }
8147 \f
8148 /* x86_cons_fix_new is called via the expression parsing code when a
8149 reloc is needed. We use this hook to get the correct .got reloc. */
8150 static int cons_sign = -1;
8151
8152 void
8153 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
8154 expressionS *exp, bfd_reloc_code_real_type r)
8155 {
8156 r = reloc (len, 0, cons_sign, r);
8157
8158 #ifdef TE_PE
8159 if (exp->X_op == O_secrel)
8160 {
8161 exp->X_op = O_symbol;
8162 r = BFD_RELOC_32_SECREL;
8163 }
8164 #endif
8165
8166 fix_new_exp (frag, off, len, exp, 0, r);
8167 }
8168
8169 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
8170 purpose of the `.dc.a' internal pseudo-op. */
8171
8172 int
8173 x86_address_bytes (void)
8174 {
8175 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
8176 return 4;
8177 return stdoutput->arch_info->bits_per_address / 8;
8178 }
8179
8180 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
8181 || defined (LEX_AT)
8182 # define lex_got(reloc, adjust, types) NULL
8183 #else
8184 /* Parse operands of the form
8185 <symbol>@GOTOFF+<nnn>
8186 and similar .plt or .got references.
8187
8188 If we find one, set up the correct relocation in RELOC and copy the
8189 input string, minus the `@GOTOFF' into a malloc'd buffer for
8190 parsing by the calling routine. Return this buffer, and if ADJUST
8191 is non-null set it to the length of the string we removed from the
8192 input line. Otherwise return NULL. */
8193 static char *
8194 lex_got (enum bfd_reloc_code_real *rel,
8195 int *adjust,
8196 i386_operand_type *types)
8197 {
8198 /* Some of the relocations depend on the size of what field is to
8199 be relocated. But in our callers i386_immediate and i386_displacement
8200 we don't yet know the operand size (this will be set by insn
8201 matching). Hence we record the word32 relocation here,
8202 and adjust the reloc according to the real size in reloc(). */
8203 static const struct {
8204 const char *str;
8205 int len;
8206 const enum bfd_reloc_code_real rel[2];
8207 const i386_operand_type types64;
8208 } gotrel[] = {
8209 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8210 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
8211 BFD_RELOC_SIZE32 },
8212 OPERAND_TYPE_IMM32_64 },
8213 #endif
8214 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
8215 BFD_RELOC_X86_64_PLTOFF64 },
8216 OPERAND_TYPE_IMM64 },
8217 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
8218 BFD_RELOC_X86_64_PLT32 },
8219 OPERAND_TYPE_IMM32_32S_DISP32 },
8220 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
8221 BFD_RELOC_X86_64_GOTPLT64 },
8222 OPERAND_TYPE_IMM64_DISP64 },
8223 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
8224 BFD_RELOC_X86_64_GOTOFF64 },
8225 OPERAND_TYPE_IMM64_DISP64 },
8226 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
8227 BFD_RELOC_X86_64_GOTPCREL },
8228 OPERAND_TYPE_IMM32_32S_DISP32 },
8229 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
8230 BFD_RELOC_X86_64_TLSGD },
8231 OPERAND_TYPE_IMM32_32S_DISP32 },
8232 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
8233 _dummy_first_bfd_reloc_code_real },
8234 OPERAND_TYPE_NONE },
8235 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
8236 BFD_RELOC_X86_64_TLSLD },
8237 OPERAND_TYPE_IMM32_32S_DISP32 },
8238 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
8239 BFD_RELOC_X86_64_GOTTPOFF },
8240 OPERAND_TYPE_IMM32_32S_DISP32 },
8241 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
8242 BFD_RELOC_X86_64_TPOFF32 },
8243 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8244 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
8245 _dummy_first_bfd_reloc_code_real },
8246 OPERAND_TYPE_NONE },
8247 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
8248 BFD_RELOC_X86_64_DTPOFF32 },
8249 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8250 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
8251 _dummy_first_bfd_reloc_code_real },
8252 OPERAND_TYPE_NONE },
8253 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
8254 _dummy_first_bfd_reloc_code_real },
8255 OPERAND_TYPE_NONE },
8256 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
8257 BFD_RELOC_X86_64_GOT32 },
8258 OPERAND_TYPE_IMM32_32S_64_DISP32 },
8259 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
8260 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
8261 OPERAND_TYPE_IMM32_32S_DISP32 },
8262 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
8263 BFD_RELOC_X86_64_TLSDESC_CALL },
8264 OPERAND_TYPE_IMM32_32S_DISP32 },
8265 };
8266 char *cp;
8267 unsigned int j;
8268
8269 #if defined (OBJ_MAYBE_ELF)
8270 if (!IS_ELF)
8271 return NULL;
8272 #endif
8273
8274 for (cp = input_line_pointer; *cp != '@'; cp++)
8275 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
8276 return NULL;
8277
8278 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
8279 {
8280 int len = gotrel[j].len;
8281 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
8282 {
8283 if (gotrel[j].rel[object_64bit] != 0)
8284 {
8285 int first, second;
8286 char *tmpbuf, *past_reloc;
8287
8288 *rel = gotrel[j].rel[object_64bit];
8289
8290 if (types)
8291 {
8292 if (flag_code != CODE_64BIT)
8293 {
8294 types->bitfield.imm32 = 1;
8295 types->bitfield.disp32 = 1;
8296 }
8297 else
8298 *types = gotrel[j].types64;
8299 }
8300
8301 if (j != 0 && GOT_symbol == NULL)
8302 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
8303
8304 /* The length of the first part of our input line. */
8305 first = cp - input_line_pointer;
8306
8307 /* The second part goes from after the reloc token until
8308 (and including) an end_of_line char or comma. */
8309 past_reloc = cp + 1 + len;
8310 cp = past_reloc;
8311 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
8312 ++cp;
8313 second = cp + 1 - past_reloc;
8314
8315 /* Allocate and copy string. The trailing NUL shouldn't
8316 be necessary, but be safe. */
8317 tmpbuf = XNEWVEC (char, first + second + 2);
8318 memcpy (tmpbuf, input_line_pointer, first);
8319 if (second != 0 && *past_reloc != ' ')
8320 /* Replace the relocation token with ' ', so that
8321 errors like foo@GOTOFF1 will be detected. */
8322 tmpbuf[first++] = ' ';
8323 else
8324 /* Increment length by 1 if the relocation token is
8325 removed. */
8326 len++;
8327 if (adjust)
8328 *adjust = len;
8329 memcpy (tmpbuf + first, past_reloc, second);
8330 tmpbuf[first + second] = '\0';
8331 return tmpbuf;
8332 }
8333
8334 as_bad (_("@%s reloc is not supported with %d-bit output format"),
8335 gotrel[j].str, 1 << (5 + object_64bit));
8336 return NULL;
8337 }
8338 }
8339
8340 /* Might be a symbol version string. Don't as_bad here. */
8341 return NULL;
8342 }
8343 #endif
8344
8345 #ifdef TE_PE
8346 #ifdef lex_got
8347 #undef lex_got
8348 #endif
8349 /* Parse operands of the form
8350 <symbol>@SECREL32+<nnn>
8351
8352 If we find one, set up the correct relocation in RELOC and copy the
8353 input string, minus the `@SECREL32' into a malloc'd buffer for
8354 parsing by the calling routine. Return this buffer, and if ADJUST
8355 is non-null set it to the length of the string we removed from the
8356 input line. Otherwise return NULL.
8357
8358 This function is copied from the ELF version above adjusted for PE targets. */
8359
8360 static char *
8361 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
8362 int *adjust ATTRIBUTE_UNUSED,
8363 i386_operand_type *types)
8364 {
8365 static const struct
8366 {
8367 const char *str;
8368 int len;
8369 const enum bfd_reloc_code_real rel[2];
8370 const i386_operand_type types64;
8371 }
8372 gotrel[] =
8373 {
8374 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
8375 BFD_RELOC_32_SECREL },
8376 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8377 };
8378
8379 char *cp;
8380 unsigned j;
8381
8382 for (cp = input_line_pointer; *cp != '@'; cp++)
8383 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
8384 return NULL;
8385
8386 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
8387 {
8388 int len = gotrel[j].len;
8389
8390 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
8391 {
8392 if (gotrel[j].rel[object_64bit] != 0)
8393 {
8394 int first, second;
8395 char *tmpbuf, *past_reloc;
8396
8397 *rel = gotrel[j].rel[object_64bit];
8398 if (adjust)
8399 *adjust = len;
8400
8401 if (types)
8402 {
8403 if (flag_code != CODE_64BIT)
8404 {
8405 types->bitfield.imm32 = 1;
8406 types->bitfield.disp32 = 1;
8407 }
8408 else
8409 *types = gotrel[j].types64;
8410 }
8411
8412 /* The length of the first part of our input line. */
8413 first = cp - input_line_pointer;
8414
8415 /* The second part goes from after the reloc token until
8416 (and including) an end_of_line char or comma. */
8417 past_reloc = cp + 1 + len;
8418 cp = past_reloc;
8419 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
8420 ++cp;
8421 second = cp + 1 - past_reloc;
8422
8423 /* Allocate and copy string. The trailing NUL shouldn't
8424 be necessary, but be safe. */
8425 tmpbuf = XNEWVEC (char, first + second + 2);
8426 memcpy (tmpbuf, input_line_pointer, first);
8427 if (second != 0 && *past_reloc != ' ')
8428 /* Replace the relocation token with ' ', so that
8429 errors like foo@SECLREL321 will be detected. */
8430 tmpbuf[first++] = ' ';
8431 memcpy (tmpbuf + first, past_reloc, second);
8432 tmpbuf[first + second] = '\0';
8433 return tmpbuf;
8434 }
8435
8436 as_bad (_("@%s reloc is not supported with %d-bit output format"),
8437 gotrel[j].str, 1 << (5 + object_64bit));
8438 return NULL;
8439 }
8440 }
8441
8442 /* Might be a symbol version string. Don't as_bad here. */
8443 return NULL;
8444 }
8445
8446 #endif /* TE_PE */
8447
8448 bfd_reloc_code_real_type
8449 x86_cons (expressionS *exp, int size)
8450 {
8451 bfd_reloc_code_real_type got_reloc = NO_RELOC;
8452
8453 intel_syntax = -intel_syntax;
8454
8455 exp->X_md = 0;
8456 if (size == 4 || (object_64bit && size == 8))
8457 {
8458 /* Handle @GOTOFF and the like in an expression. */
8459 char *save;
8460 char *gotfree_input_line;
8461 int adjust = 0;
8462
8463 save = input_line_pointer;
8464 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
8465 if (gotfree_input_line)
8466 input_line_pointer = gotfree_input_line;
8467
8468 expression (exp);
8469
8470 if (gotfree_input_line)
8471 {
8472 /* expression () has merrily parsed up to the end of line,
8473 or a comma - in the wrong buffer. Transfer how far
8474 input_line_pointer has moved to the right buffer. */
8475 input_line_pointer = (save
8476 + (input_line_pointer - gotfree_input_line)
8477 + adjust);
8478 free (gotfree_input_line);
8479 if (exp->X_op == O_constant
8480 || exp->X_op == O_absent
8481 || exp->X_op == O_illegal
8482 || exp->X_op == O_register
8483 || exp->X_op == O_big)
8484 {
8485 char c = *input_line_pointer;
8486 *input_line_pointer = 0;
8487 as_bad (_("missing or invalid expression `%s'"), save);
8488 *input_line_pointer = c;
8489 }
8490 }
8491 }
8492 else
8493 expression (exp);
8494
8495 intel_syntax = -intel_syntax;
8496
8497 if (intel_syntax)
8498 i386_intel_simplify (exp);
8499
8500 return got_reloc;
8501 }
8502
8503 static void
8504 signed_cons (int size)
8505 {
8506 if (flag_code == CODE_64BIT)
8507 cons_sign = 1;
8508 cons (size);
8509 cons_sign = -1;
8510 }
8511
8512 #ifdef TE_PE
8513 static void
8514 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
8515 {
8516 expressionS exp;
8517
8518 do
8519 {
8520 expression (&exp);
8521 if (exp.X_op == O_symbol)
8522 exp.X_op = O_secrel;
8523
8524 emit_expr (&exp, 4);
8525 }
8526 while (*input_line_pointer++ == ',');
8527
8528 input_line_pointer--;
8529 demand_empty_rest_of_line ();
8530 }
8531 #endif
8532
8533 /* Handle Vector operations. */
8534
8535 static char *
8536 check_VecOperations (char *op_string, char *op_end)
8537 {
8538 const reg_entry *mask;
8539 const char *saved;
8540 char *end_op;
8541
8542 while (*op_string
8543 && (op_end == NULL || op_string < op_end))
8544 {
8545 saved = op_string;
8546 if (*op_string == '{')
8547 {
8548 op_string++;
8549
8550 /* Check broadcasts. */
8551 if (strncmp (op_string, "1to", 3) == 0)
8552 {
8553 int bcst_type;
8554
8555 if (i.broadcast)
8556 goto duplicated_vec_op;
8557
8558 op_string += 3;
8559 if (*op_string == '8')
8560 bcst_type = 8;
8561 else if (*op_string == '4')
8562 bcst_type = 4;
8563 else if (*op_string == '2')
8564 bcst_type = 2;
8565 else if (*op_string == '1'
8566 && *(op_string+1) == '6')
8567 {
8568 bcst_type = 16;
8569 op_string++;
8570 }
8571 else
8572 {
8573 as_bad (_("Unsupported broadcast: `%s'"), saved);
8574 return NULL;
8575 }
8576 op_string++;
8577
8578 broadcast_op.type = bcst_type;
8579 broadcast_op.operand = this_operand;
8580 i.broadcast = &broadcast_op;
8581 }
8582 /* Check masking operation. */
8583 else if ((mask = parse_register (op_string, &end_op)) != NULL)
8584 {
8585 /* k0 can't be used for write mask. */
8586 if (!mask->reg_type.bitfield.regmask || mask->reg_num == 0)
8587 {
8588 as_bad (_("`%s%s' can't be used for write mask"),
8589 register_prefix, mask->reg_name);
8590 return NULL;
8591 }
8592
8593 if (!i.mask)
8594 {
8595 mask_op.mask = mask;
8596 mask_op.zeroing = 0;
8597 mask_op.operand = this_operand;
8598 i.mask = &mask_op;
8599 }
8600 else
8601 {
8602 if (i.mask->mask)
8603 goto duplicated_vec_op;
8604
8605 i.mask->mask = mask;
8606
8607 /* Only "{z}" is allowed here. No need to check
8608 zeroing mask explicitly. */
8609 if (i.mask->operand != this_operand)
8610 {
8611 as_bad (_("invalid write mask `%s'"), saved);
8612 return NULL;
8613 }
8614 }
8615
8616 op_string = end_op;
8617 }
8618 /* Check zeroing-flag for masking operation. */
8619 else if (*op_string == 'z')
8620 {
8621 if (!i.mask)
8622 {
8623 mask_op.mask = NULL;
8624 mask_op.zeroing = 1;
8625 mask_op.operand = this_operand;
8626 i.mask = &mask_op;
8627 }
8628 else
8629 {
8630 if (i.mask->zeroing)
8631 {
8632 duplicated_vec_op:
8633 as_bad (_("duplicated `%s'"), saved);
8634 return NULL;
8635 }
8636
8637 i.mask->zeroing = 1;
8638
8639 /* Only "{%k}" is allowed here. No need to check mask
8640 register explicitly. */
8641 if (i.mask->operand != this_operand)
8642 {
8643 as_bad (_("invalid zeroing-masking `%s'"),
8644 saved);
8645 return NULL;
8646 }
8647 }
8648
8649 op_string++;
8650 }
8651 else
8652 goto unknown_vec_op;
8653
8654 if (*op_string != '}')
8655 {
8656 as_bad (_("missing `}' in `%s'"), saved);
8657 return NULL;
8658 }
8659 op_string++;
8660
8661 /* Strip whitespace since the addition of pseudo prefixes
8662 changed how the scrubber treats '{'. */
8663 if (is_space_char (*op_string))
8664 ++op_string;
8665
8666 continue;
8667 }
8668 unknown_vec_op:
8669 /* We don't know this one. */
8670 as_bad (_("unknown vector operation: `%s'"), saved);
8671 return NULL;
8672 }
8673
8674 if (i.mask && i.mask->zeroing && !i.mask->mask)
8675 {
8676 as_bad (_("zeroing-masking only allowed with write mask"));
8677 return NULL;
8678 }
8679
8680 return op_string;
8681 }
8682
8683 static int
8684 i386_immediate (char *imm_start)
8685 {
8686 char *save_input_line_pointer;
8687 char *gotfree_input_line;
8688 segT exp_seg = 0;
8689 expressionS *exp;
8690 i386_operand_type types;
8691
8692 operand_type_set (&types, ~0);
8693
8694 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
8695 {
8696 as_bad (_("at most %d immediate operands are allowed"),
8697 MAX_IMMEDIATE_OPERANDS);
8698 return 0;
8699 }
8700
8701 exp = &im_expressions[i.imm_operands++];
8702 i.op[this_operand].imms = exp;
8703
8704 if (is_space_char (*imm_start))
8705 ++imm_start;
8706
8707 save_input_line_pointer = input_line_pointer;
8708 input_line_pointer = imm_start;
8709
8710 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
8711 if (gotfree_input_line)
8712 input_line_pointer = gotfree_input_line;
8713
8714 exp_seg = expression (exp);
8715
8716 SKIP_WHITESPACE ();
8717
8718 /* Handle vector operations. */
8719 if (*input_line_pointer == '{')
8720 {
8721 input_line_pointer = check_VecOperations (input_line_pointer,
8722 NULL);
8723 if (input_line_pointer == NULL)
8724 return 0;
8725 }
8726
8727 if (*input_line_pointer)
8728 as_bad (_("junk `%s' after expression"), input_line_pointer);
8729
8730 input_line_pointer = save_input_line_pointer;
8731 if (gotfree_input_line)
8732 {
8733 free (gotfree_input_line);
8734
8735 if (exp->X_op == O_constant || exp->X_op == O_register)
8736 exp->X_op = O_illegal;
8737 }
8738
8739 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
8740 }
8741
8742 static int
8743 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
8744 i386_operand_type types, const char *imm_start)
8745 {
8746 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
8747 {
8748 if (imm_start)
8749 as_bad (_("missing or invalid immediate expression `%s'"),
8750 imm_start);
8751 return 0;
8752 }
8753 else if (exp->X_op == O_constant)
8754 {
8755 /* Size it properly later. */
8756 i.types[this_operand].bitfield.imm64 = 1;
8757 /* If not 64bit, sign extend val. */
8758 if (flag_code != CODE_64BIT
8759 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
8760 exp->X_add_number
8761 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
8762 }
8763 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
8764 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
8765 && exp_seg != absolute_section
8766 && exp_seg != text_section
8767 && exp_seg != data_section
8768 && exp_seg != bss_section
8769 && exp_seg != undefined_section
8770 && !bfd_is_com_section (exp_seg))
8771 {
8772 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
8773 return 0;
8774 }
8775 #endif
8776 else if (!intel_syntax && exp_seg == reg_section)
8777 {
8778 if (imm_start)
8779 as_bad (_("illegal immediate register operand %s"), imm_start);
8780 return 0;
8781 }
8782 else
8783 {
8784 /* This is an address. The size of the address will be
8785 determined later, depending on destination register,
8786 suffix, or the default for the section. */
8787 i.types[this_operand].bitfield.imm8 = 1;
8788 i.types[this_operand].bitfield.imm16 = 1;
8789 i.types[this_operand].bitfield.imm32 = 1;
8790 i.types[this_operand].bitfield.imm32s = 1;
8791 i.types[this_operand].bitfield.imm64 = 1;
8792 i.types[this_operand] = operand_type_and (i.types[this_operand],
8793 types);
8794 }
8795
8796 return 1;
8797 }
8798
8799 static char *
8800 i386_scale (char *scale)
8801 {
8802 offsetT val;
8803 char *save = input_line_pointer;
8804
8805 input_line_pointer = scale;
8806 val = get_absolute_expression ();
8807
8808 switch (val)
8809 {
8810 case 1:
8811 i.log2_scale_factor = 0;
8812 break;
8813 case 2:
8814 i.log2_scale_factor = 1;
8815 break;
8816 case 4:
8817 i.log2_scale_factor = 2;
8818 break;
8819 case 8:
8820 i.log2_scale_factor = 3;
8821 break;
8822 default:
8823 {
8824 char sep = *input_line_pointer;
8825
8826 *input_line_pointer = '\0';
8827 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
8828 scale);
8829 *input_line_pointer = sep;
8830 input_line_pointer = save;
8831 return NULL;
8832 }
8833 }
8834 if (i.log2_scale_factor != 0 && i.index_reg == 0)
8835 {
8836 as_warn (_("scale factor of %d without an index register"),
8837 1 << i.log2_scale_factor);
8838 i.log2_scale_factor = 0;
8839 }
8840 scale = input_line_pointer;
8841 input_line_pointer = save;
8842 return scale;
8843 }
8844
8845 static int
8846 i386_displacement (char *disp_start, char *disp_end)
8847 {
8848 expressionS *exp;
8849 segT exp_seg = 0;
8850 char *save_input_line_pointer;
8851 char *gotfree_input_line;
8852 int override;
8853 i386_operand_type bigdisp, types = anydisp;
8854 int ret;
8855
8856 if (i.disp_operands == MAX_MEMORY_OPERANDS)
8857 {
8858 as_bad (_("at most %d displacement operands are allowed"),
8859 MAX_MEMORY_OPERANDS);
8860 return 0;
8861 }
8862
8863 operand_type_set (&bigdisp, 0);
8864 if ((i.types[this_operand].bitfield.jumpabsolute)
8865 || (!current_templates->start->opcode_modifier.jump
8866 && !current_templates->start->opcode_modifier.jumpdword))
8867 {
8868 bigdisp.bitfield.disp32 = 1;
8869 override = (i.prefix[ADDR_PREFIX] != 0);
8870 if (flag_code == CODE_64BIT)
8871 {
8872 if (!override)
8873 {
8874 bigdisp.bitfield.disp32s = 1;
8875 bigdisp.bitfield.disp64 = 1;
8876 }
8877 }
8878 else if ((flag_code == CODE_16BIT) ^ override)
8879 {
8880 bigdisp.bitfield.disp32 = 0;
8881 bigdisp.bitfield.disp16 = 1;
8882 }
8883 }
8884 else
8885 {
8886 /* For PC-relative branches, the width of the displacement
8887 is dependent upon data size, not address size. */
8888 override = (i.prefix[DATA_PREFIX] != 0);
8889 if (flag_code == CODE_64BIT)
8890 {
8891 if (override || i.suffix == WORD_MNEM_SUFFIX)
8892 bigdisp.bitfield.disp16 = 1;
8893 else
8894 {
8895 bigdisp.bitfield.disp32 = 1;
8896 bigdisp.bitfield.disp32s = 1;
8897 }
8898 }
8899 else
8900 {
8901 if (!override)
8902 override = (i.suffix == (flag_code != CODE_16BIT
8903 ? WORD_MNEM_SUFFIX
8904 : LONG_MNEM_SUFFIX));
8905 bigdisp.bitfield.disp32 = 1;
8906 if ((flag_code == CODE_16BIT) ^ override)
8907 {
8908 bigdisp.bitfield.disp32 = 0;
8909 bigdisp.bitfield.disp16 = 1;
8910 }
8911 }
8912 }
8913 i.types[this_operand] = operand_type_or (i.types[this_operand],
8914 bigdisp);
8915
8916 exp = &disp_expressions[i.disp_operands];
8917 i.op[this_operand].disps = exp;
8918 i.disp_operands++;
8919 save_input_line_pointer = input_line_pointer;
8920 input_line_pointer = disp_start;
8921 END_STRING_AND_SAVE (disp_end);
8922
8923 #ifndef GCC_ASM_O_HACK
8924 #define GCC_ASM_O_HACK 0
8925 #endif
8926 #if GCC_ASM_O_HACK
8927 END_STRING_AND_SAVE (disp_end + 1);
8928 if (i.types[this_operand].bitfield.baseIndex
8929 && displacement_string_end[-1] == '+')
8930 {
8931 /* This hack is to avoid a warning when using the "o"
8932 constraint within gcc asm statements.
8933 For instance:
8934
8935 #define _set_tssldt_desc(n,addr,limit,type) \
8936 __asm__ __volatile__ ( \
8937 "movw %w2,%0\n\t" \
8938 "movw %w1,2+%0\n\t" \
8939 "rorl $16,%1\n\t" \
8940 "movb %b1,4+%0\n\t" \
8941 "movb %4,5+%0\n\t" \
8942 "movb $0,6+%0\n\t" \
8943 "movb %h1,7+%0\n\t" \
8944 "rorl $16,%1" \
8945 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
8946
8947 This works great except that the output assembler ends
8948 up looking a bit weird if it turns out that there is
8949 no offset. You end up producing code that looks like:
8950
8951 #APP
8952 movw $235,(%eax)
8953 movw %dx,2+(%eax)
8954 rorl $16,%edx
8955 movb %dl,4+(%eax)
8956 movb $137,5+(%eax)
8957 movb $0,6+(%eax)
8958 movb %dh,7+(%eax)
8959 rorl $16,%edx
8960 #NO_APP
8961
8962 So here we provide the missing zero. */
8963
8964 *displacement_string_end = '0';
8965 }
8966 #endif
8967 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
8968 if (gotfree_input_line)
8969 input_line_pointer = gotfree_input_line;
8970
8971 exp_seg = expression (exp);
8972
8973 SKIP_WHITESPACE ();
8974 if (*input_line_pointer)
8975 as_bad (_("junk `%s' after expression"), input_line_pointer);
8976 #if GCC_ASM_O_HACK
8977 RESTORE_END_STRING (disp_end + 1);
8978 #endif
8979 input_line_pointer = save_input_line_pointer;
8980 if (gotfree_input_line)
8981 {
8982 free (gotfree_input_line);
8983
8984 if (exp->X_op == O_constant || exp->X_op == O_register)
8985 exp->X_op = O_illegal;
8986 }
8987
8988 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
8989
8990 RESTORE_END_STRING (disp_end);
8991
8992 return ret;
8993 }
8994
8995 static int
8996 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
8997 i386_operand_type types, const char *disp_start)
8998 {
8999 i386_operand_type bigdisp;
9000 int ret = 1;
9001
9002 /* We do this to make sure that the section symbol is in
9003 the symbol table. We will ultimately change the relocation
9004 to be relative to the beginning of the section. */
9005 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
9006 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
9007 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9008 {
9009 if (exp->X_op != O_symbol)
9010 goto inv_disp;
9011
9012 if (S_IS_LOCAL (exp->X_add_symbol)
9013 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
9014 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
9015 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
9016 exp->X_op = O_subtract;
9017 exp->X_op_symbol = GOT_symbol;
9018 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
9019 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
9020 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9021 i.reloc[this_operand] = BFD_RELOC_64;
9022 else
9023 i.reloc[this_operand] = BFD_RELOC_32;
9024 }
9025
9026 else if (exp->X_op == O_absent
9027 || exp->X_op == O_illegal
9028 || exp->X_op == O_big)
9029 {
9030 inv_disp:
9031 as_bad (_("missing or invalid displacement expression `%s'"),
9032 disp_start);
9033 ret = 0;
9034 }
9035
9036 else if (flag_code == CODE_64BIT
9037 && !i.prefix[ADDR_PREFIX]
9038 && exp->X_op == O_constant)
9039 {
9040 /* Since displacement is signed extended to 64bit, don't allow
9041 disp32 and turn off disp32s if they are out of range. */
9042 i.types[this_operand].bitfield.disp32 = 0;
9043 if (!fits_in_signed_long (exp->X_add_number))
9044 {
9045 i.types[this_operand].bitfield.disp32s = 0;
9046 if (i.types[this_operand].bitfield.baseindex)
9047 {
9048 as_bad (_("0x%lx out range of signed 32bit displacement"),
9049 (long) exp->X_add_number);
9050 ret = 0;
9051 }
9052 }
9053 }
9054
9055 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9056 else if (exp->X_op != O_constant
9057 && OUTPUT_FLAVOR == bfd_target_aout_flavour
9058 && exp_seg != absolute_section
9059 && exp_seg != text_section
9060 && exp_seg != data_section
9061 && exp_seg != bss_section
9062 && exp_seg != undefined_section
9063 && !bfd_is_com_section (exp_seg))
9064 {
9065 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9066 ret = 0;
9067 }
9068 #endif
9069
9070 /* Check if this is a displacement only operand. */
9071 bigdisp = i.types[this_operand];
9072 bigdisp.bitfield.disp8 = 0;
9073 bigdisp.bitfield.disp16 = 0;
9074 bigdisp.bitfield.disp32 = 0;
9075 bigdisp.bitfield.disp32s = 0;
9076 bigdisp.bitfield.disp64 = 0;
9077 if (operand_type_all_zero (&bigdisp))
9078 i.types[this_operand] = operand_type_and (i.types[this_operand],
9079 types);
9080
9081 return ret;
9082 }
9083
9084 /* Return the active addressing mode, taking address override and
9085 registers forming the address into consideration. Update the
9086 address override prefix if necessary. */
9087
9088 static enum flag_code
9089 i386_addressing_mode (void)
9090 {
9091 enum flag_code addr_mode;
9092
9093 if (i.prefix[ADDR_PREFIX])
9094 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
9095 else
9096 {
9097 addr_mode = flag_code;
9098
9099 #if INFER_ADDR_PREFIX
9100 if (i.mem_operands == 0)
9101 {
9102 /* Infer address prefix from the first memory operand. */
9103 const reg_entry *addr_reg = i.base_reg;
9104
9105 if (addr_reg == NULL)
9106 addr_reg = i.index_reg;
9107
9108 if (addr_reg)
9109 {
9110 if (addr_reg->reg_num == RegEip
9111 || addr_reg->reg_num == RegEiz
9112 || addr_reg->reg_type.bitfield.dword)
9113 addr_mode = CODE_32BIT;
9114 else if (flag_code != CODE_64BIT
9115 && addr_reg->reg_type.bitfield.word)
9116 addr_mode = CODE_16BIT;
9117
9118 if (addr_mode != flag_code)
9119 {
9120 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
9121 i.prefixes += 1;
9122 /* Change the size of any displacement too. At most one
9123 of Disp16 or Disp32 is set.
9124 FIXME. There doesn't seem to be any real need for
9125 separate Disp16 and Disp32 flags. The same goes for
9126 Imm16 and Imm32. Removing them would probably clean
9127 up the code quite a lot. */
9128 if (flag_code != CODE_64BIT
9129 && (i.types[this_operand].bitfield.disp16
9130 || i.types[this_operand].bitfield.disp32))
9131 i.types[this_operand]
9132 = operand_type_xor (i.types[this_operand], disp16_32);
9133 }
9134 }
9135 }
9136 #endif
9137 }
9138
9139 return addr_mode;
9140 }
9141
9142 /* Make sure the memory operand we've been dealt is valid.
9143 Return 1 on success, 0 on a failure. */
9144
9145 static int
9146 i386_index_check (const char *operand_string)
9147 {
9148 const char *kind = "base/index";
9149 enum flag_code addr_mode = i386_addressing_mode ();
9150
9151 if (current_templates->start->opcode_modifier.isstring
9152 && !current_templates->start->opcode_modifier.immext
9153 && (current_templates->end[-1].opcode_modifier.isstring
9154 || i.mem_operands))
9155 {
9156 /* Memory operands of string insns are special in that they only allow
9157 a single register (rDI, rSI, or rBX) as their memory address. */
9158 const reg_entry *expected_reg;
9159 static const char *di_si[][2] =
9160 {
9161 { "esi", "edi" },
9162 { "si", "di" },
9163 { "rsi", "rdi" }
9164 };
9165 static const char *bx[] = { "ebx", "bx", "rbx" };
9166
9167 kind = "string address";
9168
9169 if (current_templates->start->opcode_modifier.repprefixok)
9170 {
9171 i386_operand_type type = current_templates->end[-1].operand_types[0];
9172
9173 if (!type.bitfield.baseindex
9174 || ((!i.mem_operands != !intel_syntax)
9175 && current_templates->end[-1].operand_types[1]
9176 .bitfield.baseindex))
9177 type = current_templates->end[-1].operand_types[1];
9178 expected_reg = hash_find (reg_hash,
9179 di_si[addr_mode][type.bitfield.esseg]);
9180
9181 }
9182 else
9183 expected_reg = hash_find (reg_hash, bx[addr_mode]);
9184
9185 if (i.base_reg != expected_reg
9186 || i.index_reg
9187 || operand_type_check (i.types[this_operand], disp))
9188 {
9189 /* The second memory operand must have the same size as
9190 the first one. */
9191 if (i.mem_operands
9192 && i.base_reg
9193 && !((addr_mode == CODE_64BIT
9194 && i.base_reg->reg_type.bitfield.qword)
9195 || (addr_mode == CODE_32BIT
9196 ? i.base_reg->reg_type.bitfield.dword
9197 : i.base_reg->reg_type.bitfield.word)))
9198 goto bad_address;
9199
9200 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
9201 operand_string,
9202 intel_syntax ? '[' : '(',
9203 register_prefix,
9204 expected_reg->reg_name,
9205 intel_syntax ? ']' : ')');
9206 return 1;
9207 }
9208 else
9209 return 1;
9210
9211 bad_address:
9212 as_bad (_("`%s' is not a valid %s expression"),
9213 operand_string, kind);
9214 return 0;
9215 }
9216 else
9217 {
9218 if (addr_mode != CODE_16BIT)
9219 {
9220 /* 32-bit/64-bit checks. */
9221 if ((i.base_reg
9222 && (addr_mode == CODE_64BIT
9223 ? !i.base_reg->reg_type.bitfield.qword
9224 : !i.base_reg->reg_type.bitfield.dword)
9225 && (i.index_reg
9226 || (i.base_reg->reg_num
9227 != (addr_mode == CODE_64BIT ? RegRip : RegEip))))
9228 || (i.index_reg
9229 && !i.index_reg->reg_type.bitfield.xmmword
9230 && !i.index_reg->reg_type.bitfield.ymmword
9231 && !i.index_reg->reg_type.bitfield.zmmword
9232 && ((addr_mode == CODE_64BIT
9233 ? !(i.index_reg->reg_type.bitfield.qword
9234 || i.index_reg->reg_num == RegRiz)
9235 : !(i.index_reg->reg_type.bitfield.dword
9236 || i.index_reg->reg_num == RegEiz))
9237 || !i.index_reg->reg_type.bitfield.baseindex)))
9238 goto bad_address;
9239
9240 /* bndmk, bndldx, and bndstx have special restrictions. */
9241 if (current_templates->start->base_opcode == 0xf30f1b
9242 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
9243 {
9244 /* They cannot use RIP-relative addressing. */
9245 if (i.base_reg && i.base_reg->reg_num == RegRip)
9246 {
9247 as_bad (_("`%s' cannot be used here"), operand_string);
9248 return 0;
9249 }
9250
9251 /* bndldx and bndstx ignore their scale factor. */
9252 if (current_templates->start->base_opcode != 0xf30f1b
9253 && i.log2_scale_factor)
9254 as_warn (_("register scaling is being ignored here"));
9255 }
9256 }
9257 else
9258 {
9259 /* 16-bit checks. */
9260 if ((i.base_reg
9261 && (!i.base_reg->reg_type.bitfield.word
9262 || !i.base_reg->reg_type.bitfield.baseindex))
9263 || (i.index_reg
9264 && (!i.index_reg->reg_type.bitfield.word
9265 || !i.index_reg->reg_type.bitfield.baseindex
9266 || !(i.base_reg
9267 && i.base_reg->reg_num < 6
9268 && i.index_reg->reg_num >= 6
9269 && i.log2_scale_factor == 0))))
9270 goto bad_address;
9271 }
9272 }
9273 return 1;
9274 }
9275
9276 /* Handle vector immediates. */
9277
9278 static int
9279 RC_SAE_immediate (const char *imm_start)
9280 {
9281 unsigned int match_found, j;
9282 const char *pstr = imm_start;
9283 expressionS *exp;
9284
9285 if (*pstr != '{')
9286 return 0;
9287
9288 pstr++;
9289 match_found = 0;
9290 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
9291 {
9292 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
9293 {
9294 if (!i.rounding)
9295 {
9296 rc_op.type = RC_NamesTable[j].type;
9297 rc_op.operand = this_operand;
9298 i.rounding = &rc_op;
9299 }
9300 else
9301 {
9302 as_bad (_("duplicated `%s'"), imm_start);
9303 return 0;
9304 }
9305 pstr += RC_NamesTable[j].len;
9306 match_found = 1;
9307 break;
9308 }
9309 }
9310 if (!match_found)
9311 return 0;
9312
9313 if (*pstr++ != '}')
9314 {
9315 as_bad (_("Missing '}': '%s'"), imm_start);
9316 return 0;
9317 }
9318 /* RC/SAE immediate string should contain nothing more. */;
9319 if (*pstr != 0)
9320 {
9321 as_bad (_("Junk after '}': '%s'"), imm_start);
9322 return 0;
9323 }
9324
9325 exp = &im_expressions[i.imm_operands++];
9326 i.op[this_operand].imms = exp;
9327
9328 exp->X_op = O_constant;
9329 exp->X_add_number = 0;
9330 exp->X_add_symbol = (symbolS *) 0;
9331 exp->X_op_symbol = (symbolS *) 0;
9332
9333 i.types[this_operand].bitfield.imm8 = 1;
9334 return 1;
9335 }
9336
9337 /* Only string instructions can have a second memory operand, so
9338 reduce current_templates to just those if it contains any. */
9339 static int
9340 maybe_adjust_templates (void)
9341 {
9342 const insn_template *t;
9343
9344 gas_assert (i.mem_operands == 1);
9345
9346 for (t = current_templates->start; t < current_templates->end; ++t)
9347 if (t->opcode_modifier.isstring)
9348 break;
9349
9350 if (t < current_templates->end)
9351 {
9352 static templates aux_templates;
9353 bfd_boolean recheck;
9354
9355 aux_templates.start = t;
9356 for (; t < current_templates->end; ++t)
9357 if (!t->opcode_modifier.isstring)
9358 break;
9359 aux_templates.end = t;
9360
9361 /* Determine whether to re-check the first memory operand. */
9362 recheck = (aux_templates.start != current_templates->start
9363 || t != current_templates->end);
9364
9365 current_templates = &aux_templates;
9366
9367 if (recheck)
9368 {
9369 i.mem_operands = 0;
9370 if (i.memop1_string != NULL
9371 && i386_index_check (i.memop1_string) == 0)
9372 return 0;
9373 i.mem_operands = 1;
9374 }
9375 }
9376
9377 return 1;
9378 }
9379
9380 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
9381 on error. */
9382
9383 static int
9384 i386_att_operand (char *operand_string)
9385 {
9386 const reg_entry *r;
9387 char *end_op;
9388 char *op_string = operand_string;
9389
9390 if (is_space_char (*op_string))
9391 ++op_string;
9392
9393 /* We check for an absolute prefix (differentiating,
9394 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
9395 if (*op_string == ABSOLUTE_PREFIX)
9396 {
9397 ++op_string;
9398 if (is_space_char (*op_string))
9399 ++op_string;
9400 i.types[this_operand].bitfield.jumpabsolute = 1;
9401 }
9402
9403 /* Check if operand is a register. */
9404 if ((r = parse_register (op_string, &end_op)) != NULL)
9405 {
9406 i386_operand_type temp;
9407
9408 /* Check for a segment override by searching for ':' after a
9409 segment register. */
9410 op_string = end_op;
9411 if (is_space_char (*op_string))
9412 ++op_string;
9413 if (*op_string == ':'
9414 && (r->reg_type.bitfield.sreg2
9415 || r->reg_type.bitfield.sreg3))
9416 {
9417 switch (r->reg_num)
9418 {
9419 case 0:
9420 i.seg[i.mem_operands] = &es;
9421 break;
9422 case 1:
9423 i.seg[i.mem_operands] = &cs;
9424 break;
9425 case 2:
9426 i.seg[i.mem_operands] = &ss;
9427 break;
9428 case 3:
9429 i.seg[i.mem_operands] = &ds;
9430 break;
9431 case 4:
9432 i.seg[i.mem_operands] = &fs;
9433 break;
9434 case 5:
9435 i.seg[i.mem_operands] = &gs;
9436 break;
9437 }
9438
9439 /* Skip the ':' and whitespace. */
9440 ++op_string;
9441 if (is_space_char (*op_string))
9442 ++op_string;
9443
9444 if (!is_digit_char (*op_string)
9445 && !is_identifier_char (*op_string)
9446 && *op_string != '('
9447 && *op_string != ABSOLUTE_PREFIX)
9448 {
9449 as_bad (_("bad memory operand `%s'"), op_string);
9450 return 0;
9451 }
9452 /* Handle case of %es:*foo. */
9453 if (*op_string == ABSOLUTE_PREFIX)
9454 {
9455 ++op_string;
9456 if (is_space_char (*op_string))
9457 ++op_string;
9458 i.types[this_operand].bitfield.jumpabsolute = 1;
9459 }
9460 goto do_memory_reference;
9461 }
9462
9463 /* Handle vector operations. */
9464 if (*op_string == '{')
9465 {
9466 op_string = check_VecOperations (op_string, NULL);
9467 if (op_string == NULL)
9468 return 0;
9469 }
9470
9471 if (*op_string)
9472 {
9473 as_bad (_("junk `%s' after register"), op_string);
9474 return 0;
9475 }
9476 temp = r->reg_type;
9477 temp.bitfield.baseindex = 0;
9478 i.types[this_operand] = operand_type_or (i.types[this_operand],
9479 temp);
9480 i.types[this_operand].bitfield.unspecified = 0;
9481 i.op[this_operand].regs = r;
9482 i.reg_operands++;
9483 }
9484 else if (*op_string == REGISTER_PREFIX)
9485 {
9486 as_bad (_("bad register name `%s'"), op_string);
9487 return 0;
9488 }
9489 else if (*op_string == IMMEDIATE_PREFIX)
9490 {
9491 ++op_string;
9492 if (i.types[this_operand].bitfield.jumpabsolute)
9493 {
9494 as_bad (_("immediate operand illegal with absolute jump"));
9495 return 0;
9496 }
9497 if (!i386_immediate (op_string))
9498 return 0;
9499 }
9500 else if (RC_SAE_immediate (operand_string))
9501 {
9502 /* If it is a RC or SAE immediate, do nothing. */
9503 ;
9504 }
9505 else if (is_digit_char (*op_string)
9506 || is_identifier_char (*op_string)
9507 || *op_string == '"'
9508 || *op_string == '(')
9509 {
9510 /* This is a memory reference of some sort. */
9511 char *base_string;
9512
9513 /* Start and end of displacement string expression (if found). */
9514 char *displacement_string_start;
9515 char *displacement_string_end;
9516 char *vop_start;
9517
9518 do_memory_reference:
9519 if (i.mem_operands == 1 && !maybe_adjust_templates ())
9520 return 0;
9521 if ((i.mem_operands == 1
9522 && !current_templates->start->opcode_modifier.isstring)
9523 || i.mem_operands == 2)
9524 {
9525 as_bad (_("too many memory references for `%s'"),
9526 current_templates->start->name);
9527 return 0;
9528 }
9529
9530 /* Check for base index form. We detect the base index form by
9531 looking for an ')' at the end of the operand, searching
9532 for the '(' matching it, and finding a REGISTER_PREFIX or ','
9533 after the '('. */
9534 base_string = op_string + strlen (op_string);
9535
9536 /* Handle vector operations. */
9537 vop_start = strchr (op_string, '{');
9538 if (vop_start && vop_start < base_string)
9539 {
9540 if (check_VecOperations (vop_start, base_string) == NULL)
9541 return 0;
9542 base_string = vop_start;
9543 }
9544
9545 --base_string;
9546 if (is_space_char (*base_string))
9547 --base_string;
9548
9549 /* If we only have a displacement, set-up for it to be parsed later. */
9550 displacement_string_start = op_string;
9551 displacement_string_end = base_string + 1;
9552
9553 if (*base_string == ')')
9554 {
9555 char *temp_string;
9556 unsigned int parens_balanced = 1;
9557 /* We've already checked that the number of left & right ()'s are
9558 equal, so this loop will not be infinite. */
9559 do
9560 {
9561 base_string--;
9562 if (*base_string == ')')
9563 parens_balanced++;
9564 if (*base_string == '(')
9565 parens_balanced--;
9566 }
9567 while (parens_balanced);
9568
9569 temp_string = base_string;
9570
9571 /* Skip past '(' and whitespace. */
9572 ++base_string;
9573 if (is_space_char (*base_string))
9574 ++base_string;
9575
9576 if (*base_string == ','
9577 || ((i.base_reg = parse_register (base_string, &end_op))
9578 != NULL))
9579 {
9580 displacement_string_end = temp_string;
9581
9582 i.types[this_operand].bitfield.baseindex = 1;
9583
9584 if (i.base_reg)
9585 {
9586 base_string = end_op;
9587 if (is_space_char (*base_string))
9588 ++base_string;
9589 }
9590
9591 /* There may be an index reg or scale factor here. */
9592 if (*base_string == ',')
9593 {
9594 ++base_string;
9595 if (is_space_char (*base_string))
9596 ++base_string;
9597
9598 if ((i.index_reg = parse_register (base_string, &end_op))
9599 != NULL)
9600 {
9601 base_string = end_op;
9602 if (is_space_char (*base_string))
9603 ++base_string;
9604 if (*base_string == ',')
9605 {
9606 ++base_string;
9607 if (is_space_char (*base_string))
9608 ++base_string;
9609 }
9610 else if (*base_string != ')')
9611 {
9612 as_bad (_("expecting `,' or `)' "
9613 "after index register in `%s'"),
9614 operand_string);
9615 return 0;
9616 }
9617 }
9618 else if (*base_string == REGISTER_PREFIX)
9619 {
9620 end_op = strchr (base_string, ',');
9621 if (end_op)
9622 *end_op = '\0';
9623 as_bad (_("bad register name `%s'"), base_string);
9624 return 0;
9625 }
9626
9627 /* Check for scale factor. */
9628 if (*base_string != ')')
9629 {
9630 char *end_scale = i386_scale (base_string);
9631
9632 if (!end_scale)
9633 return 0;
9634
9635 base_string = end_scale;
9636 if (is_space_char (*base_string))
9637 ++base_string;
9638 if (*base_string != ')')
9639 {
9640 as_bad (_("expecting `)' "
9641 "after scale factor in `%s'"),
9642 operand_string);
9643 return 0;
9644 }
9645 }
9646 else if (!i.index_reg)
9647 {
9648 as_bad (_("expecting index register or scale factor "
9649 "after `,'; got '%c'"),
9650 *base_string);
9651 return 0;
9652 }
9653 }
9654 else if (*base_string != ')')
9655 {
9656 as_bad (_("expecting `,' or `)' "
9657 "after base register in `%s'"),
9658 operand_string);
9659 return 0;
9660 }
9661 }
9662 else if (*base_string == REGISTER_PREFIX)
9663 {
9664 end_op = strchr (base_string, ',');
9665 if (end_op)
9666 *end_op = '\0';
9667 as_bad (_("bad register name `%s'"), base_string);
9668 return 0;
9669 }
9670 }
9671
9672 /* If there's an expression beginning the operand, parse it,
9673 assuming displacement_string_start and
9674 displacement_string_end are meaningful. */
9675 if (displacement_string_start != displacement_string_end)
9676 {
9677 if (!i386_displacement (displacement_string_start,
9678 displacement_string_end))
9679 return 0;
9680 }
9681
9682 /* Special case for (%dx) while doing input/output op. */
9683 if (i.base_reg
9684 && i.base_reg->reg_type.bitfield.inoutportreg
9685 && i.index_reg == 0
9686 && i.log2_scale_factor == 0
9687 && i.seg[i.mem_operands] == 0
9688 && !operand_type_check (i.types[this_operand], disp))
9689 {
9690 i.types[this_operand] = i.base_reg->reg_type;
9691 return 1;
9692 }
9693
9694 if (i386_index_check (operand_string) == 0)
9695 return 0;
9696 i.types[this_operand].bitfield.mem = 1;
9697 if (i.mem_operands == 0)
9698 i.memop1_string = xstrdup (operand_string);
9699 i.mem_operands++;
9700 }
9701 else
9702 {
9703 /* It's not a memory operand; argh! */
9704 as_bad (_("invalid char %s beginning operand %d `%s'"),
9705 output_invalid (*op_string),
9706 this_operand + 1,
9707 op_string);
9708 return 0;
9709 }
9710 return 1; /* Normal return. */
9711 }
9712 \f
9713 /* Calculate the maximum variable size (i.e., excluding fr_fix)
9714 that an rs_machine_dependent frag may reach. */
9715
9716 unsigned int
9717 i386_frag_max_var (fragS *frag)
9718 {
9719 /* The only relaxable frags are for jumps.
9720 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
9721 gas_assert (frag->fr_type == rs_machine_dependent);
9722 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
9723 }
9724
9725 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9726 static int
9727 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
9728 {
9729 /* STT_GNU_IFUNC symbol must go through PLT. */
9730 if ((symbol_get_bfdsym (fr_symbol)->flags
9731 & BSF_GNU_INDIRECT_FUNCTION) != 0)
9732 return 0;
9733
9734 if (!S_IS_EXTERNAL (fr_symbol))
9735 /* Symbol may be weak or local. */
9736 return !S_IS_WEAK (fr_symbol);
9737
9738 /* Global symbols with non-default visibility can't be preempted. */
9739 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
9740 return 1;
9741
9742 if (fr_var != NO_RELOC)
9743 switch ((enum bfd_reloc_code_real) fr_var)
9744 {
9745 case BFD_RELOC_386_PLT32:
9746 case BFD_RELOC_X86_64_PLT32:
9747 /* Symbol with PLT relocation may be preempted. */
9748 return 0;
9749 default:
9750 abort ();
9751 }
9752
9753 /* Global symbols with default visibility in a shared library may be
9754 preempted by another definition. */
9755 return !shared;
9756 }
9757 #endif
9758
9759 /* md_estimate_size_before_relax()
9760
9761 Called just before relax() for rs_machine_dependent frags. The x86
9762 assembler uses these frags to handle variable size jump
9763 instructions.
9764
9765 Any symbol that is now undefined will not become defined.
9766 Return the correct fr_subtype in the frag.
9767 Return the initial "guess for variable size of frag" to caller.
9768 The guess is actually the growth beyond the fixed part. Whatever
9769 we do to grow the fixed or variable part contributes to our
9770 returned value. */
9771
9772 int
9773 md_estimate_size_before_relax (fragS *fragP, segT segment)
9774 {
9775 /* We've already got fragP->fr_subtype right; all we have to do is
9776 check for un-relaxable symbols. On an ELF system, we can't relax
9777 an externally visible symbol, because it may be overridden by a
9778 shared library. */
9779 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
9780 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9781 || (IS_ELF
9782 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
9783 fragP->fr_var))
9784 #endif
9785 #if defined (OBJ_COFF) && defined (TE_PE)
9786 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
9787 && S_IS_WEAK (fragP->fr_symbol))
9788 #endif
9789 )
9790 {
9791 /* Symbol is undefined in this segment, or we need to keep a
9792 reloc so that weak symbols can be overridden. */
9793 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
9794 enum bfd_reloc_code_real reloc_type;
9795 unsigned char *opcode;
9796 int old_fr_fix;
9797
9798 if (fragP->fr_var != NO_RELOC)
9799 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
9800 else if (size == 2)
9801 reloc_type = BFD_RELOC_16_PCREL;
9802 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9803 else if (need_plt32_p (fragP->fr_symbol))
9804 reloc_type = BFD_RELOC_X86_64_PLT32;
9805 #endif
9806 else
9807 reloc_type = BFD_RELOC_32_PCREL;
9808
9809 old_fr_fix = fragP->fr_fix;
9810 opcode = (unsigned char *) fragP->fr_opcode;
9811
9812 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
9813 {
9814 case UNCOND_JUMP:
9815 /* Make jmp (0xeb) a (d)word displacement jump. */
9816 opcode[0] = 0xe9;
9817 fragP->fr_fix += size;
9818 fix_new (fragP, old_fr_fix, size,
9819 fragP->fr_symbol,
9820 fragP->fr_offset, 1,
9821 reloc_type);
9822 break;
9823
9824 case COND_JUMP86:
9825 if (size == 2
9826 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
9827 {
9828 /* Negate the condition, and branch past an
9829 unconditional jump. */
9830 opcode[0] ^= 1;
9831 opcode[1] = 3;
9832 /* Insert an unconditional jump. */
9833 opcode[2] = 0xe9;
9834 /* We added two extra opcode bytes, and have a two byte
9835 offset. */
9836 fragP->fr_fix += 2 + 2;
9837 fix_new (fragP, old_fr_fix + 2, 2,
9838 fragP->fr_symbol,
9839 fragP->fr_offset, 1,
9840 reloc_type);
9841 break;
9842 }
9843 /* Fall through. */
9844
9845 case COND_JUMP:
9846 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
9847 {
9848 fixS *fixP;
9849
9850 fragP->fr_fix += 1;
9851 fixP = fix_new (fragP, old_fr_fix, 1,
9852 fragP->fr_symbol,
9853 fragP->fr_offset, 1,
9854 BFD_RELOC_8_PCREL);
9855 fixP->fx_signed = 1;
9856 break;
9857 }
9858
9859 /* This changes the byte-displacement jump 0x7N
9860 to the (d)word-displacement jump 0x0f,0x8N. */
9861 opcode[1] = opcode[0] + 0x10;
9862 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9863 /* We've added an opcode byte. */
9864 fragP->fr_fix += 1 + size;
9865 fix_new (fragP, old_fr_fix + 1, size,
9866 fragP->fr_symbol,
9867 fragP->fr_offset, 1,
9868 reloc_type);
9869 break;
9870
9871 default:
9872 BAD_CASE (fragP->fr_subtype);
9873 break;
9874 }
9875 frag_wane (fragP);
9876 return fragP->fr_fix - old_fr_fix;
9877 }
9878
9879 /* Guess size depending on current relax state. Initially the relax
9880 state will correspond to a short jump and we return 1, because
9881 the variable part of the frag (the branch offset) is one byte
9882 long. However, we can relax a section more than once and in that
9883 case we must either set fr_subtype back to the unrelaxed state,
9884 or return the value for the appropriate branch. */
9885 return md_relax_table[fragP->fr_subtype].rlx_length;
9886 }
9887
9888 /* Called after relax() is finished.
9889
9890 In: Address of frag.
9891 fr_type == rs_machine_dependent.
9892 fr_subtype is what the address relaxed to.
9893
9894 Out: Any fixSs and constants are set up.
9895 Caller will turn frag into a ".space 0". */
9896
9897 void
9898 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
9899 fragS *fragP)
9900 {
9901 unsigned char *opcode;
9902 unsigned char *where_to_put_displacement = NULL;
9903 offsetT target_address;
9904 offsetT opcode_address;
9905 unsigned int extension = 0;
9906 offsetT displacement_from_opcode_start;
9907
9908 opcode = (unsigned char *) fragP->fr_opcode;
9909
9910 /* Address we want to reach in file space. */
9911 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
9912
9913 /* Address opcode resides at in file space. */
9914 opcode_address = fragP->fr_address + fragP->fr_fix;
9915
9916 /* Displacement from opcode start to fill into instruction. */
9917 displacement_from_opcode_start = target_address - opcode_address;
9918
9919 if ((fragP->fr_subtype & BIG) == 0)
9920 {
9921 /* Don't have to change opcode. */
9922 extension = 1; /* 1 opcode + 1 displacement */
9923 where_to_put_displacement = &opcode[1];
9924 }
9925 else
9926 {
9927 if (no_cond_jump_promotion
9928 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
9929 as_warn_where (fragP->fr_file, fragP->fr_line,
9930 _("long jump required"));
9931
9932 switch (fragP->fr_subtype)
9933 {
9934 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
9935 extension = 4; /* 1 opcode + 4 displacement */
9936 opcode[0] = 0xe9;
9937 where_to_put_displacement = &opcode[1];
9938 break;
9939
9940 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
9941 extension = 2; /* 1 opcode + 2 displacement */
9942 opcode[0] = 0xe9;
9943 where_to_put_displacement = &opcode[1];
9944 break;
9945
9946 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
9947 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
9948 extension = 5; /* 2 opcode + 4 displacement */
9949 opcode[1] = opcode[0] + 0x10;
9950 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9951 where_to_put_displacement = &opcode[2];
9952 break;
9953
9954 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
9955 extension = 3; /* 2 opcode + 2 displacement */
9956 opcode[1] = opcode[0] + 0x10;
9957 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9958 where_to_put_displacement = &opcode[2];
9959 break;
9960
9961 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
9962 extension = 4;
9963 opcode[0] ^= 1;
9964 opcode[1] = 3;
9965 opcode[2] = 0xe9;
9966 where_to_put_displacement = &opcode[3];
9967 break;
9968
9969 default:
9970 BAD_CASE (fragP->fr_subtype);
9971 break;
9972 }
9973 }
9974
9975 /* If size if less then four we are sure that the operand fits,
9976 but if it's 4, then it could be that the displacement is larger
9977 then -/+ 2GB. */
9978 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
9979 && object_64bit
9980 && ((addressT) (displacement_from_opcode_start - extension
9981 + ((addressT) 1 << 31))
9982 > (((addressT) 2 << 31) - 1)))
9983 {
9984 as_bad_where (fragP->fr_file, fragP->fr_line,
9985 _("jump target out of range"));
9986 /* Make us emit 0. */
9987 displacement_from_opcode_start = extension;
9988 }
9989 /* Now put displacement after opcode. */
9990 md_number_to_chars ((char *) where_to_put_displacement,
9991 (valueT) (displacement_from_opcode_start - extension),
9992 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
9993 fragP->fr_fix += extension;
9994 }
9995 \f
9996 /* Apply a fixup (fixP) to segment data, once it has been determined
9997 by our caller that we have all the info we need to fix it up.
9998
9999 Parameter valP is the pointer to the value of the bits.
10000
10001 On the 386, immediates, displacements, and data pointers are all in
10002 the same (little-endian) format, so we don't need to care about which
10003 we are handling. */
10004
10005 void
10006 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
10007 {
10008 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
10009 valueT value = *valP;
10010
10011 #if !defined (TE_Mach)
10012 if (fixP->fx_pcrel)
10013 {
10014 switch (fixP->fx_r_type)
10015 {
10016 default:
10017 break;
10018
10019 case BFD_RELOC_64:
10020 fixP->fx_r_type = BFD_RELOC_64_PCREL;
10021 break;
10022 case BFD_RELOC_32:
10023 case BFD_RELOC_X86_64_32S:
10024 fixP->fx_r_type = BFD_RELOC_32_PCREL;
10025 break;
10026 case BFD_RELOC_16:
10027 fixP->fx_r_type = BFD_RELOC_16_PCREL;
10028 break;
10029 case BFD_RELOC_8:
10030 fixP->fx_r_type = BFD_RELOC_8_PCREL;
10031 break;
10032 }
10033 }
10034
10035 if (fixP->fx_addsy != NULL
10036 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
10037 || fixP->fx_r_type == BFD_RELOC_64_PCREL
10038 || fixP->fx_r_type == BFD_RELOC_16_PCREL
10039 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
10040 && !use_rela_relocations)
10041 {
10042 /* This is a hack. There should be a better way to handle this.
10043 This covers for the fact that bfd_install_relocation will
10044 subtract the current location (for partial_inplace, PC relative
10045 relocations); see more below. */
10046 #ifndef OBJ_AOUT
10047 if (IS_ELF
10048 #ifdef TE_PE
10049 || OUTPUT_FLAVOR == bfd_target_coff_flavour
10050 #endif
10051 )
10052 value += fixP->fx_where + fixP->fx_frag->fr_address;
10053 #endif
10054 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10055 if (IS_ELF)
10056 {
10057 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
10058
10059 if ((sym_seg == seg
10060 || (symbol_section_p (fixP->fx_addsy)
10061 && sym_seg != absolute_section))
10062 && !generic_force_reloc (fixP))
10063 {
10064 /* Yes, we add the values in twice. This is because
10065 bfd_install_relocation subtracts them out again. I think
10066 bfd_install_relocation is broken, but I don't dare change
10067 it. FIXME. */
10068 value += fixP->fx_where + fixP->fx_frag->fr_address;
10069 }
10070 }
10071 #endif
10072 #if defined (OBJ_COFF) && defined (TE_PE)
10073 /* For some reason, the PE format does not store a
10074 section address offset for a PC relative symbol. */
10075 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
10076 || S_IS_WEAK (fixP->fx_addsy))
10077 value += md_pcrel_from (fixP);
10078 #endif
10079 }
10080 #if defined (OBJ_COFF) && defined (TE_PE)
10081 if (fixP->fx_addsy != NULL
10082 && S_IS_WEAK (fixP->fx_addsy)
10083 /* PR 16858: Do not modify weak function references. */
10084 && ! fixP->fx_pcrel)
10085 {
10086 #if !defined (TE_PEP)
10087 /* For x86 PE weak function symbols are neither PC-relative
10088 nor do they set S_IS_FUNCTION. So the only reliable way
10089 to detect them is to check the flags of their containing
10090 section. */
10091 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
10092 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
10093 ;
10094 else
10095 #endif
10096 value -= S_GET_VALUE (fixP->fx_addsy);
10097 }
10098 #endif
10099
10100 /* Fix a few things - the dynamic linker expects certain values here,
10101 and we must not disappoint it. */
10102 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10103 if (IS_ELF && fixP->fx_addsy)
10104 switch (fixP->fx_r_type)
10105 {
10106 case BFD_RELOC_386_PLT32:
10107 case BFD_RELOC_X86_64_PLT32:
10108 /* Make the jump instruction point to the address of the operand. At
10109 runtime we merely add the offset to the actual PLT entry. */
10110 value = -4;
10111 break;
10112
10113 case BFD_RELOC_386_TLS_GD:
10114 case BFD_RELOC_386_TLS_LDM:
10115 case BFD_RELOC_386_TLS_IE_32:
10116 case BFD_RELOC_386_TLS_IE:
10117 case BFD_RELOC_386_TLS_GOTIE:
10118 case BFD_RELOC_386_TLS_GOTDESC:
10119 case BFD_RELOC_X86_64_TLSGD:
10120 case BFD_RELOC_X86_64_TLSLD:
10121 case BFD_RELOC_X86_64_GOTTPOFF:
10122 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10123 value = 0; /* Fully resolved at runtime. No addend. */
10124 /* Fallthrough */
10125 case BFD_RELOC_386_TLS_LE:
10126 case BFD_RELOC_386_TLS_LDO_32:
10127 case BFD_RELOC_386_TLS_LE_32:
10128 case BFD_RELOC_X86_64_DTPOFF32:
10129 case BFD_RELOC_X86_64_DTPOFF64:
10130 case BFD_RELOC_X86_64_TPOFF32:
10131 case BFD_RELOC_X86_64_TPOFF64:
10132 S_SET_THREAD_LOCAL (fixP->fx_addsy);
10133 break;
10134
10135 case BFD_RELOC_386_TLS_DESC_CALL:
10136 case BFD_RELOC_X86_64_TLSDESC_CALL:
10137 value = 0; /* Fully resolved at runtime. No addend. */
10138 S_SET_THREAD_LOCAL (fixP->fx_addsy);
10139 fixP->fx_done = 0;
10140 return;
10141
10142 case BFD_RELOC_VTABLE_INHERIT:
10143 case BFD_RELOC_VTABLE_ENTRY:
10144 fixP->fx_done = 0;
10145 return;
10146
10147 default:
10148 break;
10149 }
10150 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
10151 *valP = value;
10152 #endif /* !defined (TE_Mach) */
10153
10154 /* Are we finished with this relocation now? */
10155 if (fixP->fx_addsy == NULL)
10156 fixP->fx_done = 1;
10157 #if defined (OBJ_COFF) && defined (TE_PE)
10158 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
10159 {
10160 fixP->fx_done = 0;
10161 /* Remember value for tc_gen_reloc. */
10162 fixP->fx_addnumber = value;
10163 /* Clear out the frag for now. */
10164 value = 0;
10165 }
10166 #endif
10167 else if (use_rela_relocations)
10168 {
10169 fixP->fx_no_overflow = 1;
10170 /* Remember value for tc_gen_reloc. */
10171 fixP->fx_addnumber = value;
10172 value = 0;
10173 }
10174
10175 md_number_to_chars (p, value, fixP->fx_size);
10176 }
10177 \f
10178 const char *
10179 md_atof (int type, char *litP, int *sizeP)
10180 {
10181 /* This outputs the LITTLENUMs in REVERSE order;
10182 in accord with the bigendian 386. */
10183 return ieee_md_atof (type, litP, sizeP, FALSE);
10184 }
10185 \f
10186 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
10187
10188 static char *
10189 output_invalid (int c)
10190 {
10191 if (ISPRINT (c))
10192 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10193 "'%c'", c);
10194 else
10195 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10196 "(0x%x)", (unsigned char) c);
10197 return output_invalid_buf;
10198 }
10199
10200 /* REG_STRING starts *before* REGISTER_PREFIX. */
10201
10202 static const reg_entry *
10203 parse_real_register (char *reg_string, char **end_op)
10204 {
10205 char *s = reg_string;
10206 char *p;
10207 char reg_name_given[MAX_REG_NAME_SIZE + 1];
10208 const reg_entry *r;
10209
10210 /* Skip possible REGISTER_PREFIX and possible whitespace. */
10211 if (*s == REGISTER_PREFIX)
10212 ++s;
10213
10214 if (is_space_char (*s))
10215 ++s;
10216
10217 p = reg_name_given;
10218 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
10219 {
10220 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
10221 return (const reg_entry *) NULL;
10222 s++;
10223 }
10224
10225 /* For naked regs, make sure that we are not dealing with an identifier.
10226 This prevents confusing an identifier like `eax_var' with register
10227 `eax'. */
10228 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
10229 return (const reg_entry *) NULL;
10230
10231 *end_op = s;
10232
10233 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
10234
10235 /* Handle floating point regs, allowing spaces in the (i) part. */
10236 if (r == i386_regtab /* %st is first entry of table */)
10237 {
10238 if (!cpu_arch_flags.bitfield.cpu8087
10239 && !cpu_arch_flags.bitfield.cpu287
10240 && !cpu_arch_flags.bitfield.cpu387)
10241 return (const reg_entry *) NULL;
10242
10243 if (is_space_char (*s))
10244 ++s;
10245 if (*s == '(')
10246 {
10247 ++s;
10248 if (is_space_char (*s))
10249 ++s;
10250 if (*s >= '0' && *s <= '7')
10251 {
10252 int fpr = *s - '0';
10253 ++s;
10254 if (is_space_char (*s))
10255 ++s;
10256 if (*s == ')')
10257 {
10258 *end_op = s + 1;
10259 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
10260 know (r);
10261 return r + fpr;
10262 }
10263 }
10264 /* We have "%st(" then garbage. */
10265 return (const reg_entry *) NULL;
10266 }
10267 }
10268
10269 if (r == NULL || allow_pseudo_reg)
10270 return r;
10271
10272 if (operand_type_all_zero (&r->reg_type))
10273 return (const reg_entry *) NULL;
10274
10275 if ((r->reg_type.bitfield.dword
10276 || r->reg_type.bitfield.sreg3
10277 || r->reg_type.bitfield.control
10278 || r->reg_type.bitfield.debug
10279 || r->reg_type.bitfield.test)
10280 && !cpu_arch_flags.bitfield.cpui386)
10281 return (const reg_entry *) NULL;
10282
10283 if (r->reg_type.bitfield.regmmx && !cpu_arch_flags.bitfield.cpummx)
10284 return (const reg_entry *) NULL;
10285
10286 if (!cpu_arch_flags.bitfield.cpuavx512f)
10287 {
10288 if (r->reg_type.bitfield.zmmword || r->reg_type.bitfield.regmask)
10289 return (const reg_entry *) NULL;
10290
10291 if (!cpu_arch_flags.bitfield.cpuavx)
10292 {
10293 if (r->reg_type.bitfield.ymmword)
10294 return (const reg_entry *) NULL;
10295
10296 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
10297 return (const reg_entry *) NULL;
10298 }
10299 }
10300
10301 if (r->reg_type.bitfield.regbnd && !cpu_arch_flags.bitfield.cpumpx)
10302 return (const reg_entry *) NULL;
10303
10304 /* Don't allow fake index register unless allow_index_reg isn't 0. */
10305 if (!allow_index_reg
10306 && (r->reg_num == RegEiz || r->reg_num == RegRiz))
10307 return (const reg_entry *) NULL;
10308
10309 /* Upper 16 vector registers are only available with VREX in 64bit
10310 mode, and require EVEX encoding. */
10311 if (r->reg_flags & RegVRex)
10312 {
10313 if (!cpu_arch_flags.bitfield.cpuvrex
10314 || flag_code != CODE_64BIT)
10315 return (const reg_entry *) NULL;
10316
10317 i.vec_encoding = vex_encoding_evex;
10318 }
10319
10320 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
10321 && (!cpu_arch_flags.bitfield.cpulm || !r->reg_type.bitfield.control)
10322 && flag_code != CODE_64BIT)
10323 return (const reg_entry *) NULL;
10324
10325 if (r->reg_type.bitfield.sreg3 && r->reg_num == RegFlat && !intel_syntax)
10326 return (const reg_entry *) NULL;
10327
10328 return r;
10329 }
10330
10331 /* REG_STRING starts *before* REGISTER_PREFIX. */
10332
10333 static const reg_entry *
10334 parse_register (char *reg_string, char **end_op)
10335 {
10336 const reg_entry *r;
10337
10338 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
10339 r = parse_real_register (reg_string, end_op);
10340 else
10341 r = NULL;
10342 if (!r)
10343 {
10344 char *save = input_line_pointer;
10345 char c;
10346 symbolS *symbolP;
10347
10348 input_line_pointer = reg_string;
10349 c = get_symbol_name (&reg_string);
10350 symbolP = symbol_find (reg_string);
10351 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
10352 {
10353 const expressionS *e = symbol_get_value_expression (symbolP);
10354
10355 know (e->X_op == O_register);
10356 know (e->X_add_number >= 0
10357 && (valueT) e->X_add_number < i386_regtab_size);
10358 r = i386_regtab + e->X_add_number;
10359 if ((r->reg_flags & RegVRex))
10360 i.vec_encoding = vex_encoding_evex;
10361 *end_op = input_line_pointer;
10362 }
10363 *input_line_pointer = c;
10364 input_line_pointer = save;
10365 }
10366 return r;
10367 }
10368
10369 int
10370 i386_parse_name (char *name, expressionS *e, char *nextcharP)
10371 {
10372 const reg_entry *r;
10373 char *end = input_line_pointer;
10374
10375 *end = *nextcharP;
10376 r = parse_register (name, &input_line_pointer);
10377 if (r && end <= input_line_pointer)
10378 {
10379 *nextcharP = *input_line_pointer;
10380 *input_line_pointer = 0;
10381 e->X_op = O_register;
10382 e->X_add_number = r - i386_regtab;
10383 return 1;
10384 }
10385 input_line_pointer = end;
10386 *end = 0;
10387 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
10388 }
10389
10390 void
10391 md_operand (expressionS *e)
10392 {
10393 char *end;
10394 const reg_entry *r;
10395
10396 switch (*input_line_pointer)
10397 {
10398 case REGISTER_PREFIX:
10399 r = parse_real_register (input_line_pointer, &end);
10400 if (r)
10401 {
10402 e->X_op = O_register;
10403 e->X_add_number = r - i386_regtab;
10404 input_line_pointer = end;
10405 }
10406 break;
10407
10408 case '[':
10409 gas_assert (intel_syntax);
10410 end = input_line_pointer++;
10411 expression (e);
10412 if (*input_line_pointer == ']')
10413 {
10414 ++input_line_pointer;
10415 e->X_op_symbol = make_expr_symbol (e);
10416 e->X_add_symbol = NULL;
10417 e->X_add_number = 0;
10418 e->X_op = O_index;
10419 }
10420 else
10421 {
10422 e->X_op = O_absent;
10423 input_line_pointer = end;
10424 }
10425 break;
10426 }
10427 }
10428
10429 \f
10430 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10431 const char *md_shortopts = "kVQ:sqnO::";
10432 #else
10433 const char *md_shortopts = "qnO::";
10434 #endif
10435
10436 #define OPTION_32 (OPTION_MD_BASE + 0)
10437 #define OPTION_64 (OPTION_MD_BASE + 1)
10438 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
10439 #define OPTION_MARCH (OPTION_MD_BASE + 3)
10440 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
10441 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
10442 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
10443 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
10444 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
10445 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
10446 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
10447 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
10448 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
10449 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
10450 #define OPTION_X32 (OPTION_MD_BASE + 14)
10451 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
10452 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
10453 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
10454 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
10455 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
10456 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
10457 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
10458 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
10459 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
10460 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
10461
10462 struct option md_longopts[] =
10463 {
10464 {"32", no_argument, NULL, OPTION_32},
10465 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
10466 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
10467 {"64", no_argument, NULL, OPTION_64},
10468 #endif
10469 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10470 {"x32", no_argument, NULL, OPTION_X32},
10471 {"mshared", no_argument, NULL, OPTION_MSHARED},
10472 #endif
10473 {"divide", no_argument, NULL, OPTION_DIVIDE},
10474 {"march", required_argument, NULL, OPTION_MARCH},
10475 {"mtune", required_argument, NULL, OPTION_MTUNE},
10476 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
10477 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
10478 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
10479 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
10480 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
10481 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
10482 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
10483 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
10484 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
10485 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
10486 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
10487 # if defined (TE_PE) || defined (TE_PEP)
10488 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
10489 #endif
10490 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
10491 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
10492 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
10493 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
10494 {"mamd64", no_argument, NULL, OPTION_MAMD64},
10495 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
10496 {NULL, no_argument, NULL, 0}
10497 };
10498 size_t md_longopts_size = sizeof (md_longopts);
10499
10500 int
10501 md_parse_option (int c, const char *arg)
10502 {
10503 unsigned int j;
10504 char *arch, *next, *saved;
10505
10506 switch (c)
10507 {
10508 case 'n':
10509 optimize_align_code = 0;
10510 break;
10511
10512 case 'q':
10513 quiet_warnings = 1;
10514 break;
10515
10516 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10517 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
10518 should be emitted or not. FIXME: Not implemented. */
10519 case 'Q':
10520 break;
10521
10522 /* -V: SVR4 argument to print version ID. */
10523 case 'V':
10524 print_version_id ();
10525 break;
10526
10527 /* -k: Ignore for FreeBSD compatibility. */
10528 case 'k':
10529 break;
10530
10531 case 's':
10532 /* -s: On i386 Solaris, this tells the native assembler to use
10533 .stab instead of .stab.excl. We always use .stab anyhow. */
10534 break;
10535
10536 case OPTION_MSHARED:
10537 shared = 1;
10538 break;
10539 #endif
10540 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
10541 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
10542 case OPTION_64:
10543 {
10544 const char **list, **l;
10545
10546 list = bfd_target_list ();
10547 for (l = list; *l != NULL; l++)
10548 if (CONST_STRNEQ (*l, "elf64-x86-64")
10549 || strcmp (*l, "coff-x86-64") == 0
10550 || strcmp (*l, "pe-x86-64") == 0
10551 || strcmp (*l, "pei-x86-64") == 0
10552 || strcmp (*l, "mach-o-x86-64") == 0)
10553 {
10554 default_arch = "x86_64";
10555 break;
10556 }
10557 if (*l == NULL)
10558 as_fatal (_("no compiled in support for x86_64"));
10559 free (list);
10560 }
10561 break;
10562 #endif
10563
10564 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10565 case OPTION_X32:
10566 if (IS_ELF)
10567 {
10568 const char **list, **l;
10569
10570 list = bfd_target_list ();
10571 for (l = list; *l != NULL; l++)
10572 if (CONST_STRNEQ (*l, "elf32-x86-64"))
10573 {
10574 default_arch = "x86_64:32";
10575 break;
10576 }
10577 if (*l == NULL)
10578 as_fatal (_("no compiled in support for 32bit x86_64"));
10579 free (list);
10580 }
10581 else
10582 as_fatal (_("32bit x86_64 is only supported for ELF"));
10583 break;
10584 #endif
10585
10586 case OPTION_32:
10587 default_arch = "i386";
10588 break;
10589
10590 case OPTION_DIVIDE:
10591 #ifdef SVR4_COMMENT_CHARS
10592 {
10593 char *n, *t;
10594 const char *s;
10595
10596 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
10597 t = n;
10598 for (s = i386_comment_chars; *s != '\0'; s++)
10599 if (*s != '/')
10600 *t++ = *s;
10601 *t = '\0';
10602 i386_comment_chars = n;
10603 }
10604 #endif
10605 break;
10606
10607 case OPTION_MARCH:
10608 saved = xstrdup (arg);
10609 arch = saved;
10610 /* Allow -march=+nosse. */
10611 if (*arch == '+')
10612 arch++;
10613 do
10614 {
10615 if (*arch == '.')
10616 as_fatal (_("invalid -march= option: `%s'"), arg);
10617 next = strchr (arch, '+');
10618 if (next)
10619 *next++ = '\0';
10620 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
10621 {
10622 if (strcmp (arch, cpu_arch [j].name) == 0)
10623 {
10624 /* Processor. */
10625 if (! cpu_arch[j].flags.bitfield.cpui386)
10626 continue;
10627
10628 cpu_arch_name = cpu_arch[j].name;
10629 cpu_sub_arch_name = NULL;
10630 cpu_arch_flags = cpu_arch[j].flags;
10631 cpu_arch_isa = cpu_arch[j].type;
10632 cpu_arch_isa_flags = cpu_arch[j].flags;
10633 if (!cpu_arch_tune_set)
10634 {
10635 cpu_arch_tune = cpu_arch_isa;
10636 cpu_arch_tune_flags = cpu_arch_isa_flags;
10637 }
10638 break;
10639 }
10640 else if (*cpu_arch [j].name == '.'
10641 && strcmp (arch, cpu_arch [j].name + 1) == 0)
10642 {
10643 /* ISA extension. */
10644 i386_cpu_flags flags;
10645
10646 flags = cpu_flags_or (cpu_arch_flags,
10647 cpu_arch[j].flags);
10648
10649 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
10650 {
10651 if (cpu_sub_arch_name)
10652 {
10653 char *name = cpu_sub_arch_name;
10654 cpu_sub_arch_name = concat (name,
10655 cpu_arch[j].name,
10656 (const char *) NULL);
10657 free (name);
10658 }
10659 else
10660 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
10661 cpu_arch_flags = flags;
10662 cpu_arch_isa_flags = flags;
10663 }
10664 else
10665 cpu_arch_isa_flags
10666 = cpu_flags_or (cpu_arch_isa_flags,
10667 cpu_arch[j].flags);
10668 break;
10669 }
10670 }
10671
10672 if (j >= ARRAY_SIZE (cpu_arch))
10673 {
10674 /* Disable an ISA extension. */
10675 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
10676 if (strcmp (arch, cpu_noarch [j].name) == 0)
10677 {
10678 i386_cpu_flags flags;
10679
10680 flags = cpu_flags_and_not (cpu_arch_flags,
10681 cpu_noarch[j].flags);
10682 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
10683 {
10684 if (cpu_sub_arch_name)
10685 {
10686 char *name = cpu_sub_arch_name;
10687 cpu_sub_arch_name = concat (arch,
10688 (const char *) NULL);
10689 free (name);
10690 }
10691 else
10692 cpu_sub_arch_name = xstrdup (arch);
10693 cpu_arch_flags = flags;
10694 cpu_arch_isa_flags = flags;
10695 }
10696 break;
10697 }
10698
10699 if (j >= ARRAY_SIZE (cpu_noarch))
10700 j = ARRAY_SIZE (cpu_arch);
10701 }
10702
10703 if (j >= ARRAY_SIZE (cpu_arch))
10704 as_fatal (_("invalid -march= option: `%s'"), arg);
10705
10706 arch = next;
10707 }
10708 while (next != NULL);
10709 free (saved);
10710 break;
10711
10712 case OPTION_MTUNE:
10713 if (*arg == '.')
10714 as_fatal (_("invalid -mtune= option: `%s'"), arg);
10715 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
10716 {
10717 if (strcmp (arg, cpu_arch [j].name) == 0)
10718 {
10719 cpu_arch_tune_set = 1;
10720 cpu_arch_tune = cpu_arch [j].type;
10721 cpu_arch_tune_flags = cpu_arch[j].flags;
10722 break;
10723 }
10724 }
10725 if (j >= ARRAY_SIZE (cpu_arch))
10726 as_fatal (_("invalid -mtune= option: `%s'"), arg);
10727 break;
10728
10729 case OPTION_MMNEMONIC:
10730 if (strcasecmp (arg, "att") == 0)
10731 intel_mnemonic = 0;
10732 else if (strcasecmp (arg, "intel") == 0)
10733 intel_mnemonic = 1;
10734 else
10735 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
10736 break;
10737
10738 case OPTION_MSYNTAX:
10739 if (strcasecmp (arg, "att") == 0)
10740 intel_syntax = 0;
10741 else if (strcasecmp (arg, "intel") == 0)
10742 intel_syntax = 1;
10743 else
10744 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
10745 break;
10746
10747 case OPTION_MINDEX_REG:
10748 allow_index_reg = 1;
10749 break;
10750
10751 case OPTION_MNAKED_REG:
10752 allow_naked_reg = 1;
10753 break;
10754
10755 case OPTION_MSSE2AVX:
10756 sse2avx = 1;
10757 break;
10758
10759 case OPTION_MSSE_CHECK:
10760 if (strcasecmp (arg, "error") == 0)
10761 sse_check = check_error;
10762 else if (strcasecmp (arg, "warning") == 0)
10763 sse_check = check_warning;
10764 else if (strcasecmp (arg, "none") == 0)
10765 sse_check = check_none;
10766 else
10767 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
10768 break;
10769
10770 case OPTION_MOPERAND_CHECK:
10771 if (strcasecmp (arg, "error") == 0)
10772 operand_check = check_error;
10773 else if (strcasecmp (arg, "warning") == 0)
10774 operand_check = check_warning;
10775 else if (strcasecmp (arg, "none") == 0)
10776 operand_check = check_none;
10777 else
10778 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
10779 break;
10780
10781 case OPTION_MAVXSCALAR:
10782 if (strcasecmp (arg, "128") == 0)
10783 avxscalar = vex128;
10784 else if (strcasecmp (arg, "256") == 0)
10785 avxscalar = vex256;
10786 else
10787 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
10788 break;
10789
10790 case OPTION_MADD_BND_PREFIX:
10791 add_bnd_prefix = 1;
10792 break;
10793
10794 case OPTION_MEVEXLIG:
10795 if (strcmp (arg, "128") == 0)
10796 evexlig = evexl128;
10797 else if (strcmp (arg, "256") == 0)
10798 evexlig = evexl256;
10799 else if (strcmp (arg, "512") == 0)
10800 evexlig = evexl512;
10801 else
10802 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
10803 break;
10804
10805 case OPTION_MEVEXRCIG:
10806 if (strcmp (arg, "rne") == 0)
10807 evexrcig = rne;
10808 else if (strcmp (arg, "rd") == 0)
10809 evexrcig = rd;
10810 else if (strcmp (arg, "ru") == 0)
10811 evexrcig = ru;
10812 else if (strcmp (arg, "rz") == 0)
10813 evexrcig = rz;
10814 else
10815 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
10816 break;
10817
10818 case OPTION_MEVEXWIG:
10819 if (strcmp (arg, "0") == 0)
10820 evexwig = evexw0;
10821 else if (strcmp (arg, "1") == 0)
10822 evexwig = evexw1;
10823 else
10824 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
10825 break;
10826
10827 # if defined (TE_PE) || defined (TE_PEP)
10828 case OPTION_MBIG_OBJ:
10829 use_big_obj = 1;
10830 break;
10831 #endif
10832
10833 case OPTION_MOMIT_LOCK_PREFIX:
10834 if (strcasecmp (arg, "yes") == 0)
10835 omit_lock_prefix = 1;
10836 else if (strcasecmp (arg, "no") == 0)
10837 omit_lock_prefix = 0;
10838 else
10839 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
10840 break;
10841
10842 case OPTION_MFENCE_AS_LOCK_ADD:
10843 if (strcasecmp (arg, "yes") == 0)
10844 avoid_fence = 1;
10845 else if (strcasecmp (arg, "no") == 0)
10846 avoid_fence = 0;
10847 else
10848 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
10849 break;
10850
10851 case OPTION_MRELAX_RELOCATIONS:
10852 if (strcasecmp (arg, "yes") == 0)
10853 generate_relax_relocations = 1;
10854 else if (strcasecmp (arg, "no") == 0)
10855 generate_relax_relocations = 0;
10856 else
10857 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
10858 break;
10859
10860 case OPTION_MAMD64:
10861 intel64 = 0;
10862 break;
10863
10864 case OPTION_MINTEL64:
10865 intel64 = 1;
10866 break;
10867
10868 case 'O':
10869 if (arg == NULL)
10870 {
10871 optimize = 1;
10872 /* Turn off -Os. */
10873 optimize_for_space = 0;
10874 }
10875 else if (*arg == 's')
10876 {
10877 optimize_for_space = 1;
10878 /* Turn on all encoding optimizations. */
10879 optimize = -1;
10880 }
10881 else
10882 {
10883 optimize = atoi (arg);
10884 /* Turn off -Os. */
10885 optimize_for_space = 0;
10886 }
10887 break;
10888
10889 default:
10890 return 0;
10891 }
10892 return 1;
10893 }
10894
10895 #define MESSAGE_TEMPLATE \
10896 " "
10897
10898 static char *
10899 output_message (FILE *stream, char *p, char *message, char *start,
10900 int *left_p, const char *name, int len)
10901 {
10902 int size = sizeof (MESSAGE_TEMPLATE);
10903 int left = *left_p;
10904
10905 /* Reserve 2 spaces for ", " or ",\0" */
10906 left -= len + 2;
10907
10908 /* Check if there is any room. */
10909 if (left >= 0)
10910 {
10911 if (p != start)
10912 {
10913 *p++ = ',';
10914 *p++ = ' ';
10915 }
10916 p = mempcpy (p, name, len);
10917 }
10918 else
10919 {
10920 /* Output the current message now and start a new one. */
10921 *p++ = ',';
10922 *p = '\0';
10923 fprintf (stream, "%s\n", message);
10924 p = start;
10925 left = size - (start - message) - len - 2;
10926
10927 gas_assert (left >= 0);
10928
10929 p = mempcpy (p, name, len);
10930 }
10931
10932 *left_p = left;
10933 return p;
10934 }
10935
10936 static void
10937 show_arch (FILE *stream, int ext, int check)
10938 {
10939 static char message[] = MESSAGE_TEMPLATE;
10940 char *start = message + 27;
10941 char *p;
10942 int size = sizeof (MESSAGE_TEMPLATE);
10943 int left;
10944 const char *name;
10945 int len;
10946 unsigned int j;
10947
10948 p = start;
10949 left = size - (start - message);
10950 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
10951 {
10952 /* Should it be skipped? */
10953 if (cpu_arch [j].skip)
10954 continue;
10955
10956 name = cpu_arch [j].name;
10957 len = cpu_arch [j].len;
10958 if (*name == '.')
10959 {
10960 /* It is an extension. Skip if we aren't asked to show it. */
10961 if (ext)
10962 {
10963 name++;
10964 len--;
10965 }
10966 else
10967 continue;
10968 }
10969 else if (ext)
10970 {
10971 /* It is an processor. Skip if we show only extension. */
10972 continue;
10973 }
10974 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
10975 {
10976 /* It is an impossible processor - skip. */
10977 continue;
10978 }
10979
10980 p = output_message (stream, p, message, start, &left, name, len);
10981 }
10982
10983 /* Display disabled extensions. */
10984 if (ext)
10985 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
10986 {
10987 name = cpu_noarch [j].name;
10988 len = cpu_noarch [j].len;
10989 p = output_message (stream, p, message, start, &left, name,
10990 len);
10991 }
10992
10993 *p = '\0';
10994 fprintf (stream, "%s\n", message);
10995 }
10996
10997 void
10998 md_show_usage (FILE *stream)
10999 {
11000 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11001 fprintf (stream, _("\
11002 -Q ignored\n\
11003 -V print assembler version number\n\
11004 -k ignored\n"));
11005 #endif
11006 fprintf (stream, _("\
11007 -n Do not optimize code alignment\n\
11008 -q quieten some warnings\n"));
11009 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11010 fprintf (stream, _("\
11011 -s ignored\n"));
11012 #endif
11013 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11014 || defined (TE_PE) || defined (TE_PEP))
11015 fprintf (stream, _("\
11016 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
11017 #endif
11018 #ifdef SVR4_COMMENT_CHARS
11019 fprintf (stream, _("\
11020 --divide do not treat `/' as a comment character\n"));
11021 #else
11022 fprintf (stream, _("\
11023 --divide ignored\n"));
11024 #endif
11025 fprintf (stream, _("\
11026 -march=CPU[,+EXTENSION...]\n\
11027 generate code for CPU and EXTENSION, CPU is one of:\n"));
11028 show_arch (stream, 0, 1);
11029 fprintf (stream, _("\
11030 EXTENSION is combination of:\n"));
11031 show_arch (stream, 1, 0);
11032 fprintf (stream, _("\
11033 -mtune=CPU optimize for CPU, CPU is one of:\n"));
11034 show_arch (stream, 0, 0);
11035 fprintf (stream, _("\
11036 -msse2avx encode SSE instructions with VEX prefix\n"));
11037 fprintf (stream, _("\
11038 -msse-check=[none|error|warning]\n\
11039 check SSE instructions\n"));
11040 fprintf (stream, _("\
11041 -moperand-check=[none|error|warning]\n\
11042 check operand combinations for validity\n"));
11043 fprintf (stream, _("\
11044 -mavxscalar=[128|256] encode scalar AVX instructions with specific vector\n\
11045 length\n"));
11046 fprintf (stream, _("\
11047 -mevexlig=[128|256|512] encode scalar EVEX instructions with specific vector\n\
11048 length\n"));
11049 fprintf (stream, _("\
11050 -mevexwig=[0|1] encode EVEX instructions with specific EVEX.W value\n\
11051 for EVEX.W bit ignored instructions\n"));
11052 fprintf (stream, _("\
11053 -mevexrcig=[rne|rd|ru|rz]\n\
11054 encode EVEX instructions with specific EVEX.RC value\n\
11055 for SAE-only ignored instructions\n"));
11056 fprintf (stream, _("\
11057 -mmnemonic=[att|intel] use AT&T/Intel mnemonic\n"));
11058 fprintf (stream, _("\
11059 -msyntax=[att|intel] use AT&T/Intel syntax\n"));
11060 fprintf (stream, _("\
11061 -mindex-reg support pseudo index registers\n"));
11062 fprintf (stream, _("\
11063 -mnaked-reg don't require `%%' prefix for registers\n"));
11064 fprintf (stream, _("\
11065 -madd-bnd-prefix add BND prefix for all valid branches\n"));
11066 fprintf (stream, _("\
11067 -mshared disable branch optimization for shared code\n"));
11068 # if defined (TE_PE) || defined (TE_PEP)
11069 fprintf (stream, _("\
11070 -mbig-obj generate big object files\n"));
11071 #endif
11072 fprintf (stream, _("\
11073 -momit-lock-prefix=[no|yes]\n\
11074 strip all lock prefixes\n"));
11075 fprintf (stream, _("\
11076 -mfence-as-lock-add=[no|yes]\n\
11077 encode lfence, mfence and sfence as\n\
11078 lock addl $0x0, (%%{re}sp)\n"));
11079 fprintf (stream, _("\
11080 -mrelax-relocations=[no|yes]\n\
11081 generate relax relocations\n"));
11082 fprintf (stream, _("\
11083 -mamd64 accept only AMD64 ISA\n"));
11084 fprintf (stream, _("\
11085 -mintel64 accept only Intel64 ISA\n"));
11086 }
11087
11088 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
11089 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11090 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11091
11092 /* Pick the target format to use. */
11093
11094 const char *
11095 i386_target_format (void)
11096 {
11097 if (!strncmp (default_arch, "x86_64", 6))
11098 {
11099 update_code_flag (CODE_64BIT, 1);
11100 if (default_arch[6] == '\0')
11101 x86_elf_abi = X86_64_ABI;
11102 else
11103 x86_elf_abi = X86_64_X32_ABI;
11104 }
11105 else if (!strcmp (default_arch, "i386"))
11106 update_code_flag (CODE_32BIT, 1);
11107 else if (!strcmp (default_arch, "iamcu"))
11108 {
11109 update_code_flag (CODE_32BIT, 1);
11110 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
11111 {
11112 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
11113 cpu_arch_name = "iamcu";
11114 cpu_sub_arch_name = NULL;
11115 cpu_arch_flags = iamcu_flags;
11116 cpu_arch_isa = PROCESSOR_IAMCU;
11117 cpu_arch_isa_flags = iamcu_flags;
11118 if (!cpu_arch_tune_set)
11119 {
11120 cpu_arch_tune = cpu_arch_isa;
11121 cpu_arch_tune_flags = cpu_arch_isa_flags;
11122 }
11123 }
11124 else if (cpu_arch_isa != PROCESSOR_IAMCU)
11125 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
11126 cpu_arch_name);
11127 }
11128 else
11129 as_fatal (_("unknown architecture"));
11130
11131 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
11132 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11133 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
11134 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11135
11136 switch (OUTPUT_FLAVOR)
11137 {
11138 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
11139 case bfd_target_aout_flavour:
11140 return AOUT_TARGET_FORMAT;
11141 #endif
11142 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
11143 # if defined (TE_PE) || defined (TE_PEP)
11144 case bfd_target_coff_flavour:
11145 if (flag_code == CODE_64BIT)
11146 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
11147 else
11148 return "pe-i386";
11149 # elif defined (TE_GO32)
11150 case bfd_target_coff_flavour:
11151 return "coff-go32";
11152 # else
11153 case bfd_target_coff_flavour:
11154 return "coff-i386";
11155 # endif
11156 #endif
11157 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
11158 case bfd_target_elf_flavour:
11159 {
11160 const char *format;
11161
11162 switch (x86_elf_abi)
11163 {
11164 default:
11165 format = ELF_TARGET_FORMAT;
11166 break;
11167 case X86_64_ABI:
11168 use_rela_relocations = 1;
11169 object_64bit = 1;
11170 format = ELF_TARGET_FORMAT64;
11171 break;
11172 case X86_64_X32_ABI:
11173 use_rela_relocations = 1;
11174 object_64bit = 1;
11175 disallow_64bit_reloc = 1;
11176 format = ELF_TARGET_FORMAT32;
11177 break;
11178 }
11179 if (cpu_arch_isa == PROCESSOR_L1OM)
11180 {
11181 if (x86_elf_abi != X86_64_ABI)
11182 as_fatal (_("Intel L1OM is 64bit only"));
11183 return ELF_TARGET_L1OM_FORMAT;
11184 }
11185 else if (cpu_arch_isa == PROCESSOR_K1OM)
11186 {
11187 if (x86_elf_abi != X86_64_ABI)
11188 as_fatal (_("Intel K1OM is 64bit only"));
11189 return ELF_TARGET_K1OM_FORMAT;
11190 }
11191 else if (cpu_arch_isa == PROCESSOR_IAMCU)
11192 {
11193 if (x86_elf_abi != I386_ABI)
11194 as_fatal (_("Intel MCU is 32bit only"));
11195 return ELF_TARGET_IAMCU_FORMAT;
11196 }
11197 else
11198 return format;
11199 }
11200 #endif
11201 #if defined (OBJ_MACH_O)
11202 case bfd_target_mach_o_flavour:
11203 if (flag_code == CODE_64BIT)
11204 {
11205 use_rela_relocations = 1;
11206 object_64bit = 1;
11207 return "mach-o-x86-64";
11208 }
11209 else
11210 return "mach-o-i386";
11211 #endif
11212 default:
11213 abort ();
11214 return NULL;
11215 }
11216 }
11217
11218 #endif /* OBJ_MAYBE_ more than one */
11219 \f
11220 symbolS *
11221 md_undefined_symbol (char *name)
11222 {
11223 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
11224 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
11225 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
11226 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
11227 {
11228 if (!GOT_symbol)
11229 {
11230 if (symbol_find (name))
11231 as_bad (_("GOT already in symbol table"));
11232 GOT_symbol = symbol_new (name, undefined_section,
11233 (valueT) 0, &zero_address_frag);
11234 };
11235 return GOT_symbol;
11236 }
11237 return 0;
11238 }
11239
11240 /* Round up a section size to the appropriate boundary. */
11241
11242 valueT
11243 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
11244 {
11245 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
11246 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
11247 {
11248 /* For a.out, force the section size to be aligned. If we don't do
11249 this, BFD will align it for us, but it will not write out the
11250 final bytes of the section. This may be a bug in BFD, but it is
11251 easier to fix it here since that is how the other a.out targets
11252 work. */
11253 int align;
11254
11255 align = bfd_get_section_alignment (stdoutput, segment);
11256 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
11257 }
11258 #endif
11259
11260 return size;
11261 }
11262
11263 /* On the i386, PC-relative offsets are relative to the start of the
11264 next instruction. That is, the address of the offset, plus its
11265 size, since the offset is always the last part of the insn. */
11266
11267 long
11268 md_pcrel_from (fixS *fixP)
11269 {
11270 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
11271 }
11272
11273 #ifndef I386COFF
11274
11275 static void
11276 s_bss (int ignore ATTRIBUTE_UNUSED)
11277 {
11278 int temp;
11279
11280 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11281 if (IS_ELF)
11282 obj_elf_section_change_hook ();
11283 #endif
11284 temp = get_absolute_expression ();
11285 subseg_set (bss_section, (subsegT) temp);
11286 demand_empty_rest_of_line ();
11287 }
11288
11289 #endif
11290
11291 void
11292 i386_validate_fix (fixS *fixp)
11293 {
11294 if (fixp->fx_subsy)
11295 {
11296 if (fixp->fx_subsy == GOT_symbol)
11297 {
11298 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
11299 {
11300 if (!object_64bit)
11301 abort ();
11302 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11303 if (fixp->fx_tcbit2)
11304 fixp->fx_r_type = (fixp->fx_tcbit
11305 ? BFD_RELOC_X86_64_REX_GOTPCRELX
11306 : BFD_RELOC_X86_64_GOTPCRELX);
11307 else
11308 #endif
11309 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
11310 }
11311 else
11312 {
11313 if (!object_64bit)
11314 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
11315 else
11316 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
11317 }
11318 fixp->fx_subsy = 0;
11319 }
11320 }
11321 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11322 else if (!object_64bit)
11323 {
11324 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
11325 && fixp->fx_tcbit2)
11326 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
11327 }
11328 #endif
11329 }
11330
11331 arelent *
11332 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
11333 {
11334 arelent *rel;
11335 bfd_reloc_code_real_type code;
11336
11337 switch (fixp->fx_r_type)
11338 {
11339 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11340 case BFD_RELOC_SIZE32:
11341 case BFD_RELOC_SIZE64:
11342 if (S_IS_DEFINED (fixp->fx_addsy)
11343 && !S_IS_EXTERNAL (fixp->fx_addsy))
11344 {
11345 /* Resolve size relocation against local symbol to size of
11346 the symbol plus addend. */
11347 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
11348 if (fixp->fx_r_type == BFD_RELOC_SIZE32
11349 && !fits_in_unsigned_long (value))
11350 as_bad_where (fixp->fx_file, fixp->fx_line,
11351 _("symbol size computation overflow"));
11352 fixp->fx_addsy = NULL;
11353 fixp->fx_subsy = NULL;
11354 md_apply_fix (fixp, (valueT *) &value, NULL);
11355 return NULL;
11356 }
11357 #endif
11358 /* Fall through. */
11359
11360 case BFD_RELOC_X86_64_PLT32:
11361 case BFD_RELOC_X86_64_GOT32:
11362 case BFD_RELOC_X86_64_GOTPCREL:
11363 case BFD_RELOC_X86_64_GOTPCRELX:
11364 case BFD_RELOC_X86_64_REX_GOTPCRELX:
11365 case BFD_RELOC_386_PLT32:
11366 case BFD_RELOC_386_GOT32:
11367 case BFD_RELOC_386_GOT32X:
11368 case BFD_RELOC_386_GOTOFF:
11369 case BFD_RELOC_386_GOTPC:
11370 case BFD_RELOC_386_TLS_GD:
11371 case BFD_RELOC_386_TLS_LDM:
11372 case BFD_RELOC_386_TLS_LDO_32:
11373 case BFD_RELOC_386_TLS_IE_32:
11374 case BFD_RELOC_386_TLS_IE:
11375 case BFD_RELOC_386_TLS_GOTIE:
11376 case BFD_RELOC_386_TLS_LE_32:
11377 case BFD_RELOC_386_TLS_LE:
11378 case BFD_RELOC_386_TLS_GOTDESC:
11379 case BFD_RELOC_386_TLS_DESC_CALL:
11380 case BFD_RELOC_X86_64_TLSGD:
11381 case BFD_RELOC_X86_64_TLSLD:
11382 case BFD_RELOC_X86_64_DTPOFF32:
11383 case BFD_RELOC_X86_64_DTPOFF64:
11384 case BFD_RELOC_X86_64_GOTTPOFF:
11385 case BFD_RELOC_X86_64_TPOFF32:
11386 case BFD_RELOC_X86_64_TPOFF64:
11387 case BFD_RELOC_X86_64_GOTOFF64:
11388 case BFD_RELOC_X86_64_GOTPC32:
11389 case BFD_RELOC_X86_64_GOT64:
11390 case BFD_RELOC_X86_64_GOTPCREL64:
11391 case BFD_RELOC_X86_64_GOTPC64:
11392 case BFD_RELOC_X86_64_GOTPLT64:
11393 case BFD_RELOC_X86_64_PLTOFF64:
11394 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11395 case BFD_RELOC_X86_64_TLSDESC_CALL:
11396 case BFD_RELOC_RVA:
11397 case BFD_RELOC_VTABLE_ENTRY:
11398 case BFD_RELOC_VTABLE_INHERIT:
11399 #ifdef TE_PE
11400 case BFD_RELOC_32_SECREL:
11401 #endif
11402 code = fixp->fx_r_type;
11403 break;
11404 case BFD_RELOC_X86_64_32S:
11405 if (!fixp->fx_pcrel)
11406 {
11407 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
11408 code = fixp->fx_r_type;
11409 break;
11410 }
11411 /* Fall through. */
11412 default:
11413 if (fixp->fx_pcrel)
11414 {
11415 switch (fixp->fx_size)
11416 {
11417 default:
11418 as_bad_where (fixp->fx_file, fixp->fx_line,
11419 _("can not do %d byte pc-relative relocation"),
11420 fixp->fx_size);
11421 code = BFD_RELOC_32_PCREL;
11422 break;
11423 case 1: code = BFD_RELOC_8_PCREL; break;
11424 case 2: code = BFD_RELOC_16_PCREL; break;
11425 case 4: code = BFD_RELOC_32_PCREL; break;
11426 #ifdef BFD64
11427 case 8: code = BFD_RELOC_64_PCREL; break;
11428 #endif
11429 }
11430 }
11431 else
11432 {
11433 switch (fixp->fx_size)
11434 {
11435 default:
11436 as_bad_where (fixp->fx_file, fixp->fx_line,
11437 _("can not do %d byte relocation"),
11438 fixp->fx_size);
11439 code = BFD_RELOC_32;
11440 break;
11441 case 1: code = BFD_RELOC_8; break;
11442 case 2: code = BFD_RELOC_16; break;
11443 case 4: code = BFD_RELOC_32; break;
11444 #ifdef BFD64
11445 case 8: code = BFD_RELOC_64; break;
11446 #endif
11447 }
11448 }
11449 break;
11450 }
11451
11452 if ((code == BFD_RELOC_32
11453 || code == BFD_RELOC_32_PCREL
11454 || code == BFD_RELOC_X86_64_32S)
11455 && GOT_symbol
11456 && fixp->fx_addsy == GOT_symbol)
11457 {
11458 if (!object_64bit)
11459 code = BFD_RELOC_386_GOTPC;
11460 else
11461 code = BFD_RELOC_X86_64_GOTPC32;
11462 }
11463 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
11464 && GOT_symbol
11465 && fixp->fx_addsy == GOT_symbol)
11466 {
11467 code = BFD_RELOC_X86_64_GOTPC64;
11468 }
11469
11470 rel = XNEW (arelent);
11471 rel->sym_ptr_ptr = XNEW (asymbol *);
11472 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
11473
11474 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
11475
11476 if (!use_rela_relocations)
11477 {
11478 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
11479 vtable entry to be used in the relocation's section offset. */
11480 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
11481 rel->address = fixp->fx_offset;
11482 #if defined (OBJ_COFF) && defined (TE_PE)
11483 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
11484 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
11485 else
11486 #endif
11487 rel->addend = 0;
11488 }
11489 /* Use the rela in 64bit mode. */
11490 else
11491 {
11492 if (disallow_64bit_reloc)
11493 switch (code)
11494 {
11495 case BFD_RELOC_X86_64_DTPOFF64:
11496 case BFD_RELOC_X86_64_TPOFF64:
11497 case BFD_RELOC_64_PCREL:
11498 case BFD_RELOC_X86_64_GOTOFF64:
11499 case BFD_RELOC_X86_64_GOT64:
11500 case BFD_RELOC_X86_64_GOTPCREL64:
11501 case BFD_RELOC_X86_64_GOTPC64:
11502 case BFD_RELOC_X86_64_GOTPLT64:
11503 case BFD_RELOC_X86_64_PLTOFF64:
11504 as_bad_where (fixp->fx_file, fixp->fx_line,
11505 _("cannot represent relocation type %s in x32 mode"),
11506 bfd_get_reloc_code_name (code));
11507 break;
11508 default:
11509 break;
11510 }
11511
11512 if (!fixp->fx_pcrel)
11513 rel->addend = fixp->fx_offset;
11514 else
11515 switch (code)
11516 {
11517 case BFD_RELOC_X86_64_PLT32:
11518 case BFD_RELOC_X86_64_GOT32:
11519 case BFD_RELOC_X86_64_GOTPCREL:
11520 case BFD_RELOC_X86_64_GOTPCRELX:
11521 case BFD_RELOC_X86_64_REX_GOTPCRELX:
11522 case BFD_RELOC_X86_64_TLSGD:
11523 case BFD_RELOC_X86_64_TLSLD:
11524 case BFD_RELOC_X86_64_GOTTPOFF:
11525 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11526 case BFD_RELOC_X86_64_TLSDESC_CALL:
11527 rel->addend = fixp->fx_offset - fixp->fx_size;
11528 break;
11529 default:
11530 rel->addend = (section->vma
11531 - fixp->fx_size
11532 + fixp->fx_addnumber
11533 + md_pcrel_from (fixp));
11534 break;
11535 }
11536 }
11537
11538 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
11539 if (rel->howto == NULL)
11540 {
11541 as_bad_where (fixp->fx_file, fixp->fx_line,
11542 _("cannot represent relocation type %s"),
11543 bfd_get_reloc_code_name (code));
11544 /* Set howto to a garbage value so that we can keep going. */
11545 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
11546 gas_assert (rel->howto != NULL);
11547 }
11548
11549 return rel;
11550 }
11551
11552 #include "tc-i386-intel.c"
11553
11554 void
11555 tc_x86_parse_to_dw2regnum (expressionS *exp)
11556 {
11557 int saved_naked_reg;
11558 char saved_register_dot;
11559
11560 saved_naked_reg = allow_naked_reg;
11561 allow_naked_reg = 1;
11562 saved_register_dot = register_chars['.'];
11563 register_chars['.'] = '.';
11564 allow_pseudo_reg = 1;
11565 expression_and_evaluate (exp);
11566 allow_pseudo_reg = 0;
11567 register_chars['.'] = saved_register_dot;
11568 allow_naked_reg = saved_naked_reg;
11569
11570 if (exp->X_op == O_register && exp->X_add_number >= 0)
11571 {
11572 if ((addressT) exp->X_add_number < i386_regtab_size)
11573 {
11574 exp->X_op = O_constant;
11575 exp->X_add_number = i386_regtab[exp->X_add_number]
11576 .dw2_regnum[flag_code >> 1];
11577 }
11578 else
11579 exp->X_op = O_illegal;
11580 }
11581 }
11582
11583 void
11584 tc_x86_frame_initial_instructions (void)
11585 {
11586 static unsigned int sp_regno[2];
11587
11588 if (!sp_regno[flag_code >> 1])
11589 {
11590 char *saved_input = input_line_pointer;
11591 char sp[][4] = {"esp", "rsp"};
11592 expressionS exp;
11593
11594 input_line_pointer = sp[flag_code >> 1];
11595 tc_x86_parse_to_dw2regnum (&exp);
11596 gas_assert (exp.X_op == O_constant);
11597 sp_regno[flag_code >> 1] = exp.X_add_number;
11598 input_line_pointer = saved_input;
11599 }
11600
11601 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
11602 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
11603 }
11604
11605 int
11606 x86_dwarf2_addr_size (void)
11607 {
11608 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
11609 if (x86_elf_abi == X86_64_X32_ABI)
11610 return 4;
11611 #endif
11612 return bfd_arch_bits_per_address (stdoutput) / 8;
11613 }
11614
11615 int
11616 i386_elf_section_type (const char *str, size_t len)
11617 {
11618 if (flag_code == CODE_64BIT
11619 && len == sizeof ("unwind") - 1
11620 && strncmp (str, "unwind", 6) == 0)
11621 return SHT_X86_64_UNWIND;
11622
11623 return -1;
11624 }
11625
11626 #ifdef TE_SOLARIS
11627 void
11628 i386_solaris_fix_up_eh_frame (segT sec)
11629 {
11630 if (flag_code == CODE_64BIT)
11631 elf_section_type (sec) = SHT_X86_64_UNWIND;
11632 }
11633 #endif
11634
11635 #ifdef TE_PE
11636 void
11637 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
11638 {
11639 expressionS exp;
11640
11641 exp.X_op = O_secrel;
11642 exp.X_add_symbol = symbol;
11643 exp.X_add_number = 0;
11644 emit_expr (&exp, size);
11645 }
11646 #endif
11647
11648 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11649 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
11650
11651 bfd_vma
11652 x86_64_section_letter (int letter, const char **ptr_msg)
11653 {
11654 if (flag_code == CODE_64BIT)
11655 {
11656 if (letter == 'l')
11657 return SHF_X86_64_LARGE;
11658
11659 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
11660 }
11661 else
11662 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
11663 return -1;
11664 }
11665
11666 bfd_vma
11667 x86_64_section_word (char *str, size_t len)
11668 {
11669 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
11670 return SHF_X86_64_LARGE;
11671
11672 return -1;
11673 }
11674
11675 static void
11676 handle_large_common (int small ATTRIBUTE_UNUSED)
11677 {
11678 if (flag_code != CODE_64BIT)
11679 {
11680 s_comm_internal (0, elf_common_parse);
11681 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
11682 }
11683 else
11684 {
11685 static segT lbss_section;
11686 asection *saved_com_section_ptr = elf_com_section_ptr;
11687 asection *saved_bss_section = bss_section;
11688
11689 if (lbss_section == NULL)
11690 {
11691 flagword applicable;
11692 segT seg = now_seg;
11693 subsegT subseg = now_subseg;
11694
11695 /* The .lbss section is for local .largecomm symbols. */
11696 lbss_section = subseg_new (".lbss", 0);
11697 applicable = bfd_applicable_section_flags (stdoutput);
11698 bfd_set_section_flags (stdoutput, lbss_section,
11699 applicable & SEC_ALLOC);
11700 seg_info (lbss_section)->bss = 1;
11701
11702 subseg_set (seg, subseg);
11703 }
11704
11705 elf_com_section_ptr = &_bfd_elf_large_com_section;
11706 bss_section = lbss_section;
11707
11708 s_comm_internal (0, elf_common_parse);
11709
11710 elf_com_section_ptr = saved_com_section_ptr;
11711 bss_section = saved_bss_section;
11712 }
11713 }
11714 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 0.323455 seconds and 3 git commands to generate.