x86: restrict use of register aliases
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef INFER_ADDR_PREFIX
48 #define INFER_ADDR_PREFIX 1
49 #endif
50
51 #ifndef DEFAULT_ARCH
52 #define DEFAULT_ARCH "i386"
53 #endif
54
55 #ifndef INLINE
56 #if __GNUC__ >= 2
57 #define INLINE __inline__
58 #else
59 #define INLINE
60 #endif
61 #endif
62
63 /* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
68 #define WAIT_PREFIX 0
69 #define SEG_PREFIX 1
70 #define ADDR_PREFIX 2
71 #define DATA_PREFIX 3
72 #define REP_PREFIX 4
73 #define HLE_PREFIX REP_PREFIX
74 #define BND_PREFIX REP_PREFIX
75 #define LOCK_PREFIX 5
76 #define REX_PREFIX 6 /* must come last. */
77 #define MAX_PREFIXES 7 /* max prefixes per opcode */
78
79 /* we define the syntax here (modulo base,index,scale syntax) */
80 #define REGISTER_PREFIX '%'
81 #define IMMEDIATE_PREFIX '$'
82 #define ABSOLUTE_PREFIX '*'
83
84 /* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86 #define WORD_MNEM_SUFFIX 'w'
87 #define BYTE_MNEM_SUFFIX 'b'
88 #define SHORT_MNEM_SUFFIX 's'
89 #define LONG_MNEM_SUFFIX 'l'
90 #define QWORD_MNEM_SUFFIX 'q'
91 /* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95 #define END_OF_INSN '\0'
96
97 /* This matches the C -> StaticRounding alias in the opcode table. */
98 #define commutative staticrounding
99
100 /*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107 typedef struct
108 {
109 const insn_template *start;
110 const insn_template *end;
111 }
112 templates;
113
114 /* 386 operand encoding bytes: see 386 book for details of this. */
115 typedef struct
116 {
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120 }
121 modrm_byte;
122
123 /* x86-64 extension prefix. */
124 typedef int rex_byte;
125
126 /* 386 opcode byte to code indirect addressing. */
127 typedef struct
128 {
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132 }
133 sib_byte;
134
135 /* x86 arch names, types and features */
136 typedef struct
137 {
138 const char *name; /* arch name */
139 unsigned int len; /* arch string length */
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
142 unsigned int skip; /* show_arch should skip this. */
143 }
144 arch_entry;
145
146 /* Used to turn off indicated flags. */
147 typedef struct
148 {
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152 }
153 noarch_entry;
154
155 static void update_code_flag (int, int);
156 static void set_code_flag (int);
157 static void set_16bit_gcc_code_flag (int);
158 static void set_intel_syntax (int);
159 static void set_intel_mnemonic (int);
160 static void set_allow_index_reg (int);
161 static void set_check (int);
162 static void set_cpu_arch (int);
163 #ifdef TE_PE
164 static void pe_directive_secrel (int);
165 #endif
166 static void signed_cons (int);
167 static char *output_invalid (int c);
168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
172 static int i386_att_operand (char *);
173 static int i386_intel_operand (char *, int);
174 static int i386_intel_simplify (expressionS *);
175 static int i386_intel_parse_name (const char *, expressionS *);
176 static const reg_entry *parse_register (char *, char **);
177 static char *parse_insn (char *, char *);
178 static char *parse_operands (char *, const char *);
179 static void swap_operands (void);
180 static void swap_2_operands (int, int);
181 static enum flag_code i386_addressing_mode (void);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
202
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
210
211 static const char *default_arch = DEFAULT_ARCH;
212
213 /* parse_register() returns this when a register alias cannot be used. */
214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
215 { Dw2Inval, Dw2Inval } };
216
217 /* This struct describes rounding control and SAE in the instruction. */
218 struct RC_Operation
219 {
220 enum rc_type
221 {
222 rne = 0,
223 rd,
224 ru,
225 rz,
226 saeonly
227 } type;
228 int operand;
229 };
230
231 static struct RC_Operation rc_op;
232
233 /* The struct describes masking, applied to OPERAND in the instruction.
234 MASK is a pointer to the corresponding mask register. ZEROING tells
235 whether merging or zeroing mask is used. */
236 struct Mask_Operation
237 {
238 const reg_entry *mask;
239 unsigned int zeroing;
240 /* The operand where this operation is associated. */
241 int operand;
242 };
243
244 static struct Mask_Operation mask_op;
245
246 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
247 broadcast factor. */
248 struct Broadcast_Operation
249 {
250 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
251 int type;
252
253 /* Index of broadcasted operand. */
254 int operand;
255
256 /* Number of bytes to broadcast. */
257 int bytes;
258 };
259
260 static struct Broadcast_Operation broadcast_op;
261
262 /* VEX prefix. */
263 typedef struct
264 {
265 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
266 unsigned char bytes[4];
267 unsigned int length;
268 /* Destination or source register specifier. */
269 const reg_entry *register_specifier;
270 } vex_prefix;
271
272 /* 'md_assemble ()' gathers together information and puts it into a
273 i386_insn. */
274
275 union i386_op
276 {
277 expressionS *disps;
278 expressionS *imms;
279 const reg_entry *regs;
280 };
281
282 enum i386_error
283 {
284 operand_size_mismatch,
285 operand_type_mismatch,
286 register_type_mismatch,
287 number_of_operands_mismatch,
288 invalid_instruction_suffix,
289 bad_imm4,
290 unsupported_with_intel_mnemonic,
291 unsupported_syntax,
292 unsupported,
293 invalid_vsib_address,
294 invalid_vector_register_set,
295 unsupported_vector_index_register,
296 unsupported_broadcast,
297 broadcast_needed,
298 unsupported_masking,
299 mask_not_on_destination,
300 no_default_mask,
301 unsupported_rc_sae,
302 rc_sae_operand_not_last_imm,
303 invalid_register_operand,
304 };
305
306 struct _i386_insn
307 {
308 /* TM holds the template for the insn were currently assembling. */
309 insn_template tm;
310
311 /* SUFFIX holds the instruction size suffix for byte, word, dword
312 or qword, if given. */
313 char suffix;
314
315 /* OPERANDS gives the number of given operands. */
316 unsigned int operands;
317
318 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
319 of given register, displacement, memory operands and immediate
320 operands. */
321 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
322
323 /* TYPES [i] is the type (see above #defines) which tells us how to
324 use OP[i] for the corresponding operand. */
325 i386_operand_type types[MAX_OPERANDS];
326
327 /* Displacement expression, immediate expression, or register for each
328 operand. */
329 union i386_op op[MAX_OPERANDS];
330
331 /* Flags for operands. */
332 unsigned int flags[MAX_OPERANDS];
333 #define Operand_PCrel 1
334 #define Operand_Mem 2
335
336 /* Relocation type for operand */
337 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
338
339 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
340 the base index byte below. */
341 const reg_entry *base_reg;
342 const reg_entry *index_reg;
343 unsigned int log2_scale_factor;
344
345 /* SEG gives the seg_entries of this insn. They are zero unless
346 explicit segment overrides are given. */
347 const seg_entry *seg[2];
348
349 /* Copied first memory operand string, for re-checking. */
350 char *memop1_string;
351
352 /* PREFIX holds all the given prefix opcodes (usually null).
353 PREFIXES is the number of prefix opcodes. */
354 unsigned int prefixes;
355 unsigned char prefix[MAX_PREFIXES];
356
357 /* Register is in low 3 bits of opcode. */
358 bfd_boolean short_form;
359
360 /* The operand to a branch insn indicates an absolute branch. */
361 bfd_boolean jumpabsolute;
362
363 /* Has MMX register operands. */
364 bfd_boolean has_regmmx;
365
366 /* Has XMM register operands. */
367 bfd_boolean has_regxmm;
368
369 /* Has YMM register operands. */
370 bfd_boolean has_regymm;
371
372 /* Has ZMM register operands. */
373 bfd_boolean has_regzmm;
374
375 /* Has GOTPC or TLS relocation. */
376 bfd_boolean has_gotpc_tls_reloc;
377
378 /* RM and SIB are the modrm byte and the sib byte where the
379 addressing modes of this insn are encoded. */
380 modrm_byte rm;
381 rex_byte rex;
382 rex_byte vrex;
383 sib_byte sib;
384 vex_prefix vex;
385
386 /* Masking attributes. */
387 struct Mask_Operation *mask;
388
389 /* Rounding control and SAE attributes. */
390 struct RC_Operation *rounding;
391
392 /* Broadcasting attributes. */
393 struct Broadcast_Operation *broadcast;
394
395 /* Compressed disp8*N attribute. */
396 unsigned int memshift;
397
398 /* Prefer load or store in encoding. */
399 enum
400 {
401 dir_encoding_default = 0,
402 dir_encoding_load,
403 dir_encoding_store,
404 dir_encoding_swap
405 } dir_encoding;
406
407 /* Prefer 8bit or 32bit displacement in encoding. */
408 enum
409 {
410 disp_encoding_default = 0,
411 disp_encoding_8bit,
412 disp_encoding_32bit
413 } disp_encoding;
414
415 /* Prefer the REX byte in encoding. */
416 bfd_boolean rex_encoding;
417
418 /* Disable instruction size optimization. */
419 bfd_boolean no_optimize;
420
421 /* How to encode vector instructions. */
422 enum
423 {
424 vex_encoding_default = 0,
425 vex_encoding_vex,
426 vex_encoding_vex3,
427 vex_encoding_evex
428 } vec_encoding;
429
430 /* REP prefix. */
431 const char *rep_prefix;
432
433 /* HLE prefix. */
434 const char *hle_prefix;
435
436 /* Have BND prefix. */
437 const char *bnd_prefix;
438
439 /* Have NOTRACK prefix. */
440 const char *notrack_prefix;
441
442 /* Error message. */
443 enum i386_error error;
444 };
445
446 typedef struct _i386_insn i386_insn;
447
448 /* Link RC type with corresponding string, that'll be looked for in
449 asm. */
450 struct RC_name
451 {
452 enum rc_type type;
453 const char *name;
454 unsigned int len;
455 };
456
457 static const struct RC_name RC_NamesTable[] =
458 {
459 { rne, STRING_COMMA_LEN ("rn-sae") },
460 { rd, STRING_COMMA_LEN ("rd-sae") },
461 { ru, STRING_COMMA_LEN ("ru-sae") },
462 { rz, STRING_COMMA_LEN ("rz-sae") },
463 { saeonly, STRING_COMMA_LEN ("sae") },
464 };
465
466 /* List of chars besides those in app.c:symbol_chars that can start an
467 operand. Used to prevent the scrubber eating vital white-space. */
468 const char extra_symbol_chars[] = "*%-([{}"
469 #ifdef LEX_AT
470 "@"
471 #endif
472 #ifdef LEX_QM
473 "?"
474 #endif
475 ;
476
477 #if (defined (TE_I386AIX) \
478 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
479 && !defined (TE_GNU) \
480 && !defined (TE_LINUX) \
481 && !defined (TE_NACL) \
482 && !defined (TE_FreeBSD) \
483 && !defined (TE_DragonFly) \
484 && !defined (TE_NetBSD)))
485 /* This array holds the chars that always start a comment. If the
486 pre-processor is disabled, these aren't very useful. The option
487 --divide will remove '/' from this list. */
488 const char *i386_comment_chars = "#/";
489 #define SVR4_COMMENT_CHARS 1
490 #define PREFIX_SEPARATOR '\\'
491
492 #else
493 const char *i386_comment_chars = "#";
494 #define PREFIX_SEPARATOR '/'
495 #endif
496
497 /* This array holds the chars that only start a comment at the beginning of
498 a line. If the line seems to have the form '# 123 filename'
499 .line and .file directives will appear in the pre-processed output.
500 Note that input_file.c hand checks for '#' at the beginning of the
501 first line of the input file. This is because the compiler outputs
502 #NO_APP at the beginning of its output.
503 Also note that comments started like this one will always work if
504 '/' isn't otherwise defined. */
505 const char line_comment_chars[] = "#/";
506
507 const char line_separator_chars[] = ";";
508
509 /* Chars that can be used to separate mant from exp in floating point
510 nums. */
511 const char EXP_CHARS[] = "eE";
512
513 /* Chars that mean this number is a floating point constant
514 As in 0f12.456
515 or 0d1.2345e12. */
516 const char FLT_CHARS[] = "fFdDxX";
517
518 /* Tables for lexical analysis. */
519 static char mnemonic_chars[256];
520 static char register_chars[256];
521 static char operand_chars[256];
522 static char identifier_chars[256];
523 static char digit_chars[256];
524
525 /* Lexical macros. */
526 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
527 #define is_operand_char(x) (operand_chars[(unsigned char) x])
528 #define is_register_char(x) (register_chars[(unsigned char) x])
529 #define is_space_char(x) ((x) == ' ')
530 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
531 #define is_digit_char(x) (digit_chars[(unsigned char) x])
532
533 /* All non-digit non-letter characters that may occur in an operand. */
534 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
535
536 /* md_assemble() always leaves the strings it's passed unaltered. To
537 effect this we maintain a stack of saved characters that we've smashed
538 with '\0's (indicating end of strings for various sub-fields of the
539 assembler instruction). */
540 static char save_stack[32];
541 static char *save_stack_p;
542 #define END_STRING_AND_SAVE(s) \
543 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
544 #define RESTORE_END_STRING(s) \
545 do { *(s) = *--save_stack_p; } while (0)
546
547 /* The instruction we're assembling. */
548 static i386_insn i;
549
550 /* Possible templates for current insn. */
551 static const templates *current_templates;
552
553 /* Per instruction expressionS buffers: max displacements & immediates. */
554 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
555 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
556
557 /* Current operand we are working on. */
558 static int this_operand = -1;
559
560 /* We support four different modes. FLAG_CODE variable is used to distinguish
561 these. */
562
563 enum flag_code {
564 CODE_32BIT,
565 CODE_16BIT,
566 CODE_64BIT };
567
568 static enum flag_code flag_code;
569 static unsigned int object_64bit;
570 static unsigned int disallow_64bit_reloc;
571 static int use_rela_relocations = 0;
572 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
573 static const char *tls_get_addr;
574
575 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
576 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
577 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
578
579 /* The ELF ABI to use. */
580 enum x86_elf_abi
581 {
582 I386_ABI,
583 X86_64_ABI,
584 X86_64_X32_ABI
585 };
586
587 static enum x86_elf_abi x86_elf_abi = I386_ABI;
588 #endif
589
590 #if defined (TE_PE) || defined (TE_PEP)
591 /* Use big object file format. */
592 static int use_big_obj = 0;
593 #endif
594
595 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
596 /* 1 if generating code for a shared library. */
597 static int shared = 0;
598 #endif
599
600 /* 1 for intel syntax,
601 0 if att syntax. */
602 static int intel_syntax = 0;
603
604 static enum x86_64_isa
605 {
606 amd64 = 1, /* AMD64 ISA. */
607 intel64 /* Intel64 ISA. */
608 } isa64;
609
610 /* 1 for intel mnemonic,
611 0 if att mnemonic. */
612 static int intel_mnemonic = !SYSV386_COMPAT;
613
614 /* 1 if pseudo registers are permitted. */
615 static int allow_pseudo_reg = 0;
616
617 /* 1 if register prefix % not required. */
618 static int allow_naked_reg = 0;
619
620 /* 1 if the assembler should add BND prefix for all control-transferring
621 instructions supporting it, even if this prefix wasn't specified
622 explicitly. */
623 static int add_bnd_prefix = 0;
624
625 /* 1 if pseudo index register, eiz/riz, is allowed . */
626 static int allow_index_reg = 0;
627
628 /* 1 if the assembler should ignore LOCK prefix, even if it was
629 specified explicitly. */
630 static int omit_lock_prefix = 0;
631
632 /* 1 if the assembler should encode lfence, mfence, and sfence as
633 "lock addl $0, (%{re}sp)". */
634 static int avoid_fence = 0;
635
636 /* 1 if lfence should be inserted after every load. */
637 static int lfence_after_load = 0;
638
639 /* Non-zero if lfence should be inserted before indirect branch. */
640 static enum lfence_before_indirect_branch_kind
641 {
642 lfence_branch_none = 0,
643 lfence_branch_register,
644 lfence_branch_memory,
645 lfence_branch_all
646 }
647 lfence_before_indirect_branch;
648
649 /* Non-zero if lfence should be inserted before ret. */
650 static enum lfence_before_ret_kind
651 {
652 lfence_before_ret_none = 0,
653 lfence_before_ret_not,
654 lfence_before_ret_or,
655 lfence_before_ret_shl
656 }
657 lfence_before_ret;
658
659 /* Types of previous instruction is .byte or prefix. */
660 static struct
661 {
662 segT seg;
663 const char *file;
664 const char *name;
665 unsigned int line;
666 enum last_insn_kind
667 {
668 last_insn_other = 0,
669 last_insn_directive,
670 last_insn_prefix
671 } kind;
672 } last_insn;
673
674 /* 1 if the assembler should generate relax relocations. */
675
676 static int generate_relax_relocations
677 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
678
679 static enum check_kind
680 {
681 check_none = 0,
682 check_warning,
683 check_error
684 }
685 sse_check, operand_check = check_warning;
686
687 /* Non-zero if branches should be aligned within power of 2 boundary. */
688 static int align_branch_power = 0;
689
690 /* Types of branches to align. */
691 enum align_branch_kind
692 {
693 align_branch_none = 0,
694 align_branch_jcc = 1,
695 align_branch_fused = 2,
696 align_branch_jmp = 3,
697 align_branch_call = 4,
698 align_branch_indirect = 5,
699 align_branch_ret = 6
700 };
701
702 /* Type bits of branches to align. */
703 enum align_branch_bit
704 {
705 align_branch_jcc_bit = 1 << align_branch_jcc,
706 align_branch_fused_bit = 1 << align_branch_fused,
707 align_branch_jmp_bit = 1 << align_branch_jmp,
708 align_branch_call_bit = 1 << align_branch_call,
709 align_branch_indirect_bit = 1 << align_branch_indirect,
710 align_branch_ret_bit = 1 << align_branch_ret
711 };
712
713 static unsigned int align_branch = (align_branch_jcc_bit
714 | align_branch_fused_bit
715 | align_branch_jmp_bit);
716
717 /* Types of condition jump used by macro-fusion. */
718 enum mf_jcc_kind
719 {
720 mf_jcc_jo = 0, /* base opcode 0x70 */
721 mf_jcc_jc, /* base opcode 0x72 */
722 mf_jcc_je, /* base opcode 0x74 */
723 mf_jcc_jna, /* base opcode 0x76 */
724 mf_jcc_js, /* base opcode 0x78 */
725 mf_jcc_jp, /* base opcode 0x7a */
726 mf_jcc_jl, /* base opcode 0x7c */
727 mf_jcc_jle, /* base opcode 0x7e */
728 };
729
730 /* Types of compare flag-modifying insntructions used by macro-fusion. */
731 enum mf_cmp_kind
732 {
733 mf_cmp_test_and, /* test/cmp */
734 mf_cmp_alu_cmp, /* add/sub/cmp */
735 mf_cmp_incdec /* inc/dec */
736 };
737
738 /* The maximum padding size for fused jcc. CMP like instruction can
739 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
740 prefixes. */
741 #define MAX_FUSED_JCC_PADDING_SIZE 20
742
743 /* The maximum number of prefixes added for an instruction. */
744 static unsigned int align_branch_prefix_size = 5;
745
746 /* Optimization:
747 1. Clear the REX_W bit with register operand if possible.
748 2. Above plus use 128bit vector instruction to clear the full vector
749 register.
750 */
751 static int optimize = 0;
752
753 /* Optimization:
754 1. Clear the REX_W bit with register operand if possible.
755 2. Above plus use 128bit vector instruction to clear the full vector
756 register.
757 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
758 "testb $imm7,%r8".
759 */
760 static int optimize_for_space = 0;
761
762 /* Register prefix used for error message. */
763 static const char *register_prefix = "%";
764
765 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
766 leave, push, and pop instructions so that gcc has the same stack
767 frame as in 32 bit mode. */
768 static char stackop_size = '\0';
769
770 /* Non-zero to optimize code alignment. */
771 int optimize_align_code = 1;
772
773 /* Non-zero to quieten some warnings. */
774 static int quiet_warnings = 0;
775
776 /* CPU name. */
777 static const char *cpu_arch_name = NULL;
778 static char *cpu_sub_arch_name = NULL;
779
780 /* CPU feature flags. */
781 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
782
783 /* If we have selected a cpu we are generating instructions for. */
784 static int cpu_arch_tune_set = 0;
785
786 /* Cpu we are generating instructions for. */
787 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
788
789 /* CPU feature flags of cpu we are generating instructions for. */
790 static i386_cpu_flags cpu_arch_tune_flags;
791
792 /* CPU instruction set architecture used. */
793 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
794
795 /* CPU feature flags of instruction set architecture used. */
796 i386_cpu_flags cpu_arch_isa_flags;
797
798 /* If set, conditional jumps are not automatically promoted to handle
799 larger than a byte offset. */
800 static unsigned int no_cond_jump_promotion = 0;
801
802 /* Encode SSE instructions with VEX prefix. */
803 static unsigned int sse2avx;
804
805 /* Encode scalar AVX instructions with specific vector length. */
806 static enum
807 {
808 vex128 = 0,
809 vex256
810 } avxscalar;
811
812 /* Encode VEX WIG instructions with specific vex.w. */
813 static enum
814 {
815 vexw0 = 0,
816 vexw1
817 } vexwig;
818
819 /* Encode scalar EVEX LIG instructions with specific vector length. */
820 static enum
821 {
822 evexl128 = 0,
823 evexl256,
824 evexl512
825 } evexlig;
826
827 /* Encode EVEX WIG instructions with specific evex.w. */
828 static enum
829 {
830 evexw0 = 0,
831 evexw1
832 } evexwig;
833
834 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
835 static enum rc_type evexrcig = rne;
836
837 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
838 static symbolS *GOT_symbol;
839
840 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
841 unsigned int x86_dwarf2_return_column;
842
843 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
844 int x86_cie_data_alignment;
845
846 /* Interface to relax_segment.
847 There are 3 major relax states for 386 jump insns because the
848 different types of jumps add different sizes to frags when we're
849 figuring out what sort of jump to choose to reach a given label.
850
851 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
852 branches which are handled by md_estimate_size_before_relax() and
853 i386_generic_table_relax_frag(). */
854
855 /* Types. */
856 #define UNCOND_JUMP 0
857 #define COND_JUMP 1
858 #define COND_JUMP86 2
859 #define BRANCH_PADDING 3
860 #define BRANCH_PREFIX 4
861 #define FUSED_JCC_PADDING 5
862
863 /* Sizes. */
864 #define CODE16 1
865 #define SMALL 0
866 #define SMALL16 (SMALL | CODE16)
867 #define BIG 2
868 #define BIG16 (BIG | CODE16)
869
870 #ifndef INLINE
871 #ifdef __GNUC__
872 #define INLINE __inline__
873 #else
874 #define INLINE
875 #endif
876 #endif
877
878 #define ENCODE_RELAX_STATE(type, size) \
879 ((relax_substateT) (((type) << 2) | (size)))
880 #define TYPE_FROM_RELAX_STATE(s) \
881 ((s) >> 2)
882 #define DISP_SIZE_FROM_RELAX_STATE(s) \
883 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
884
885 /* This table is used by relax_frag to promote short jumps to long
886 ones where necessary. SMALL (short) jumps may be promoted to BIG
887 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
888 don't allow a short jump in a 32 bit code segment to be promoted to
889 a 16 bit offset jump because it's slower (requires data size
890 prefix), and doesn't work, unless the destination is in the bottom
891 64k of the code segment (The top 16 bits of eip are zeroed). */
892
893 const relax_typeS md_relax_table[] =
894 {
895 /* The fields are:
896 1) most positive reach of this state,
897 2) most negative reach of this state,
898 3) how many bytes this mode will have in the variable part of the frag
899 4) which index into the table to try if we can't fit into this one. */
900
901 /* UNCOND_JUMP states. */
902 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
903 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
904 /* dword jmp adds 4 bytes to frag:
905 0 extra opcode bytes, 4 displacement bytes. */
906 {0, 0, 4, 0},
907 /* word jmp adds 2 byte2 to frag:
908 0 extra opcode bytes, 2 displacement bytes. */
909 {0, 0, 2, 0},
910
911 /* COND_JUMP states. */
912 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
913 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
914 /* dword conditionals adds 5 bytes to frag:
915 1 extra opcode byte, 4 displacement bytes. */
916 {0, 0, 5, 0},
917 /* word conditionals add 3 bytes to frag:
918 1 extra opcode byte, 2 displacement bytes. */
919 {0, 0, 3, 0},
920
921 /* COND_JUMP86 states. */
922 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
923 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
924 /* dword conditionals adds 5 bytes to frag:
925 1 extra opcode byte, 4 displacement bytes. */
926 {0, 0, 5, 0},
927 /* word conditionals add 4 bytes to frag:
928 1 displacement byte and a 3 byte long branch insn. */
929 {0, 0, 4, 0}
930 };
931
932 static const arch_entry cpu_arch[] =
933 {
934 /* Do not replace the first two entries - i386_target_format()
935 relies on them being there in this order. */
936 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
937 CPU_GENERIC32_FLAGS, 0 },
938 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
939 CPU_GENERIC64_FLAGS, 0 },
940 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
941 CPU_NONE_FLAGS, 0 },
942 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
943 CPU_I186_FLAGS, 0 },
944 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
945 CPU_I286_FLAGS, 0 },
946 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
947 CPU_I386_FLAGS, 0 },
948 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
949 CPU_I486_FLAGS, 0 },
950 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
951 CPU_I586_FLAGS, 0 },
952 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
953 CPU_I686_FLAGS, 0 },
954 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
955 CPU_I586_FLAGS, 0 },
956 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
957 CPU_PENTIUMPRO_FLAGS, 0 },
958 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
959 CPU_P2_FLAGS, 0 },
960 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
961 CPU_P3_FLAGS, 0 },
962 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
963 CPU_P4_FLAGS, 0 },
964 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
965 CPU_CORE_FLAGS, 0 },
966 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
967 CPU_NOCONA_FLAGS, 0 },
968 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
969 CPU_CORE_FLAGS, 1 },
970 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
971 CPU_CORE_FLAGS, 0 },
972 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
973 CPU_CORE2_FLAGS, 1 },
974 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
975 CPU_CORE2_FLAGS, 0 },
976 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
977 CPU_COREI7_FLAGS, 0 },
978 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
979 CPU_L1OM_FLAGS, 0 },
980 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
981 CPU_K1OM_FLAGS, 0 },
982 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
983 CPU_IAMCU_FLAGS, 0 },
984 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
985 CPU_K6_FLAGS, 0 },
986 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
987 CPU_K6_2_FLAGS, 0 },
988 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
989 CPU_ATHLON_FLAGS, 0 },
990 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
991 CPU_K8_FLAGS, 1 },
992 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
993 CPU_K8_FLAGS, 0 },
994 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
995 CPU_K8_FLAGS, 0 },
996 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
997 CPU_AMDFAM10_FLAGS, 0 },
998 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
999 CPU_BDVER1_FLAGS, 0 },
1000 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1001 CPU_BDVER2_FLAGS, 0 },
1002 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1003 CPU_BDVER3_FLAGS, 0 },
1004 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1005 CPU_BDVER4_FLAGS, 0 },
1006 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1007 CPU_ZNVER1_FLAGS, 0 },
1008 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1009 CPU_ZNVER2_FLAGS, 0 },
1010 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1011 CPU_BTVER1_FLAGS, 0 },
1012 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1013 CPU_BTVER2_FLAGS, 0 },
1014 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1015 CPU_8087_FLAGS, 0 },
1016 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1017 CPU_287_FLAGS, 0 },
1018 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1019 CPU_387_FLAGS, 0 },
1020 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1021 CPU_687_FLAGS, 0 },
1022 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1023 CPU_CMOV_FLAGS, 0 },
1024 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1025 CPU_FXSR_FLAGS, 0 },
1026 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1027 CPU_MMX_FLAGS, 0 },
1028 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1029 CPU_SSE_FLAGS, 0 },
1030 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1031 CPU_SSE2_FLAGS, 0 },
1032 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1033 CPU_SSE3_FLAGS, 0 },
1034 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1035 CPU_SSE4A_FLAGS, 0 },
1036 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1037 CPU_SSSE3_FLAGS, 0 },
1038 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1039 CPU_SSE4_1_FLAGS, 0 },
1040 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1041 CPU_SSE4_2_FLAGS, 0 },
1042 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1043 CPU_SSE4_2_FLAGS, 0 },
1044 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1045 CPU_AVX_FLAGS, 0 },
1046 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1047 CPU_AVX2_FLAGS, 0 },
1048 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1049 CPU_AVX512F_FLAGS, 0 },
1050 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1051 CPU_AVX512CD_FLAGS, 0 },
1052 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1053 CPU_AVX512ER_FLAGS, 0 },
1054 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1055 CPU_AVX512PF_FLAGS, 0 },
1056 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1057 CPU_AVX512DQ_FLAGS, 0 },
1058 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1059 CPU_AVX512BW_FLAGS, 0 },
1060 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1061 CPU_AVX512VL_FLAGS, 0 },
1062 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1063 CPU_VMX_FLAGS, 0 },
1064 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1065 CPU_VMFUNC_FLAGS, 0 },
1066 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1067 CPU_SMX_FLAGS, 0 },
1068 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1069 CPU_XSAVE_FLAGS, 0 },
1070 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1071 CPU_XSAVEOPT_FLAGS, 0 },
1072 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1073 CPU_XSAVEC_FLAGS, 0 },
1074 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1075 CPU_XSAVES_FLAGS, 0 },
1076 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1077 CPU_AES_FLAGS, 0 },
1078 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1079 CPU_PCLMUL_FLAGS, 0 },
1080 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1081 CPU_PCLMUL_FLAGS, 1 },
1082 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1083 CPU_FSGSBASE_FLAGS, 0 },
1084 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1085 CPU_RDRND_FLAGS, 0 },
1086 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1087 CPU_F16C_FLAGS, 0 },
1088 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1089 CPU_BMI2_FLAGS, 0 },
1090 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1091 CPU_FMA_FLAGS, 0 },
1092 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1093 CPU_FMA4_FLAGS, 0 },
1094 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1095 CPU_XOP_FLAGS, 0 },
1096 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1097 CPU_LWP_FLAGS, 0 },
1098 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1099 CPU_MOVBE_FLAGS, 0 },
1100 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1101 CPU_CX16_FLAGS, 0 },
1102 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1103 CPU_EPT_FLAGS, 0 },
1104 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1105 CPU_LZCNT_FLAGS, 0 },
1106 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1107 CPU_POPCNT_FLAGS, 0 },
1108 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1109 CPU_HLE_FLAGS, 0 },
1110 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1111 CPU_RTM_FLAGS, 0 },
1112 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1113 CPU_INVPCID_FLAGS, 0 },
1114 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1115 CPU_CLFLUSH_FLAGS, 0 },
1116 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1117 CPU_NOP_FLAGS, 0 },
1118 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1119 CPU_SYSCALL_FLAGS, 0 },
1120 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1121 CPU_RDTSCP_FLAGS, 0 },
1122 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1123 CPU_3DNOW_FLAGS, 0 },
1124 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1125 CPU_3DNOWA_FLAGS, 0 },
1126 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1127 CPU_PADLOCK_FLAGS, 0 },
1128 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1129 CPU_SVME_FLAGS, 1 },
1130 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1131 CPU_SVME_FLAGS, 0 },
1132 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1133 CPU_SSE4A_FLAGS, 0 },
1134 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1135 CPU_ABM_FLAGS, 0 },
1136 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1137 CPU_BMI_FLAGS, 0 },
1138 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1139 CPU_TBM_FLAGS, 0 },
1140 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1141 CPU_ADX_FLAGS, 0 },
1142 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1143 CPU_RDSEED_FLAGS, 0 },
1144 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1145 CPU_PRFCHW_FLAGS, 0 },
1146 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1147 CPU_SMAP_FLAGS, 0 },
1148 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1149 CPU_MPX_FLAGS, 0 },
1150 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1151 CPU_SHA_FLAGS, 0 },
1152 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1153 CPU_CLFLUSHOPT_FLAGS, 0 },
1154 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1155 CPU_PREFETCHWT1_FLAGS, 0 },
1156 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1157 CPU_SE1_FLAGS, 0 },
1158 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1159 CPU_CLWB_FLAGS, 0 },
1160 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1161 CPU_AVX512IFMA_FLAGS, 0 },
1162 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1163 CPU_AVX512VBMI_FLAGS, 0 },
1164 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1165 CPU_AVX512_4FMAPS_FLAGS, 0 },
1166 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1167 CPU_AVX512_4VNNIW_FLAGS, 0 },
1168 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1169 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1170 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1171 CPU_AVX512_VBMI2_FLAGS, 0 },
1172 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1173 CPU_AVX512_VNNI_FLAGS, 0 },
1174 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1175 CPU_AVX512_BITALG_FLAGS, 0 },
1176 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1177 CPU_CLZERO_FLAGS, 0 },
1178 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1179 CPU_MWAITX_FLAGS, 0 },
1180 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1181 CPU_OSPKE_FLAGS, 0 },
1182 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1183 CPU_RDPID_FLAGS, 0 },
1184 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1185 CPU_PTWRITE_FLAGS, 0 },
1186 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1187 CPU_IBT_FLAGS, 0 },
1188 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1189 CPU_SHSTK_FLAGS, 0 },
1190 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1191 CPU_GFNI_FLAGS, 0 },
1192 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1193 CPU_VAES_FLAGS, 0 },
1194 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1195 CPU_VPCLMULQDQ_FLAGS, 0 },
1196 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1197 CPU_WBNOINVD_FLAGS, 0 },
1198 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1199 CPU_PCONFIG_FLAGS, 0 },
1200 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1201 CPU_WAITPKG_FLAGS, 0 },
1202 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1203 CPU_CLDEMOTE_FLAGS, 0 },
1204 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1205 CPU_MOVDIRI_FLAGS, 0 },
1206 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1207 CPU_MOVDIR64B_FLAGS, 0 },
1208 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1209 CPU_AVX512_BF16_FLAGS, 0 },
1210 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1211 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1212 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1213 CPU_ENQCMD_FLAGS, 0 },
1214 { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1215 CPU_SERIALIZE_FLAGS, 0 },
1216 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1217 CPU_RDPRU_FLAGS, 0 },
1218 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1219 CPU_MCOMMIT_FLAGS, 0 },
1220 { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1221 CPU_SEV_ES_FLAGS, 0 },
1222 { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1223 CPU_TSXLDTRK_FLAGS, 0 },
1224 };
1225
1226 static const noarch_entry cpu_noarch[] =
1227 {
1228 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1229 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1230 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1231 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1232 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1233 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1234 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1235 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1236 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1237 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1238 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1239 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1240 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1241 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1242 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1243 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1244 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1245 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1246 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1247 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1248 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1249 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1250 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1251 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1252 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1253 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1254 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1255 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1256 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1257 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1258 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1259 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1260 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1261 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1262 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1263 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1264 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1265 { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1266 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1267 { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1268 { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1269 };
1270
1271 #ifdef I386COFF
1272 /* Like s_lcomm_internal in gas/read.c but the alignment string
1273 is allowed to be optional. */
1274
1275 static symbolS *
1276 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1277 {
1278 addressT align = 0;
1279
1280 SKIP_WHITESPACE ();
1281
1282 if (needs_align
1283 && *input_line_pointer == ',')
1284 {
1285 align = parse_align (needs_align - 1);
1286
1287 if (align == (addressT) -1)
1288 return NULL;
1289 }
1290 else
1291 {
1292 if (size >= 8)
1293 align = 3;
1294 else if (size >= 4)
1295 align = 2;
1296 else if (size >= 2)
1297 align = 1;
1298 else
1299 align = 0;
1300 }
1301
1302 bss_alloc (symbolP, size, align);
1303 return symbolP;
1304 }
1305
1306 static void
1307 pe_lcomm (int needs_align)
1308 {
1309 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1310 }
1311 #endif
1312
1313 const pseudo_typeS md_pseudo_table[] =
1314 {
1315 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1316 {"align", s_align_bytes, 0},
1317 #else
1318 {"align", s_align_ptwo, 0},
1319 #endif
1320 {"arch", set_cpu_arch, 0},
1321 #ifndef I386COFF
1322 {"bss", s_bss, 0},
1323 #else
1324 {"lcomm", pe_lcomm, 1},
1325 #endif
1326 {"ffloat", float_cons, 'f'},
1327 {"dfloat", float_cons, 'd'},
1328 {"tfloat", float_cons, 'x'},
1329 {"value", cons, 2},
1330 {"slong", signed_cons, 4},
1331 {"noopt", s_ignore, 0},
1332 {"optim", s_ignore, 0},
1333 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1334 {"code16", set_code_flag, CODE_16BIT},
1335 {"code32", set_code_flag, CODE_32BIT},
1336 #ifdef BFD64
1337 {"code64", set_code_flag, CODE_64BIT},
1338 #endif
1339 {"intel_syntax", set_intel_syntax, 1},
1340 {"att_syntax", set_intel_syntax, 0},
1341 {"intel_mnemonic", set_intel_mnemonic, 1},
1342 {"att_mnemonic", set_intel_mnemonic, 0},
1343 {"allow_index_reg", set_allow_index_reg, 1},
1344 {"disallow_index_reg", set_allow_index_reg, 0},
1345 {"sse_check", set_check, 0},
1346 {"operand_check", set_check, 1},
1347 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1348 {"largecomm", handle_large_common, 0},
1349 #else
1350 {"file", dwarf2_directive_file, 0},
1351 {"loc", dwarf2_directive_loc, 0},
1352 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1353 #endif
1354 #ifdef TE_PE
1355 {"secrel32", pe_directive_secrel, 0},
1356 #endif
1357 {0, 0, 0}
1358 };
1359
1360 /* For interface with expression (). */
1361 extern char *input_line_pointer;
1362
1363 /* Hash table for instruction mnemonic lookup. */
1364 static struct hash_control *op_hash;
1365
1366 /* Hash table for register lookup. */
1367 static struct hash_control *reg_hash;
1368 \f
1369 /* Various efficient no-op patterns for aligning code labels.
1370 Note: Don't try to assemble the instructions in the comments.
1371 0L and 0w are not legal. */
1372 static const unsigned char f32_1[] =
1373 {0x90}; /* nop */
1374 static const unsigned char f32_2[] =
1375 {0x66,0x90}; /* xchg %ax,%ax */
1376 static const unsigned char f32_3[] =
1377 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1378 static const unsigned char f32_4[] =
1379 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1380 static const unsigned char f32_6[] =
1381 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1382 static const unsigned char f32_7[] =
1383 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1384 static const unsigned char f16_3[] =
1385 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1386 static const unsigned char f16_4[] =
1387 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1388 static const unsigned char jump_disp8[] =
1389 {0xeb}; /* jmp disp8 */
1390 static const unsigned char jump32_disp32[] =
1391 {0xe9}; /* jmp disp32 */
1392 static const unsigned char jump16_disp32[] =
1393 {0x66,0xe9}; /* jmp disp32 */
1394 /* 32-bit NOPs patterns. */
1395 static const unsigned char *const f32_patt[] = {
1396 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1397 };
1398 /* 16-bit NOPs patterns. */
1399 static const unsigned char *const f16_patt[] = {
1400 f32_1, f32_2, f16_3, f16_4
1401 };
1402 /* nopl (%[re]ax) */
1403 static const unsigned char alt_3[] =
1404 {0x0f,0x1f,0x00};
1405 /* nopl 0(%[re]ax) */
1406 static const unsigned char alt_4[] =
1407 {0x0f,0x1f,0x40,0x00};
1408 /* nopl 0(%[re]ax,%[re]ax,1) */
1409 static const unsigned char alt_5[] =
1410 {0x0f,0x1f,0x44,0x00,0x00};
1411 /* nopw 0(%[re]ax,%[re]ax,1) */
1412 static const unsigned char alt_6[] =
1413 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1414 /* nopl 0L(%[re]ax) */
1415 static const unsigned char alt_7[] =
1416 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1417 /* nopl 0L(%[re]ax,%[re]ax,1) */
1418 static const unsigned char alt_8[] =
1419 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1420 /* nopw 0L(%[re]ax,%[re]ax,1) */
1421 static const unsigned char alt_9[] =
1422 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1423 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1424 static const unsigned char alt_10[] =
1425 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1426 /* data16 nopw %cs:0L(%eax,%eax,1) */
1427 static const unsigned char alt_11[] =
1428 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1429 /* 32-bit and 64-bit NOPs patterns. */
1430 static const unsigned char *const alt_patt[] = {
1431 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1432 alt_9, alt_10, alt_11
1433 };
1434
1435 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1436 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1437
1438 static void
1439 i386_output_nops (char *where, const unsigned char *const *patt,
1440 int count, int max_single_nop_size)
1441
1442 {
1443 /* Place the longer NOP first. */
1444 int last;
1445 int offset;
1446 const unsigned char *nops;
1447
1448 if (max_single_nop_size < 1)
1449 {
1450 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1451 max_single_nop_size);
1452 return;
1453 }
1454
1455 nops = patt[max_single_nop_size - 1];
1456
1457 /* Use the smaller one if the requsted one isn't available. */
1458 if (nops == NULL)
1459 {
1460 max_single_nop_size--;
1461 nops = patt[max_single_nop_size - 1];
1462 }
1463
1464 last = count % max_single_nop_size;
1465
1466 count -= last;
1467 for (offset = 0; offset < count; offset += max_single_nop_size)
1468 memcpy (where + offset, nops, max_single_nop_size);
1469
1470 if (last)
1471 {
1472 nops = patt[last - 1];
1473 if (nops == NULL)
1474 {
1475 /* Use the smaller one plus one-byte NOP if the needed one
1476 isn't available. */
1477 last--;
1478 nops = patt[last - 1];
1479 memcpy (where + offset, nops, last);
1480 where[offset + last] = *patt[0];
1481 }
1482 else
1483 memcpy (where + offset, nops, last);
1484 }
1485 }
1486
1487 static INLINE int
1488 fits_in_imm7 (offsetT num)
1489 {
1490 return (num & 0x7f) == num;
1491 }
1492
1493 static INLINE int
1494 fits_in_imm31 (offsetT num)
1495 {
1496 return (num & 0x7fffffff) == num;
1497 }
1498
1499 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1500 single NOP instruction LIMIT. */
1501
1502 void
1503 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1504 {
1505 const unsigned char *const *patt = NULL;
1506 int max_single_nop_size;
1507 /* Maximum number of NOPs before switching to jump over NOPs. */
1508 int max_number_of_nops;
1509
1510 switch (fragP->fr_type)
1511 {
1512 case rs_fill_nop:
1513 case rs_align_code:
1514 break;
1515 case rs_machine_dependent:
1516 /* Allow NOP padding for jumps and calls. */
1517 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1518 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1519 break;
1520 /* Fall through. */
1521 default:
1522 return;
1523 }
1524
1525 /* We need to decide which NOP sequence to use for 32bit and
1526 64bit. When -mtune= is used:
1527
1528 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1529 PROCESSOR_GENERIC32, f32_patt will be used.
1530 2. For the rest, alt_patt will be used.
1531
1532 When -mtune= isn't used, alt_patt will be used if
1533 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1534 be used.
1535
1536 When -march= or .arch is used, we can't use anything beyond
1537 cpu_arch_isa_flags. */
1538
1539 if (flag_code == CODE_16BIT)
1540 {
1541 patt = f16_patt;
1542 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1543 /* Limit number of NOPs to 2 in 16-bit mode. */
1544 max_number_of_nops = 2;
1545 }
1546 else
1547 {
1548 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1549 {
1550 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1551 switch (cpu_arch_tune)
1552 {
1553 case PROCESSOR_UNKNOWN:
1554 /* We use cpu_arch_isa_flags to check if we SHOULD
1555 optimize with nops. */
1556 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1557 patt = alt_patt;
1558 else
1559 patt = f32_patt;
1560 break;
1561 case PROCESSOR_PENTIUM4:
1562 case PROCESSOR_NOCONA:
1563 case PROCESSOR_CORE:
1564 case PROCESSOR_CORE2:
1565 case PROCESSOR_COREI7:
1566 case PROCESSOR_L1OM:
1567 case PROCESSOR_K1OM:
1568 case PROCESSOR_GENERIC64:
1569 case PROCESSOR_K6:
1570 case PROCESSOR_ATHLON:
1571 case PROCESSOR_K8:
1572 case PROCESSOR_AMDFAM10:
1573 case PROCESSOR_BD:
1574 case PROCESSOR_ZNVER:
1575 case PROCESSOR_BT:
1576 patt = alt_patt;
1577 break;
1578 case PROCESSOR_I386:
1579 case PROCESSOR_I486:
1580 case PROCESSOR_PENTIUM:
1581 case PROCESSOR_PENTIUMPRO:
1582 case PROCESSOR_IAMCU:
1583 case PROCESSOR_GENERIC32:
1584 patt = f32_patt;
1585 break;
1586 }
1587 }
1588 else
1589 {
1590 switch (fragP->tc_frag_data.tune)
1591 {
1592 case PROCESSOR_UNKNOWN:
1593 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1594 PROCESSOR_UNKNOWN. */
1595 abort ();
1596 break;
1597
1598 case PROCESSOR_I386:
1599 case PROCESSOR_I486:
1600 case PROCESSOR_PENTIUM:
1601 case PROCESSOR_IAMCU:
1602 case PROCESSOR_K6:
1603 case PROCESSOR_ATHLON:
1604 case PROCESSOR_K8:
1605 case PROCESSOR_AMDFAM10:
1606 case PROCESSOR_BD:
1607 case PROCESSOR_ZNVER:
1608 case PROCESSOR_BT:
1609 case PROCESSOR_GENERIC32:
1610 /* We use cpu_arch_isa_flags to check if we CAN optimize
1611 with nops. */
1612 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1613 patt = alt_patt;
1614 else
1615 patt = f32_patt;
1616 break;
1617 case PROCESSOR_PENTIUMPRO:
1618 case PROCESSOR_PENTIUM4:
1619 case PROCESSOR_NOCONA:
1620 case PROCESSOR_CORE:
1621 case PROCESSOR_CORE2:
1622 case PROCESSOR_COREI7:
1623 case PROCESSOR_L1OM:
1624 case PROCESSOR_K1OM:
1625 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1626 patt = alt_patt;
1627 else
1628 patt = f32_patt;
1629 break;
1630 case PROCESSOR_GENERIC64:
1631 patt = alt_patt;
1632 break;
1633 }
1634 }
1635
1636 if (patt == f32_patt)
1637 {
1638 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1639 /* Limit number of NOPs to 2 for older processors. */
1640 max_number_of_nops = 2;
1641 }
1642 else
1643 {
1644 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1645 /* Limit number of NOPs to 7 for newer processors. */
1646 max_number_of_nops = 7;
1647 }
1648 }
1649
1650 if (limit == 0)
1651 limit = max_single_nop_size;
1652
1653 if (fragP->fr_type == rs_fill_nop)
1654 {
1655 /* Output NOPs for .nop directive. */
1656 if (limit > max_single_nop_size)
1657 {
1658 as_bad_where (fragP->fr_file, fragP->fr_line,
1659 _("invalid single nop size: %d "
1660 "(expect within [0, %d])"),
1661 limit, max_single_nop_size);
1662 return;
1663 }
1664 }
1665 else if (fragP->fr_type != rs_machine_dependent)
1666 fragP->fr_var = count;
1667
1668 if ((count / max_single_nop_size) > max_number_of_nops)
1669 {
1670 /* Generate jump over NOPs. */
1671 offsetT disp = count - 2;
1672 if (fits_in_imm7 (disp))
1673 {
1674 /* Use "jmp disp8" if possible. */
1675 count = disp;
1676 where[0] = jump_disp8[0];
1677 where[1] = count;
1678 where += 2;
1679 }
1680 else
1681 {
1682 unsigned int size_of_jump;
1683
1684 if (flag_code == CODE_16BIT)
1685 {
1686 where[0] = jump16_disp32[0];
1687 where[1] = jump16_disp32[1];
1688 size_of_jump = 2;
1689 }
1690 else
1691 {
1692 where[0] = jump32_disp32[0];
1693 size_of_jump = 1;
1694 }
1695
1696 count -= size_of_jump + 4;
1697 if (!fits_in_imm31 (count))
1698 {
1699 as_bad_where (fragP->fr_file, fragP->fr_line,
1700 _("jump over nop padding out of range"));
1701 return;
1702 }
1703
1704 md_number_to_chars (where + size_of_jump, count, 4);
1705 where += size_of_jump + 4;
1706 }
1707 }
1708
1709 /* Generate multiple NOPs. */
1710 i386_output_nops (where, patt, count, limit);
1711 }
1712
1713 static INLINE int
1714 operand_type_all_zero (const union i386_operand_type *x)
1715 {
1716 switch (ARRAY_SIZE(x->array))
1717 {
1718 case 3:
1719 if (x->array[2])
1720 return 0;
1721 /* Fall through. */
1722 case 2:
1723 if (x->array[1])
1724 return 0;
1725 /* Fall through. */
1726 case 1:
1727 return !x->array[0];
1728 default:
1729 abort ();
1730 }
1731 }
1732
1733 static INLINE void
1734 operand_type_set (union i386_operand_type *x, unsigned int v)
1735 {
1736 switch (ARRAY_SIZE(x->array))
1737 {
1738 case 3:
1739 x->array[2] = v;
1740 /* Fall through. */
1741 case 2:
1742 x->array[1] = v;
1743 /* Fall through. */
1744 case 1:
1745 x->array[0] = v;
1746 /* Fall through. */
1747 break;
1748 default:
1749 abort ();
1750 }
1751
1752 x->bitfield.class = ClassNone;
1753 x->bitfield.instance = InstanceNone;
1754 }
1755
1756 static INLINE int
1757 operand_type_equal (const union i386_operand_type *x,
1758 const union i386_operand_type *y)
1759 {
1760 switch (ARRAY_SIZE(x->array))
1761 {
1762 case 3:
1763 if (x->array[2] != y->array[2])
1764 return 0;
1765 /* Fall through. */
1766 case 2:
1767 if (x->array[1] != y->array[1])
1768 return 0;
1769 /* Fall through. */
1770 case 1:
1771 return x->array[0] == y->array[0];
1772 break;
1773 default:
1774 abort ();
1775 }
1776 }
1777
1778 static INLINE int
1779 cpu_flags_all_zero (const union i386_cpu_flags *x)
1780 {
1781 switch (ARRAY_SIZE(x->array))
1782 {
1783 case 4:
1784 if (x->array[3])
1785 return 0;
1786 /* Fall through. */
1787 case 3:
1788 if (x->array[2])
1789 return 0;
1790 /* Fall through. */
1791 case 2:
1792 if (x->array[1])
1793 return 0;
1794 /* Fall through. */
1795 case 1:
1796 return !x->array[0];
1797 default:
1798 abort ();
1799 }
1800 }
1801
1802 static INLINE int
1803 cpu_flags_equal (const union i386_cpu_flags *x,
1804 const union i386_cpu_flags *y)
1805 {
1806 switch (ARRAY_SIZE(x->array))
1807 {
1808 case 4:
1809 if (x->array[3] != y->array[3])
1810 return 0;
1811 /* Fall through. */
1812 case 3:
1813 if (x->array[2] != y->array[2])
1814 return 0;
1815 /* Fall through. */
1816 case 2:
1817 if (x->array[1] != y->array[1])
1818 return 0;
1819 /* Fall through. */
1820 case 1:
1821 return x->array[0] == y->array[0];
1822 break;
1823 default:
1824 abort ();
1825 }
1826 }
1827
1828 static INLINE int
1829 cpu_flags_check_cpu64 (i386_cpu_flags f)
1830 {
1831 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1832 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1833 }
1834
1835 static INLINE i386_cpu_flags
1836 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1837 {
1838 switch (ARRAY_SIZE (x.array))
1839 {
1840 case 4:
1841 x.array [3] &= y.array [3];
1842 /* Fall through. */
1843 case 3:
1844 x.array [2] &= y.array [2];
1845 /* Fall through. */
1846 case 2:
1847 x.array [1] &= y.array [1];
1848 /* Fall through. */
1849 case 1:
1850 x.array [0] &= y.array [0];
1851 break;
1852 default:
1853 abort ();
1854 }
1855 return x;
1856 }
1857
1858 static INLINE i386_cpu_flags
1859 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1860 {
1861 switch (ARRAY_SIZE (x.array))
1862 {
1863 case 4:
1864 x.array [3] |= y.array [3];
1865 /* Fall through. */
1866 case 3:
1867 x.array [2] |= y.array [2];
1868 /* Fall through. */
1869 case 2:
1870 x.array [1] |= y.array [1];
1871 /* Fall through. */
1872 case 1:
1873 x.array [0] |= y.array [0];
1874 break;
1875 default:
1876 abort ();
1877 }
1878 return x;
1879 }
1880
1881 static INLINE i386_cpu_flags
1882 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1883 {
1884 switch (ARRAY_SIZE (x.array))
1885 {
1886 case 4:
1887 x.array [3] &= ~y.array [3];
1888 /* Fall through. */
1889 case 3:
1890 x.array [2] &= ~y.array [2];
1891 /* Fall through. */
1892 case 2:
1893 x.array [1] &= ~y.array [1];
1894 /* Fall through. */
1895 case 1:
1896 x.array [0] &= ~y.array [0];
1897 break;
1898 default:
1899 abort ();
1900 }
1901 return x;
1902 }
1903
1904 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1905
1906 #define CPU_FLAGS_ARCH_MATCH 0x1
1907 #define CPU_FLAGS_64BIT_MATCH 0x2
1908
1909 #define CPU_FLAGS_PERFECT_MATCH \
1910 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1911
1912 /* Return CPU flags match bits. */
1913
1914 static int
1915 cpu_flags_match (const insn_template *t)
1916 {
1917 i386_cpu_flags x = t->cpu_flags;
1918 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1919
1920 x.bitfield.cpu64 = 0;
1921 x.bitfield.cpuno64 = 0;
1922
1923 if (cpu_flags_all_zero (&x))
1924 {
1925 /* This instruction is available on all archs. */
1926 match |= CPU_FLAGS_ARCH_MATCH;
1927 }
1928 else
1929 {
1930 /* This instruction is available only on some archs. */
1931 i386_cpu_flags cpu = cpu_arch_flags;
1932
1933 /* AVX512VL is no standalone feature - match it and then strip it. */
1934 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1935 return match;
1936 x.bitfield.cpuavx512vl = 0;
1937
1938 cpu = cpu_flags_and (x, cpu);
1939 if (!cpu_flags_all_zero (&cpu))
1940 {
1941 if (x.bitfield.cpuavx)
1942 {
1943 /* We need to check a few extra flags with AVX. */
1944 if (cpu.bitfield.cpuavx
1945 && (!t->opcode_modifier.sse2avx || sse2avx)
1946 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1947 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1948 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1949 match |= CPU_FLAGS_ARCH_MATCH;
1950 }
1951 else if (x.bitfield.cpuavx512f)
1952 {
1953 /* We need to check a few extra flags with AVX512F. */
1954 if (cpu.bitfield.cpuavx512f
1955 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1956 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1957 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1958 match |= CPU_FLAGS_ARCH_MATCH;
1959 }
1960 else
1961 match |= CPU_FLAGS_ARCH_MATCH;
1962 }
1963 }
1964 return match;
1965 }
1966
1967 static INLINE i386_operand_type
1968 operand_type_and (i386_operand_type x, i386_operand_type y)
1969 {
1970 if (x.bitfield.class != y.bitfield.class)
1971 x.bitfield.class = ClassNone;
1972 if (x.bitfield.instance != y.bitfield.instance)
1973 x.bitfield.instance = InstanceNone;
1974
1975 switch (ARRAY_SIZE (x.array))
1976 {
1977 case 3:
1978 x.array [2] &= y.array [2];
1979 /* Fall through. */
1980 case 2:
1981 x.array [1] &= y.array [1];
1982 /* Fall through. */
1983 case 1:
1984 x.array [0] &= y.array [0];
1985 break;
1986 default:
1987 abort ();
1988 }
1989 return x;
1990 }
1991
1992 static INLINE i386_operand_type
1993 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1994 {
1995 gas_assert (y.bitfield.class == ClassNone);
1996 gas_assert (y.bitfield.instance == InstanceNone);
1997
1998 switch (ARRAY_SIZE (x.array))
1999 {
2000 case 3:
2001 x.array [2] &= ~y.array [2];
2002 /* Fall through. */
2003 case 2:
2004 x.array [1] &= ~y.array [1];
2005 /* Fall through. */
2006 case 1:
2007 x.array [0] &= ~y.array [0];
2008 break;
2009 default:
2010 abort ();
2011 }
2012 return x;
2013 }
2014
2015 static INLINE i386_operand_type
2016 operand_type_or (i386_operand_type x, i386_operand_type y)
2017 {
2018 gas_assert (x.bitfield.class == ClassNone ||
2019 y.bitfield.class == ClassNone ||
2020 x.bitfield.class == y.bitfield.class);
2021 gas_assert (x.bitfield.instance == InstanceNone ||
2022 y.bitfield.instance == InstanceNone ||
2023 x.bitfield.instance == y.bitfield.instance);
2024
2025 switch (ARRAY_SIZE (x.array))
2026 {
2027 case 3:
2028 x.array [2] |= y.array [2];
2029 /* Fall through. */
2030 case 2:
2031 x.array [1] |= y.array [1];
2032 /* Fall through. */
2033 case 1:
2034 x.array [0] |= y.array [0];
2035 break;
2036 default:
2037 abort ();
2038 }
2039 return x;
2040 }
2041
2042 static INLINE i386_operand_type
2043 operand_type_xor (i386_operand_type x, i386_operand_type y)
2044 {
2045 gas_assert (y.bitfield.class == ClassNone);
2046 gas_assert (y.bitfield.instance == InstanceNone);
2047
2048 switch (ARRAY_SIZE (x.array))
2049 {
2050 case 3:
2051 x.array [2] ^= y.array [2];
2052 /* Fall through. */
2053 case 2:
2054 x.array [1] ^= y.array [1];
2055 /* Fall through. */
2056 case 1:
2057 x.array [0] ^= y.array [0];
2058 break;
2059 default:
2060 abort ();
2061 }
2062 return x;
2063 }
2064
2065 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2066 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2067 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2068 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2069 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2070 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2071 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2072 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2073 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2074 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2075 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2076 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2077 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2078 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2079 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2080 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2081 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2082
2083 enum operand_type
2084 {
2085 reg,
2086 imm,
2087 disp,
2088 anymem
2089 };
2090
2091 static INLINE int
2092 operand_type_check (i386_operand_type t, enum operand_type c)
2093 {
2094 switch (c)
2095 {
2096 case reg:
2097 return t.bitfield.class == Reg;
2098
2099 case imm:
2100 return (t.bitfield.imm8
2101 || t.bitfield.imm8s
2102 || t.bitfield.imm16
2103 || t.bitfield.imm32
2104 || t.bitfield.imm32s
2105 || t.bitfield.imm64);
2106
2107 case disp:
2108 return (t.bitfield.disp8
2109 || t.bitfield.disp16
2110 || t.bitfield.disp32
2111 || t.bitfield.disp32s
2112 || t.bitfield.disp64);
2113
2114 case anymem:
2115 return (t.bitfield.disp8
2116 || t.bitfield.disp16
2117 || t.bitfield.disp32
2118 || t.bitfield.disp32s
2119 || t.bitfield.disp64
2120 || t.bitfield.baseindex);
2121
2122 default:
2123 abort ();
2124 }
2125
2126 return 0;
2127 }
2128
2129 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2130 between operand GIVEN and opeand WANTED for instruction template T. */
2131
2132 static INLINE int
2133 match_operand_size (const insn_template *t, unsigned int wanted,
2134 unsigned int given)
2135 {
2136 return !((i.types[given].bitfield.byte
2137 && !t->operand_types[wanted].bitfield.byte)
2138 || (i.types[given].bitfield.word
2139 && !t->operand_types[wanted].bitfield.word)
2140 || (i.types[given].bitfield.dword
2141 && !t->operand_types[wanted].bitfield.dword)
2142 || (i.types[given].bitfield.qword
2143 && !t->operand_types[wanted].bitfield.qword)
2144 || (i.types[given].bitfield.tbyte
2145 && !t->operand_types[wanted].bitfield.tbyte));
2146 }
2147
2148 /* Return 1 if there is no conflict in SIMD register between operand
2149 GIVEN and opeand WANTED for instruction template T. */
2150
2151 static INLINE int
2152 match_simd_size (const insn_template *t, unsigned int wanted,
2153 unsigned int given)
2154 {
2155 return !((i.types[given].bitfield.xmmword
2156 && !t->operand_types[wanted].bitfield.xmmword)
2157 || (i.types[given].bitfield.ymmword
2158 && !t->operand_types[wanted].bitfield.ymmword)
2159 || (i.types[given].bitfield.zmmword
2160 && !t->operand_types[wanted].bitfield.zmmword));
2161 }
2162
2163 /* Return 1 if there is no conflict in any size between operand GIVEN
2164 and opeand WANTED for instruction template T. */
2165
2166 static INLINE int
2167 match_mem_size (const insn_template *t, unsigned int wanted,
2168 unsigned int given)
2169 {
2170 return (match_operand_size (t, wanted, given)
2171 && !((i.types[given].bitfield.unspecified
2172 && !i.broadcast
2173 && !t->operand_types[wanted].bitfield.unspecified)
2174 || (i.types[given].bitfield.fword
2175 && !t->operand_types[wanted].bitfield.fword)
2176 /* For scalar opcode templates to allow register and memory
2177 operands at the same time, some special casing is needed
2178 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2179 down-conversion vpmov*. */
2180 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2181 && t->operand_types[wanted].bitfield.byte
2182 + t->operand_types[wanted].bitfield.word
2183 + t->operand_types[wanted].bitfield.dword
2184 + t->operand_types[wanted].bitfield.qword
2185 > !!t->opcode_modifier.broadcast)
2186 ? (i.types[given].bitfield.xmmword
2187 || i.types[given].bitfield.ymmword
2188 || i.types[given].bitfield.zmmword)
2189 : !match_simd_size(t, wanted, given))));
2190 }
2191
2192 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2193 operands for instruction template T, and it has MATCH_REVERSE set if there
2194 is no size conflict on any operands for the template with operands reversed
2195 (and the template allows for reversing in the first place). */
2196
2197 #define MATCH_STRAIGHT 1
2198 #define MATCH_REVERSE 2
2199
2200 static INLINE unsigned int
2201 operand_size_match (const insn_template *t)
2202 {
2203 unsigned int j, match = MATCH_STRAIGHT;
2204
2205 /* Don't check non-absolute jump instructions. */
2206 if (t->opcode_modifier.jump
2207 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2208 return match;
2209
2210 /* Check memory and accumulator operand size. */
2211 for (j = 0; j < i.operands; j++)
2212 {
2213 if (i.types[j].bitfield.class != Reg
2214 && i.types[j].bitfield.class != RegSIMD
2215 && t->opcode_modifier.anysize)
2216 continue;
2217
2218 if (t->operand_types[j].bitfield.class == Reg
2219 && !match_operand_size (t, j, j))
2220 {
2221 match = 0;
2222 break;
2223 }
2224
2225 if (t->operand_types[j].bitfield.class == RegSIMD
2226 && !match_simd_size (t, j, j))
2227 {
2228 match = 0;
2229 break;
2230 }
2231
2232 if (t->operand_types[j].bitfield.instance == Accum
2233 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2234 {
2235 match = 0;
2236 break;
2237 }
2238
2239 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2240 {
2241 match = 0;
2242 break;
2243 }
2244 }
2245
2246 if (!t->opcode_modifier.d)
2247 {
2248 mismatch:
2249 if (!match)
2250 i.error = operand_size_mismatch;
2251 return match;
2252 }
2253
2254 /* Check reverse. */
2255 gas_assert (i.operands >= 2 && i.operands <= 3);
2256
2257 for (j = 0; j < i.operands; j++)
2258 {
2259 unsigned int given = i.operands - j - 1;
2260
2261 if (t->operand_types[j].bitfield.class == Reg
2262 && !match_operand_size (t, j, given))
2263 goto mismatch;
2264
2265 if (t->operand_types[j].bitfield.class == RegSIMD
2266 && !match_simd_size (t, j, given))
2267 goto mismatch;
2268
2269 if (t->operand_types[j].bitfield.instance == Accum
2270 && (!match_operand_size (t, j, given)
2271 || !match_simd_size (t, j, given)))
2272 goto mismatch;
2273
2274 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2275 goto mismatch;
2276 }
2277
2278 return match | MATCH_REVERSE;
2279 }
2280
2281 static INLINE int
2282 operand_type_match (i386_operand_type overlap,
2283 i386_operand_type given)
2284 {
2285 i386_operand_type temp = overlap;
2286
2287 temp.bitfield.unspecified = 0;
2288 temp.bitfield.byte = 0;
2289 temp.bitfield.word = 0;
2290 temp.bitfield.dword = 0;
2291 temp.bitfield.fword = 0;
2292 temp.bitfield.qword = 0;
2293 temp.bitfield.tbyte = 0;
2294 temp.bitfield.xmmword = 0;
2295 temp.bitfield.ymmword = 0;
2296 temp.bitfield.zmmword = 0;
2297 if (operand_type_all_zero (&temp))
2298 goto mismatch;
2299
2300 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2301 return 1;
2302
2303 mismatch:
2304 i.error = operand_type_mismatch;
2305 return 0;
2306 }
2307
2308 /* If given types g0 and g1 are registers they must be of the same type
2309 unless the expected operand type register overlap is null.
2310 Some Intel syntax memory operand size checking also happens here. */
2311
2312 static INLINE int
2313 operand_type_register_match (i386_operand_type g0,
2314 i386_operand_type t0,
2315 i386_operand_type g1,
2316 i386_operand_type t1)
2317 {
2318 if (g0.bitfield.class != Reg
2319 && g0.bitfield.class != RegSIMD
2320 && (!operand_type_check (g0, anymem)
2321 || g0.bitfield.unspecified
2322 || (t0.bitfield.class != Reg
2323 && t0.bitfield.class != RegSIMD)))
2324 return 1;
2325
2326 if (g1.bitfield.class != Reg
2327 && g1.bitfield.class != RegSIMD
2328 && (!operand_type_check (g1, anymem)
2329 || g1.bitfield.unspecified
2330 || (t1.bitfield.class != Reg
2331 && t1.bitfield.class != RegSIMD)))
2332 return 1;
2333
2334 if (g0.bitfield.byte == g1.bitfield.byte
2335 && g0.bitfield.word == g1.bitfield.word
2336 && g0.bitfield.dword == g1.bitfield.dword
2337 && g0.bitfield.qword == g1.bitfield.qword
2338 && g0.bitfield.xmmword == g1.bitfield.xmmword
2339 && g0.bitfield.ymmword == g1.bitfield.ymmword
2340 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2341 return 1;
2342
2343 if (!(t0.bitfield.byte & t1.bitfield.byte)
2344 && !(t0.bitfield.word & t1.bitfield.word)
2345 && !(t0.bitfield.dword & t1.bitfield.dword)
2346 && !(t0.bitfield.qword & t1.bitfield.qword)
2347 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2348 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2349 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2350 return 1;
2351
2352 i.error = register_type_mismatch;
2353
2354 return 0;
2355 }
2356
2357 static INLINE unsigned int
2358 register_number (const reg_entry *r)
2359 {
2360 unsigned int nr = r->reg_num;
2361
2362 if (r->reg_flags & RegRex)
2363 nr += 8;
2364
2365 if (r->reg_flags & RegVRex)
2366 nr += 16;
2367
2368 return nr;
2369 }
2370
2371 static INLINE unsigned int
2372 mode_from_disp_size (i386_operand_type t)
2373 {
2374 if (t.bitfield.disp8)
2375 return 1;
2376 else if (t.bitfield.disp16
2377 || t.bitfield.disp32
2378 || t.bitfield.disp32s)
2379 return 2;
2380 else
2381 return 0;
2382 }
2383
2384 static INLINE int
2385 fits_in_signed_byte (addressT num)
2386 {
2387 return num + 0x80 <= 0xff;
2388 }
2389
2390 static INLINE int
2391 fits_in_unsigned_byte (addressT num)
2392 {
2393 return num <= 0xff;
2394 }
2395
2396 static INLINE int
2397 fits_in_unsigned_word (addressT num)
2398 {
2399 return num <= 0xffff;
2400 }
2401
2402 static INLINE int
2403 fits_in_signed_word (addressT num)
2404 {
2405 return num + 0x8000 <= 0xffff;
2406 }
2407
2408 static INLINE int
2409 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2410 {
2411 #ifndef BFD64
2412 return 1;
2413 #else
2414 return num + 0x80000000 <= 0xffffffff;
2415 #endif
2416 } /* fits_in_signed_long() */
2417
2418 static INLINE int
2419 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2420 {
2421 #ifndef BFD64
2422 return 1;
2423 #else
2424 return num <= 0xffffffff;
2425 #endif
2426 } /* fits_in_unsigned_long() */
2427
2428 static INLINE int
2429 fits_in_disp8 (offsetT num)
2430 {
2431 int shift = i.memshift;
2432 unsigned int mask;
2433
2434 if (shift == -1)
2435 abort ();
2436
2437 mask = (1 << shift) - 1;
2438
2439 /* Return 0 if NUM isn't properly aligned. */
2440 if ((num & mask))
2441 return 0;
2442
2443 /* Check if NUM will fit in 8bit after shift. */
2444 return fits_in_signed_byte (num >> shift);
2445 }
2446
2447 static INLINE int
2448 fits_in_imm4 (offsetT num)
2449 {
2450 return (num & 0xf) == num;
2451 }
2452
2453 static i386_operand_type
2454 smallest_imm_type (offsetT num)
2455 {
2456 i386_operand_type t;
2457
2458 operand_type_set (&t, 0);
2459 t.bitfield.imm64 = 1;
2460
2461 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2462 {
2463 /* This code is disabled on the 486 because all the Imm1 forms
2464 in the opcode table are slower on the i486. They're the
2465 versions with the implicitly specified single-position
2466 displacement, which has another syntax if you really want to
2467 use that form. */
2468 t.bitfield.imm1 = 1;
2469 t.bitfield.imm8 = 1;
2470 t.bitfield.imm8s = 1;
2471 t.bitfield.imm16 = 1;
2472 t.bitfield.imm32 = 1;
2473 t.bitfield.imm32s = 1;
2474 }
2475 else if (fits_in_signed_byte (num))
2476 {
2477 t.bitfield.imm8 = 1;
2478 t.bitfield.imm8s = 1;
2479 t.bitfield.imm16 = 1;
2480 t.bitfield.imm32 = 1;
2481 t.bitfield.imm32s = 1;
2482 }
2483 else if (fits_in_unsigned_byte (num))
2484 {
2485 t.bitfield.imm8 = 1;
2486 t.bitfield.imm16 = 1;
2487 t.bitfield.imm32 = 1;
2488 t.bitfield.imm32s = 1;
2489 }
2490 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2491 {
2492 t.bitfield.imm16 = 1;
2493 t.bitfield.imm32 = 1;
2494 t.bitfield.imm32s = 1;
2495 }
2496 else if (fits_in_signed_long (num))
2497 {
2498 t.bitfield.imm32 = 1;
2499 t.bitfield.imm32s = 1;
2500 }
2501 else if (fits_in_unsigned_long (num))
2502 t.bitfield.imm32 = 1;
2503
2504 return t;
2505 }
2506
2507 static offsetT
2508 offset_in_range (offsetT val, int size)
2509 {
2510 addressT mask;
2511
2512 switch (size)
2513 {
2514 case 1: mask = ((addressT) 1 << 8) - 1; break;
2515 case 2: mask = ((addressT) 1 << 16) - 1; break;
2516 case 4: mask = ((addressT) 2 << 31) - 1; break;
2517 #ifdef BFD64
2518 case 8: mask = ((addressT) 2 << 63) - 1; break;
2519 #endif
2520 default: abort ();
2521 }
2522
2523 #ifdef BFD64
2524 /* If BFD64, sign extend val for 32bit address mode. */
2525 if (flag_code != CODE_64BIT
2526 || i.prefix[ADDR_PREFIX])
2527 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2528 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2529 #endif
2530
2531 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2532 {
2533 char buf1[40], buf2[40];
2534
2535 sprint_value (buf1, val);
2536 sprint_value (buf2, val & mask);
2537 as_warn (_("%s shortened to %s"), buf1, buf2);
2538 }
2539 return val & mask;
2540 }
2541
2542 enum PREFIX_GROUP
2543 {
2544 PREFIX_EXIST = 0,
2545 PREFIX_LOCK,
2546 PREFIX_REP,
2547 PREFIX_DS,
2548 PREFIX_OTHER
2549 };
2550
2551 /* Returns
2552 a. PREFIX_EXIST if attempting to add a prefix where one from the
2553 same class already exists.
2554 b. PREFIX_LOCK if lock prefix is added.
2555 c. PREFIX_REP if rep/repne prefix is added.
2556 d. PREFIX_DS if ds prefix is added.
2557 e. PREFIX_OTHER if other prefix is added.
2558 */
2559
2560 static enum PREFIX_GROUP
2561 add_prefix (unsigned int prefix)
2562 {
2563 enum PREFIX_GROUP ret = PREFIX_OTHER;
2564 unsigned int q;
2565
2566 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2567 && flag_code == CODE_64BIT)
2568 {
2569 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2570 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2571 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2572 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2573 ret = PREFIX_EXIST;
2574 q = REX_PREFIX;
2575 }
2576 else
2577 {
2578 switch (prefix)
2579 {
2580 default:
2581 abort ();
2582
2583 case DS_PREFIX_OPCODE:
2584 ret = PREFIX_DS;
2585 /* Fall through. */
2586 case CS_PREFIX_OPCODE:
2587 case ES_PREFIX_OPCODE:
2588 case FS_PREFIX_OPCODE:
2589 case GS_PREFIX_OPCODE:
2590 case SS_PREFIX_OPCODE:
2591 q = SEG_PREFIX;
2592 break;
2593
2594 case REPNE_PREFIX_OPCODE:
2595 case REPE_PREFIX_OPCODE:
2596 q = REP_PREFIX;
2597 ret = PREFIX_REP;
2598 break;
2599
2600 case LOCK_PREFIX_OPCODE:
2601 q = LOCK_PREFIX;
2602 ret = PREFIX_LOCK;
2603 break;
2604
2605 case FWAIT_OPCODE:
2606 q = WAIT_PREFIX;
2607 break;
2608
2609 case ADDR_PREFIX_OPCODE:
2610 q = ADDR_PREFIX;
2611 break;
2612
2613 case DATA_PREFIX_OPCODE:
2614 q = DATA_PREFIX;
2615 break;
2616 }
2617 if (i.prefix[q] != 0)
2618 ret = PREFIX_EXIST;
2619 }
2620
2621 if (ret)
2622 {
2623 if (!i.prefix[q])
2624 ++i.prefixes;
2625 i.prefix[q] |= prefix;
2626 }
2627 else
2628 as_bad (_("same type of prefix used twice"));
2629
2630 return ret;
2631 }
2632
2633 static void
2634 update_code_flag (int value, int check)
2635 {
2636 PRINTF_LIKE ((*as_error));
2637
2638 flag_code = (enum flag_code) value;
2639 if (flag_code == CODE_64BIT)
2640 {
2641 cpu_arch_flags.bitfield.cpu64 = 1;
2642 cpu_arch_flags.bitfield.cpuno64 = 0;
2643 }
2644 else
2645 {
2646 cpu_arch_flags.bitfield.cpu64 = 0;
2647 cpu_arch_flags.bitfield.cpuno64 = 1;
2648 }
2649 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2650 {
2651 if (check)
2652 as_error = as_fatal;
2653 else
2654 as_error = as_bad;
2655 (*as_error) (_("64bit mode not supported on `%s'."),
2656 cpu_arch_name ? cpu_arch_name : default_arch);
2657 }
2658 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2659 {
2660 if (check)
2661 as_error = as_fatal;
2662 else
2663 as_error = as_bad;
2664 (*as_error) (_("32bit mode not supported on `%s'."),
2665 cpu_arch_name ? cpu_arch_name : default_arch);
2666 }
2667 stackop_size = '\0';
2668 }
2669
2670 static void
2671 set_code_flag (int value)
2672 {
2673 update_code_flag (value, 0);
2674 }
2675
2676 static void
2677 set_16bit_gcc_code_flag (int new_code_flag)
2678 {
2679 flag_code = (enum flag_code) new_code_flag;
2680 if (flag_code != CODE_16BIT)
2681 abort ();
2682 cpu_arch_flags.bitfield.cpu64 = 0;
2683 cpu_arch_flags.bitfield.cpuno64 = 1;
2684 stackop_size = LONG_MNEM_SUFFIX;
2685 }
2686
2687 static void
2688 set_intel_syntax (int syntax_flag)
2689 {
2690 /* Find out if register prefixing is specified. */
2691 int ask_naked_reg = 0;
2692
2693 SKIP_WHITESPACE ();
2694 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2695 {
2696 char *string;
2697 int e = get_symbol_name (&string);
2698
2699 if (strcmp (string, "prefix") == 0)
2700 ask_naked_reg = 1;
2701 else if (strcmp (string, "noprefix") == 0)
2702 ask_naked_reg = -1;
2703 else
2704 as_bad (_("bad argument to syntax directive."));
2705 (void) restore_line_pointer (e);
2706 }
2707 demand_empty_rest_of_line ();
2708
2709 intel_syntax = syntax_flag;
2710
2711 if (ask_naked_reg == 0)
2712 allow_naked_reg = (intel_syntax
2713 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2714 else
2715 allow_naked_reg = (ask_naked_reg < 0);
2716
2717 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2718
2719 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2720 identifier_chars['$'] = intel_syntax ? '$' : 0;
2721 register_prefix = allow_naked_reg ? "" : "%";
2722 }
2723
2724 static void
2725 set_intel_mnemonic (int mnemonic_flag)
2726 {
2727 intel_mnemonic = mnemonic_flag;
2728 }
2729
2730 static void
2731 set_allow_index_reg (int flag)
2732 {
2733 allow_index_reg = flag;
2734 }
2735
2736 static void
2737 set_check (int what)
2738 {
2739 enum check_kind *kind;
2740 const char *str;
2741
2742 if (what)
2743 {
2744 kind = &operand_check;
2745 str = "operand";
2746 }
2747 else
2748 {
2749 kind = &sse_check;
2750 str = "sse";
2751 }
2752
2753 SKIP_WHITESPACE ();
2754
2755 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2756 {
2757 char *string;
2758 int e = get_symbol_name (&string);
2759
2760 if (strcmp (string, "none") == 0)
2761 *kind = check_none;
2762 else if (strcmp (string, "warning") == 0)
2763 *kind = check_warning;
2764 else if (strcmp (string, "error") == 0)
2765 *kind = check_error;
2766 else
2767 as_bad (_("bad argument to %s_check directive."), str);
2768 (void) restore_line_pointer (e);
2769 }
2770 else
2771 as_bad (_("missing argument for %s_check directive"), str);
2772
2773 demand_empty_rest_of_line ();
2774 }
2775
2776 static void
2777 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2778 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2779 {
2780 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2781 static const char *arch;
2782
2783 /* Intel LIOM is only supported on ELF. */
2784 if (!IS_ELF)
2785 return;
2786
2787 if (!arch)
2788 {
2789 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2790 use default_arch. */
2791 arch = cpu_arch_name;
2792 if (!arch)
2793 arch = default_arch;
2794 }
2795
2796 /* If we are targeting Intel MCU, we must enable it. */
2797 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2798 || new_flag.bitfield.cpuiamcu)
2799 return;
2800
2801 /* If we are targeting Intel L1OM, we must enable it. */
2802 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2803 || new_flag.bitfield.cpul1om)
2804 return;
2805
2806 /* If we are targeting Intel K1OM, we must enable it. */
2807 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2808 || new_flag.bitfield.cpuk1om)
2809 return;
2810
2811 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2812 #endif
2813 }
2814
2815 static void
2816 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2817 {
2818 SKIP_WHITESPACE ();
2819
2820 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2821 {
2822 char *string;
2823 int e = get_symbol_name (&string);
2824 unsigned int j;
2825 i386_cpu_flags flags;
2826
2827 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2828 {
2829 if (strcmp (string, cpu_arch[j].name) == 0)
2830 {
2831 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2832
2833 if (*string != '.')
2834 {
2835 cpu_arch_name = cpu_arch[j].name;
2836 cpu_sub_arch_name = NULL;
2837 cpu_arch_flags = cpu_arch[j].flags;
2838 if (flag_code == CODE_64BIT)
2839 {
2840 cpu_arch_flags.bitfield.cpu64 = 1;
2841 cpu_arch_flags.bitfield.cpuno64 = 0;
2842 }
2843 else
2844 {
2845 cpu_arch_flags.bitfield.cpu64 = 0;
2846 cpu_arch_flags.bitfield.cpuno64 = 1;
2847 }
2848 cpu_arch_isa = cpu_arch[j].type;
2849 cpu_arch_isa_flags = cpu_arch[j].flags;
2850 if (!cpu_arch_tune_set)
2851 {
2852 cpu_arch_tune = cpu_arch_isa;
2853 cpu_arch_tune_flags = cpu_arch_isa_flags;
2854 }
2855 break;
2856 }
2857
2858 flags = cpu_flags_or (cpu_arch_flags,
2859 cpu_arch[j].flags);
2860
2861 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2862 {
2863 if (cpu_sub_arch_name)
2864 {
2865 char *name = cpu_sub_arch_name;
2866 cpu_sub_arch_name = concat (name,
2867 cpu_arch[j].name,
2868 (const char *) NULL);
2869 free (name);
2870 }
2871 else
2872 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2873 cpu_arch_flags = flags;
2874 cpu_arch_isa_flags = flags;
2875 }
2876 else
2877 cpu_arch_isa_flags
2878 = cpu_flags_or (cpu_arch_isa_flags,
2879 cpu_arch[j].flags);
2880 (void) restore_line_pointer (e);
2881 demand_empty_rest_of_line ();
2882 return;
2883 }
2884 }
2885
2886 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2887 {
2888 /* Disable an ISA extension. */
2889 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2890 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2891 {
2892 flags = cpu_flags_and_not (cpu_arch_flags,
2893 cpu_noarch[j].flags);
2894 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2895 {
2896 if (cpu_sub_arch_name)
2897 {
2898 char *name = cpu_sub_arch_name;
2899 cpu_sub_arch_name = concat (name, string,
2900 (const char *) NULL);
2901 free (name);
2902 }
2903 else
2904 cpu_sub_arch_name = xstrdup (string);
2905 cpu_arch_flags = flags;
2906 cpu_arch_isa_flags = flags;
2907 }
2908 (void) restore_line_pointer (e);
2909 demand_empty_rest_of_line ();
2910 return;
2911 }
2912
2913 j = ARRAY_SIZE (cpu_arch);
2914 }
2915
2916 if (j >= ARRAY_SIZE (cpu_arch))
2917 as_bad (_("no such architecture: `%s'"), string);
2918
2919 *input_line_pointer = e;
2920 }
2921 else
2922 as_bad (_("missing cpu architecture"));
2923
2924 no_cond_jump_promotion = 0;
2925 if (*input_line_pointer == ','
2926 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2927 {
2928 char *string;
2929 char e;
2930
2931 ++input_line_pointer;
2932 e = get_symbol_name (&string);
2933
2934 if (strcmp (string, "nojumps") == 0)
2935 no_cond_jump_promotion = 1;
2936 else if (strcmp (string, "jumps") == 0)
2937 ;
2938 else
2939 as_bad (_("no such architecture modifier: `%s'"), string);
2940
2941 (void) restore_line_pointer (e);
2942 }
2943
2944 demand_empty_rest_of_line ();
2945 }
2946
2947 enum bfd_architecture
2948 i386_arch (void)
2949 {
2950 if (cpu_arch_isa == PROCESSOR_L1OM)
2951 {
2952 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2953 || flag_code != CODE_64BIT)
2954 as_fatal (_("Intel L1OM is 64bit ELF only"));
2955 return bfd_arch_l1om;
2956 }
2957 else if (cpu_arch_isa == PROCESSOR_K1OM)
2958 {
2959 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2960 || flag_code != CODE_64BIT)
2961 as_fatal (_("Intel K1OM is 64bit ELF only"));
2962 return bfd_arch_k1om;
2963 }
2964 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2965 {
2966 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2967 || flag_code == CODE_64BIT)
2968 as_fatal (_("Intel MCU is 32bit ELF only"));
2969 return bfd_arch_iamcu;
2970 }
2971 else
2972 return bfd_arch_i386;
2973 }
2974
2975 unsigned long
2976 i386_mach (void)
2977 {
2978 if (!strncmp (default_arch, "x86_64", 6))
2979 {
2980 if (cpu_arch_isa == PROCESSOR_L1OM)
2981 {
2982 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2983 || default_arch[6] != '\0')
2984 as_fatal (_("Intel L1OM is 64bit ELF only"));
2985 return bfd_mach_l1om;
2986 }
2987 else if (cpu_arch_isa == PROCESSOR_K1OM)
2988 {
2989 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2990 || default_arch[6] != '\0')
2991 as_fatal (_("Intel K1OM is 64bit ELF only"));
2992 return bfd_mach_k1om;
2993 }
2994 else if (default_arch[6] == '\0')
2995 return bfd_mach_x86_64;
2996 else
2997 return bfd_mach_x64_32;
2998 }
2999 else if (!strcmp (default_arch, "i386")
3000 || !strcmp (default_arch, "iamcu"))
3001 {
3002 if (cpu_arch_isa == PROCESSOR_IAMCU)
3003 {
3004 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3005 as_fatal (_("Intel MCU is 32bit ELF only"));
3006 return bfd_mach_i386_iamcu;
3007 }
3008 else
3009 return bfd_mach_i386_i386;
3010 }
3011 else
3012 as_fatal (_("unknown architecture"));
3013 }
3014 \f
3015 void
3016 md_begin (void)
3017 {
3018 const char *hash_err;
3019
3020 /* Support pseudo prefixes like {disp32}. */
3021 lex_type ['{'] = LEX_BEGIN_NAME;
3022
3023 /* Initialize op_hash hash table. */
3024 op_hash = hash_new ();
3025
3026 {
3027 const insn_template *optab;
3028 templates *core_optab;
3029
3030 /* Setup for loop. */
3031 optab = i386_optab;
3032 core_optab = XNEW (templates);
3033 core_optab->start = optab;
3034
3035 while (1)
3036 {
3037 ++optab;
3038 if (optab->name == NULL
3039 || strcmp (optab->name, (optab - 1)->name) != 0)
3040 {
3041 /* different name --> ship out current template list;
3042 add to hash table; & begin anew. */
3043 core_optab->end = optab;
3044 hash_err = hash_insert (op_hash,
3045 (optab - 1)->name,
3046 (void *) core_optab);
3047 if (hash_err)
3048 {
3049 as_fatal (_("can't hash %s: %s"),
3050 (optab - 1)->name,
3051 hash_err);
3052 }
3053 if (optab->name == NULL)
3054 break;
3055 core_optab = XNEW (templates);
3056 core_optab->start = optab;
3057 }
3058 }
3059 }
3060
3061 /* Initialize reg_hash hash table. */
3062 reg_hash = hash_new ();
3063 {
3064 const reg_entry *regtab;
3065 unsigned int regtab_size = i386_regtab_size;
3066
3067 for (regtab = i386_regtab; regtab_size--; regtab++)
3068 {
3069 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3070 if (hash_err)
3071 as_fatal (_("can't hash %s: %s"),
3072 regtab->reg_name,
3073 hash_err);
3074 }
3075 }
3076
3077 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3078 {
3079 int c;
3080 char *p;
3081
3082 for (c = 0; c < 256; c++)
3083 {
3084 if (ISDIGIT (c))
3085 {
3086 digit_chars[c] = c;
3087 mnemonic_chars[c] = c;
3088 register_chars[c] = c;
3089 operand_chars[c] = c;
3090 }
3091 else if (ISLOWER (c))
3092 {
3093 mnemonic_chars[c] = c;
3094 register_chars[c] = c;
3095 operand_chars[c] = c;
3096 }
3097 else if (ISUPPER (c))
3098 {
3099 mnemonic_chars[c] = TOLOWER (c);
3100 register_chars[c] = mnemonic_chars[c];
3101 operand_chars[c] = c;
3102 }
3103 else if (c == '{' || c == '}')
3104 {
3105 mnemonic_chars[c] = c;
3106 operand_chars[c] = c;
3107 }
3108
3109 if (ISALPHA (c) || ISDIGIT (c))
3110 identifier_chars[c] = c;
3111 else if (c >= 128)
3112 {
3113 identifier_chars[c] = c;
3114 operand_chars[c] = c;
3115 }
3116 }
3117
3118 #ifdef LEX_AT
3119 identifier_chars['@'] = '@';
3120 #endif
3121 #ifdef LEX_QM
3122 identifier_chars['?'] = '?';
3123 operand_chars['?'] = '?';
3124 #endif
3125 digit_chars['-'] = '-';
3126 mnemonic_chars['_'] = '_';
3127 mnemonic_chars['-'] = '-';
3128 mnemonic_chars['.'] = '.';
3129 identifier_chars['_'] = '_';
3130 identifier_chars['.'] = '.';
3131
3132 for (p = operand_special_chars; *p != '\0'; p++)
3133 operand_chars[(unsigned char) *p] = *p;
3134 }
3135
3136 if (flag_code == CODE_64BIT)
3137 {
3138 #if defined (OBJ_COFF) && defined (TE_PE)
3139 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3140 ? 32 : 16);
3141 #else
3142 x86_dwarf2_return_column = 16;
3143 #endif
3144 x86_cie_data_alignment = -8;
3145 }
3146 else
3147 {
3148 x86_dwarf2_return_column = 8;
3149 x86_cie_data_alignment = -4;
3150 }
3151
3152 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3153 can be turned into BRANCH_PREFIX frag. */
3154 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3155 abort ();
3156 }
3157
3158 void
3159 i386_print_statistics (FILE *file)
3160 {
3161 hash_print_statistics (file, "i386 opcode", op_hash);
3162 hash_print_statistics (file, "i386 register", reg_hash);
3163 }
3164 \f
3165 #ifdef DEBUG386
3166
3167 /* Debugging routines for md_assemble. */
3168 static void pte (insn_template *);
3169 static void pt (i386_operand_type);
3170 static void pe (expressionS *);
3171 static void ps (symbolS *);
3172
3173 static void
3174 pi (const char *line, i386_insn *x)
3175 {
3176 unsigned int j;
3177
3178 fprintf (stdout, "%s: template ", line);
3179 pte (&x->tm);
3180 fprintf (stdout, " address: base %s index %s scale %x\n",
3181 x->base_reg ? x->base_reg->reg_name : "none",
3182 x->index_reg ? x->index_reg->reg_name : "none",
3183 x->log2_scale_factor);
3184 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3185 x->rm.mode, x->rm.reg, x->rm.regmem);
3186 fprintf (stdout, " sib: base %x index %x scale %x\n",
3187 x->sib.base, x->sib.index, x->sib.scale);
3188 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3189 (x->rex & REX_W) != 0,
3190 (x->rex & REX_R) != 0,
3191 (x->rex & REX_X) != 0,
3192 (x->rex & REX_B) != 0);
3193 for (j = 0; j < x->operands; j++)
3194 {
3195 fprintf (stdout, " #%d: ", j + 1);
3196 pt (x->types[j]);
3197 fprintf (stdout, "\n");
3198 if (x->types[j].bitfield.class == Reg
3199 || x->types[j].bitfield.class == RegMMX
3200 || x->types[j].bitfield.class == RegSIMD
3201 || x->types[j].bitfield.class == SReg
3202 || x->types[j].bitfield.class == RegCR
3203 || x->types[j].bitfield.class == RegDR
3204 || x->types[j].bitfield.class == RegTR)
3205 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3206 if (operand_type_check (x->types[j], imm))
3207 pe (x->op[j].imms);
3208 if (operand_type_check (x->types[j], disp))
3209 pe (x->op[j].disps);
3210 }
3211 }
3212
3213 static void
3214 pte (insn_template *t)
3215 {
3216 unsigned int j;
3217 fprintf (stdout, " %d operands ", t->operands);
3218 fprintf (stdout, "opcode %x ", t->base_opcode);
3219 if (t->extension_opcode != None)
3220 fprintf (stdout, "ext %x ", t->extension_opcode);
3221 if (t->opcode_modifier.d)
3222 fprintf (stdout, "D");
3223 if (t->opcode_modifier.w)
3224 fprintf (stdout, "W");
3225 fprintf (stdout, "\n");
3226 for (j = 0; j < t->operands; j++)
3227 {
3228 fprintf (stdout, " #%d type ", j + 1);
3229 pt (t->operand_types[j]);
3230 fprintf (stdout, "\n");
3231 }
3232 }
3233
3234 static void
3235 pe (expressionS *e)
3236 {
3237 fprintf (stdout, " operation %d\n", e->X_op);
3238 fprintf (stdout, " add_number %ld (%lx)\n",
3239 (long) e->X_add_number, (long) e->X_add_number);
3240 if (e->X_add_symbol)
3241 {
3242 fprintf (stdout, " add_symbol ");
3243 ps (e->X_add_symbol);
3244 fprintf (stdout, "\n");
3245 }
3246 if (e->X_op_symbol)
3247 {
3248 fprintf (stdout, " op_symbol ");
3249 ps (e->X_op_symbol);
3250 fprintf (stdout, "\n");
3251 }
3252 }
3253
3254 static void
3255 ps (symbolS *s)
3256 {
3257 fprintf (stdout, "%s type %s%s",
3258 S_GET_NAME (s),
3259 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3260 segment_name (S_GET_SEGMENT (s)));
3261 }
3262
3263 static struct type_name
3264 {
3265 i386_operand_type mask;
3266 const char *name;
3267 }
3268 const type_names[] =
3269 {
3270 { OPERAND_TYPE_REG8, "r8" },
3271 { OPERAND_TYPE_REG16, "r16" },
3272 { OPERAND_TYPE_REG32, "r32" },
3273 { OPERAND_TYPE_REG64, "r64" },
3274 { OPERAND_TYPE_ACC8, "acc8" },
3275 { OPERAND_TYPE_ACC16, "acc16" },
3276 { OPERAND_TYPE_ACC32, "acc32" },
3277 { OPERAND_TYPE_ACC64, "acc64" },
3278 { OPERAND_TYPE_IMM8, "i8" },
3279 { OPERAND_TYPE_IMM8, "i8s" },
3280 { OPERAND_TYPE_IMM16, "i16" },
3281 { OPERAND_TYPE_IMM32, "i32" },
3282 { OPERAND_TYPE_IMM32S, "i32s" },
3283 { OPERAND_TYPE_IMM64, "i64" },
3284 { OPERAND_TYPE_IMM1, "i1" },
3285 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3286 { OPERAND_TYPE_DISP8, "d8" },
3287 { OPERAND_TYPE_DISP16, "d16" },
3288 { OPERAND_TYPE_DISP32, "d32" },
3289 { OPERAND_TYPE_DISP32S, "d32s" },
3290 { OPERAND_TYPE_DISP64, "d64" },
3291 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3292 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3293 { OPERAND_TYPE_CONTROL, "control reg" },
3294 { OPERAND_TYPE_TEST, "test reg" },
3295 { OPERAND_TYPE_DEBUG, "debug reg" },
3296 { OPERAND_TYPE_FLOATREG, "FReg" },
3297 { OPERAND_TYPE_FLOATACC, "FAcc" },
3298 { OPERAND_TYPE_SREG, "SReg" },
3299 { OPERAND_TYPE_REGMMX, "rMMX" },
3300 { OPERAND_TYPE_REGXMM, "rXMM" },
3301 { OPERAND_TYPE_REGYMM, "rYMM" },
3302 { OPERAND_TYPE_REGZMM, "rZMM" },
3303 { OPERAND_TYPE_REGMASK, "Mask reg" },
3304 };
3305
3306 static void
3307 pt (i386_operand_type t)
3308 {
3309 unsigned int j;
3310 i386_operand_type a;
3311
3312 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3313 {
3314 a = operand_type_and (t, type_names[j].mask);
3315 if (operand_type_equal (&a, &type_names[j].mask))
3316 fprintf (stdout, "%s, ", type_names[j].name);
3317 }
3318 fflush (stdout);
3319 }
3320
3321 #endif /* DEBUG386 */
3322 \f
3323 static bfd_reloc_code_real_type
3324 reloc (unsigned int size,
3325 int pcrel,
3326 int sign,
3327 bfd_reloc_code_real_type other)
3328 {
3329 if (other != NO_RELOC)
3330 {
3331 reloc_howto_type *rel;
3332
3333 if (size == 8)
3334 switch (other)
3335 {
3336 case BFD_RELOC_X86_64_GOT32:
3337 return BFD_RELOC_X86_64_GOT64;
3338 break;
3339 case BFD_RELOC_X86_64_GOTPLT64:
3340 return BFD_RELOC_X86_64_GOTPLT64;
3341 break;
3342 case BFD_RELOC_X86_64_PLTOFF64:
3343 return BFD_RELOC_X86_64_PLTOFF64;
3344 break;
3345 case BFD_RELOC_X86_64_GOTPC32:
3346 other = BFD_RELOC_X86_64_GOTPC64;
3347 break;
3348 case BFD_RELOC_X86_64_GOTPCREL:
3349 other = BFD_RELOC_X86_64_GOTPCREL64;
3350 break;
3351 case BFD_RELOC_X86_64_TPOFF32:
3352 other = BFD_RELOC_X86_64_TPOFF64;
3353 break;
3354 case BFD_RELOC_X86_64_DTPOFF32:
3355 other = BFD_RELOC_X86_64_DTPOFF64;
3356 break;
3357 default:
3358 break;
3359 }
3360
3361 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3362 if (other == BFD_RELOC_SIZE32)
3363 {
3364 if (size == 8)
3365 other = BFD_RELOC_SIZE64;
3366 if (pcrel)
3367 {
3368 as_bad (_("there are no pc-relative size relocations"));
3369 return NO_RELOC;
3370 }
3371 }
3372 #endif
3373
3374 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3375 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3376 sign = -1;
3377
3378 rel = bfd_reloc_type_lookup (stdoutput, other);
3379 if (!rel)
3380 as_bad (_("unknown relocation (%u)"), other);
3381 else if (size != bfd_get_reloc_size (rel))
3382 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3383 bfd_get_reloc_size (rel),
3384 size);
3385 else if (pcrel && !rel->pc_relative)
3386 as_bad (_("non-pc-relative relocation for pc-relative field"));
3387 else if ((rel->complain_on_overflow == complain_overflow_signed
3388 && !sign)
3389 || (rel->complain_on_overflow == complain_overflow_unsigned
3390 && sign > 0))
3391 as_bad (_("relocated field and relocation type differ in signedness"));
3392 else
3393 return other;
3394 return NO_RELOC;
3395 }
3396
3397 if (pcrel)
3398 {
3399 if (!sign)
3400 as_bad (_("there are no unsigned pc-relative relocations"));
3401 switch (size)
3402 {
3403 case 1: return BFD_RELOC_8_PCREL;
3404 case 2: return BFD_RELOC_16_PCREL;
3405 case 4: return BFD_RELOC_32_PCREL;
3406 case 8: return BFD_RELOC_64_PCREL;
3407 }
3408 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3409 }
3410 else
3411 {
3412 if (sign > 0)
3413 switch (size)
3414 {
3415 case 4: return BFD_RELOC_X86_64_32S;
3416 }
3417 else
3418 switch (size)
3419 {
3420 case 1: return BFD_RELOC_8;
3421 case 2: return BFD_RELOC_16;
3422 case 4: return BFD_RELOC_32;
3423 case 8: return BFD_RELOC_64;
3424 }
3425 as_bad (_("cannot do %s %u byte relocation"),
3426 sign > 0 ? "signed" : "unsigned", size);
3427 }
3428
3429 return NO_RELOC;
3430 }
3431
3432 /* Here we decide which fixups can be adjusted to make them relative to
3433 the beginning of the section instead of the symbol. Basically we need
3434 to make sure that the dynamic relocations are done correctly, so in
3435 some cases we force the original symbol to be used. */
3436
3437 int
3438 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3439 {
3440 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3441 if (!IS_ELF)
3442 return 1;
3443
3444 /* Don't adjust pc-relative references to merge sections in 64-bit
3445 mode. */
3446 if (use_rela_relocations
3447 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3448 && fixP->fx_pcrel)
3449 return 0;
3450
3451 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3452 and changed later by validate_fix. */
3453 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3454 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3455 return 0;
3456
3457 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3458 for size relocations. */
3459 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3460 || fixP->fx_r_type == BFD_RELOC_SIZE64
3461 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3462 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3463 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3464 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3465 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3466 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3467 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3468 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3469 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3470 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3471 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3472 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3473 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3474 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3475 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3476 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3477 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3478 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3479 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3480 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3481 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3482 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3483 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3484 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3485 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3486 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3487 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3488 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3489 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3490 return 0;
3491 #endif
3492 return 1;
3493 }
3494
3495 static int
3496 intel_float_operand (const char *mnemonic)
3497 {
3498 /* Note that the value returned is meaningful only for opcodes with (memory)
3499 operands, hence the code here is free to improperly handle opcodes that
3500 have no operands (for better performance and smaller code). */
3501
3502 if (mnemonic[0] != 'f')
3503 return 0; /* non-math */
3504
3505 switch (mnemonic[1])
3506 {
3507 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3508 the fs segment override prefix not currently handled because no
3509 call path can make opcodes without operands get here */
3510 case 'i':
3511 return 2 /* integer op */;
3512 case 'l':
3513 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3514 return 3; /* fldcw/fldenv */
3515 break;
3516 case 'n':
3517 if (mnemonic[2] != 'o' /* fnop */)
3518 return 3; /* non-waiting control op */
3519 break;
3520 case 'r':
3521 if (mnemonic[2] == 's')
3522 return 3; /* frstor/frstpm */
3523 break;
3524 case 's':
3525 if (mnemonic[2] == 'a')
3526 return 3; /* fsave */
3527 if (mnemonic[2] == 't')
3528 {
3529 switch (mnemonic[3])
3530 {
3531 case 'c': /* fstcw */
3532 case 'd': /* fstdw */
3533 case 'e': /* fstenv */
3534 case 's': /* fsts[gw] */
3535 return 3;
3536 }
3537 }
3538 break;
3539 case 'x':
3540 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3541 return 0; /* fxsave/fxrstor are not really math ops */
3542 break;
3543 }
3544
3545 return 1;
3546 }
3547
3548 /* Build the VEX prefix. */
3549
3550 static void
3551 build_vex_prefix (const insn_template *t)
3552 {
3553 unsigned int register_specifier;
3554 unsigned int implied_prefix;
3555 unsigned int vector_length;
3556 unsigned int w;
3557
3558 /* Check register specifier. */
3559 if (i.vex.register_specifier)
3560 {
3561 register_specifier =
3562 ~register_number (i.vex.register_specifier) & 0xf;
3563 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3564 }
3565 else
3566 register_specifier = 0xf;
3567
3568 /* Use 2-byte VEX prefix by swapping destination and source operand
3569 if there are more than 1 register operand. */
3570 if (i.reg_operands > 1
3571 && i.vec_encoding != vex_encoding_vex3
3572 && i.dir_encoding == dir_encoding_default
3573 && i.operands == i.reg_operands
3574 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3575 && i.tm.opcode_modifier.vexopcode == VEX0F
3576 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3577 && i.rex == REX_B)
3578 {
3579 unsigned int xchg = i.operands - 1;
3580 union i386_op temp_op;
3581 i386_operand_type temp_type;
3582
3583 temp_type = i.types[xchg];
3584 i.types[xchg] = i.types[0];
3585 i.types[0] = temp_type;
3586 temp_op = i.op[xchg];
3587 i.op[xchg] = i.op[0];
3588 i.op[0] = temp_op;
3589
3590 gas_assert (i.rm.mode == 3);
3591
3592 i.rex = REX_R;
3593 xchg = i.rm.regmem;
3594 i.rm.regmem = i.rm.reg;
3595 i.rm.reg = xchg;
3596
3597 if (i.tm.opcode_modifier.d)
3598 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3599 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3600 else /* Use the next insn. */
3601 i.tm = t[1];
3602 }
3603
3604 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3605 are no memory operands and at least 3 register ones. */
3606 if (i.reg_operands >= 3
3607 && i.vec_encoding != vex_encoding_vex3
3608 && i.reg_operands == i.operands - i.imm_operands
3609 && i.tm.opcode_modifier.vex
3610 && i.tm.opcode_modifier.commutative
3611 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3612 && i.rex == REX_B
3613 && i.vex.register_specifier
3614 && !(i.vex.register_specifier->reg_flags & RegRex))
3615 {
3616 unsigned int xchg = i.operands - i.reg_operands;
3617 union i386_op temp_op;
3618 i386_operand_type temp_type;
3619
3620 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3621 gas_assert (!i.tm.opcode_modifier.sae);
3622 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3623 &i.types[i.operands - 3]));
3624 gas_assert (i.rm.mode == 3);
3625
3626 temp_type = i.types[xchg];
3627 i.types[xchg] = i.types[xchg + 1];
3628 i.types[xchg + 1] = temp_type;
3629 temp_op = i.op[xchg];
3630 i.op[xchg] = i.op[xchg + 1];
3631 i.op[xchg + 1] = temp_op;
3632
3633 i.rex = 0;
3634 xchg = i.rm.regmem | 8;
3635 i.rm.regmem = ~register_specifier & 0xf;
3636 gas_assert (!(i.rm.regmem & 8));
3637 i.vex.register_specifier += xchg - i.rm.regmem;
3638 register_specifier = ~xchg & 0xf;
3639 }
3640
3641 if (i.tm.opcode_modifier.vex == VEXScalar)
3642 vector_length = avxscalar;
3643 else if (i.tm.opcode_modifier.vex == VEX256)
3644 vector_length = 1;
3645 else
3646 {
3647 unsigned int op;
3648
3649 /* Determine vector length from the last multi-length vector
3650 operand. */
3651 vector_length = 0;
3652 for (op = t->operands; op--;)
3653 if (t->operand_types[op].bitfield.xmmword
3654 && t->operand_types[op].bitfield.ymmword
3655 && i.types[op].bitfield.ymmword)
3656 {
3657 vector_length = 1;
3658 break;
3659 }
3660 }
3661
3662 switch ((i.tm.base_opcode >> 8) & 0xff)
3663 {
3664 case 0:
3665 implied_prefix = 0;
3666 break;
3667 case DATA_PREFIX_OPCODE:
3668 implied_prefix = 1;
3669 break;
3670 case REPE_PREFIX_OPCODE:
3671 implied_prefix = 2;
3672 break;
3673 case REPNE_PREFIX_OPCODE:
3674 implied_prefix = 3;
3675 break;
3676 default:
3677 abort ();
3678 }
3679
3680 /* Check the REX.W bit and VEXW. */
3681 if (i.tm.opcode_modifier.vexw == VEXWIG)
3682 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3683 else if (i.tm.opcode_modifier.vexw)
3684 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3685 else
3686 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3687
3688 /* Use 2-byte VEX prefix if possible. */
3689 if (w == 0
3690 && i.vec_encoding != vex_encoding_vex3
3691 && i.tm.opcode_modifier.vexopcode == VEX0F
3692 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3693 {
3694 /* 2-byte VEX prefix. */
3695 unsigned int r;
3696
3697 i.vex.length = 2;
3698 i.vex.bytes[0] = 0xc5;
3699
3700 /* Check the REX.R bit. */
3701 r = (i.rex & REX_R) ? 0 : 1;
3702 i.vex.bytes[1] = (r << 7
3703 | register_specifier << 3
3704 | vector_length << 2
3705 | implied_prefix);
3706 }
3707 else
3708 {
3709 /* 3-byte VEX prefix. */
3710 unsigned int m;
3711
3712 i.vex.length = 3;
3713
3714 switch (i.tm.opcode_modifier.vexopcode)
3715 {
3716 case VEX0F:
3717 m = 0x1;
3718 i.vex.bytes[0] = 0xc4;
3719 break;
3720 case VEX0F38:
3721 m = 0x2;
3722 i.vex.bytes[0] = 0xc4;
3723 break;
3724 case VEX0F3A:
3725 m = 0x3;
3726 i.vex.bytes[0] = 0xc4;
3727 break;
3728 case XOP08:
3729 m = 0x8;
3730 i.vex.bytes[0] = 0x8f;
3731 break;
3732 case XOP09:
3733 m = 0x9;
3734 i.vex.bytes[0] = 0x8f;
3735 break;
3736 case XOP0A:
3737 m = 0xa;
3738 i.vex.bytes[0] = 0x8f;
3739 break;
3740 default:
3741 abort ();
3742 }
3743
3744 /* The high 3 bits of the second VEX byte are 1's compliment
3745 of RXB bits from REX. */
3746 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3747
3748 i.vex.bytes[2] = (w << 7
3749 | register_specifier << 3
3750 | vector_length << 2
3751 | implied_prefix);
3752 }
3753 }
3754
3755 static INLINE bfd_boolean
3756 is_evex_encoding (const insn_template *t)
3757 {
3758 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3759 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3760 || t->opcode_modifier.sae;
3761 }
3762
3763 static INLINE bfd_boolean
3764 is_any_vex_encoding (const insn_template *t)
3765 {
3766 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3767 || is_evex_encoding (t);
3768 }
3769
3770 /* Build the EVEX prefix. */
3771
3772 static void
3773 build_evex_prefix (void)
3774 {
3775 unsigned int register_specifier;
3776 unsigned int implied_prefix;
3777 unsigned int m, w;
3778 rex_byte vrex_used = 0;
3779
3780 /* Check register specifier. */
3781 if (i.vex.register_specifier)
3782 {
3783 gas_assert ((i.vrex & REX_X) == 0);
3784
3785 register_specifier = i.vex.register_specifier->reg_num;
3786 if ((i.vex.register_specifier->reg_flags & RegRex))
3787 register_specifier += 8;
3788 /* The upper 16 registers are encoded in the fourth byte of the
3789 EVEX prefix. */
3790 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3791 i.vex.bytes[3] = 0x8;
3792 register_specifier = ~register_specifier & 0xf;
3793 }
3794 else
3795 {
3796 register_specifier = 0xf;
3797
3798 /* Encode upper 16 vector index register in the fourth byte of
3799 the EVEX prefix. */
3800 if (!(i.vrex & REX_X))
3801 i.vex.bytes[3] = 0x8;
3802 else
3803 vrex_used |= REX_X;
3804 }
3805
3806 switch ((i.tm.base_opcode >> 8) & 0xff)
3807 {
3808 case 0:
3809 implied_prefix = 0;
3810 break;
3811 case DATA_PREFIX_OPCODE:
3812 implied_prefix = 1;
3813 break;
3814 case REPE_PREFIX_OPCODE:
3815 implied_prefix = 2;
3816 break;
3817 case REPNE_PREFIX_OPCODE:
3818 implied_prefix = 3;
3819 break;
3820 default:
3821 abort ();
3822 }
3823
3824 /* 4 byte EVEX prefix. */
3825 i.vex.length = 4;
3826 i.vex.bytes[0] = 0x62;
3827
3828 /* mmmm bits. */
3829 switch (i.tm.opcode_modifier.vexopcode)
3830 {
3831 case VEX0F:
3832 m = 1;
3833 break;
3834 case VEX0F38:
3835 m = 2;
3836 break;
3837 case VEX0F3A:
3838 m = 3;
3839 break;
3840 default:
3841 abort ();
3842 break;
3843 }
3844
3845 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3846 bits from REX. */
3847 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3848
3849 /* The fifth bit of the second EVEX byte is 1's compliment of the
3850 REX_R bit in VREX. */
3851 if (!(i.vrex & REX_R))
3852 i.vex.bytes[1] |= 0x10;
3853 else
3854 vrex_used |= REX_R;
3855
3856 if ((i.reg_operands + i.imm_operands) == i.operands)
3857 {
3858 /* When all operands are registers, the REX_X bit in REX is not
3859 used. We reuse it to encode the upper 16 registers, which is
3860 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3861 as 1's compliment. */
3862 if ((i.vrex & REX_B))
3863 {
3864 vrex_used |= REX_B;
3865 i.vex.bytes[1] &= ~0x40;
3866 }
3867 }
3868
3869 /* EVEX instructions shouldn't need the REX prefix. */
3870 i.vrex &= ~vrex_used;
3871 gas_assert (i.vrex == 0);
3872
3873 /* Check the REX.W bit and VEXW. */
3874 if (i.tm.opcode_modifier.vexw == VEXWIG)
3875 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3876 else if (i.tm.opcode_modifier.vexw)
3877 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3878 else
3879 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3880
3881 /* Encode the U bit. */
3882 implied_prefix |= 0x4;
3883
3884 /* The third byte of the EVEX prefix. */
3885 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3886
3887 /* The fourth byte of the EVEX prefix. */
3888 /* The zeroing-masking bit. */
3889 if (i.mask && i.mask->zeroing)
3890 i.vex.bytes[3] |= 0x80;
3891
3892 /* Don't always set the broadcast bit if there is no RC. */
3893 if (!i.rounding)
3894 {
3895 /* Encode the vector length. */
3896 unsigned int vec_length;
3897
3898 if (!i.tm.opcode_modifier.evex
3899 || i.tm.opcode_modifier.evex == EVEXDYN)
3900 {
3901 unsigned int op;
3902
3903 /* Determine vector length from the last multi-length vector
3904 operand. */
3905 vec_length = 0;
3906 for (op = i.operands; op--;)
3907 if (i.tm.operand_types[op].bitfield.xmmword
3908 + i.tm.operand_types[op].bitfield.ymmword
3909 + i.tm.operand_types[op].bitfield.zmmword > 1)
3910 {
3911 if (i.types[op].bitfield.zmmword)
3912 {
3913 i.tm.opcode_modifier.evex = EVEX512;
3914 break;
3915 }
3916 else if (i.types[op].bitfield.ymmword)
3917 {
3918 i.tm.opcode_modifier.evex = EVEX256;
3919 break;
3920 }
3921 else if (i.types[op].bitfield.xmmword)
3922 {
3923 i.tm.opcode_modifier.evex = EVEX128;
3924 break;
3925 }
3926 else if (i.broadcast && (int) op == i.broadcast->operand)
3927 {
3928 switch (i.broadcast->bytes)
3929 {
3930 case 64:
3931 i.tm.opcode_modifier.evex = EVEX512;
3932 break;
3933 case 32:
3934 i.tm.opcode_modifier.evex = EVEX256;
3935 break;
3936 case 16:
3937 i.tm.opcode_modifier.evex = EVEX128;
3938 break;
3939 default:
3940 abort ();
3941 }
3942 break;
3943 }
3944 }
3945
3946 if (op >= MAX_OPERANDS)
3947 abort ();
3948 }
3949
3950 switch (i.tm.opcode_modifier.evex)
3951 {
3952 case EVEXLIG: /* LL' is ignored */
3953 vec_length = evexlig << 5;
3954 break;
3955 case EVEX128:
3956 vec_length = 0 << 5;
3957 break;
3958 case EVEX256:
3959 vec_length = 1 << 5;
3960 break;
3961 case EVEX512:
3962 vec_length = 2 << 5;
3963 break;
3964 default:
3965 abort ();
3966 break;
3967 }
3968 i.vex.bytes[3] |= vec_length;
3969 /* Encode the broadcast bit. */
3970 if (i.broadcast)
3971 i.vex.bytes[3] |= 0x10;
3972 }
3973 else
3974 {
3975 if (i.rounding->type != saeonly)
3976 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3977 else
3978 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3979 }
3980
3981 if (i.mask && i.mask->mask)
3982 i.vex.bytes[3] |= i.mask->mask->reg_num;
3983 }
3984
3985 static void
3986 process_immext (void)
3987 {
3988 expressionS *exp;
3989
3990 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3991 which is coded in the same place as an 8-bit immediate field
3992 would be. Here we fake an 8-bit immediate operand from the
3993 opcode suffix stored in tm.extension_opcode.
3994
3995 AVX instructions also use this encoding, for some of
3996 3 argument instructions. */
3997
3998 gas_assert (i.imm_operands <= 1
3999 && (i.operands <= 2
4000 || (is_any_vex_encoding (&i.tm)
4001 && i.operands <= 4)));
4002
4003 exp = &im_expressions[i.imm_operands++];
4004 i.op[i.operands].imms = exp;
4005 i.types[i.operands] = imm8;
4006 i.operands++;
4007 exp->X_op = O_constant;
4008 exp->X_add_number = i.tm.extension_opcode;
4009 i.tm.extension_opcode = None;
4010 }
4011
4012
4013 static int
4014 check_hle (void)
4015 {
4016 switch (i.tm.opcode_modifier.hleprefixok)
4017 {
4018 default:
4019 abort ();
4020 case HLEPrefixNone:
4021 as_bad (_("invalid instruction `%s' after `%s'"),
4022 i.tm.name, i.hle_prefix);
4023 return 0;
4024 case HLEPrefixLock:
4025 if (i.prefix[LOCK_PREFIX])
4026 return 1;
4027 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4028 return 0;
4029 case HLEPrefixAny:
4030 return 1;
4031 case HLEPrefixRelease:
4032 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4033 {
4034 as_bad (_("instruction `%s' after `xacquire' not allowed"),
4035 i.tm.name);
4036 return 0;
4037 }
4038 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4039 {
4040 as_bad (_("memory destination needed for instruction `%s'"
4041 " after `xrelease'"), i.tm.name);
4042 return 0;
4043 }
4044 return 1;
4045 }
4046 }
4047
4048 /* Try the shortest encoding by shortening operand size. */
4049
4050 static void
4051 optimize_encoding (void)
4052 {
4053 unsigned int j;
4054
4055 if (optimize_for_space
4056 && !is_any_vex_encoding (&i.tm)
4057 && i.reg_operands == 1
4058 && i.imm_operands == 1
4059 && !i.types[1].bitfield.byte
4060 && i.op[0].imms->X_op == O_constant
4061 && fits_in_imm7 (i.op[0].imms->X_add_number)
4062 && (i.tm.base_opcode == 0xa8
4063 || (i.tm.base_opcode == 0xf6
4064 && i.tm.extension_opcode == 0x0)))
4065 {
4066 /* Optimize: -Os:
4067 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4068 */
4069 unsigned int base_regnum = i.op[1].regs->reg_num;
4070 if (flag_code == CODE_64BIT || base_regnum < 4)
4071 {
4072 i.types[1].bitfield.byte = 1;
4073 /* Ignore the suffix. */
4074 i.suffix = 0;
4075 /* Convert to byte registers. */
4076 if (i.types[1].bitfield.word)
4077 j = 16;
4078 else if (i.types[1].bitfield.dword)
4079 j = 32;
4080 else
4081 j = 48;
4082 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4083 j += 8;
4084 i.op[1].regs -= j;
4085 }
4086 }
4087 else if (flag_code == CODE_64BIT
4088 && !is_any_vex_encoding (&i.tm)
4089 && ((i.types[1].bitfield.qword
4090 && i.reg_operands == 1
4091 && i.imm_operands == 1
4092 && i.op[0].imms->X_op == O_constant
4093 && ((i.tm.base_opcode == 0xb8
4094 && i.tm.extension_opcode == None
4095 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4096 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4097 && ((i.tm.base_opcode == 0x24
4098 || i.tm.base_opcode == 0xa8)
4099 || (i.tm.base_opcode == 0x80
4100 && i.tm.extension_opcode == 0x4)
4101 || ((i.tm.base_opcode == 0xf6
4102 || (i.tm.base_opcode | 1) == 0xc7)
4103 && i.tm.extension_opcode == 0x0)))
4104 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4105 && i.tm.base_opcode == 0x83
4106 && i.tm.extension_opcode == 0x4)))
4107 || (i.types[0].bitfield.qword
4108 && ((i.reg_operands == 2
4109 && i.op[0].regs == i.op[1].regs
4110 && (i.tm.base_opcode == 0x30
4111 || i.tm.base_opcode == 0x28))
4112 || (i.reg_operands == 1
4113 && i.operands == 1
4114 && i.tm.base_opcode == 0x30)))))
4115 {
4116 /* Optimize: -O:
4117 andq $imm31, %r64 -> andl $imm31, %r32
4118 andq $imm7, %r64 -> andl $imm7, %r32
4119 testq $imm31, %r64 -> testl $imm31, %r32
4120 xorq %r64, %r64 -> xorl %r32, %r32
4121 subq %r64, %r64 -> subl %r32, %r32
4122 movq $imm31, %r64 -> movl $imm31, %r32
4123 movq $imm32, %r64 -> movl $imm32, %r32
4124 */
4125 i.tm.opcode_modifier.norex64 = 1;
4126 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4127 {
4128 /* Handle
4129 movq $imm31, %r64 -> movl $imm31, %r32
4130 movq $imm32, %r64 -> movl $imm32, %r32
4131 */
4132 i.tm.operand_types[0].bitfield.imm32 = 1;
4133 i.tm.operand_types[0].bitfield.imm32s = 0;
4134 i.tm.operand_types[0].bitfield.imm64 = 0;
4135 i.types[0].bitfield.imm32 = 1;
4136 i.types[0].bitfield.imm32s = 0;
4137 i.types[0].bitfield.imm64 = 0;
4138 i.types[1].bitfield.dword = 1;
4139 i.types[1].bitfield.qword = 0;
4140 if ((i.tm.base_opcode | 1) == 0xc7)
4141 {
4142 /* Handle
4143 movq $imm31, %r64 -> movl $imm31, %r32
4144 */
4145 i.tm.base_opcode = 0xb8;
4146 i.tm.extension_opcode = None;
4147 i.tm.opcode_modifier.w = 0;
4148 i.tm.opcode_modifier.modrm = 0;
4149 }
4150 }
4151 }
4152 else if (optimize > 1
4153 && !optimize_for_space
4154 && !is_any_vex_encoding (&i.tm)
4155 && i.reg_operands == 2
4156 && i.op[0].regs == i.op[1].regs
4157 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4158 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4159 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4160 {
4161 /* Optimize: -O2:
4162 andb %rN, %rN -> testb %rN, %rN
4163 andw %rN, %rN -> testw %rN, %rN
4164 andq %rN, %rN -> testq %rN, %rN
4165 orb %rN, %rN -> testb %rN, %rN
4166 orw %rN, %rN -> testw %rN, %rN
4167 orq %rN, %rN -> testq %rN, %rN
4168
4169 and outside of 64-bit mode
4170
4171 andl %rN, %rN -> testl %rN, %rN
4172 orl %rN, %rN -> testl %rN, %rN
4173 */
4174 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4175 }
4176 else if (i.reg_operands == 3
4177 && i.op[0].regs == i.op[1].regs
4178 && !i.types[2].bitfield.xmmword
4179 && (i.tm.opcode_modifier.vex
4180 || ((!i.mask || i.mask->zeroing)
4181 && !i.rounding
4182 && is_evex_encoding (&i.tm)
4183 && (i.vec_encoding != vex_encoding_evex
4184 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4185 || i.tm.cpu_flags.bitfield.cpuavx512vl
4186 || (i.tm.operand_types[2].bitfield.zmmword
4187 && i.types[2].bitfield.ymmword))))
4188 && ((i.tm.base_opcode == 0x55
4189 || i.tm.base_opcode == 0x6655
4190 || i.tm.base_opcode == 0x66df
4191 || i.tm.base_opcode == 0x57
4192 || i.tm.base_opcode == 0x6657
4193 || i.tm.base_opcode == 0x66ef
4194 || i.tm.base_opcode == 0x66f8
4195 || i.tm.base_opcode == 0x66f9
4196 || i.tm.base_opcode == 0x66fa
4197 || i.tm.base_opcode == 0x66fb
4198 || i.tm.base_opcode == 0x42
4199 || i.tm.base_opcode == 0x6642
4200 || i.tm.base_opcode == 0x47
4201 || i.tm.base_opcode == 0x6647)
4202 && i.tm.extension_opcode == None))
4203 {
4204 /* Optimize: -O1:
4205 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4206 vpsubq and vpsubw:
4207 EVEX VOP %zmmM, %zmmM, %zmmN
4208 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4209 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4210 EVEX VOP %ymmM, %ymmM, %ymmN
4211 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4212 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4213 VEX VOP %ymmM, %ymmM, %ymmN
4214 -> VEX VOP %xmmM, %xmmM, %xmmN
4215 VOP, one of vpandn and vpxor:
4216 VEX VOP %ymmM, %ymmM, %ymmN
4217 -> VEX VOP %xmmM, %xmmM, %xmmN
4218 VOP, one of vpandnd and vpandnq:
4219 EVEX VOP %zmmM, %zmmM, %zmmN
4220 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4221 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4222 EVEX VOP %ymmM, %ymmM, %ymmN
4223 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4224 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4225 VOP, one of vpxord and vpxorq:
4226 EVEX VOP %zmmM, %zmmM, %zmmN
4227 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4228 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4229 EVEX VOP %ymmM, %ymmM, %ymmN
4230 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4231 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4232 VOP, one of kxord and kxorq:
4233 VEX VOP %kM, %kM, %kN
4234 -> VEX kxorw %kM, %kM, %kN
4235 VOP, one of kandnd and kandnq:
4236 VEX VOP %kM, %kM, %kN
4237 -> VEX kandnw %kM, %kM, %kN
4238 */
4239 if (is_evex_encoding (&i.tm))
4240 {
4241 if (i.vec_encoding != vex_encoding_evex)
4242 {
4243 i.tm.opcode_modifier.vex = VEX128;
4244 i.tm.opcode_modifier.vexw = VEXW0;
4245 i.tm.opcode_modifier.evex = 0;
4246 }
4247 else if (optimize > 1)
4248 i.tm.opcode_modifier.evex = EVEX128;
4249 else
4250 return;
4251 }
4252 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4253 {
4254 i.tm.base_opcode &= 0xff;
4255 i.tm.opcode_modifier.vexw = VEXW0;
4256 }
4257 else
4258 i.tm.opcode_modifier.vex = VEX128;
4259
4260 if (i.tm.opcode_modifier.vex)
4261 for (j = 0; j < 3; j++)
4262 {
4263 i.types[j].bitfield.xmmword = 1;
4264 i.types[j].bitfield.ymmword = 0;
4265 }
4266 }
4267 else if (i.vec_encoding != vex_encoding_evex
4268 && !i.types[0].bitfield.zmmword
4269 && !i.types[1].bitfield.zmmword
4270 && !i.mask
4271 && !i.broadcast
4272 && is_evex_encoding (&i.tm)
4273 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4274 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4275 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4276 || (i.tm.base_opcode & ~4) == 0x66db
4277 || (i.tm.base_opcode & ~4) == 0x66eb)
4278 && i.tm.extension_opcode == None)
4279 {
4280 /* Optimize: -O1:
4281 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4282 vmovdqu32 and vmovdqu64:
4283 EVEX VOP %xmmM, %xmmN
4284 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4285 EVEX VOP %ymmM, %ymmN
4286 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4287 EVEX VOP %xmmM, mem
4288 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4289 EVEX VOP %ymmM, mem
4290 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4291 EVEX VOP mem, %xmmN
4292 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4293 EVEX VOP mem, %ymmN
4294 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4295 VOP, one of vpand, vpandn, vpor, vpxor:
4296 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4297 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4298 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4299 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4300 EVEX VOP{d,q} mem, %xmmM, %xmmN
4301 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4302 EVEX VOP{d,q} mem, %ymmM, %ymmN
4303 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4304 */
4305 for (j = 0; j < i.operands; j++)
4306 if (operand_type_check (i.types[j], disp)
4307 && i.op[j].disps->X_op == O_constant)
4308 {
4309 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4310 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4311 bytes, we choose EVEX Disp8 over VEX Disp32. */
4312 int evex_disp8, vex_disp8;
4313 unsigned int memshift = i.memshift;
4314 offsetT n = i.op[j].disps->X_add_number;
4315
4316 evex_disp8 = fits_in_disp8 (n);
4317 i.memshift = 0;
4318 vex_disp8 = fits_in_disp8 (n);
4319 if (evex_disp8 != vex_disp8)
4320 {
4321 i.memshift = memshift;
4322 return;
4323 }
4324
4325 i.types[j].bitfield.disp8 = vex_disp8;
4326 break;
4327 }
4328 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4329 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4330 i.tm.opcode_modifier.vex
4331 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4332 i.tm.opcode_modifier.vexw = VEXW0;
4333 /* VPAND, VPOR, and VPXOR are commutative. */
4334 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4335 i.tm.opcode_modifier.commutative = 1;
4336 i.tm.opcode_modifier.evex = 0;
4337 i.tm.opcode_modifier.masking = 0;
4338 i.tm.opcode_modifier.broadcast = 0;
4339 i.tm.opcode_modifier.disp8memshift = 0;
4340 i.memshift = 0;
4341 if (j < i.operands)
4342 i.types[j].bitfield.disp8
4343 = fits_in_disp8 (i.op[j].disps->X_add_number);
4344 }
4345 }
4346
4347 /* Return non-zero for load instruction. */
4348
4349 static int
4350 load_insn_p (void)
4351 {
4352 unsigned int dest;
4353 int any_vex_p = is_any_vex_encoding (&i.tm);
4354 unsigned int base_opcode = i.tm.base_opcode | 1;
4355
4356 if (!any_vex_p)
4357 {
4358 /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4359 prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4360 bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote. */
4361 if (i.tm.opcode_modifier.anysize)
4362 return 0;
4363
4364 /* pop, popf, popa. */
4365 if (strcmp (i.tm.name, "pop") == 0
4366 || i.tm.base_opcode == 0x9d
4367 || i.tm.base_opcode == 0x61)
4368 return 1;
4369
4370 /* movs, cmps, lods, scas. */
4371 if ((i.tm.base_opcode | 0xb) == 0xaf)
4372 return 1;
4373
4374 /* outs, xlatb. */
4375 if (base_opcode == 0x6f
4376 || i.tm.base_opcode == 0xd7)
4377 return 1;
4378 /* NB: For AMD-specific insns with implicit memory operands,
4379 they're intentionally not covered. */
4380 }
4381
4382 /* No memory operand. */
4383 if (!i.mem_operands)
4384 return 0;
4385
4386 if (any_vex_p)
4387 {
4388 /* vldmxcsr. */
4389 if (i.tm.base_opcode == 0xae
4390 && i.tm.opcode_modifier.vex
4391 && i.tm.opcode_modifier.vexopcode == VEX0F
4392 && i.tm.extension_opcode == 2)
4393 return 1;
4394 }
4395 else
4396 {
4397 /* test, not, neg, mul, imul, div, idiv. */
4398 if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4399 && i.tm.extension_opcode != 1)
4400 return 1;
4401
4402 /* inc, dec. */
4403 if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4404 return 1;
4405
4406 /* add, or, adc, sbb, and, sub, xor, cmp. */
4407 if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4408 return 1;
4409
4410 /* bt, bts, btr, btc. */
4411 if (i.tm.base_opcode == 0xfba
4412 && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4413 return 1;
4414
4415 /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4416 if ((base_opcode == 0xc1
4417 || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4418 && i.tm.extension_opcode != 6)
4419 return 1;
4420
4421 /* cmpxchg8b, cmpxchg16b, xrstors. */
4422 if (i.tm.base_opcode == 0xfc7
4423 && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4424 return 1;
4425
4426 /* fxrstor, ldmxcsr, xrstor. */
4427 if (i.tm.base_opcode == 0xfae
4428 && (i.tm.extension_opcode == 1
4429 || i.tm.extension_opcode == 2
4430 || i.tm.extension_opcode == 5))
4431 return 1;
4432
4433 /* lgdt, lidt, lmsw. */
4434 if (i.tm.base_opcode == 0xf01
4435 && (i.tm.extension_opcode == 2
4436 || i.tm.extension_opcode == 3
4437 || i.tm.extension_opcode == 6))
4438 return 1;
4439
4440 /* vmptrld */
4441 if (i.tm.base_opcode == 0xfc7
4442 && i.tm.extension_opcode == 6)
4443 return 1;
4444
4445 /* Check for x87 instructions. */
4446 if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4447 {
4448 /* Skip fst, fstp, fstenv, fstcw. */
4449 if (i.tm.base_opcode == 0xd9
4450 && (i.tm.extension_opcode == 2
4451 || i.tm.extension_opcode == 3
4452 || i.tm.extension_opcode == 6
4453 || i.tm.extension_opcode == 7))
4454 return 0;
4455
4456 /* Skip fisttp, fist, fistp, fstp. */
4457 if (i.tm.base_opcode == 0xdb
4458 && (i.tm.extension_opcode == 1
4459 || i.tm.extension_opcode == 2
4460 || i.tm.extension_opcode == 3
4461 || i.tm.extension_opcode == 7))
4462 return 0;
4463
4464 /* Skip fisttp, fst, fstp, fsave, fstsw. */
4465 if (i.tm.base_opcode == 0xdd
4466 && (i.tm.extension_opcode == 1
4467 || i.tm.extension_opcode == 2
4468 || i.tm.extension_opcode == 3
4469 || i.tm.extension_opcode == 6
4470 || i.tm.extension_opcode == 7))
4471 return 0;
4472
4473 /* Skip fisttp, fist, fistp, fbstp, fistp. */
4474 if (i.tm.base_opcode == 0xdf
4475 && (i.tm.extension_opcode == 1
4476 || i.tm.extension_opcode == 2
4477 || i.tm.extension_opcode == 3
4478 || i.tm.extension_opcode == 6
4479 || i.tm.extension_opcode == 7))
4480 return 0;
4481
4482 return 1;
4483 }
4484 }
4485
4486 dest = i.operands - 1;
4487
4488 /* Check fake imm8 operand and 3 source operands. */
4489 if ((i.tm.opcode_modifier.immext
4490 || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4491 && i.types[dest].bitfield.imm8)
4492 dest--;
4493
4494 /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd */
4495 if (!any_vex_p
4496 && (base_opcode == 0x1
4497 || base_opcode == 0x9
4498 || base_opcode == 0x11
4499 || base_opcode == 0x19
4500 || base_opcode == 0x21
4501 || base_opcode == 0x29
4502 || base_opcode == 0x31
4503 || base_opcode == 0x39
4504 || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4505 || base_opcode == 0xfc1))
4506 return 1;
4507
4508 /* Check for load instruction. */
4509 return (i.types[dest].bitfield.class != ClassNone
4510 || i.types[dest].bitfield.instance == Accum);
4511 }
4512
4513 /* Output lfence, 0xfaee8, after instruction. */
4514
4515 static void
4516 insert_lfence_after (void)
4517 {
4518 if (lfence_after_load && load_insn_p ())
4519 {
4520 /* There are also two REP string instructions that require
4521 special treatment. Specifically, the compare string (CMPS)
4522 and scan string (SCAS) instructions set EFLAGS in a manner
4523 that depends on the data being compared/scanned. When used
4524 with a REP prefix, the number of iterations may therefore
4525 vary depending on this data. If the data is a program secret
4526 chosen by the adversary using an LVI method,
4527 then this data-dependent behavior may leak some aspect
4528 of the secret. */
4529 if (((i.tm.base_opcode | 0x1) == 0xa7
4530 || (i.tm.base_opcode | 0x1) == 0xaf)
4531 && i.prefix[REP_PREFIX])
4532 {
4533 as_warn (_("`%s` changes flags which would affect control flow behavior"),
4534 i.tm.name);
4535 }
4536 char *p = frag_more (3);
4537 *p++ = 0xf;
4538 *p++ = 0xae;
4539 *p = 0xe8;
4540 }
4541 }
4542
4543 /* Output lfence, 0xfaee8, before instruction. */
4544
4545 static void
4546 insert_lfence_before (void)
4547 {
4548 char *p;
4549
4550 if (is_any_vex_encoding (&i.tm))
4551 return;
4552
4553 if (i.tm.base_opcode == 0xff
4554 && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4555 {
4556 /* Insert lfence before indirect branch if needed. */
4557
4558 if (lfence_before_indirect_branch == lfence_branch_none)
4559 return;
4560
4561 if (i.operands != 1)
4562 abort ();
4563
4564 if (i.reg_operands == 1)
4565 {
4566 /* Indirect branch via register. Don't insert lfence with
4567 -mlfence-after-load=yes. */
4568 if (lfence_after_load
4569 || lfence_before_indirect_branch == lfence_branch_memory)
4570 return;
4571 }
4572 else if (i.mem_operands == 1
4573 && lfence_before_indirect_branch != lfence_branch_register)
4574 {
4575 as_warn (_("indirect `%s` with memory operand should be avoided"),
4576 i.tm.name);
4577 return;
4578 }
4579 else
4580 return;
4581
4582 if (last_insn.kind != last_insn_other
4583 && last_insn.seg == now_seg)
4584 {
4585 as_warn_where (last_insn.file, last_insn.line,
4586 _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4587 last_insn.name, i.tm.name);
4588 return;
4589 }
4590
4591 p = frag_more (3);
4592 *p++ = 0xf;
4593 *p++ = 0xae;
4594 *p = 0xe8;
4595 return;
4596 }
4597
4598 /* Output or/not/shl and lfence before near ret. */
4599 if (lfence_before_ret != lfence_before_ret_none
4600 && (i.tm.base_opcode == 0xc2
4601 || i.tm.base_opcode == 0xc3))
4602 {
4603 if (last_insn.kind != last_insn_other
4604 && last_insn.seg == now_seg)
4605 {
4606 as_warn_where (last_insn.file, last_insn.line,
4607 _("`%s` skips -mlfence-before-ret on `%s`"),
4608 last_insn.name, i.tm.name);
4609 return;
4610 }
4611
4612 /* Near ret ingore operand size override under CPU64. */
4613 char prefix = flag_code == CODE_64BIT
4614 ? 0x48
4615 : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4616
4617 if (lfence_before_ret == lfence_before_ret_not)
4618 {
4619 /* not: 0xf71424, may add prefix
4620 for operand size override or 64-bit code. */
4621 p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4622 if (prefix)
4623 *p++ = prefix;
4624 *p++ = 0xf7;
4625 *p++ = 0x14;
4626 *p++ = 0x24;
4627 if (prefix)
4628 *p++ = prefix;
4629 *p++ = 0xf7;
4630 *p++ = 0x14;
4631 *p++ = 0x24;
4632 }
4633 else
4634 {
4635 p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4636 if (prefix)
4637 *p++ = prefix;
4638 if (lfence_before_ret == lfence_before_ret_or)
4639 {
4640 /* or: 0x830c2400, may add prefix
4641 for operand size override or 64-bit code. */
4642 *p++ = 0x83;
4643 *p++ = 0x0c;
4644 }
4645 else
4646 {
4647 /* shl: 0xc1242400, may add prefix
4648 for operand size override or 64-bit code. */
4649 *p++ = 0xc1;
4650 *p++ = 0x24;
4651 }
4652
4653 *p++ = 0x24;
4654 *p++ = 0x0;
4655 }
4656
4657 *p++ = 0xf;
4658 *p++ = 0xae;
4659 *p = 0xe8;
4660 }
4661 }
4662
4663 /* This is the guts of the machine-dependent assembler. LINE points to a
4664 machine dependent instruction. This function is supposed to emit
4665 the frags/bytes it assembles to. */
4666
4667 void
4668 md_assemble (char *line)
4669 {
4670 unsigned int j;
4671 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4672 const insn_template *t;
4673
4674 /* Initialize globals. */
4675 memset (&i, '\0', sizeof (i));
4676 for (j = 0; j < MAX_OPERANDS; j++)
4677 i.reloc[j] = NO_RELOC;
4678 memset (disp_expressions, '\0', sizeof (disp_expressions));
4679 memset (im_expressions, '\0', sizeof (im_expressions));
4680 save_stack_p = save_stack;
4681
4682 /* First parse an instruction mnemonic & call i386_operand for the operands.
4683 We assume that the scrubber has arranged it so that line[0] is the valid
4684 start of a (possibly prefixed) mnemonic. */
4685
4686 line = parse_insn (line, mnemonic);
4687 if (line == NULL)
4688 return;
4689 mnem_suffix = i.suffix;
4690
4691 line = parse_operands (line, mnemonic);
4692 this_operand = -1;
4693 xfree (i.memop1_string);
4694 i.memop1_string = NULL;
4695 if (line == NULL)
4696 return;
4697
4698 /* Now we've parsed the mnemonic into a set of templates, and have the
4699 operands at hand. */
4700
4701 /* All Intel opcodes have reversed operands except for "bound", "enter",
4702 "monitor*", "mwait*", "tpause", and "umwait". We also don't reverse
4703 intersegment "jmp" and "call" instructions with 2 immediate operands so
4704 that the immediate segment precedes the offset, as it does when in AT&T
4705 mode. */
4706 if (intel_syntax
4707 && i.operands > 1
4708 && (strcmp (mnemonic, "bound") != 0)
4709 && (strcmp (mnemonic, "invlpga") != 0)
4710 && (strncmp (mnemonic, "monitor", 7) != 0)
4711 && (strncmp (mnemonic, "mwait", 5) != 0)
4712 && (strcmp (mnemonic, "tpause") != 0)
4713 && (strcmp (mnemonic, "umwait") != 0)
4714 && !(operand_type_check (i.types[0], imm)
4715 && operand_type_check (i.types[1], imm)))
4716 swap_operands ();
4717
4718 /* The order of the immediates should be reversed
4719 for 2 immediates extrq and insertq instructions */
4720 if (i.imm_operands == 2
4721 && (strcmp (mnemonic, "extrq") == 0
4722 || strcmp (mnemonic, "insertq") == 0))
4723 swap_2_operands (0, 1);
4724
4725 if (i.imm_operands)
4726 optimize_imm ();
4727
4728 /* Don't optimize displacement for movabs since it only takes 64bit
4729 displacement. */
4730 if (i.disp_operands
4731 && i.disp_encoding != disp_encoding_32bit
4732 && (flag_code != CODE_64BIT
4733 || strcmp (mnemonic, "movabs") != 0))
4734 optimize_disp ();
4735
4736 /* Next, we find a template that matches the given insn,
4737 making sure the overlap of the given operands types is consistent
4738 with the template operand types. */
4739
4740 if (!(t = match_template (mnem_suffix)))
4741 return;
4742
4743 if (sse_check != check_none
4744 && !i.tm.opcode_modifier.noavx
4745 && !i.tm.cpu_flags.bitfield.cpuavx
4746 && !i.tm.cpu_flags.bitfield.cpuavx512f
4747 && (i.tm.cpu_flags.bitfield.cpusse
4748 || i.tm.cpu_flags.bitfield.cpusse2
4749 || i.tm.cpu_flags.bitfield.cpusse3
4750 || i.tm.cpu_flags.bitfield.cpussse3
4751 || i.tm.cpu_flags.bitfield.cpusse4_1
4752 || i.tm.cpu_flags.bitfield.cpusse4_2
4753 || i.tm.cpu_flags.bitfield.cpusse4a
4754 || i.tm.cpu_flags.bitfield.cpupclmul
4755 || i.tm.cpu_flags.bitfield.cpuaes
4756 || i.tm.cpu_flags.bitfield.cpusha
4757 || i.tm.cpu_flags.bitfield.cpugfni))
4758 {
4759 (sse_check == check_warning
4760 ? as_warn
4761 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4762 }
4763
4764 if (i.tm.opcode_modifier.fwait)
4765 if (!add_prefix (FWAIT_OPCODE))
4766 return;
4767
4768 /* Check if REP prefix is OK. */
4769 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4770 {
4771 as_bad (_("invalid instruction `%s' after `%s'"),
4772 i.tm.name, i.rep_prefix);
4773 return;
4774 }
4775
4776 /* Check for lock without a lockable instruction. Destination operand
4777 must be memory unless it is xchg (0x86). */
4778 if (i.prefix[LOCK_PREFIX]
4779 && (!i.tm.opcode_modifier.islockable
4780 || i.mem_operands == 0
4781 || (i.tm.base_opcode != 0x86
4782 && !(i.flags[i.operands - 1] & Operand_Mem))))
4783 {
4784 as_bad (_("expecting lockable instruction after `lock'"));
4785 return;
4786 }
4787
4788 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4789 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4790 {
4791 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4792 return;
4793 }
4794
4795 /* Check if HLE prefix is OK. */
4796 if (i.hle_prefix && !check_hle ())
4797 return;
4798
4799 /* Check BND prefix. */
4800 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4801 as_bad (_("expecting valid branch instruction after `bnd'"));
4802
4803 /* Check NOTRACK prefix. */
4804 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4805 as_bad (_("expecting indirect branch instruction after `notrack'"));
4806
4807 if (i.tm.cpu_flags.bitfield.cpumpx)
4808 {
4809 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4810 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4811 else if (flag_code != CODE_16BIT
4812 ? i.prefix[ADDR_PREFIX]
4813 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4814 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4815 }
4816
4817 /* Insert BND prefix. */
4818 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4819 {
4820 if (!i.prefix[BND_PREFIX])
4821 add_prefix (BND_PREFIX_OPCODE);
4822 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4823 {
4824 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4825 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4826 }
4827 }
4828
4829 /* Check string instruction segment overrides. */
4830 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4831 {
4832 gas_assert (i.mem_operands);
4833 if (!check_string ())
4834 return;
4835 i.disp_operands = 0;
4836 }
4837
4838 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4839 optimize_encoding ();
4840
4841 if (!process_suffix ())
4842 return;
4843
4844 /* Update operand types. */
4845 for (j = 0; j < i.operands; j++)
4846 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4847
4848 /* Make still unresolved immediate matches conform to size of immediate
4849 given in i.suffix. */
4850 if (!finalize_imm ())
4851 return;
4852
4853 if (i.types[0].bitfield.imm1)
4854 i.imm_operands = 0; /* kludge for shift insns. */
4855
4856 /* We only need to check those implicit registers for instructions
4857 with 3 operands or less. */
4858 if (i.operands <= 3)
4859 for (j = 0; j < i.operands; j++)
4860 if (i.types[j].bitfield.instance != InstanceNone
4861 && !i.types[j].bitfield.xmmword)
4862 i.reg_operands--;
4863
4864 /* ImmExt should be processed after SSE2AVX. */
4865 if (!i.tm.opcode_modifier.sse2avx
4866 && i.tm.opcode_modifier.immext)
4867 process_immext ();
4868
4869 /* For insns with operands there are more diddles to do to the opcode. */
4870 if (i.operands)
4871 {
4872 if (!process_operands ())
4873 return;
4874 }
4875 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4876 {
4877 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4878 as_warn (_("translating to `%sp'"), i.tm.name);
4879 }
4880
4881 if (is_any_vex_encoding (&i.tm))
4882 {
4883 if (!cpu_arch_flags.bitfield.cpui286)
4884 {
4885 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4886 i.tm.name);
4887 return;
4888 }
4889
4890 if (i.tm.opcode_modifier.vex)
4891 build_vex_prefix (t);
4892 else
4893 build_evex_prefix ();
4894 }
4895
4896 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4897 instructions may define INT_OPCODE as well, so avoid this corner
4898 case for those instructions that use MODRM. */
4899 if (i.tm.base_opcode == INT_OPCODE
4900 && !i.tm.opcode_modifier.modrm
4901 && i.op[0].imms->X_add_number == 3)
4902 {
4903 i.tm.base_opcode = INT3_OPCODE;
4904 i.imm_operands = 0;
4905 }
4906
4907 if ((i.tm.opcode_modifier.jump == JUMP
4908 || i.tm.opcode_modifier.jump == JUMP_BYTE
4909 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4910 && i.op[0].disps->X_op == O_constant)
4911 {
4912 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4913 the absolute address given by the constant. Since ix86 jumps and
4914 calls are pc relative, we need to generate a reloc. */
4915 i.op[0].disps->X_add_symbol = &abs_symbol;
4916 i.op[0].disps->X_op = O_symbol;
4917 }
4918
4919 /* For 8 bit registers we need an empty rex prefix. Also if the
4920 instruction already has a prefix, we need to convert old
4921 registers to new ones. */
4922
4923 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4924 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4925 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4926 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4927 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4928 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4929 && i.rex != 0))
4930 {
4931 int x;
4932
4933 i.rex |= REX_OPCODE;
4934 for (x = 0; x < 2; x++)
4935 {
4936 /* Look for 8 bit operand that uses old registers. */
4937 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4938 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4939 {
4940 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4941 /* In case it is "hi" register, give up. */
4942 if (i.op[x].regs->reg_num > 3)
4943 as_bad (_("can't encode register '%s%s' in an "
4944 "instruction requiring REX prefix."),
4945 register_prefix, i.op[x].regs->reg_name);
4946
4947 /* Otherwise it is equivalent to the extended register.
4948 Since the encoding doesn't change this is merely
4949 cosmetic cleanup for debug output. */
4950
4951 i.op[x].regs = i.op[x].regs + 8;
4952 }
4953 }
4954 }
4955
4956 if (i.rex == 0 && i.rex_encoding)
4957 {
4958 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4959 that uses legacy register. If it is "hi" register, don't add
4960 the REX_OPCODE byte. */
4961 int x;
4962 for (x = 0; x < 2; x++)
4963 if (i.types[x].bitfield.class == Reg
4964 && i.types[x].bitfield.byte
4965 && (i.op[x].regs->reg_flags & RegRex64) == 0
4966 && i.op[x].regs->reg_num > 3)
4967 {
4968 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4969 i.rex_encoding = FALSE;
4970 break;
4971 }
4972
4973 if (i.rex_encoding)
4974 i.rex = REX_OPCODE;
4975 }
4976
4977 if (i.rex != 0)
4978 add_prefix (REX_OPCODE | i.rex);
4979
4980 insert_lfence_before ();
4981
4982 /* We are ready to output the insn. */
4983 output_insn ();
4984
4985 insert_lfence_after ();
4986
4987 last_insn.seg = now_seg;
4988
4989 if (i.tm.opcode_modifier.isprefix)
4990 {
4991 last_insn.kind = last_insn_prefix;
4992 last_insn.name = i.tm.name;
4993 last_insn.file = as_where (&last_insn.line);
4994 }
4995 else
4996 last_insn.kind = last_insn_other;
4997 }
4998
4999 static char *
5000 parse_insn (char *line, char *mnemonic)
5001 {
5002 char *l = line;
5003 char *token_start = l;
5004 char *mnem_p;
5005 int supported;
5006 const insn_template *t;
5007 char *dot_p = NULL;
5008
5009 while (1)
5010 {
5011 mnem_p = mnemonic;
5012 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5013 {
5014 if (*mnem_p == '.')
5015 dot_p = mnem_p;
5016 mnem_p++;
5017 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5018 {
5019 as_bad (_("no such instruction: `%s'"), token_start);
5020 return NULL;
5021 }
5022 l++;
5023 }
5024 if (!is_space_char (*l)
5025 && *l != END_OF_INSN
5026 && (intel_syntax
5027 || (*l != PREFIX_SEPARATOR
5028 && *l != ',')))
5029 {
5030 as_bad (_("invalid character %s in mnemonic"),
5031 output_invalid (*l));
5032 return NULL;
5033 }
5034 if (token_start == l)
5035 {
5036 if (!intel_syntax && *l == PREFIX_SEPARATOR)
5037 as_bad (_("expecting prefix; got nothing"));
5038 else
5039 as_bad (_("expecting mnemonic; got nothing"));
5040 return NULL;
5041 }
5042
5043 /* Look up instruction (or prefix) via hash table. */
5044 current_templates = (const templates *) hash_find (op_hash, mnemonic);
5045
5046 if (*l != END_OF_INSN
5047 && (!is_space_char (*l) || l[1] != END_OF_INSN)
5048 && current_templates
5049 && current_templates->start->opcode_modifier.isprefix)
5050 {
5051 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5052 {
5053 as_bad ((flag_code != CODE_64BIT
5054 ? _("`%s' is only supported in 64-bit mode")
5055 : _("`%s' is not supported in 64-bit mode")),
5056 current_templates->start->name);
5057 return NULL;
5058 }
5059 /* If we are in 16-bit mode, do not allow addr16 or data16.
5060 Similarly, in 32-bit mode, do not allow addr32 or data32. */
5061 if ((current_templates->start->opcode_modifier.size == SIZE16
5062 || current_templates->start->opcode_modifier.size == SIZE32)
5063 && flag_code != CODE_64BIT
5064 && ((current_templates->start->opcode_modifier.size == SIZE32)
5065 ^ (flag_code == CODE_16BIT)))
5066 {
5067 as_bad (_("redundant %s prefix"),
5068 current_templates->start->name);
5069 return NULL;
5070 }
5071 if (current_templates->start->opcode_length == 0)
5072 {
5073 /* Handle pseudo prefixes. */
5074 switch (current_templates->start->base_opcode)
5075 {
5076 case 0x0:
5077 /* {disp8} */
5078 i.disp_encoding = disp_encoding_8bit;
5079 break;
5080 case 0x1:
5081 /* {disp32} */
5082 i.disp_encoding = disp_encoding_32bit;
5083 break;
5084 case 0x2:
5085 /* {load} */
5086 i.dir_encoding = dir_encoding_load;
5087 break;
5088 case 0x3:
5089 /* {store} */
5090 i.dir_encoding = dir_encoding_store;
5091 break;
5092 case 0x4:
5093 /* {vex} */
5094 i.vec_encoding = vex_encoding_vex;
5095 break;
5096 case 0x5:
5097 /* {vex3} */
5098 i.vec_encoding = vex_encoding_vex3;
5099 break;
5100 case 0x6:
5101 /* {evex} */
5102 i.vec_encoding = vex_encoding_evex;
5103 break;
5104 case 0x7:
5105 /* {rex} */
5106 i.rex_encoding = TRUE;
5107 break;
5108 case 0x8:
5109 /* {nooptimize} */
5110 i.no_optimize = TRUE;
5111 break;
5112 default:
5113 abort ();
5114 }
5115 }
5116 else
5117 {
5118 /* Add prefix, checking for repeated prefixes. */
5119 switch (add_prefix (current_templates->start->base_opcode))
5120 {
5121 case PREFIX_EXIST:
5122 return NULL;
5123 case PREFIX_DS:
5124 if (current_templates->start->cpu_flags.bitfield.cpuibt)
5125 i.notrack_prefix = current_templates->start->name;
5126 break;
5127 case PREFIX_REP:
5128 if (current_templates->start->cpu_flags.bitfield.cpuhle)
5129 i.hle_prefix = current_templates->start->name;
5130 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5131 i.bnd_prefix = current_templates->start->name;
5132 else
5133 i.rep_prefix = current_templates->start->name;
5134 break;
5135 default:
5136 break;
5137 }
5138 }
5139 /* Skip past PREFIX_SEPARATOR and reset token_start. */
5140 token_start = ++l;
5141 }
5142 else
5143 break;
5144 }
5145
5146 if (!current_templates)
5147 {
5148 /* Deprecated functionality (new code should use pseudo-prefixes instead):
5149 Check if we should swap operand or force 32bit displacement in
5150 encoding. */
5151 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5152 i.dir_encoding = dir_encoding_swap;
5153 else if (mnem_p - 3 == dot_p
5154 && dot_p[1] == 'd'
5155 && dot_p[2] == '8')
5156 i.disp_encoding = disp_encoding_8bit;
5157 else if (mnem_p - 4 == dot_p
5158 && dot_p[1] == 'd'
5159 && dot_p[2] == '3'
5160 && dot_p[3] == '2')
5161 i.disp_encoding = disp_encoding_32bit;
5162 else
5163 goto check_suffix;
5164 mnem_p = dot_p;
5165 *dot_p = '\0';
5166 current_templates = (const templates *) hash_find (op_hash, mnemonic);
5167 }
5168
5169 if (!current_templates)
5170 {
5171 check_suffix:
5172 if (mnem_p > mnemonic)
5173 {
5174 /* See if we can get a match by trimming off a suffix. */
5175 switch (mnem_p[-1])
5176 {
5177 case WORD_MNEM_SUFFIX:
5178 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5179 i.suffix = SHORT_MNEM_SUFFIX;
5180 else
5181 /* Fall through. */
5182 case BYTE_MNEM_SUFFIX:
5183 case QWORD_MNEM_SUFFIX:
5184 i.suffix = mnem_p[-1];
5185 mnem_p[-1] = '\0';
5186 current_templates = (const templates *) hash_find (op_hash,
5187 mnemonic);
5188 break;
5189 case SHORT_MNEM_SUFFIX:
5190 case LONG_MNEM_SUFFIX:
5191 if (!intel_syntax)
5192 {
5193 i.suffix = mnem_p[-1];
5194 mnem_p[-1] = '\0';
5195 current_templates = (const templates *) hash_find (op_hash,
5196 mnemonic);
5197 }
5198 break;
5199
5200 /* Intel Syntax. */
5201 case 'd':
5202 if (intel_syntax)
5203 {
5204 if (intel_float_operand (mnemonic) == 1)
5205 i.suffix = SHORT_MNEM_SUFFIX;
5206 else
5207 i.suffix = LONG_MNEM_SUFFIX;
5208 mnem_p[-1] = '\0';
5209 current_templates = (const templates *) hash_find (op_hash,
5210 mnemonic);
5211 }
5212 break;
5213 }
5214 }
5215
5216 if (!current_templates)
5217 {
5218 as_bad (_("no such instruction: `%s'"), token_start);
5219 return NULL;
5220 }
5221 }
5222
5223 if (current_templates->start->opcode_modifier.jump == JUMP
5224 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5225 {
5226 /* Check for a branch hint. We allow ",pt" and ",pn" for
5227 predict taken and predict not taken respectively.
5228 I'm not sure that branch hints actually do anything on loop
5229 and jcxz insns (JumpByte) for current Pentium4 chips. They
5230 may work in the future and it doesn't hurt to accept them
5231 now. */
5232 if (l[0] == ',' && l[1] == 'p')
5233 {
5234 if (l[2] == 't')
5235 {
5236 if (!add_prefix (DS_PREFIX_OPCODE))
5237 return NULL;
5238 l += 3;
5239 }
5240 else if (l[2] == 'n')
5241 {
5242 if (!add_prefix (CS_PREFIX_OPCODE))
5243 return NULL;
5244 l += 3;
5245 }
5246 }
5247 }
5248 /* Any other comma loses. */
5249 if (*l == ',')
5250 {
5251 as_bad (_("invalid character %s in mnemonic"),
5252 output_invalid (*l));
5253 return NULL;
5254 }
5255
5256 /* Check if instruction is supported on specified architecture. */
5257 supported = 0;
5258 for (t = current_templates->start; t < current_templates->end; ++t)
5259 {
5260 supported |= cpu_flags_match (t);
5261 if (supported == CPU_FLAGS_PERFECT_MATCH)
5262 {
5263 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5264 as_warn (_("use .code16 to ensure correct addressing mode"));
5265
5266 return l;
5267 }
5268 }
5269
5270 if (!(supported & CPU_FLAGS_64BIT_MATCH))
5271 as_bad (flag_code == CODE_64BIT
5272 ? _("`%s' is not supported in 64-bit mode")
5273 : _("`%s' is only supported in 64-bit mode"),
5274 current_templates->start->name);
5275 else
5276 as_bad (_("`%s' is not supported on `%s%s'"),
5277 current_templates->start->name,
5278 cpu_arch_name ? cpu_arch_name : default_arch,
5279 cpu_sub_arch_name ? cpu_sub_arch_name : "");
5280
5281 return NULL;
5282 }
5283
5284 static char *
5285 parse_operands (char *l, const char *mnemonic)
5286 {
5287 char *token_start;
5288
5289 /* 1 if operand is pending after ','. */
5290 unsigned int expecting_operand = 0;
5291
5292 /* Non-zero if operand parens not balanced. */
5293 unsigned int paren_not_balanced;
5294
5295 while (*l != END_OF_INSN)
5296 {
5297 /* Skip optional white space before operand. */
5298 if (is_space_char (*l))
5299 ++l;
5300 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5301 {
5302 as_bad (_("invalid character %s before operand %d"),
5303 output_invalid (*l),
5304 i.operands + 1);
5305 return NULL;
5306 }
5307 token_start = l; /* After white space. */
5308 paren_not_balanced = 0;
5309 while (paren_not_balanced || *l != ',')
5310 {
5311 if (*l == END_OF_INSN)
5312 {
5313 if (paren_not_balanced)
5314 {
5315 if (!intel_syntax)
5316 as_bad (_("unbalanced parenthesis in operand %d."),
5317 i.operands + 1);
5318 else
5319 as_bad (_("unbalanced brackets in operand %d."),
5320 i.operands + 1);
5321 return NULL;
5322 }
5323 else
5324 break; /* we are done */
5325 }
5326 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5327 {
5328 as_bad (_("invalid character %s in operand %d"),
5329 output_invalid (*l),
5330 i.operands + 1);
5331 return NULL;
5332 }
5333 if (!intel_syntax)
5334 {
5335 if (*l == '(')
5336 ++paren_not_balanced;
5337 if (*l == ')')
5338 --paren_not_balanced;
5339 }
5340 else
5341 {
5342 if (*l == '[')
5343 ++paren_not_balanced;
5344 if (*l == ']')
5345 --paren_not_balanced;
5346 }
5347 l++;
5348 }
5349 if (l != token_start)
5350 { /* Yes, we've read in another operand. */
5351 unsigned int operand_ok;
5352 this_operand = i.operands++;
5353 if (i.operands > MAX_OPERANDS)
5354 {
5355 as_bad (_("spurious operands; (%d operands/instruction max)"),
5356 MAX_OPERANDS);
5357 return NULL;
5358 }
5359 i.types[this_operand].bitfield.unspecified = 1;
5360 /* Now parse operand adding info to 'i' as we go along. */
5361 END_STRING_AND_SAVE (l);
5362
5363 if (i.mem_operands > 1)
5364 {
5365 as_bad (_("too many memory references for `%s'"),
5366 mnemonic);
5367 return 0;
5368 }
5369
5370 if (intel_syntax)
5371 operand_ok =
5372 i386_intel_operand (token_start,
5373 intel_float_operand (mnemonic));
5374 else
5375 operand_ok = i386_att_operand (token_start);
5376
5377 RESTORE_END_STRING (l);
5378 if (!operand_ok)
5379 return NULL;
5380 }
5381 else
5382 {
5383 if (expecting_operand)
5384 {
5385 expecting_operand_after_comma:
5386 as_bad (_("expecting operand after ','; got nothing"));
5387 return NULL;
5388 }
5389 if (*l == ',')
5390 {
5391 as_bad (_("expecting operand before ','; got nothing"));
5392 return NULL;
5393 }
5394 }
5395
5396 /* Now *l must be either ',' or END_OF_INSN. */
5397 if (*l == ',')
5398 {
5399 if (*++l == END_OF_INSN)
5400 {
5401 /* Just skip it, if it's \n complain. */
5402 goto expecting_operand_after_comma;
5403 }
5404 expecting_operand = 1;
5405 }
5406 }
5407 return l;
5408 }
5409
5410 static void
5411 swap_2_operands (int xchg1, int xchg2)
5412 {
5413 union i386_op temp_op;
5414 i386_operand_type temp_type;
5415 unsigned int temp_flags;
5416 enum bfd_reloc_code_real temp_reloc;
5417
5418 temp_type = i.types[xchg2];
5419 i.types[xchg2] = i.types[xchg1];
5420 i.types[xchg1] = temp_type;
5421
5422 temp_flags = i.flags[xchg2];
5423 i.flags[xchg2] = i.flags[xchg1];
5424 i.flags[xchg1] = temp_flags;
5425
5426 temp_op = i.op[xchg2];
5427 i.op[xchg2] = i.op[xchg1];
5428 i.op[xchg1] = temp_op;
5429
5430 temp_reloc = i.reloc[xchg2];
5431 i.reloc[xchg2] = i.reloc[xchg1];
5432 i.reloc[xchg1] = temp_reloc;
5433
5434 if (i.mask)
5435 {
5436 if (i.mask->operand == xchg1)
5437 i.mask->operand = xchg2;
5438 else if (i.mask->operand == xchg2)
5439 i.mask->operand = xchg1;
5440 }
5441 if (i.broadcast)
5442 {
5443 if (i.broadcast->operand == xchg1)
5444 i.broadcast->operand = xchg2;
5445 else if (i.broadcast->operand == xchg2)
5446 i.broadcast->operand = xchg1;
5447 }
5448 if (i.rounding)
5449 {
5450 if (i.rounding->operand == xchg1)
5451 i.rounding->operand = xchg2;
5452 else if (i.rounding->operand == xchg2)
5453 i.rounding->operand = xchg1;
5454 }
5455 }
5456
5457 static void
5458 swap_operands (void)
5459 {
5460 switch (i.operands)
5461 {
5462 case 5:
5463 case 4:
5464 swap_2_operands (1, i.operands - 2);
5465 /* Fall through. */
5466 case 3:
5467 case 2:
5468 swap_2_operands (0, i.operands - 1);
5469 break;
5470 default:
5471 abort ();
5472 }
5473
5474 if (i.mem_operands == 2)
5475 {
5476 const seg_entry *temp_seg;
5477 temp_seg = i.seg[0];
5478 i.seg[0] = i.seg[1];
5479 i.seg[1] = temp_seg;
5480 }
5481 }
5482
5483 /* Try to ensure constant immediates are represented in the smallest
5484 opcode possible. */
5485 static void
5486 optimize_imm (void)
5487 {
5488 char guess_suffix = 0;
5489 int op;
5490
5491 if (i.suffix)
5492 guess_suffix = i.suffix;
5493 else if (i.reg_operands)
5494 {
5495 /* Figure out a suffix from the last register operand specified.
5496 We can't do this properly yet, i.e. excluding special register
5497 instances, but the following works for instructions with
5498 immediates. In any case, we can't set i.suffix yet. */
5499 for (op = i.operands; --op >= 0;)
5500 if (i.types[op].bitfield.class != Reg)
5501 continue;
5502 else if (i.types[op].bitfield.byte)
5503 {
5504 guess_suffix = BYTE_MNEM_SUFFIX;
5505 break;
5506 }
5507 else if (i.types[op].bitfield.word)
5508 {
5509 guess_suffix = WORD_MNEM_SUFFIX;
5510 break;
5511 }
5512 else if (i.types[op].bitfield.dword)
5513 {
5514 guess_suffix = LONG_MNEM_SUFFIX;
5515 break;
5516 }
5517 else if (i.types[op].bitfield.qword)
5518 {
5519 guess_suffix = QWORD_MNEM_SUFFIX;
5520 break;
5521 }
5522 }
5523 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5524 guess_suffix = WORD_MNEM_SUFFIX;
5525
5526 for (op = i.operands; --op >= 0;)
5527 if (operand_type_check (i.types[op], imm))
5528 {
5529 switch (i.op[op].imms->X_op)
5530 {
5531 case O_constant:
5532 /* If a suffix is given, this operand may be shortened. */
5533 switch (guess_suffix)
5534 {
5535 case LONG_MNEM_SUFFIX:
5536 i.types[op].bitfield.imm32 = 1;
5537 i.types[op].bitfield.imm64 = 1;
5538 break;
5539 case WORD_MNEM_SUFFIX:
5540 i.types[op].bitfield.imm16 = 1;
5541 i.types[op].bitfield.imm32 = 1;
5542 i.types[op].bitfield.imm32s = 1;
5543 i.types[op].bitfield.imm64 = 1;
5544 break;
5545 case BYTE_MNEM_SUFFIX:
5546 i.types[op].bitfield.imm8 = 1;
5547 i.types[op].bitfield.imm8s = 1;
5548 i.types[op].bitfield.imm16 = 1;
5549 i.types[op].bitfield.imm32 = 1;
5550 i.types[op].bitfield.imm32s = 1;
5551 i.types[op].bitfield.imm64 = 1;
5552 break;
5553 }
5554
5555 /* If this operand is at most 16 bits, convert it
5556 to a signed 16 bit number before trying to see
5557 whether it will fit in an even smaller size.
5558 This allows a 16-bit operand such as $0xffe0 to
5559 be recognised as within Imm8S range. */
5560 if ((i.types[op].bitfield.imm16)
5561 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5562 {
5563 i.op[op].imms->X_add_number =
5564 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5565 }
5566 #ifdef BFD64
5567 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5568 if ((i.types[op].bitfield.imm32)
5569 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5570 == 0))
5571 {
5572 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5573 ^ ((offsetT) 1 << 31))
5574 - ((offsetT) 1 << 31));
5575 }
5576 #endif
5577 i.types[op]
5578 = operand_type_or (i.types[op],
5579 smallest_imm_type (i.op[op].imms->X_add_number));
5580
5581 /* We must avoid matching of Imm32 templates when 64bit
5582 only immediate is available. */
5583 if (guess_suffix == QWORD_MNEM_SUFFIX)
5584 i.types[op].bitfield.imm32 = 0;
5585 break;
5586
5587 case O_absent:
5588 case O_register:
5589 abort ();
5590
5591 /* Symbols and expressions. */
5592 default:
5593 /* Convert symbolic operand to proper sizes for matching, but don't
5594 prevent matching a set of insns that only supports sizes other
5595 than those matching the insn suffix. */
5596 {
5597 i386_operand_type mask, allowed;
5598 const insn_template *t;
5599
5600 operand_type_set (&mask, 0);
5601 operand_type_set (&allowed, 0);
5602
5603 for (t = current_templates->start;
5604 t < current_templates->end;
5605 ++t)
5606 {
5607 allowed = operand_type_or (allowed, t->operand_types[op]);
5608 allowed = operand_type_and (allowed, anyimm);
5609 }
5610 switch (guess_suffix)
5611 {
5612 case QWORD_MNEM_SUFFIX:
5613 mask.bitfield.imm64 = 1;
5614 mask.bitfield.imm32s = 1;
5615 break;
5616 case LONG_MNEM_SUFFIX:
5617 mask.bitfield.imm32 = 1;
5618 break;
5619 case WORD_MNEM_SUFFIX:
5620 mask.bitfield.imm16 = 1;
5621 break;
5622 case BYTE_MNEM_SUFFIX:
5623 mask.bitfield.imm8 = 1;
5624 break;
5625 default:
5626 break;
5627 }
5628 allowed = operand_type_and (mask, allowed);
5629 if (!operand_type_all_zero (&allowed))
5630 i.types[op] = operand_type_and (i.types[op], mask);
5631 }
5632 break;
5633 }
5634 }
5635 }
5636
5637 /* Try to use the smallest displacement type too. */
5638 static void
5639 optimize_disp (void)
5640 {
5641 int op;
5642
5643 for (op = i.operands; --op >= 0;)
5644 if (operand_type_check (i.types[op], disp))
5645 {
5646 if (i.op[op].disps->X_op == O_constant)
5647 {
5648 offsetT op_disp = i.op[op].disps->X_add_number;
5649
5650 if (i.types[op].bitfield.disp16
5651 && (op_disp & ~(offsetT) 0xffff) == 0)
5652 {
5653 /* If this operand is at most 16 bits, convert
5654 to a signed 16 bit number and don't use 64bit
5655 displacement. */
5656 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5657 i.types[op].bitfield.disp64 = 0;
5658 }
5659 #ifdef BFD64
5660 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5661 if (i.types[op].bitfield.disp32
5662 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5663 {
5664 /* If this operand is at most 32 bits, convert
5665 to a signed 32 bit number and don't use 64bit
5666 displacement. */
5667 op_disp &= (((offsetT) 2 << 31) - 1);
5668 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5669 i.types[op].bitfield.disp64 = 0;
5670 }
5671 #endif
5672 if (!op_disp && i.types[op].bitfield.baseindex)
5673 {
5674 i.types[op].bitfield.disp8 = 0;
5675 i.types[op].bitfield.disp16 = 0;
5676 i.types[op].bitfield.disp32 = 0;
5677 i.types[op].bitfield.disp32s = 0;
5678 i.types[op].bitfield.disp64 = 0;
5679 i.op[op].disps = 0;
5680 i.disp_operands--;
5681 }
5682 else if (flag_code == CODE_64BIT)
5683 {
5684 if (fits_in_signed_long (op_disp))
5685 {
5686 i.types[op].bitfield.disp64 = 0;
5687 i.types[op].bitfield.disp32s = 1;
5688 }
5689 if (i.prefix[ADDR_PREFIX]
5690 && fits_in_unsigned_long (op_disp))
5691 i.types[op].bitfield.disp32 = 1;
5692 }
5693 if ((i.types[op].bitfield.disp32
5694 || i.types[op].bitfield.disp32s
5695 || i.types[op].bitfield.disp16)
5696 && fits_in_disp8 (op_disp))
5697 i.types[op].bitfield.disp8 = 1;
5698 }
5699 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5700 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5701 {
5702 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5703 i.op[op].disps, 0, i.reloc[op]);
5704 i.types[op].bitfield.disp8 = 0;
5705 i.types[op].bitfield.disp16 = 0;
5706 i.types[op].bitfield.disp32 = 0;
5707 i.types[op].bitfield.disp32s = 0;
5708 i.types[op].bitfield.disp64 = 0;
5709 }
5710 else
5711 /* We only support 64bit displacement on constants. */
5712 i.types[op].bitfield.disp64 = 0;
5713 }
5714 }
5715
5716 /* Return 1 if there is a match in broadcast bytes between operand
5717 GIVEN and instruction template T. */
5718
5719 static INLINE int
5720 match_broadcast_size (const insn_template *t, unsigned int given)
5721 {
5722 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5723 && i.types[given].bitfield.byte)
5724 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5725 && i.types[given].bitfield.word)
5726 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5727 && i.types[given].bitfield.dword)
5728 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5729 && i.types[given].bitfield.qword));
5730 }
5731
5732 /* Check if operands are valid for the instruction. */
5733
5734 static int
5735 check_VecOperands (const insn_template *t)
5736 {
5737 unsigned int op;
5738 i386_cpu_flags cpu;
5739
5740 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5741 any one operand are implicity requiring AVX512VL support if the actual
5742 operand size is YMMword or XMMword. Since this function runs after
5743 template matching, there's no need to check for YMMword/XMMword in
5744 the template. */
5745 cpu = cpu_flags_and (t->cpu_flags, avx512);
5746 if (!cpu_flags_all_zero (&cpu)
5747 && !t->cpu_flags.bitfield.cpuavx512vl
5748 && !cpu_arch_flags.bitfield.cpuavx512vl)
5749 {
5750 for (op = 0; op < t->operands; ++op)
5751 {
5752 if (t->operand_types[op].bitfield.zmmword
5753 && (i.types[op].bitfield.ymmword
5754 || i.types[op].bitfield.xmmword))
5755 {
5756 i.error = unsupported;
5757 return 1;
5758 }
5759 }
5760 }
5761
5762 /* Without VSIB byte, we can't have a vector register for index. */
5763 if (!t->opcode_modifier.vecsib
5764 && i.index_reg
5765 && (i.index_reg->reg_type.bitfield.xmmword
5766 || i.index_reg->reg_type.bitfield.ymmword
5767 || i.index_reg->reg_type.bitfield.zmmword))
5768 {
5769 i.error = unsupported_vector_index_register;
5770 return 1;
5771 }
5772
5773 /* Check if default mask is allowed. */
5774 if (t->opcode_modifier.nodefmask
5775 && (!i.mask || i.mask->mask->reg_num == 0))
5776 {
5777 i.error = no_default_mask;
5778 return 1;
5779 }
5780
5781 /* For VSIB byte, we need a vector register for index, and all vector
5782 registers must be distinct. */
5783 if (t->opcode_modifier.vecsib)
5784 {
5785 if (!i.index_reg
5786 || !((t->opcode_modifier.vecsib == VecSIB128
5787 && i.index_reg->reg_type.bitfield.xmmword)
5788 || (t->opcode_modifier.vecsib == VecSIB256
5789 && i.index_reg->reg_type.bitfield.ymmword)
5790 || (t->opcode_modifier.vecsib == VecSIB512
5791 && i.index_reg->reg_type.bitfield.zmmword)))
5792 {
5793 i.error = invalid_vsib_address;
5794 return 1;
5795 }
5796
5797 gas_assert (i.reg_operands == 2 || i.mask);
5798 if (i.reg_operands == 2 && !i.mask)
5799 {
5800 gas_assert (i.types[0].bitfield.class == RegSIMD);
5801 gas_assert (i.types[0].bitfield.xmmword
5802 || i.types[0].bitfield.ymmword);
5803 gas_assert (i.types[2].bitfield.class == RegSIMD);
5804 gas_assert (i.types[2].bitfield.xmmword
5805 || i.types[2].bitfield.ymmword);
5806 if (operand_check == check_none)
5807 return 0;
5808 if (register_number (i.op[0].regs)
5809 != register_number (i.index_reg)
5810 && register_number (i.op[2].regs)
5811 != register_number (i.index_reg)
5812 && register_number (i.op[0].regs)
5813 != register_number (i.op[2].regs))
5814 return 0;
5815 if (operand_check == check_error)
5816 {
5817 i.error = invalid_vector_register_set;
5818 return 1;
5819 }
5820 as_warn (_("mask, index, and destination registers should be distinct"));
5821 }
5822 else if (i.reg_operands == 1 && i.mask)
5823 {
5824 if (i.types[1].bitfield.class == RegSIMD
5825 && (i.types[1].bitfield.xmmword
5826 || i.types[1].bitfield.ymmword
5827 || i.types[1].bitfield.zmmword)
5828 && (register_number (i.op[1].regs)
5829 == register_number (i.index_reg)))
5830 {
5831 if (operand_check == check_error)
5832 {
5833 i.error = invalid_vector_register_set;
5834 return 1;
5835 }
5836 if (operand_check != check_none)
5837 as_warn (_("index and destination registers should be distinct"));
5838 }
5839 }
5840 }
5841
5842 /* Check if broadcast is supported by the instruction and is applied
5843 to the memory operand. */
5844 if (i.broadcast)
5845 {
5846 i386_operand_type type, overlap;
5847
5848 /* Check if specified broadcast is supported in this instruction,
5849 and its broadcast bytes match the memory operand. */
5850 op = i.broadcast->operand;
5851 if (!t->opcode_modifier.broadcast
5852 || !(i.flags[op] & Operand_Mem)
5853 || (!i.types[op].bitfield.unspecified
5854 && !match_broadcast_size (t, op)))
5855 {
5856 bad_broadcast:
5857 i.error = unsupported_broadcast;
5858 return 1;
5859 }
5860
5861 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5862 * i.broadcast->type);
5863 operand_type_set (&type, 0);
5864 switch (i.broadcast->bytes)
5865 {
5866 case 2:
5867 type.bitfield.word = 1;
5868 break;
5869 case 4:
5870 type.bitfield.dword = 1;
5871 break;
5872 case 8:
5873 type.bitfield.qword = 1;
5874 break;
5875 case 16:
5876 type.bitfield.xmmword = 1;
5877 break;
5878 case 32:
5879 type.bitfield.ymmword = 1;
5880 break;
5881 case 64:
5882 type.bitfield.zmmword = 1;
5883 break;
5884 default:
5885 goto bad_broadcast;
5886 }
5887
5888 overlap = operand_type_and (type, t->operand_types[op]);
5889 if (t->operand_types[op].bitfield.class == RegSIMD
5890 && t->operand_types[op].bitfield.byte
5891 + t->operand_types[op].bitfield.word
5892 + t->operand_types[op].bitfield.dword
5893 + t->operand_types[op].bitfield.qword > 1)
5894 {
5895 overlap.bitfield.xmmword = 0;
5896 overlap.bitfield.ymmword = 0;
5897 overlap.bitfield.zmmword = 0;
5898 }
5899 if (operand_type_all_zero (&overlap))
5900 goto bad_broadcast;
5901
5902 if (t->opcode_modifier.checkregsize)
5903 {
5904 unsigned int j;
5905
5906 type.bitfield.baseindex = 1;
5907 for (j = 0; j < i.operands; ++j)
5908 {
5909 if (j != op
5910 && !operand_type_register_match(i.types[j],
5911 t->operand_types[j],
5912 type,
5913 t->operand_types[op]))
5914 goto bad_broadcast;
5915 }
5916 }
5917 }
5918 /* If broadcast is supported in this instruction, we need to check if
5919 operand of one-element size isn't specified without broadcast. */
5920 else if (t->opcode_modifier.broadcast && i.mem_operands)
5921 {
5922 /* Find memory operand. */
5923 for (op = 0; op < i.operands; op++)
5924 if (i.flags[op] & Operand_Mem)
5925 break;
5926 gas_assert (op < i.operands);
5927 /* Check size of the memory operand. */
5928 if (match_broadcast_size (t, op))
5929 {
5930 i.error = broadcast_needed;
5931 return 1;
5932 }
5933 }
5934 else
5935 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5936
5937 /* Check if requested masking is supported. */
5938 if (i.mask)
5939 {
5940 switch (t->opcode_modifier.masking)
5941 {
5942 case BOTH_MASKING:
5943 break;
5944 case MERGING_MASKING:
5945 if (i.mask->zeroing)
5946 {
5947 case 0:
5948 i.error = unsupported_masking;
5949 return 1;
5950 }
5951 break;
5952 case DYNAMIC_MASKING:
5953 /* Memory destinations allow only merging masking. */
5954 if (i.mask->zeroing && i.mem_operands)
5955 {
5956 /* Find memory operand. */
5957 for (op = 0; op < i.operands; op++)
5958 if (i.flags[op] & Operand_Mem)
5959 break;
5960 gas_assert (op < i.operands);
5961 if (op == i.operands - 1)
5962 {
5963 i.error = unsupported_masking;
5964 return 1;
5965 }
5966 }
5967 break;
5968 default:
5969 abort ();
5970 }
5971 }
5972
5973 /* Check if masking is applied to dest operand. */
5974 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5975 {
5976 i.error = mask_not_on_destination;
5977 return 1;
5978 }
5979
5980 /* Check RC/SAE. */
5981 if (i.rounding)
5982 {
5983 if (!t->opcode_modifier.sae
5984 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5985 {
5986 i.error = unsupported_rc_sae;
5987 return 1;
5988 }
5989 /* If the instruction has several immediate operands and one of
5990 them is rounding, the rounding operand should be the last
5991 immediate operand. */
5992 if (i.imm_operands > 1
5993 && i.rounding->operand != (int) (i.imm_operands - 1))
5994 {
5995 i.error = rc_sae_operand_not_last_imm;
5996 return 1;
5997 }
5998 }
5999
6000 /* Check vector Disp8 operand. */
6001 if (t->opcode_modifier.disp8memshift
6002 && i.disp_encoding != disp_encoding_32bit)
6003 {
6004 if (i.broadcast)
6005 i.memshift = t->opcode_modifier.broadcast - 1;
6006 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6007 i.memshift = t->opcode_modifier.disp8memshift;
6008 else
6009 {
6010 const i386_operand_type *type = NULL;
6011
6012 i.memshift = 0;
6013 for (op = 0; op < i.operands; op++)
6014 if (i.flags[op] & Operand_Mem)
6015 {
6016 if (t->opcode_modifier.evex == EVEXLIG)
6017 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6018 else if (t->operand_types[op].bitfield.xmmword
6019 + t->operand_types[op].bitfield.ymmword
6020 + t->operand_types[op].bitfield.zmmword <= 1)
6021 type = &t->operand_types[op];
6022 else if (!i.types[op].bitfield.unspecified)
6023 type = &i.types[op];
6024 }
6025 else if (i.types[op].bitfield.class == RegSIMD
6026 && t->opcode_modifier.evex != EVEXLIG)
6027 {
6028 if (i.types[op].bitfield.zmmword)
6029 i.memshift = 6;
6030 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6031 i.memshift = 5;
6032 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6033 i.memshift = 4;
6034 }
6035
6036 if (type)
6037 {
6038 if (type->bitfield.zmmword)
6039 i.memshift = 6;
6040 else if (type->bitfield.ymmword)
6041 i.memshift = 5;
6042 else if (type->bitfield.xmmword)
6043 i.memshift = 4;
6044 }
6045
6046 /* For the check in fits_in_disp8(). */
6047 if (i.memshift == 0)
6048 i.memshift = -1;
6049 }
6050
6051 for (op = 0; op < i.operands; op++)
6052 if (operand_type_check (i.types[op], disp)
6053 && i.op[op].disps->X_op == O_constant)
6054 {
6055 if (fits_in_disp8 (i.op[op].disps->X_add_number))
6056 {
6057 i.types[op].bitfield.disp8 = 1;
6058 return 0;
6059 }
6060 i.types[op].bitfield.disp8 = 0;
6061 }
6062 }
6063
6064 i.memshift = 0;
6065
6066 return 0;
6067 }
6068
6069 /* Check if operands are valid for the instruction. Update VEX
6070 operand types. */
6071
6072 static int
6073 VEX_check_operands (const insn_template *t)
6074 {
6075 if (i.vec_encoding == vex_encoding_evex)
6076 {
6077 /* This instruction must be encoded with EVEX prefix. */
6078 if (!is_evex_encoding (t))
6079 {
6080 i.error = unsupported;
6081 return 1;
6082 }
6083 return 0;
6084 }
6085
6086 if (!t->opcode_modifier.vex)
6087 {
6088 /* This instruction template doesn't have VEX prefix. */
6089 if (i.vec_encoding != vex_encoding_default)
6090 {
6091 i.error = unsupported;
6092 return 1;
6093 }
6094 return 0;
6095 }
6096
6097 /* Check the special Imm4 cases; must be the first operand. */
6098 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6099 {
6100 if (i.op[0].imms->X_op != O_constant
6101 || !fits_in_imm4 (i.op[0].imms->X_add_number))
6102 {
6103 i.error = bad_imm4;
6104 return 1;
6105 }
6106
6107 /* Turn off Imm<N> so that update_imm won't complain. */
6108 operand_type_set (&i.types[0], 0);
6109 }
6110
6111 return 0;
6112 }
6113
6114 static const insn_template *
6115 match_template (char mnem_suffix)
6116 {
6117 /* Points to template once we've found it. */
6118 const insn_template *t;
6119 i386_operand_type overlap0, overlap1, overlap2, overlap3;
6120 i386_operand_type overlap4;
6121 unsigned int found_reverse_match;
6122 i386_opcode_modifier suffix_check;
6123 i386_operand_type operand_types [MAX_OPERANDS];
6124 int addr_prefix_disp;
6125 unsigned int j, size_match, check_register;
6126 enum i386_error specific_error = 0;
6127
6128 #if MAX_OPERANDS != 5
6129 # error "MAX_OPERANDS must be 5."
6130 #endif
6131
6132 found_reverse_match = 0;
6133 addr_prefix_disp = -1;
6134
6135 /* Prepare for mnemonic suffix check. */
6136 memset (&suffix_check, 0, sizeof (suffix_check));
6137 switch (mnem_suffix)
6138 {
6139 case BYTE_MNEM_SUFFIX:
6140 suffix_check.no_bsuf = 1;
6141 break;
6142 case WORD_MNEM_SUFFIX:
6143 suffix_check.no_wsuf = 1;
6144 break;
6145 case SHORT_MNEM_SUFFIX:
6146 suffix_check.no_ssuf = 1;
6147 break;
6148 case LONG_MNEM_SUFFIX:
6149 suffix_check.no_lsuf = 1;
6150 break;
6151 case QWORD_MNEM_SUFFIX:
6152 suffix_check.no_qsuf = 1;
6153 break;
6154 default:
6155 /* NB: In Intel syntax, normally we can check for memory operand
6156 size when there is no mnemonic suffix. But jmp and call have
6157 2 different encodings with Dword memory operand size, one with
6158 No_ldSuf and the other without. i.suffix is set to
6159 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
6160 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6161 suffix_check.no_ldsuf = 1;
6162 }
6163
6164 /* Must have right number of operands. */
6165 i.error = number_of_operands_mismatch;
6166
6167 for (t = current_templates->start; t < current_templates->end; t++)
6168 {
6169 addr_prefix_disp = -1;
6170 found_reverse_match = 0;
6171
6172 if (i.operands != t->operands)
6173 continue;
6174
6175 /* Check processor support. */
6176 i.error = unsupported;
6177 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6178 continue;
6179
6180 /* Check AT&T mnemonic. */
6181 i.error = unsupported_with_intel_mnemonic;
6182 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6183 continue;
6184
6185 /* Check AT&T/Intel syntax. */
6186 i.error = unsupported_syntax;
6187 if ((intel_syntax && t->opcode_modifier.attsyntax)
6188 || (!intel_syntax && t->opcode_modifier.intelsyntax))
6189 continue;
6190
6191 /* Check Intel64/AMD64 ISA. */
6192 switch (isa64)
6193 {
6194 default:
6195 /* Default: Don't accept Intel64. */
6196 if (t->opcode_modifier.isa64 == INTEL64)
6197 continue;
6198 break;
6199 case amd64:
6200 /* -mamd64: Don't accept Intel64 and Intel64 only. */
6201 if (t->opcode_modifier.isa64 >= INTEL64)
6202 continue;
6203 break;
6204 case intel64:
6205 /* -mintel64: Don't accept AMD64. */
6206 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6207 continue;
6208 break;
6209 }
6210
6211 /* Check the suffix. */
6212 i.error = invalid_instruction_suffix;
6213 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6214 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6215 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6216 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6217 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6218 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6219 continue;
6220
6221 size_match = operand_size_match (t);
6222 if (!size_match)
6223 continue;
6224
6225 /* This is intentionally not
6226
6227 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6228
6229 as the case of a missing * on the operand is accepted (perhaps with
6230 a warning, issued further down). */
6231 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6232 {
6233 i.error = operand_type_mismatch;
6234 continue;
6235 }
6236
6237 for (j = 0; j < MAX_OPERANDS; j++)
6238 operand_types[j] = t->operand_types[j];
6239
6240 /* In general, don't allow
6241 - 64-bit operands outside of 64-bit mode,
6242 - 32-bit operands on pre-386. */
6243 j = i.imm_operands + (t->operands > i.imm_operands + 1);
6244 if (((i.suffix == QWORD_MNEM_SUFFIX
6245 && flag_code != CODE_64BIT
6246 && (t->base_opcode != 0x0fc7
6247 || t->extension_opcode != 1 /* cmpxchg8b */))
6248 || (i.suffix == LONG_MNEM_SUFFIX
6249 && !cpu_arch_flags.bitfield.cpui386))
6250 && (intel_syntax
6251 ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6252 && !intel_float_operand (t->name))
6253 : intel_float_operand (t->name) != 2)
6254 && (t->operands == i.imm_operands
6255 || (operand_types[i.imm_operands].bitfield.class != RegMMX
6256 && operand_types[i.imm_operands].bitfield.class != RegSIMD
6257 && operand_types[i.imm_operands].bitfield.class != RegMask)
6258 || (operand_types[j].bitfield.class != RegMMX
6259 && operand_types[j].bitfield.class != RegSIMD
6260 && operand_types[j].bitfield.class != RegMask))
6261 && !t->opcode_modifier.vecsib)
6262 continue;
6263
6264 /* Do not verify operands when there are none. */
6265 if (!t->operands)
6266 /* We've found a match; break out of loop. */
6267 break;
6268
6269 if (!t->opcode_modifier.jump
6270 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6271 {
6272 /* There should be only one Disp operand. */
6273 for (j = 0; j < MAX_OPERANDS; j++)
6274 if (operand_type_check (operand_types[j], disp))
6275 break;
6276 if (j < MAX_OPERANDS)
6277 {
6278 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6279
6280 addr_prefix_disp = j;
6281
6282 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6283 operand into Disp32/Disp32/Disp16/Disp32 operand. */
6284 switch (flag_code)
6285 {
6286 case CODE_16BIT:
6287 override = !override;
6288 /* Fall through. */
6289 case CODE_32BIT:
6290 if (operand_types[j].bitfield.disp32
6291 && operand_types[j].bitfield.disp16)
6292 {
6293 operand_types[j].bitfield.disp16 = override;
6294 operand_types[j].bitfield.disp32 = !override;
6295 }
6296 operand_types[j].bitfield.disp32s = 0;
6297 operand_types[j].bitfield.disp64 = 0;
6298 break;
6299
6300 case CODE_64BIT:
6301 if (operand_types[j].bitfield.disp32s
6302 || operand_types[j].bitfield.disp64)
6303 {
6304 operand_types[j].bitfield.disp64 &= !override;
6305 operand_types[j].bitfield.disp32s &= !override;
6306 operand_types[j].bitfield.disp32 = override;
6307 }
6308 operand_types[j].bitfield.disp16 = 0;
6309 break;
6310 }
6311 }
6312 }
6313
6314 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
6315 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6316 continue;
6317
6318 /* We check register size if needed. */
6319 if (t->opcode_modifier.checkregsize)
6320 {
6321 check_register = (1 << t->operands) - 1;
6322 if (i.broadcast)
6323 check_register &= ~(1 << i.broadcast->operand);
6324 }
6325 else
6326 check_register = 0;
6327
6328 overlap0 = operand_type_and (i.types[0], operand_types[0]);
6329 switch (t->operands)
6330 {
6331 case 1:
6332 if (!operand_type_match (overlap0, i.types[0]))
6333 continue;
6334 break;
6335 case 2:
6336 /* xchg %eax, %eax is a special case. It is an alias for nop
6337 only in 32bit mode and we can use opcode 0x90. In 64bit
6338 mode, we can't use 0x90 for xchg %eax, %eax since it should
6339 zero-extend %eax to %rax. */
6340 if (flag_code == CODE_64BIT
6341 && t->base_opcode == 0x90
6342 && i.types[0].bitfield.instance == Accum
6343 && i.types[0].bitfield.dword
6344 && i.types[1].bitfield.instance == Accum
6345 && i.types[1].bitfield.dword)
6346 continue;
6347 /* xrelease mov %eax, <disp> is another special case. It must not
6348 match the accumulator-only encoding of mov. */
6349 if (flag_code != CODE_64BIT
6350 && i.hle_prefix
6351 && t->base_opcode == 0xa0
6352 && i.types[0].bitfield.instance == Accum
6353 && (i.flags[1] & Operand_Mem))
6354 continue;
6355 /* Fall through. */
6356
6357 case 3:
6358 if (!(size_match & MATCH_STRAIGHT))
6359 goto check_reverse;
6360 /* Reverse direction of operands if swapping is possible in the first
6361 place (operands need to be symmetric) and
6362 - the load form is requested, and the template is a store form,
6363 - the store form is requested, and the template is a load form,
6364 - the non-default (swapped) form is requested. */
6365 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6366 if (t->opcode_modifier.d && i.reg_operands == i.operands
6367 && !operand_type_all_zero (&overlap1))
6368 switch (i.dir_encoding)
6369 {
6370 case dir_encoding_load:
6371 if (operand_type_check (operand_types[i.operands - 1], anymem)
6372 || t->opcode_modifier.regmem)
6373 goto check_reverse;
6374 break;
6375
6376 case dir_encoding_store:
6377 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6378 && !t->opcode_modifier.regmem)
6379 goto check_reverse;
6380 break;
6381
6382 case dir_encoding_swap:
6383 goto check_reverse;
6384
6385 case dir_encoding_default:
6386 break;
6387 }
6388 /* If we want store form, we skip the current load. */
6389 if ((i.dir_encoding == dir_encoding_store
6390 || i.dir_encoding == dir_encoding_swap)
6391 && i.mem_operands == 0
6392 && t->opcode_modifier.load)
6393 continue;
6394 /* Fall through. */
6395 case 4:
6396 case 5:
6397 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6398 if (!operand_type_match (overlap0, i.types[0])
6399 || !operand_type_match (overlap1, i.types[1])
6400 || ((check_register & 3) == 3
6401 && !operand_type_register_match (i.types[0],
6402 operand_types[0],
6403 i.types[1],
6404 operand_types[1])))
6405 {
6406 /* Check if other direction is valid ... */
6407 if (!t->opcode_modifier.d)
6408 continue;
6409
6410 check_reverse:
6411 if (!(size_match & MATCH_REVERSE))
6412 continue;
6413 /* Try reversing direction of operands. */
6414 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6415 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6416 if (!operand_type_match (overlap0, i.types[0])
6417 || !operand_type_match (overlap1, i.types[i.operands - 1])
6418 || (check_register
6419 && !operand_type_register_match (i.types[0],
6420 operand_types[i.operands - 1],
6421 i.types[i.operands - 1],
6422 operand_types[0])))
6423 {
6424 /* Does not match either direction. */
6425 continue;
6426 }
6427 /* found_reverse_match holds which of D or FloatR
6428 we've found. */
6429 if (!t->opcode_modifier.d)
6430 found_reverse_match = 0;
6431 else if (operand_types[0].bitfield.tbyte)
6432 found_reverse_match = Opcode_FloatD;
6433 else if (operand_types[0].bitfield.xmmword
6434 || operand_types[i.operands - 1].bitfield.xmmword
6435 || operand_types[0].bitfield.class == RegMMX
6436 || operand_types[i.operands - 1].bitfield.class == RegMMX
6437 || is_any_vex_encoding(t))
6438 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6439 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6440 else
6441 found_reverse_match = Opcode_D;
6442 if (t->opcode_modifier.floatr)
6443 found_reverse_match |= Opcode_FloatR;
6444 }
6445 else
6446 {
6447 /* Found a forward 2 operand match here. */
6448 switch (t->operands)
6449 {
6450 case 5:
6451 overlap4 = operand_type_and (i.types[4],
6452 operand_types[4]);
6453 /* Fall through. */
6454 case 4:
6455 overlap3 = operand_type_and (i.types[3],
6456 operand_types[3]);
6457 /* Fall through. */
6458 case 3:
6459 overlap2 = operand_type_and (i.types[2],
6460 operand_types[2]);
6461 break;
6462 }
6463
6464 switch (t->operands)
6465 {
6466 case 5:
6467 if (!operand_type_match (overlap4, i.types[4])
6468 || !operand_type_register_match (i.types[3],
6469 operand_types[3],
6470 i.types[4],
6471 operand_types[4]))
6472 continue;
6473 /* Fall through. */
6474 case 4:
6475 if (!operand_type_match (overlap3, i.types[3])
6476 || ((check_register & 0xa) == 0xa
6477 && !operand_type_register_match (i.types[1],
6478 operand_types[1],
6479 i.types[3],
6480 operand_types[3]))
6481 || ((check_register & 0xc) == 0xc
6482 && !operand_type_register_match (i.types[2],
6483 operand_types[2],
6484 i.types[3],
6485 operand_types[3])))
6486 continue;
6487 /* Fall through. */
6488 case 3:
6489 /* Here we make use of the fact that there are no
6490 reverse match 3 operand instructions. */
6491 if (!operand_type_match (overlap2, i.types[2])
6492 || ((check_register & 5) == 5
6493 && !operand_type_register_match (i.types[0],
6494 operand_types[0],
6495 i.types[2],
6496 operand_types[2]))
6497 || ((check_register & 6) == 6
6498 && !operand_type_register_match (i.types[1],
6499 operand_types[1],
6500 i.types[2],
6501 operand_types[2])))
6502 continue;
6503 break;
6504 }
6505 }
6506 /* Found either forward/reverse 2, 3 or 4 operand match here:
6507 slip through to break. */
6508 }
6509
6510 /* Check if vector and VEX operands are valid. */
6511 if (check_VecOperands (t) || VEX_check_operands (t))
6512 {
6513 specific_error = i.error;
6514 continue;
6515 }
6516
6517 /* We've found a match; break out of loop. */
6518 break;
6519 }
6520
6521 if (t == current_templates->end)
6522 {
6523 /* We found no match. */
6524 const char *err_msg;
6525 switch (specific_error ? specific_error : i.error)
6526 {
6527 default:
6528 abort ();
6529 case operand_size_mismatch:
6530 err_msg = _("operand size mismatch");
6531 break;
6532 case operand_type_mismatch:
6533 err_msg = _("operand type mismatch");
6534 break;
6535 case register_type_mismatch:
6536 err_msg = _("register type mismatch");
6537 break;
6538 case number_of_operands_mismatch:
6539 err_msg = _("number of operands mismatch");
6540 break;
6541 case invalid_instruction_suffix:
6542 err_msg = _("invalid instruction suffix");
6543 break;
6544 case bad_imm4:
6545 err_msg = _("constant doesn't fit in 4 bits");
6546 break;
6547 case unsupported_with_intel_mnemonic:
6548 err_msg = _("unsupported with Intel mnemonic");
6549 break;
6550 case unsupported_syntax:
6551 err_msg = _("unsupported syntax");
6552 break;
6553 case unsupported:
6554 as_bad (_("unsupported instruction `%s'"),
6555 current_templates->start->name);
6556 return NULL;
6557 case invalid_vsib_address:
6558 err_msg = _("invalid VSIB address");
6559 break;
6560 case invalid_vector_register_set:
6561 err_msg = _("mask, index, and destination registers must be distinct");
6562 break;
6563 case unsupported_vector_index_register:
6564 err_msg = _("unsupported vector index register");
6565 break;
6566 case unsupported_broadcast:
6567 err_msg = _("unsupported broadcast");
6568 break;
6569 case broadcast_needed:
6570 err_msg = _("broadcast is needed for operand of such type");
6571 break;
6572 case unsupported_masking:
6573 err_msg = _("unsupported masking");
6574 break;
6575 case mask_not_on_destination:
6576 err_msg = _("mask not on destination operand");
6577 break;
6578 case no_default_mask:
6579 err_msg = _("default mask isn't allowed");
6580 break;
6581 case unsupported_rc_sae:
6582 err_msg = _("unsupported static rounding/sae");
6583 break;
6584 case rc_sae_operand_not_last_imm:
6585 if (intel_syntax)
6586 err_msg = _("RC/SAE operand must precede immediate operands");
6587 else
6588 err_msg = _("RC/SAE operand must follow immediate operands");
6589 break;
6590 case invalid_register_operand:
6591 err_msg = _("invalid register operand");
6592 break;
6593 }
6594 as_bad (_("%s for `%s'"), err_msg,
6595 current_templates->start->name);
6596 return NULL;
6597 }
6598
6599 if (!quiet_warnings)
6600 {
6601 if (!intel_syntax
6602 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6603 as_warn (_("indirect %s without `*'"), t->name);
6604
6605 if (t->opcode_modifier.isprefix
6606 && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6607 {
6608 /* Warn them that a data or address size prefix doesn't
6609 affect assembly of the next line of code. */
6610 as_warn (_("stand-alone `%s' prefix"), t->name);
6611 }
6612 }
6613
6614 /* Copy the template we found. */
6615 i.tm = *t;
6616
6617 if (addr_prefix_disp != -1)
6618 i.tm.operand_types[addr_prefix_disp]
6619 = operand_types[addr_prefix_disp];
6620
6621 if (found_reverse_match)
6622 {
6623 /* If we found a reverse match we must alter the opcode direction
6624 bit and clear/flip the regmem modifier one. found_reverse_match
6625 holds bits to change (different for int & float insns). */
6626
6627 i.tm.base_opcode ^= found_reverse_match;
6628
6629 i.tm.operand_types[0] = operand_types[i.operands - 1];
6630 i.tm.operand_types[i.operands - 1] = operand_types[0];
6631
6632 /* Certain SIMD insns have their load forms specified in the opcode
6633 table, and hence we need to _set_ RegMem instead of clearing it.
6634 We need to avoid setting the bit though on insns like KMOVW. */
6635 i.tm.opcode_modifier.regmem
6636 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6637 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6638 && !i.tm.opcode_modifier.regmem;
6639 }
6640
6641 return t;
6642 }
6643
6644 static int
6645 check_string (void)
6646 {
6647 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6648 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6649
6650 if (i.seg[op] != NULL && i.seg[op] != &es)
6651 {
6652 as_bad (_("`%s' operand %u must use `%ses' segment"),
6653 i.tm.name,
6654 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6655 register_prefix);
6656 return 0;
6657 }
6658
6659 /* There's only ever one segment override allowed per instruction.
6660 This instruction possibly has a legal segment override on the
6661 second operand, so copy the segment to where non-string
6662 instructions store it, allowing common code. */
6663 i.seg[op] = i.seg[1];
6664
6665 return 1;
6666 }
6667
6668 static int
6669 process_suffix (void)
6670 {
6671 /* If matched instruction specifies an explicit instruction mnemonic
6672 suffix, use it. */
6673 if (i.tm.opcode_modifier.size == SIZE16)
6674 i.suffix = WORD_MNEM_SUFFIX;
6675 else if (i.tm.opcode_modifier.size == SIZE32)
6676 i.suffix = LONG_MNEM_SUFFIX;
6677 else if (i.tm.opcode_modifier.size == SIZE64)
6678 i.suffix = QWORD_MNEM_SUFFIX;
6679 else if (i.reg_operands
6680 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6681 && !i.tm.opcode_modifier.addrprefixopreg)
6682 {
6683 unsigned int numop = i.operands;
6684
6685 /* movsx/movzx want only their source operand considered here, for the
6686 ambiguity checking below. The suffix will be replaced afterwards
6687 to represent the destination (register). */
6688 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6689 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6690 --i.operands;
6691
6692 /* crc32 needs REX.W set regardless of suffix / source operand size. */
6693 if (i.tm.base_opcode == 0xf20f38f0
6694 && i.tm.operand_types[1].bitfield.qword)
6695 i.rex |= REX_W;
6696
6697 /* If there's no instruction mnemonic suffix we try to invent one
6698 based on GPR operands. */
6699 if (!i.suffix)
6700 {
6701 /* We take i.suffix from the last register operand specified,
6702 Destination register type is more significant than source
6703 register type. crc32 in SSE4.2 prefers source register
6704 type. */
6705 unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6706
6707 while (op--)
6708 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6709 || i.tm.operand_types[op].bitfield.instance == Accum)
6710 {
6711 if (i.types[op].bitfield.class != Reg)
6712 continue;
6713 if (i.types[op].bitfield.byte)
6714 i.suffix = BYTE_MNEM_SUFFIX;
6715 else if (i.types[op].bitfield.word)
6716 i.suffix = WORD_MNEM_SUFFIX;
6717 else if (i.types[op].bitfield.dword)
6718 i.suffix = LONG_MNEM_SUFFIX;
6719 else if (i.types[op].bitfield.qword)
6720 i.suffix = QWORD_MNEM_SUFFIX;
6721 else
6722 continue;
6723 break;
6724 }
6725
6726 /* As an exception, movsx/movzx silently default to a byte source
6727 in AT&T mode. */
6728 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6729 && !i.suffix && !intel_syntax)
6730 i.suffix = BYTE_MNEM_SUFFIX;
6731 }
6732 else if (i.suffix == BYTE_MNEM_SUFFIX)
6733 {
6734 if (intel_syntax
6735 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6736 && i.tm.opcode_modifier.no_bsuf)
6737 i.suffix = 0;
6738 else if (!check_byte_reg ())
6739 return 0;
6740 }
6741 else if (i.suffix == LONG_MNEM_SUFFIX)
6742 {
6743 if (intel_syntax
6744 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6745 && i.tm.opcode_modifier.no_lsuf
6746 && !i.tm.opcode_modifier.todword
6747 && !i.tm.opcode_modifier.toqword)
6748 i.suffix = 0;
6749 else if (!check_long_reg ())
6750 return 0;
6751 }
6752 else if (i.suffix == QWORD_MNEM_SUFFIX)
6753 {
6754 if (intel_syntax
6755 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6756 && i.tm.opcode_modifier.no_qsuf
6757 && !i.tm.opcode_modifier.todword
6758 && !i.tm.opcode_modifier.toqword)
6759 i.suffix = 0;
6760 else if (!check_qword_reg ())
6761 return 0;
6762 }
6763 else if (i.suffix == WORD_MNEM_SUFFIX)
6764 {
6765 if (intel_syntax
6766 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6767 && i.tm.opcode_modifier.no_wsuf)
6768 i.suffix = 0;
6769 else if (!check_word_reg ())
6770 return 0;
6771 }
6772 else if (intel_syntax
6773 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6774 /* Do nothing if the instruction is going to ignore the prefix. */
6775 ;
6776 else
6777 abort ();
6778
6779 /* Undo the movsx/movzx change done above. */
6780 i.operands = numop;
6781 }
6782 else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6783 && !i.suffix)
6784 {
6785 i.suffix = stackop_size;
6786 if (stackop_size == LONG_MNEM_SUFFIX)
6787 {
6788 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6789 .code16gcc directive to support 16-bit mode with
6790 32-bit address. For IRET without a suffix, generate
6791 16-bit IRET (opcode 0xcf) to return from an interrupt
6792 handler. */
6793 if (i.tm.base_opcode == 0xcf)
6794 {
6795 i.suffix = WORD_MNEM_SUFFIX;
6796 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6797 }
6798 /* Warn about changed behavior for segment register push/pop. */
6799 else if ((i.tm.base_opcode | 1) == 0x07)
6800 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6801 i.tm.name);
6802 }
6803 }
6804 else if (!i.suffix
6805 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6806 || i.tm.opcode_modifier.jump == JUMP_BYTE
6807 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6808 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6809 && i.tm.extension_opcode <= 3)))
6810 {
6811 switch (flag_code)
6812 {
6813 case CODE_64BIT:
6814 if (!i.tm.opcode_modifier.no_qsuf)
6815 {
6816 i.suffix = QWORD_MNEM_SUFFIX;
6817 break;
6818 }
6819 /* Fall through. */
6820 case CODE_32BIT:
6821 if (!i.tm.opcode_modifier.no_lsuf)
6822 i.suffix = LONG_MNEM_SUFFIX;
6823 break;
6824 case CODE_16BIT:
6825 if (!i.tm.opcode_modifier.no_wsuf)
6826 i.suffix = WORD_MNEM_SUFFIX;
6827 break;
6828 }
6829 }
6830
6831 if (!i.suffix
6832 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6833 /* Also cover lret/retf/iret in 64-bit mode. */
6834 || (flag_code == CODE_64BIT
6835 && !i.tm.opcode_modifier.no_lsuf
6836 && !i.tm.opcode_modifier.no_qsuf))
6837 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6838 /* Accept FLDENV et al without suffix. */
6839 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6840 {
6841 unsigned int suffixes, evex = 0;
6842
6843 suffixes = !i.tm.opcode_modifier.no_bsuf;
6844 if (!i.tm.opcode_modifier.no_wsuf)
6845 suffixes |= 1 << 1;
6846 if (!i.tm.opcode_modifier.no_lsuf)
6847 suffixes |= 1 << 2;
6848 if (!i.tm.opcode_modifier.no_ldsuf)
6849 suffixes |= 1 << 3;
6850 if (!i.tm.opcode_modifier.no_ssuf)
6851 suffixes |= 1 << 4;
6852 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6853 suffixes |= 1 << 5;
6854
6855 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6856 also suitable for AT&T syntax mode, it was requested that this be
6857 restricted to just Intel syntax. */
6858 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6859 {
6860 unsigned int op;
6861
6862 for (op = 0; op < i.tm.operands; ++op)
6863 {
6864 if (is_evex_encoding (&i.tm)
6865 && !cpu_arch_flags.bitfield.cpuavx512vl)
6866 {
6867 if (i.tm.operand_types[op].bitfield.ymmword)
6868 i.tm.operand_types[op].bitfield.xmmword = 0;
6869 if (i.tm.operand_types[op].bitfield.zmmword)
6870 i.tm.operand_types[op].bitfield.ymmword = 0;
6871 if (!i.tm.opcode_modifier.evex
6872 || i.tm.opcode_modifier.evex == EVEXDYN)
6873 i.tm.opcode_modifier.evex = EVEX512;
6874 }
6875
6876 if (i.tm.operand_types[op].bitfield.xmmword
6877 + i.tm.operand_types[op].bitfield.ymmword
6878 + i.tm.operand_types[op].bitfield.zmmword < 2)
6879 continue;
6880
6881 /* Any properly sized operand disambiguates the insn. */
6882 if (i.types[op].bitfield.xmmword
6883 || i.types[op].bitfield.ymmword
6884 || i.types[op].bitfield.zmmword)
6885 {
6886 suffixes &= ~(7 << 6);
6887 evex = 0;
6888 break;
6889 }
6890
6891 if ((i.flags[op] & Operand_Mem)
6892 && i.tm.operand_types[op].bitfield.unspecified)
6893 {
6894 if (i.tm.operand_types[op].bitfield.xmmword)
6895 suffixes |= 1 << 6;
6896 if (i.tm.operand_types[op].bitfield.ymmword)
6897 suffixes |= 1 << 7;
6898 if (i.tm.operand_types[op].bitfield.zmmword)
6899 suffixes |= 1 << 8;
6900 if (is_evex_encoding (&i.tm))
6901 evex = EVEX512;
6902 }
6903 }
6904 }
6905
6906 /* Are multiple suffixes / operand sizes allowed? */
6907 if (suffixes & (suffixes - 1))
6908 {
6909 if (intel_syntax
6910 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6911 || operand_check == check_error))
6912 {
6913 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6914 return 0;
6915 }
6916 if (operand_check == check_error)
6917 {
6918 as_bad (_("no instruction mnemonic suffix given and "
6919 "no register operands; can't size `%s'"), i.tm.name);
6920 return 0;
6921 }
6922 if (operand_check == check_warning)
6923 as_warn (_("%s; using default for `%s'"),
6924 intel_syntax
6925 ? _("ambiguous operand size")
6926 : _("no instruction mnemonic suffix given and "
6927 "no register operands"),
6928 i.tm.name);
6929
6930 if (i.tm.opcode_modifier.floatmf)
6931 i.suffix = SHORT_MNEM_SUFFIX;
6932 else if ((i.tm.base_opcode | 8) == 0xfbe
6933 || (i.tm.base_opcode == 0x63
6934 && i.tm.cpu_flags.bitfield.cpu64))
6935 /* handled below */;
6936 else if (evex)
6937 i.tm.opcode_modifier.evex = evex;
6938 else if (flag_code == CODE_16BIT)
6939 i.suffix = WORD_MNEM_SUFFIX;
6940 else if (!i.tm.opcode_modifier.no_lsuf)
6941 i.suffix = LONG_MNEM_SUFFIX;
6942 else
6943 i.suffix = QWORD_MNEM_SUFFIX;
6944 }
6945 }
6946
6947 if ((i.tm.base_opcode | 8) == 0xfbe
6948 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6949 {
6950 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
6951 In AT&T syntax, if there is no suffix (warned about above), the default
6952 will be byte extension. */
6953 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
6954 i.tm.base_opcode |= 1;
6955
6956 /* For further processing, the suffix should represent the destination
6957 (register). This is already the case when one was used with
6958 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
6959 no suffix to begin with. */
6960 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
6961 {
6962 if (i.types[1].bitfield.word)
6963 i.suffix = WORD_MNEM_SUFFIX;
6964 else if (i.types[1].bitfield.qword)
6965 i.suffix = QWORD_MNEM_SUFFIX;
6966 else
6967 i.suffix = LONG_MNEM_SUFFIX;
6968
6969 i.tm.opcode_modifier.w = 0;
6970 }
6971 }
6972
6973 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
6974 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
6975 != (i.tm.operand_types[1].bitfield.class == Reg);
6976
6977 /* Change the opcode based on the operand size given by i.suffix. */
6978 switch (i.suffix)
6979 {
6980 /* Size floating point instruction. */
6981 case LONG_MNEM_SUFFIX:
6982 if (i.tm.opcode_modifier.floatmf)
6983 {
6984 i.tm.base_opcode ^= 4;
6985 break;
6986 }
6987 /* fall through */
6988 case WORD_MNEM_SUFFIX:
6989 case QWORD_MNEM_SUFFIX:
6990 /* It's not a byte, select word/dword operation. */
6991 if (i.tm.opcode_modifier.w)
6992 {
6993 if (i.short_form)
6994 i.tm.base_opcode |= 8;
6995 else
6996 i.tm.base_opcode |= 1;
6997 }
6998 /* fall through */
6999 case SHORT_MNEM_SUFFIX:
7000 /* Now select between word & dword operations via the operand
7001 size prefix, except for instructions that will ignore this
7002 prefix anyway. */
7003 if (i.suffix != QWORD_MNEM_SUFFIX
7004 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7005 && !i.tm.opcode_modifier.floatmf
7006 && !is_any_vex_encoding (&i.tm)
7007 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7008 || (flag_code == CODE_64BIT
7009 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7010 {
7011 unsigned int prefix = DATA_PREFIX_OPCODE;
7012
7013 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7014 prefix = ADDR_PREFIX_OPCODE;
7015
7016 if (!add_prefix (prefix))
7017 return 0;
7018 }
7019
7020 /* Set mode64 for an operand. */
7021 if (i.suffix == QWORD_MNEM_SUFFIX
7022 && flag_code == CODE_64BIT
7023 && !i.tm.opcode_modifier.norex64
7024 && !i.tm.opcode_modifier.vexw
7025 /* Special case for xchg %rax,%rax. It is NOP and doesn't
7026 need rex64. */
7027 && ! (i.operands == 2
7028 && i.tm.base_opcode == 0x90
7029 && i.tm.extension_opcode == None
7030 && i.types[0].bitfield.instance == Accum
7031 && i.types[0].bitfield.qword
7032 && i.types[1].bitfield.instance == Accum
7033 && i.types[1].bitfield.qword))
7034 i.rex |= REX_W;
7035
7036 break;
7037 }
7038
7039 if (i.tm.opcode_modifier.addrprefixopreg)
7040 {
7041 gas_assert (!i.suffix);
7042 gas_assert (i.reg_operands);
7043
7044 if (i.tm.operand_types[0].bitfield.instance == Accum
7045 || i.operands == 1)
7046 {
7047 /* The address size override prefix changes the size of the
7048 first operand. */
7049 if (flag_code == CODE_64BIT
7050 && i.op[0].regs->reg_type.bitfield.word)
7051 {
7052 as_bad (_("16-bit addressing unavailable for `%s'"),
7053 i.tm.name);
7054 return 0;
7055 }
7056
7057 if ((flag_code == CODE_32BIT
7058 ? i.op[0].regs->reg_type.bitfield.word
7059 : i.op[0].regs->reg_type.bitfield.dword)
7060 && !add_prefix (ADDR_PREFIX_OPCODE))
7061 return 0;
7062 }
7063 else
7064 {
7065 /* Check invalid register operand when the address size override
7066 prefix changes the size of register operands. */
7067 unsigned int op;
7068 enum { need_word, need_dword, need_qword } need;
7069
7070 if (flag_code == CODE_32BIT)
7071 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7072 else if (i.prefix[ADDR_PREFIX])
7073 need = need_dword;
7074 else
7075 need = flag_code == CODE_64BIT ? need_qword : need_word;
7076
7077 for (op = 0; op < i.operands; op++)
7078 {
7079 if (i.types[op].bitfield.class != Reg)
7080 continue;
7081
7082 switch (need)
7083 {
7084 case need_word:
7085 if (i.op[op].regs->reg_type.bitfield.word)
7086 continue;
7087 break;
7088 case need_dword:
7089 if (i.op[op].regs->reg_type.bitfield.dword)
7090 continue;
7091 break;
7092 case need_qword:
7093 if (i.op[op].regs->reg_type.bitfield.qword)
7094 continue;
7095 break;
7096 }
7097
7098 as_bad (_("invalid register operand size for `%s'"),
7099 i.tm.name);
7100 return 0;
7101 }
7102 }
7103 }
7104
7105 return 1;
7106 }
7107
7108 static int
7109 check_byte_reg (void)
7110 {
7111 int op;
7112
7113 for (op = i.operands; --op >= 0;)
7114 {
7115 /* Skip non-register operands. */
7116 if (i.types[op].bitfield.class != Reg)
7117 continue;
7118
7119 /* If this is an eight bit register, it's OK. If it's the 16 or
7120 32 bit version of an eight bit register, we will just use the
7121 low portion, and that's OK too. */
7122 if (i.types[op].bitfield.byte)
7123 continue;
7124
7125 /* I/O port address operands are OK too. */
7126 if (i.tm.operand_types[op].bitfield.instance == RegD
7127 && i.tm.operand_types[op].bitfield.word)
7128 continue;
7129
7130 /* crc32 only wants its source operand checked here. */
7131 if (i.tm.base_opcode == 0xf20f38f0 && op)
7132 continue;
7133
7134 /* Any other register is bad. */
7135 if (i.types[op].bitfield.class == Reg
7136 || i.types[op].bitfield.class == RegMMX
7137 || i.types[op].bitfield.class == RegSIMD
7138 || i.types[op].bitfield.class == SReg
7139 || i.types[op].bitfield.class == RegCR
7140 || i.types[op].bitfield.class == RegDR
7141 || i.types[op].bitfield.class == RegTR)
7142 {
7143 as_bad (_("`%s%s' not allowed with `%s%c'"),
7144 register_prefix,
7145 i.op[op].regs->reg_name,
7146 i.tm.name,
7147 i.suffix);
7148 return 0;
7149 }
7150 }
7151 return 1;
7152 }
7153
7154 static int
7155 check_long_reg (void)
7156 {
7157 int op;
7158
7159 for (op = i.operands; --op >= 0;)
7160 /* Skip non-register operands. */
7161 if (i.types[op].bitfield.class != Reg)
7162 continue;
7163 /* Reject eight bit registers, except where the template requires
7164 them. (eg. movzb) */
7165 else if (i.types[op].bitfield.byte
7166 && (i.tm.operand_types[op].bitfield.class == Reg
7167 || i.tm.operand_types[op].bitfield.instance == Accum)
7168 && (i.tm.operand_types[op].bitfield.word
7169 || i.tm.operand_types[op].bitfield.dword))
7170 {
7171 as_bad (_("`%s%s' not allowed with `%s%c'"),
7172 register_prefix,
7173 i.op[op].regs->reg_name,
7174 i.tm.name,
7175 i.suffix);
7176 return 0;
7177 }
7178 /* Error if the e prefix on a general reg is missing. */
7179 else if (i.types[op].bitfield.word
7180 && (i.tm.operand_types[op].bitfield.class == Reg
7181 || i.tm.operand_types[op].bitfield.instance == Accum)
7182 && i.tm.operand_types[op].bitfield.dword)
7183 {
7184 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7185 register_prefix, i.op[op].regs->reg_name,
7186 i.suffix);
7187 return 0;
7188 }
7189 /* Warn if the r prefix on a general reg is present. */
7190 else if (i.types[op].bitfield.qword
7191 && (i.tm.operand_types[op].bitfield.class == Reg
7192 || i.tm.operand_types[op].bitfield.instance == Accum)
7193 && i.tm.operand_types[op].bitfield.dword)
7194 {
7195 if (intel_syntax
7196 && i.tm.opcode_modifier.toqword
7197 && i.types[0].bitfield.class != RegSIMD)
7198 {
7199 /* Convert to QWORD. We want REX byte. */
7200 i.suffix = QWORD_MNEM_SUFFIX;
7201 }
7202 else
7203 {
7204 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7205 register_prefix, i.op[op].regs->reg_name,
7206 i.suffix);
7207 return 0;
7208 }
7209 }
7210 return 1;
7211 }
7212
7213 static int
7214 check_qword_reg (void)
7215 {
7216 int op;
7217
7218 for (op = i.operands; --op >= 0; )
7219 /* Skip non-register operands. */
7220 if (i.types[op].bitfield.class != Reg)
7221 continue;
7222 /* Reject eight bit registers, except where the template requires
7223 them. (eg. movzb) */
7224 else if (i.types[op].bitfield.byte
7225 && (i.tm.operand_types[op].bitfield.class == Reg
7226 || i.tm.operand_types[op].bitfield.instance == Accum)
7227 && (i.tm.operand_types[op].bitfield.word
7228 || i.tm.operand_types[op].bitfield.dword))
7229 {
7230 as_bad (_("`%s%s' not allowed with `%s%c'"),
7231 register_prefix,
7232 i.op[op].regs->reg_name,
7233 i.tm.name,
7234 i.suffix);
7235 return 0;
7236 }
7237 /* Warn if the r prefix on a general reg is missing. */
7238 else if ((i.types[op].bitfield.word
7239 || i.types[op].bitfield.dword)
7240 && (i.tm.operand_types[op].bitfield.class == Reg
7241 || i.tm.operand_types[op].bitfield.instance == Accum)
7242 && i.tm.operand_types[op].bitfield.qword)
7243 {
7244 /* Prohibit these changes in the 64bit mode, since the
7245 lowering is more complicated. */
7246 if (intel_syntax
7247 && i.tm.opcode_modifier.todword
7248 && i.types[0].bitfield.class != RegSIMD)
7249 {
7250 /* Convert to DWORD. We don't want REX byte. */
7251 i.suffix = LONG_MNEM_SUFFIX;
7252 }
7253 else
7254 {
7255 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7256 register_prefix, i.op[op].regs->reg_name,
7257 i.suffix);
7258 return 0;
7259 }
7260 }
7261 return 1;
7262 }
7263
7264 static int
7265 check_word_reg (void)
7266 {
7267 int op;
7268 for (op = i.operands; --op >= 0;)
7269 /* Skip non-register operands. */
7270 if (i.types[op].bitfield.class != Reg)
7271 continue;
7272 /* Reject eight bit registers, except where the template requires
7273 them. (eg. movzb) */
7274 else if (i.types[op].bitfield.byte
7275 && (i.tm.operand_types[op].bitfield.class == Reg
7276 || i.tm.operand_types[op].bitfield.instance == Accum)
7277 && (i.tm.operand_types[op].bitfield.word
7278 || i.tm.operand_types[op].bitfield.dword))
7279 {
7280 as_bad (_("`%s%s' not allowed with `%s%c'"),
7281 register_prefix,
7282 i.op[op].regs->reg_name,
7283 i.tm.name,
7284 i.suffix);
7285 return 0;
7286 }
7287 /* Error if the e or r prefix on a general reg is present. */
7288 else if ((i.types[op].bitfield.dword
7289 || i.types[op].bitfield.qword)
7290 && (i.tm.operand_types[op].bitfield.class == Reg
7291 || i.tm.operand_types[op].bitfield.instance == Accum)
7292 && i.tm.operand_types[op].bitfield.word)
7293 {
7294 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7295 register_prefix, i.op[op].regs->reg_name,
7296 i.suffix);
7297 return 0;
7298 }
7299 return 1;
7300 }
7301
7302 static int
7303 update_imm (unsigned int j)
7304 {
7305 i386_operand_type overlap = i.types[j];
7306 if ((overlap.bitfield.imm8
7307 || overlap.bitfield.imm8s
7308 || overlap.bitfield.imm16
7309 || overlap.bitfield.imm32
7310 || overlap.bitfield.imm32s
7311 || overlap.bitfield.imm64)
7312 && !operand_type_equal (&overlap, &imm8)
7313 && !operand_type_equal (&overlap, &imm8s)
7314 && !operand_type_equal (&overlap, &imm16)
7315 && !operand_type_equal (&overlap, &imm32)
7316 && !operand_type_equal (&overlap, &imm32s)
7317 && !operand_type_equal (&overlap, &imm64))
7318 {
7319 if (i.suffix)
7320 {
7321 i386_operand_type temp;
7322
7323 operand_type_set (&temp, 0);
7324 if (i.suffix == BYTE_MNEM_SUFFIX)
7325 {
7326 temp.bitfield.imm8 = overlap.bitfield.imm8;
7327 temp.bitfield.imm8s = overlap.bitfield.imm8s;
7328 }
7329 else if (i.suffix == WORD_MNEM_SUFFIX)
7330 temp.bitfield.imm16 = overlap.bitfield.imm16;
7331 else if (i.suffix == QWORD_MNEM_SUFFIX)
7332 {
7333 temp.bitfield.imm64 = overlap.bitfield.imm64;
7334 temp.bitfield.imm32s = overlap.bitfield.imm32s;
7335 }
7336 else
7337 temp.bitfield.imm32 = overlap.bitfield.imm32;
7338 overlap = temp;
7339 }
7340 else if (operand_type_equal (&overlap, &imm16_32_32s)
7341 || operand_type_equal (&overlap, &imm16_32)
7342 || operand_type_equal (&overlap, &imm16_32s))
7343 {
7344 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7345 overlap = imm16;
7346 else
7347 overlap = imm32s;
7348 }
7349 if (!operand_type_equal (&overlap, &imm8)
7350 && !operand_type_equal (&overlap, &imm8s)
7351 && !operand_type_equal (&overlap, &imm16)
7352 && !operand_type_equal (&overlap, &imm32)
7353 && !operand_type_equal (&overlap, &imm32s)
7354 && !operand_type_equal (&overlap, &imm64))
7355 {
7356 as_bad (_("no instruction mnemonic suffix given; "
7357 "can't determine immediate size"));
7358 return 0;
7359 }
7360 }
7361 i.types[j] = overlap;
7362
7363 return 1;
7364 }
7365
7366 static int
7367 finalize_imm (void)
7368 {
7369 unsigned int j, n;
7370
7371 /* Update the first 2 immediate operands. */
7372 n = i.operands > 2 ? 2 : i.operands;
7373 if (n)
7374 {
7375 for (j = 0; j < n; j++)
7376 if (update_imm (j) == 0)
7377 return 0;
7378
7379 /* The 3rd operand can't be immediate operand. */
7380 gas_assert (operand_type_check (i.types[2], imm) == 0);
7381 }
7382
7383 return 1;
7384 }
7385
7386 static int
7387 process_operands (void)
7388 {
7389 /* Default segment register this instruction will use for memory
7390 accesses. 0 means unknown. This is only for optimizing out
7391 unnecessary segment overrides. */
7392 const seg_entry *default_seg = 0;
7393
7394 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7395 {
7396 unsigned int dupl = i.operands;
7397 unsigned int dest = dupl - 1;
7398 unsigned int j;
7399
7400 /* The destination must be an xmm register. */
7401 gas_assert (i.reg_operands
7402 && MAX_OPERANDS > dupl
7403 && operand_type_equal (&i.types[dest], &regxmm));
7404
7405 if (i.tm.operand_types[0].bitfield.instance == Accum
7406 && i.tm.operand_types[0].bitfield.xmmword)
7407 {
7408 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7409 {
7410 /* Keep xmm0 for instructions with VEX prefix and 3
7411 sources. */
7412 i.tm.operand_types[0].bitfield.instance = InstanceNone;
7413 i.tm.operand_types[0].bitfield.class = RegSIMD;
7414 goto duplicate;
7415 }
7416 else
7417 {
7418 /* We remove the first xmm0 and keep the number of
7419 operands unchanged, which in fact duplicates the
7420 destination. */
7421 for (j = 1; j < i.operands; j++)
7422 {
7423 i.op[j - 1] = i.op[j];
7424 i.types[j - 1] = i.types[j];
7425 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7426 i.flags[j - 1] = i.flags[j];
7427 }
7428 }
7429 }
7430 else if (i.tm.opcode_modifier.implicit1stxmm0)
7431 {
7432 gas_assert ((MAX_OPERANDS - 1) > dupl
7433 && (i.tm.opcode_modifier.vexsources
7434 == VEX3SOURCES));
7435
7436 /* Add the implicit xmm0 for instructions with VEX prefix
7437 and 3 sources. */
7438 for (j = i.operands; j > 0; j--)
7439 {
7440 i.op[j] = i.op[j - 1];
7441 i.types[j] = i.types[j - 1];
7442 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7443 i.flags[j] = i.flags[j - 1];
7444 }
7445 i.op[0].regs
7446 = (const reg_entry *) hash_find (reg_hash, "xmm0");
7447 i.types[0] = regxmm;
7448 i.tm.operand_types[0] = regxmm;
7449
7450 i.operands += 2;
7451 i.reg_operands += 2;
7452 i.tm.operands += 2;
7453
7454 dupl++;
7455 dest++;
7456 i.op[dupl] = i.op[dest];
7457 i.types[dupl] = i.types[dest];
7458 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7459 i.flags[dupl] = i.flags[dest];
7460 }
7461 else
7462 {
7463 duplicate:
7464 i.operands++;
7465 i.reg_operands++;
7466 i.tm.operands++;
7467
7468 i.op[dupl] = i.op[dest];
7469 i.types[dupl] = i.types[dest];
7470 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7471 i.flags[dupl] = i.flags[dest];
7472 }
7473
7474 if (i.tm.opcode_modifier.immext)
7475 process_immext ();
7476 }
7477 else if (i.tm.operand_types[0].bitfield.instance == Accum
7478 && i.tm.operand_types[0].bitfield.xmmword)
7479 {
7480 unsigned int j;
7481
7482 for (j = 1; j < i.operands; j++)
7483 {
7484 i.op[j - 1] = i.op[j];
7485 i.types[j - 1] = i.types[j];
7486
7487 /* We need to adjust fields in i.tm since they are used by
7488 build_modrm_byte. */
7489 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7490
7491 i.flags[j - 1] = i.flags[j];
7492 }
7493
7494 i.operands--;
7495 i.reg_operands--;
7496 i.tm.operands--;
7497 }
7498 else if (i.tm.opcode_modifier.implicitquadgroup)
7499 {
7500 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7501
7502 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7503 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7504 regnum = register_number (i.op[1].regs);
7505 first_reg_in_group = regnum & ~3;
7506 last_reg_in_group = first_reg_in_group + 3;
7507 if (regnum != first_reg_in_group)
7508 as_warn (_("source register `%s%s' implicitly denotes"
7509 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7510 register_prefix, i.op[1].regs->reg_name,
7511 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7512 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7513 i.tm.name);
7514 }
7515 else if (i.tm.opcode_modifier.regkludge)
7516 {
7517 /* The imul $imm, %reg instruction is converted into
7518 imul $imm, %reg, %reg, and the clr %reg instruction
7519 is converted into xor %reg, %reg. */
7520
7521 unsigned int first_reg_op;
7522
7523 if (operand_type_check (i.types[0], reg))
7524 first_reg_op = 0;
7525 else
7526 first_reg_op = 1;
7527 /* Pretend we saw the extra register operand. */
7528 gas_assert (i.reg_operands == 1
7529 && i.op[first_reg_op + 1].regs == 0);
7530 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7531 i.types[first_reg_op + 1] = i.types[first_reg_op];
7532 i.operands++;
7533 i.reg_operands++;
7534 }
7535
7536 if (i.tm.opcode_modifier.modrm)
7537 {
7538 /* The opcode is completed (modulo i.tm.extension_opcode which
7539 must be put into the modrm byte). Now, we make the modrm and
7540 index base bytes based on all the info we've collected. */
7541
7542 default_seg = build_modrm_byte ();
7543 }
7544 else if (i.types[0].bitfield.class == SReg)
7545 {
7546 if (flag_code != CODE_64BIT
7547 ? i.tm.base_opcode == POP_SEG_SHORT
7548 && i.op[0].regs->reg_num == 1
7549 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7550 && i.op[0].regs->reg_num < 4)
7551 {
7552 as_bad (_("you can't `%s %s%s'"),
7553 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7554 return 0;
7555 }
7556 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7557 {
7558 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7559 i.tm.opcode_length = 2;
7560 }
7561 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7562 }
7563 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7564 {
7565 default_seg = &ds;
7566 }
7567 else if (i.tm.opcode_modifier.isstring)
7568 {
7569 /* For the string instructions that allow a segment override
7570 on one of their operands, the default segment is ds. */
7571 default_seg = &ds;
7572 }
7573 else if (i.short_form)
7574 {
7575 /* The register or float register operand is in operand
7576 0 or 1. */
7577 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7578
7579 /* Register goes in low 3 bits of opcode. */
7580 i.tm.base_opcode |= i.op[op].regs->reg_num;
7581 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7582 i.rex |= REX_B;
7583 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7584 {
7585 /* Warn about some common errors, but press on regardless.
7586 The first case can be generated by gcc (<= 2.8.1). */
7587 if (i.operands == 2)
7588 {
7589 /* Reversed arguments on faddp, fsubp, etc. */
7590 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7591 register_prefix, i.op[!intel_syntax].regs->reg_name,
7592 register_prefix, i.op[intel_syntax].regs->reg_name);
7593 }
7594 else
7595 {
7596 /* Extraneous `l' suffix on fp insn. */
7597 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7598 register_prefix, i.op[0].regs->reg_name);
7599 }
7600 }
7601 }
7602
7603 if ((i.seg[0] || i.prefix[SEG_PREFIX])
7604 && i.tm.base_opcode == 0x8d /* lea */
7605 && !is_any_vex_encoding(&i.tm))
7606 {
7607 if (!quiet_warnings)
7608 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7609 if (optimize)
7610 {
7611 i.seg[0] = NULL;
7612 i.prefix[SEG_PREFIX] = 0;
7613 }
7614 }
7615
7616 /* If a segment was explicitly specified, and the specified segment
7617 is neither the default nor the one already recorded from a prefix,
7618 use an opcode prefix to select it. If we never figured out what
7619 the default segment is, then default_seg will be zero at this
7620 point, and the specified segment prefix will always be used. */
7621 if (i.seg[0]
7622 && i.seg[0] != default_seg
7623 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7624 {
7625 if (!add_prefix (i.seg[0]->seg_prefix))
7626 return 0;
7627 }
7628 return 1;
7629 }
7630
7631 static const seg_entry *
7632 build_modrm_byte (void)
7633 {
7634 const seg_entry *default_seg = 0;
7635 unsigned int source, dest;
7636 int vex_3_sources;
7637
7638 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7639 if (vex_3_sources)
7640 {
7641 unsigned int nds, reg_slot;
7642 expressionS *exp;
7643
7644 dest = i.operands - 1;
7645 nds = dest - 1;
7646
7647 /* There are 2 kinds of instructions:
7648 1. 5 operands: 4 register operands or 3 register operands
7649 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7650 VexW0 or VexW1. The destination must be either XMM, YMM or
7651 ZMM register.
7652 2. 4 operands: 4 register operands or 3 register operands
7653 plus 1 memory operand, with VexXDS. */
7654 gas_assert ((i.reg_operands == 4
7655 || (i.reg_operands == 3 && i.mem_operands == 1))
7656 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7657 && i.tm.opcode_modifier.vexw
7658 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7659
7660 /* If VexW1 is set, the first non-immediate operand is the source and
7661 the second non-immediate one is encoded in the immediate operand. */
7662 if (i.tm.opcode_modifier.vexw == VEXW1)
7663 {
7664 source = i.imm_operands;
7665 reg_slot = i.imm_operands + 1;
7666 }
7667 else
7668 {
7669 source = i.imm_operands + 1;
7670 reg_slot = i.imm_operands;
7671 }
7672
7673 if (i.imm_operands == 0)
7674 {
7675 /* When there is no immediate operand, generate an 8bit
7676 immediate operand to encode the first operand. */
7677 exp = &im_expressions[i.imm_operands++];
7678 i.op[i.operands].imms = exp;
7679 i.types[i.operands] = imm8;
7680 i.operands++;
7681
7682 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7683 exp->X_op = O_constant;
7684 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7685 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7686 }
7687 else
7688 {
7689 gas_assert (i.imm_operands == 1);
7690 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7691 gas_assert (!i.tm.opcode_modifier.immext);
7692
7693 /* Turn on Imm8 again so that output_imm will generate it. */
7694 i.types[0].bitfield.imm8 = 1;
7695
7696 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7697 i.op[0].imms->X_add_number
7698 |= register_number (i.op[reg_slot].regs) << 4;
7699 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7700 }
7701
7702 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7703 i.vex.register_specifier = i.op[nds].regs;
7704 }
7705 else
7706 source = dest = 0;
7707
7708 /* i.reg_operands MUST be the number of real register operands;
7709 implicit registers do not count. If there are 3 register
7710 operands, it must be a instruction with VexNDS. For a
7711 instruction with VexNDD, the destination register is encoded
7712 in VEX prefix. If there are 4 register operands, it must be
7713 a instruction with VEX prefix and 3 sources. */
7714 if (i.mem_operands == 0
7715 && ((i.reg_operands == 2
7716 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7717 || (i.reg_operands == 3
7718 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7719 || (i.reg_operands == 4 && vex_3_sources)))
7720 {
7721 switch (i.operands)
7722 {
7723 case 2:
7724 source = 0;
7725 break;
7726 case 3:
7727 /* When there are 3 operands, one of them may be immediate,
7728 which may be the first or the last operand. Otherwise,
7729 the first operand must be shift count register (cl) or it
7730 is an instruction with VexNDS. */
7731 gas_assert (i.imm_operands == 1
7732 || (i.imm_operands == 0
7733 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7734 || (i.types[0].bitfield.instance == RegC
7735 && i.types[0].bitfield.byte))));
7736 if (operand_type_check (i.types[0], imm)
7737 || (i.types[0].bitfield.instance == RegC
7738 && i.types[0].bitfield.byte))
7739 source = 1;
7740 else
7741 source = 0;
7742 break;
7743 case 4:
7744 /* When there are 4 operands, the first two must be 8bit
7745 immediate operands. The source operand will be the 3rd
7746 one.
7747
7748 For instructions with VexNDS, if the first operand
7749 an imm8, the source operand is the 2nd one. If the last
7750 operand is imm8, the source operand is the first one. */
7751 gas_assert ((i.imm_operands == 2
7752 && i.types[0].bitfield.imm8
7753 && i.types[1].bitfield.imm8)
7754 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7755 && i.imm_operands == 1
7756 && (i.types[0].bitfield.imm8
7757 || i.types[i.operands - 1].bitfield.imm8
7758 || i.rounding)));
7759 if (i.imm_operands == 2)
7760 source = 2;
7761 else
7762 {
7763 if (i.types[0].bitfield.imm8)
7764 source = 1;
7765 else
7766 source = 0;
7767 }
7768 break;
7769 case 5:
7770 if (is_evex_encoding (&i.tm))
7771 {
7772 /* For EVEX instructions, when there are 5 operands, the
7773 first one must be immediate operand. If the second one
7774 is immediate operand, the source operand is the 3th
7775 one. If the last one is immediate operand, the source
7776 operand is the 2nd one. */
7777 gas_assert (i.imm_operands == 2
7778 && i.tm.opcode_modifier.sae
7779 && operand_type_check (i.types[0], imm));
7780 if (operand_type_check (i.types[1], imm))
7781 source = 2;
7782 else if (operand_type_check (i.types[4], imm))
7783 source = 1;
7784 else
7785 abort ();
7786 }
7787 break;
7788 default:
7789 abort ();
7790 }
7791
7792 if (!vex_3_sources)
7793 {
7794 dest = source + 1;
7795
7796 /* RC/SAE operand could be between DEST and SRC. That happens
7797 when one operand is GPR and the other one is XMM/YMM/ZMM
7798 register. */
7799 if (i.rounding && i.rounding->operand == (int) dest)
7800 dest++;
7801
7802 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7803 {
7804 /* For instructions with VexNDS, the register-only source
7805 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7806 register. It is encoded in VEX prefix. */
7807
7808 i386_operand_type op;
7809 unsigned int vvvv;
7810
7811 /* Check register-only source operand when two source
7812 operands are swapped. */
7813 if (!i.tm.operand_types[source].bitfield.baseindex
7814 && i.tm.operand_types[dest].bitfield.baseindex)
7815 {
7816 vvvv = source;
7817 source = dest;
7818 }
7819 else
7820 vvvv = dest;
7821
7822 op = i.tm.operand_types[vvvv];
7823 if ((dest + 1) >= i.operands
7824 || ((op.bitfield.class != Reg
7825 || (!op.bitfield.dword && !op.bitfield.qword))
7826 && op.bitfield.class != RegSIMD
7827 && !operand_type_equal (&op, &regmask)))
7828 abort ();
7829 i.vex.register_specifier = i.op[vvvv].regs;
7830 dest++;
7831 }
7832 }
7833
7834 i.rm.mode = 3;
7835 /* One of the register operands will be encoded in the i.rm.reg
7836 field, the other in the combined i.rm.mode and i.rm.regmem
7837 fields. If no form of this instruction supports a memory
7838 destination operand, then we assume the source operand may
7839 sometimes be a memory operand and so we need to store the
7840 destination in the i.rm.reg field. */
7841 if (!i.tm.opcode_modifier.regmem
7842 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7843 {
7844 i.rm.reg = i.op[dest].regs->reg_num;
7845 i.rm.regmem = i.op[source].regs->reg_num;
7846 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7847 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7848 i.has_regmmx = TRUE;
7849 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7850 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7851 {
7852 if (i.types[dest].bitfield.zmmword
7853 || i.types[source].bitfield.zmmword)
7854 i.has_regzmm = TRUE;
7855 else if (i.types[dest].bitfield.ymmword
7856 || i.types[source].bitfield.ymmword)
7857 i.has_regymm = TRUE;
7858 else
7859 i.has_regxmm = TRUE;
7860 }
7861 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7862 i.rex |= REX_R;
7863 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7864 i.vrex |= REX_R;
7865 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7866 i.rex |= REX_B;
7867 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7868 i.vrex |= REX_B;
7869 }
7870 else
7871 {
7872 i.rm.reg = i.op[source].regs->reg_num;
7873 i.rm.regmem = i.op[dest].regs->reg_num;
7874 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7875 i.rex |= REX_B;
7876 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7877 i.vrex |= REX_B;
7878 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7879 i.rex |= REX_R;
7880 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7881 i.vrex |= REX_R;
7882 }
7883 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7884 {
7885 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7886 abort ();
7887 i.rex &= ~REX_R;
7888 add_prefix (LOCK_PREFIX_OPCODE);
7889 }
7890 }
7891 else
7892 { /* If it's not 2 reg operands... */
7893 unsigned int mem;
7894
7895 if (i.mem_operands)
7896 {
7897 unsigned int fake_zero_displacement = 0;
7898 unsigned int op;
7899
7900 for (op = 0; op < i.operands; op++)
7901 if (i.flags[op] & Operand_Mem)
7902 break;
7903 gas_assert (op < i.operands);
7904
7905 if (i.tm.opcode_modifier.vecsib)
7906 {
7907 if (i.index_reg->reg_num == RegIZ)
7908 abort ();
7909
7910 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7911 if (!i.base_reg)
7912 {
7913 i.sib.base = NO_BASE_REGISTER;
7914 i.sib.scale = i.log2_scale_factor;
7915 i.types[op].bitfield.disp8 = 0;
7916 i.types[op].bitfield.disp16 = 0;
7917 i.types[op].bitfield.disp64 = 0;
7918 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7919 {
7920 /* Must be 32 bit */
7921 i.types[op].bitfield.disp32 = 1;
7922 i.types[op].bitfield.disp32s = 0;
7923 }
7924 else
7925 {
7926 i.types[op].bitfield.disp32 = 0;
7927 i.types[op].bitfield.disp32s = 1;
7928 }
7929 }
7930 i.sib.index = i.index_reg->reg_num;
7931 if ((i.index_reg->reg_flags & RegRex) != 0)
7932 i.rex |= REX_X;
7933 if ((i.index_reg->reg_flags & RegVRex) != 0)
7934 i.vrex |= REX_X;
7935 }
7936
7937 default_seg = &ds;
7938
7939 if (i.base_reg == 0)
7940 {
7941 i.rm.mode = 0;
7942 if (!i.disp_operands)
7943 fake_zero_displacement = 1;
7944 if (i.index_reg == 0)
7945 {
7946 i386_operand_type newdisp;
7947
7948 gas_assert (!i.tm.opcode_modifier.vecsib);
7949 /* Operand is just <disp> */
7950 if (flag_code == CODE_64BIT)
7951 {
7952 /* 64bit mode overwrites the 32bit absolute
7953 addressing by RIP relative addressing and
7954 absolute addressing is encoded by one of the
7955 redundant SIB forms. */
7956 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7957 i.sib.base = NO_BASE_REGISTER;
7958 i.sib.index = NO_INDEX_REGISTER;
7959 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7960 }
7961 else if ((flag_code == CODE_16BIT)
7962 ^ (i.prefix[ADDR_PREFIX] != 0))
7963 {
7964 i.rm.regmem = NO_BASE_REGISTER_16;
7965 newdisp = disp16;
7966 }
7967 else
7968 {
7969 i.rm.regmem = NO_BASE_REGISTER;
7970 newdisp = disp32;
7971 }
7972 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7973 i.types[op] = operand_type_or (i.types[op], newdisp);
7974 }
7975 else if (!i.tm.opcode_modifier.vecsib)
7976 {
7977 /* !i.base_reg && i.index_reg */
7978 if (i.index_reg->reg_num == RegIZ)
7979 i.sib.index = NO_INDEX_REGISTER;
7980 else
7981 i.sib.index = i.index_reg->reg_num;
7982 i.sib.base = NO_BASE_REGISTER;
7983 i.sib.scale = i.log2_scale_factor;
7984 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7985 i.types[op].bitfield.disp8 = 0;
7986 i.types[op].bitfield.disp16 = 0;
7987 i.types[op].bitfield.disp64 = 0;
7988 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7989 {
7990 /* Must be 32 bit */
7991 i.types[op].bitfield.disp32 = 1;
7992 i.types[op].bitfield.disp32s = 0;
7993 }
7994 else
7995 {
7996 i.types[op].bitfield.disp32 = 0;
7997 i.types[op].bitfield.disp32s = 1;
7998 }
7999 if ((i.index_reg->reg_flags & RegRex) != 0)
8000 i.rex |= REX_X;
8001 }
8002 }
8003 /* RIP addressing for 64bit mode. */
8004 else if (i.base_reg->reg_num == RegIP)
8005 {
8006 gas_assert (!i.tm.opcode_modifier.vecsib);
8007 i.rm.regmem = NO_BASE_REGISTER;
8008 i.types[op].bitfield.disp8 = 0;
8009 i.types[op].bitfield.disp16 = 0;
8010 i.types[op].bitfield.disp32 = 0;
8011 i.types[op].bitfield.disp32s = 1;
8012 i.types[op].bitfield.disp64 = 0;
8013 i.flags[op] |= Operand_PCrel;
8014 if (! i.disp_operands)
8015 fake_zero_displacement = 1;
8016 }
8017 else if (i.base_reg->reg_type.bitfield.word)
8018 {
8019 gas_assert (!i.tm.opcode_modifier.vecsib);
8020 switch (i.base_reg->reg_num)
8021 {
8022 case 3: /* (%bx) */
8023 if (i.index_reg == 0)
8024 i.rm.regmem = 7;
8025 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
8026 i.rm.regmem = i.index_reg->reg_num - 6;
8027 break;
8028 case 5: /* (%bp) */
8029 default_seg = &ss;
8030 if (i.index_reg == 0)
8031 {
8032 i.rm.regmem = 6;
8033 if (operand_type_check (i.types[op], disp) == 0)
8034 {
8035 /* fake (%bp) into 0(%bp) */
8036 i.types[op].bitfield.disp8 = 1;
8037 fake_zero_displacement = 1;
8038 }
8039 }
8040 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
8041 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8042 break;
8043 default: /* (%si) -> 4 or (%di) -> 5 */
8044 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8045 }
8046 i.rm.mode = mode_from_disp_size (i.types[op]);
8047 }
8048 else /* i.base_reg and 32/64 bit mode */
8049 {
8050 if (flag_code == CODE_64BIT
8051 && operand_type_check (i.types[op], disp))
8052 {
8053 i.types[op].bitfield.disp16 = 0;
8054 i.types[op].bitfield.disp64 = 0;
8055 if (i.prefix[ADDR_PREFIX] == 0)
8056 {
8057 i.types[op].bitfield.disp32 = 0;
8058 i.types[op].bitfield.disp32s = 1;
8059 }
8060 else
8061 {
8062 i.types[op].bitfield.disp32 = 1;
8063 i.types[op].bitfield.disp32s = 0;
8064 }
8065 }
8066
8067 if (!i.tm.opcode_modifier.vecsib)
8068 i.rm.regmem = i.base_reg->reg_num;
8069 if ((i.base_reg->reg_flags & RegRex) != 0)
8070 i.rex |= REX_B;
8071 i.sib.base = i.base_reg->reg_num;
8072 /* x86-64 ignores REX prefix bit here to avoid decoder
8073 complications. */
8074 if (!(i.base_reg->reg_flags & RegRex)
8075 && (i.base_reg->reg_num == EBP_REG_NUM
8076 || i.base_reg->reg_num == ESP_REG_NUM))
8077 default_seg = &ss;
8078 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8079 {
8080 fake_zero_displacement = 1;
8081 i.types[op].bitfield.disp8 = 1;
8082 }
8083 i.sib.scale = i.log2_scale_factor;
8084 if (i.index_reg == 0)
8085 {
8086 gas_assert (!i.tm.opcode_modifier.vecsib);
8087 /* <disp>(%esp) becomes two byte modrm with no index
8088 register. We've already stored the code for esp
8089 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8090 Any base register besides %esp will not use the
8091 extra modrm byte. */
8092 i.sib.index = NO_INDEX_REGISTER;
8093 }
8094 else if (!i.tm.opcode_modifier.vecsib)
8095 {
8096 if (i.index_reg->reg_num == RegIZ)
8097 i.sib.index = NO_INDEX_REGISTER;
8098 else
8099 i.sib.index = i.index_reg->reg_num;
8100 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8101 if ((i.index_reg->reg_flags & RegRex) != 0)
8102 i.rex |= REX_X;
8103 }
8104
8105 if (i.disp_operands
8106 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8107 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8108 i.rm.mode = 0;
8109 else
8110 {
8111 if (!fake_zero_displacement
8112 && !i.disp_operands
8113 && i.disp_encoding)
8114 {
8115 fake_zero_displacement = 1;
8116 if (i.disp_encoding == disp_encoding_8bit)
8117 i.types[op].bitfield.disp8 = 1;
8118 else
8119 i.types[op].bitfield.disp32 = 1;
8120 }
8121 i.rm.mode = mode_from_disp_size (i.types[op]);
8122 }
8123 }
8124
8125 if (fake_zero_displacement)
8126 {
8127 /* Fakes a zero displacement assuming that i.types[op]
8128 holds the correct displacement size. */
8129 expressionS *exp;
8130
8131 gas_assert (i.op[op].disps == 0);
8132 exp = &disp_expressions[i.disp_operands++];
8133 i.op[op].disps = exp;
8134 exp->X_op = O_constant;
8135 exp->X_add_number = 0;
8136 exp->X_add_symbol = (symbolS *) 0;
8137 exp->X_op_symbol = (symbolS *) 0;
8138 }
8139
8140 mem = op;
8141 }
8142 else
8143 mem = ~0;
8144
8145 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8146 {
8147 if (operand_type_check (i.types[0], imm))
8148 i.vex.register_specifier = NULL;
8149 else
8150 {
8151 /* VEX.vvvv encodes one of the sources when the first
8152 operand is not an immediate. */
8153 if (i.tm.opcode_modifier.vexw == VEXW0)
8154 i.vex.register_specifier = i.op[0].regs;
8155 else
8156 i.vex.register_specifier = i.op[1].regs;
8157 }
8158
8159 /* Destination is a XMM register encoded in the ModRM.reg
8160 and VEX.R bit. */
8161 i.rm.reg = i.op[2].regs->reg_num;
8162 if ((i.op[2].regs->reg_flags & RegRex) != 0)
8163 i.rex |= REX_R;
8164
8165 /* ModRM.rm and VEX.B encodes the other source. */
8166 if (!i.mem_operands)
8167 {
8168 i.rm.mode = 3;
8169
8170 if (i.tm.opcode_modifier.vexw == VEXW0)
8171 i.rm.regmem = i.op[1].regs->reg_num;
8172 else
8173 i.rm.regmem = i.op[0].regs->reg_num;
8174
8175 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8176 i.rex |= REX_B;
8177 }
8178 }
8179 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8180 {
8181 i.vex.register_specifier = i.op[2].regs;
8182 if (!i.mem_operands)
8183 {
8184 i.rm.mode = 3;
8185 i.rm.regmem = i.op[1].regs->reg_num;
8186 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8187 i.rex |= REX_B;
8188 }
8189 }
8190 /* Fill in i.rm.reg or i.rm.regmem field with register operand
8191 (if any) based on i.tm.extension_opcode. Again, we must be
8192 careful to make sure that segment/control/debug/test/MMX
8193 registers are coded into the i.rm.reg field. */
8194 else if (i.reg_operands)
8195 {
8196 unsigned int op;
8197 unsigned int vex_reg = ~0;
8198
8199 for (op = 0; op < i.operands; op++)
8200 {
8201 if (i.types[op].bitfield.class == Reg
8202 || i.types[op].bitfield.class == RegBND
8203 || i.types[op].bitfield.class == RegMask
8204 || i.types[op].bitfield.class == SReg
8205 || i.types[op].bitfield.class == RegCR
8206 || i.types[op].bitfield.class == RegDR
8207 || i.types[op].bitfield.class == RegTR)
8208 break;
8209 if (i.types[op].bitfield.class == RegSIMD)
8210 {
8211 if (i.types[op].bitfield.zmmword)
8212 i.has_regzmm = TRUE;
8213 else if (i.types[op].bitfield.ymmword)
8214 i.has_regymm = TRUE;
8215 else
8216 i.has_regxmm = TRUE;
8217 break;
8218 }
8219 if (i.types[op].bitfield.class == RegMMX)
8220 {
8221 i.has_regmmx = TRUE;
8222 break;
8223 }
8224 }
8225
8226 if (vex_3_sources)
8227 op = dest;
8228 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8229 {
8230 /* For instructions with VexNDS, the register-only
8231 source operand is encoded in VEX prefix. */
8232 gas_assert (mem != (unsigned int) ~0);
8233
8234 if (op > mem)
8235 {
8236 vex_reg = op++;
8237 gas_assert (op < i.operands);
8238 }
8239 else
8240 {
8241 /* Check register-only source operand when two source
8242 operands are swapped. */
8243 if (!i.tm.operand_types[op].bitfield.baseindex
8244 && i.tm.operand_types[op + 1].bitfield.baseindex)
8245 {
8246 vex_reg = op;
8247 op += 2;
8248 gas_assert (mem == (vex_reg + 1)
8249 && op < i.operands);
8250 }
8251 else
8252 {
8253 vex_reg = op + 1;
8254 gas_assert (vex_reg < i.operands);
8255 }
8256 }
8257 }
8258 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8259 {
8260 /* For instructions with VexNDD, the register destination
8261 is encoded in VEX prefix. */
8262 if (i.mem_operands == 0)
8263 {
8264 /* There is no memory operand. */
8265 gas_assert ((op + 2) == i.operands);
8266 vex_reg = op + 1;
8267 }
8268 else
8269 {
8270 /* There are only 2 non-immediate operands. */
8271 gas_assert (op < i.imm_operands + 2
8272 && i.operands == i.imm_operands + 2);
8273 vex_reg = i.imm_operands + 1;
8274 }
8275 }
8276 else
8277 gas_assert (op < i.operands);
8278
8279 if (vex_reg != (unsigned int) ~0)
8280 {
8281 i386_operand_type *type = &i.tm.operand_types[vex_reg];
8282
8283 if ((type->bitfield.class != Reg
8284 || (!type->bitfield.dword && !type->bitfield.qword))
8285 && type->bitfield.class != RegSIMD
8286 && !operand_type_equal (type, &regmask))
8287 abort ();
8288
8289 i.vex.register_specifier = i.op[vex_reg].regs;
8290 }
8291
8292 /* Don't set OP operand twice. */
8293 if (vex_reg != op)
8294 {
8295 /* If there is an extension opcode to put here, the
8296 register number must be put into the regmem field. */
8297 if (i.tm.extension_opcode != None)
8298 {
8299 i.rm.regmem = i.op[op].regs->reg_num;
8300 if ((i.op[op].regs->reg_flags & RegRex) != 0)
8301 i.rex |= REX_B;
8302 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
8303 i.vrex |= REX_B;
8304 }
8305 else
8306 {
8307 i.rm.reg = i.op[op].regs->reg_num;
8308 if ((i.op[op].regs->reg_flags & RegRex) != 0)
8309 i.rex |= REX_R;
8310 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
8311 i.vrex |= REX_R;
8312 }
8313 }
8314
8315 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8316 must set it to 3 to indicate this is a register operand
8317 in the regmem field. */
8318 if (!i.mem_operands)
8319 i.rm.mode = 3;
8320 }
8321
8322 /* Fill in i.rm.reg field with extension opcode (if any). */
8323 if (i.tm.extension_opcode != None)
8324 i.rm.reg = i.tm.extension_opcode;
8325 }
8326 return default_seg;
8327 }
8328
8329 static unsigned int
8330 flip_code16 (unsigned int code16)
8331 {
8332 gas_assert (i.tm.operands == 1);
8333
8334 return !(i.prefix[REX_PREFIX] & REX_W)
8335 && (code16 ? i.tm.operand_types[0].bitfield.disp32
8336 || i.tm.operand_types[0].bitfield.disp32s
8337 : i.tm.operand_types[0].bitfield.disp16)
8338 ? CODE16 : 0;
8339 }
8340
8341 static void
8342 output_branch (void)
8343 {
8344 char *p;
8345 int size;
8346 int code16;
8347 int prefix;
8348 relax_substateT subtype;
8349 symbolS *sym;
8350 offsetT off;
8351
8352 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8353 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8354
8355 prefix = 0;
8356 if (i.prefix[DATA_PREFIX] != 0)
8357 {
8358 prefix = 1;
8359 i.prefixes -= 1;
8360 code16 ^= flip_code16(code16);
8361 }
8362 /* Pentium4 branch hints. */
8363 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8364 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8365 {
8366 prefix++;
8367 i.prefixes--;
8368 }
8369 if (i.prefix[REX_PREFIX] != 0)
8370 {
8371 prefix++;
8372 i.prefixes--;
8373 }
8374
8375 /* BND prefixed jump. */
8376 if (i.prefix[BND_PREFIX] != 0)
8377 {
8378 prefix++;
8379 i.prefixes--;
8380 }
8381
8382 if (i.prefixes != 0)
8383 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8384
8385 /* It's always a symbol; End frag & setup for relax.
8386 Make sure there is enough room in this frag for the largest
8387 instruction we may generate in md_convert_frag. This is 2
8388 bytes for the opcode and room for the prefix and largest
8389 displacement. */
8390 frag_grow (prefix + 2 + 4);
8391 /* Prefix and 1 opcode byte go in fr_fix. */
8392 p = frag_more (prefix + 1);
8393 if (i.prefix[DATA_PREFIX] != 0)
8394 *p++ = DATA_PREFIX_OPCODE;
8395 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8396 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8397 *p++ = i.prefix[SEG_PREFIX];
8398 if (i.prefix[BND_PREFIX] != 0)
8399 *p++ = BND_PREFIX_OPCODE;
8400 if (i.prefix[REX_PREFIX] != 0)
8401 *p++ = i.prefix[REX_PREFIX];
8402 *p = i.tm.base_opcode;
8403
8404 if ((unsigned char) *p == JUMP_PC_RELATIVE)
8405 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8406 else if (cpu_arch_flags.bitfield.cpui386)
8407 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8408 else
8409 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8410 subtype |= code16;
8411
8412 sym = i.op[0].disps->X_add_symbol;
8413 off = i.op[0].disps->X_add_number;
8414
8415 if (i.op[0].disps->X_op != O_constant
8416 && i.op[0].disps->X_op != O_symbol)
8417 {
8418 /* Handle complex expressions. */
8419 sym = make_expr_symbol (i.op[0].disps);
8420 off = 0;
8421 }
8422
8423 /* 1 possible extra opcode + 4 byte displacement go in var part.
8424 Pass reloc in fr_var. */
8425 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8426 }
8427
8428 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8429 /* Return TRUE iff PLT32 relocation should be used for branching to
8430 symbol S. */
8431
8432 static bfd_boolean
8433 need_plt32_p (symbolS *s)
8434 {
8435 /* PLT32 relocation is ELF only. */
8436 if (!IS_ELF)
8437 return FALSE;
8438
8439 #ifdef TE_SOLARIS
8440 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8441 krtld support it. */
8442 return FALSE;
8443 #endif
8444
8445 /* Since there is no need to prepare for PLT branch on x86-64, we
8446 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8447 be used as a marker for 32-bit PC-relative branches. */
8448 if (!object_64bit)
8449 return FALSE;
8450
8451 /* Weak or undefined symbol need PLT32 relocation. */
8452 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8453 return TRUE;
8454
8455 /* Non-global symbol doesn't need PLT32 relocation. */
8456 if (! S_IS_EXTERNAL (s))
8457 return FALSE;
8458
8459 /* Other global symbols need PLT32 relocation. NB: Symbol with
8460 non-default visibilities are treated as normal global symbol
8461 so that PLT32 relocation can be used as a marker for 32-bit
8462 PC-relative branches. It is useful for linker relaxation. */
8463 return TRUE;
8464 }
8465 #endif
8466
8467 static void
8468 output_jump (void)
8469 {
8470 char *p;
8471 int size;
8472 fixS *fixP;
8473 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8474
8475 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8476 {
8477 /* This is a loop or jecxz type instruction. */
8478 size = 1;
8479 if (i.prefix[ADDR_PREFIX] != 0)
8480 {
8481 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8482 i.prefixes -= 1;
8483 }
8484 /* Pentium4 branch hints. */
8485 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8486 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8487 {
8488 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8489 i.prefixes--;
8490 }
8491 }
8492 else
8493 {
8494 int code16;
8495
8496 code16 = 0;
8497 if (flag_code == CODE_16BIT)
8498 code16 = CODE16;
8499
8500 if (i.prefix[DATA_PREFIX] != 0)
8501 {
8502 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8503 i.prefixes -= 1;
8504 code16 ^= flip_code16(code16);
8505 }
8506
8507 size = 4;
8508 if (code16)
8509 size = 2;
8510 }
8511
8512 /* BND prefixed jump. */
8513 if (i.prefix[BND_PREFIX] != 0)
8514 {
8515 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8516 i.prefixes -= 1;
8517 }
8518
8519 if (i.prefix[REX_PREFIX] != 0)
8520 {
8521 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8522 i.prefixes -= 1;
8523 }
8524
8525 if (i.prefixes != 0)
8526 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8527
8528 p = frag_more (i.tm.opcode_length + size);
8529 switch (i.tm.opcode_length)
8530 {
8531 case 2:
8532 *p++ = i.tm.base_opcode >> 8;
8533 /* Fall through. */
8534 case 1:
8535 *p++ = i.tm.base_opcode;
8536 break;
8537 default:
8538 abort ();
8539 }
8540
8541 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8542 if (size == 4
8543 && jump_reloc == NO_RELOC
8544 && need_plt32_p (i.op[0].disps->X_add_symbol))
8545 jump_reloc = BFD_RELOC_X86_64_PLT32;
8546 #endif
8547
8548 jump_reloc = reloc (size, 1, 1, jump_reloc);
8549
8550 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8551 i.op[0].disps, 1, jump_reloc);
8552
8553 /* All jumps handled here are signed, but don't use a signed limit
8554 check for 32 and 16 bit jumps as we want to allow wrap around at
8555 4G and 64k respectively. */
8556 if (size == 1)
8557 fixP->fx_signed = 1;
8558 }
8559
8560 static void
8561 output_interseg_jump (void)
8562 {
8563 char *p;
8564 int size;
8565 int prefix;
8566 int code16;
8567
8568 code16 = 0;
8569 if (flag_code == CODE_16BIT)
8570 code16 = CODE16;
8571
8572 prefix = 0;
8573 if (i.prefix[DATA_PREFIX] != 0)
8574 {
8575 prefix = 1;
8576 i.prefixes -= 1;
8577 code16 ^= CODE16;
8578 }
8579
8580 gas_assert (!i.prefix[REX_PREFIX]);
8581
8582 size = 4;
8583 if (code16)
8584 size = 2;
8585
8586 if (i.prefixes != 0)
8587 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8588
8589 /* 1 opcode; 2 segment; offset */
8590 p = frag_more (prefix + 1 + 2 + size);
8591
8592 if (i.prefix[DATA_PREFIX] != 0)
8593 *p++ = DATA_PREFIX_OPCODE;
8594
8595 if (i.prefix[REX_PREFIX] != 0)
8596 *p++ = i.prefix[REX_PREFIX];
8597
8598 *p++ = i.tm.base_opcode;
8599 if (i.op[1].imms->X_op == O_constant)
8600 {
8601 offsetT n = i.op[1].imms->X_add_number;
8602
8603 if (size == 2
8604 && !fits_in_unsigned_word (n)
8605 && !fits_in_signed_word (n))
8606 {
8607 as_bad (_("16-bit jump out of range"));
8608 return;
8609 }
8610 md_number_to_chars (p, n, size);
8611 }
8612 else
8613 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8614 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8615 if (i.op[0].imms->X_op != O_constant)
8616 as_bad (_("can't handle non absolute segment in `%s'"),
8617 i.tm.name);
8618 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8619 }
8620
8621 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8622 void
8623 x86_cleanup (void)
8624 {
8625 char *p;
8626 asection *seg = now_seg;
8627 subsegT subseg = now_subseg;
8628 asection *sec;
8629 unsigned int alignment, align_size_1;
8630 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8631 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8632 unsigned int padding;
8633
8634 if (!IS_ELF || !x86_used_note)
8635 return;
8636
8637 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8638
8639 /* The .note.gnu.property section layout:
8640
8641 Field Length Contents
8642 ---- ---- ----
8643 n_namsz 4 4
8644 n_descsz 4 The note descriptor size
8645 n_type 4 NT_GNU_PROPERTY_TYPE_0
8646 n_name 4 "GNU"
8647 n_desc n_descsz The program property array
8648 .... .... ....
8649 */
8650
8651 /* Create the .note.gnu.property section. */
8652 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8653 bfd_set_section_flags (sec,
8654 (SEC_ALLOC
8655 | SEC_LOAD
8656 | SEC_DATA
8657 | SEC_HAS_CONTENTS
8658 | SEC_READONLY));
8659
8660 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8661 {
8662 align_size_1 = 7;
8663 alignment = 3;
8664 }
8665 else
8666 {
8667 align_size_1 = 3;
8668 alignment = 2;
8669 }
8670
8671 bfd_set_section_alignment (sec, alignment);
8672 elf_section_type (sec) = SHT_NOTE;
8673
8674 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8675 + 4-byte data */
8676 isa_1_descsz_raw = 4 + 4 + 4;
8677 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8678 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8679
8680 feature_2_descsz_raw = isa_1_descsz;
8681 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8682 + 4-byte data */
8683 feature_2_descsz_raw += 4 + 4 + 4;
8684 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8685 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8686 & ~align_size_1);
8687
8688 descsz = feature_2_descsz;
8689 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8690 p = frag_more (4 + 4 + 4 + 4 + descsz);
8691
8692 /* Write n_namsz. */
8693 md_number_to_chars (p, (valueT) 4, 4);
8694
8695 /* Write n_descsz. */
8696 md_number_to_chars (p + 4, (valueT) descsz, 4);
8697
8698 /* Write n_type. */
8699 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8700
8701 /* Write n_name. */
8702 memcpy (p + 4 * 3, "GNU", 4);
8703
8704 /* Write 4-byte type. */
8705 md_number_to_chars (p + 4 * 4,
8706 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8707
8708 /* Write 4-byte data size. */
8709 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8710
8711 /* Write 4-byte data. */
8712 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8713
8714 /* Zero out paddings. */
8715 padding = isa_1_descsz - isa_1_descsz_raw;
8716 if (padding)
8717 memset (p + 4 * 7, 0, padding);
8718
8719 /* Write 4-byte type. */
8720 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8721 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8722
8723 /* Write 4-byte data size. */
8724 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8725
8726 /* Write 4-byte data. */
8727 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8728 (valueT) x86_feature_2_used, 4);
8729
8730 /* Zero out paddings. */
8731 padding = feature_2_descsz - feature_2_descsz_raw;
8732 if (padding)
8733 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8734
8735 /* We probably can't restore the current segment, for there likely
8736 isn't one yet... */
8737 if (seg && subseg)
8738 subseg_set (seg, subseg);
8739 }
8740 #endif
8741
8742 static unsigned int
8743 encoding_length (const fragS *start_frag, offsetT start_off,
8744 const char *frag_now_ptr)
8745 {
8746 unsigned int len = 0;
8747
8748 if (start_frag != frag_now)
8749 {
8750 const fragS *fr = start_frag;
8751
8752 do {
8753 len += fr->fr_fix;
8754 fr = fr->fr_next;
8755 } while (fr && fr != frag_now);
8756 }
8757
8758 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8759 }
8760
8761 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8762 be macro-fused with conditional jumps.
8763 NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8764 or is one of the following format:
8765
8766 cmp m, imm
8767 add m, imm
8768 sub m, imm
8769 test m, imm
8770 and m, imm
8771 inc m
8772 dec m
8773
8774 it is unfusible. */
8775
8776 static int
8777 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8778 {
8779 /* No RIP address. */
8780 if (i.base_reg && i.base_reg->reg_num == RegIP)
8781 return 0;
8782
8783 /* No VEX/EVEX encoding. */
8784 if (is_any_vex_encoding (&i.tm))
8785 return 0;
8786
8787 /* add, sub without add/sub m, imm. */
8788 if (i.tm.base_opcode <= 5
8789 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8790 || ((i.tm.base_opcode | 3) == 0x83
8791 && (i.tm.extension_opcode == 0x5
8792 || i.tm.extension_opcode == 0x0)))
8793 {
8794 *mf_cmp_p = mf_cmp_alu_cmp;
8795 return !(i.mem_operands && i.imm_operands);
8796 }
8797
8798 /* and without and m, imm. */
8799 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8800 || ((i.tm.base_opcode | 3) == 0x83
8801 && i.tm.extension_opcode == 0x4))
8802 {
8803 *mf_cmp_p = mf_cmp_test_and;
8804 return !(i.mem_operands && i.imm_operands);
8805 }
8806
8807 /* test without test m imm. */
8808 if ((i.tm.base_opcode | 1) == 0x85
8809 || (i.tm.base_opcode | 1) == 0xa9
8810 || ((i.tm.base_opcode | 1) == 0xf7
8811 && i.tm.extension_opcode == 0))
8812 {
8813 *mf_cmp_p = mf_cmp_test_and;
8814 return !(i.mem_operands && i.imm_operands);
8815 }
8816
8817 /* cmp without cmp m, imm. */
8818 if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8819 || ((i.tm.base_opcode | 3) == 0x83
8820 && (i.tm.extension_opcode == 0x7)))
8821 {
8822 *mf_cmp_p = mf_cmp_alu_cmp;
8823 return !(i.mem_operands && i.imm_operands);
8824 }
8825
8826 /* inc, dec without inc/dec m. */
8827 if ((i.tm.cpu_flags.bitfield.cpuno64
8828 && (i.tm.base_opcode | 0xf) == 0x4f)
8829 || ((i.tm.base_opcode | 1) == 0xff
8830 && i.tm.extension_opcode <= 0x1))
8831 {
8832 *mf_cmp_p = mf_cmp_incdec;
8833 return !i.mem_operands;
8834 }
8835
8836 return 0;
8837 }
8838
8839 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8840
8841 static int
8842 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
8843 {
8844 /* NB: Don't work with COND_JUMP86 without i386. */
8845 if (!align_branch_power
8846 || now_seg == absolute_section
8847 || !cpu_arch_flags.bitfield.cpui386
8848 || !(align_branch & align_branch_fused_bit))
8849 return 0;
8850
8851 if (maybe_fused_with_jcc_p (mf_cmp_p))
8852 {
8853 if (last_insn.kind == last_insn_other
8854 || last_insn.seg != now_seg)
8855 return 1;
8856 if (flag_debug)
8857 as_warn_where (last_insn.file, last_insn.line,
8858 _("`%s` skips -malign-branch-boundary on `%s`"),
8859 last_insn.name, i.tm.name);
8860 }
8861
8862 return 0;
8863 }
8864
8865 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
8866
8867 static int
8868 add_branch_prefix_frag_p (void)
8869 {
8870 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8871 to PadLock instructions since they include prefixes in opcode. */
8872 if (!align_branch_power
8873 || !align_branch_prefix_size
8874 || now_seg == absolute_section
8875 || i.tm.cpu_flags.bitfield.cpupadlock
8876 || !cpu_arch_flags.bitfield.cpui386)
8877 return 0;
8878
8879 /* Don't add prefix if it is a prefix or there is no operand in case
8880 that segment prefix is special. */
8881 if (!i.operands || i.tm.opcode_modifier.isprefix)
8882 return 0;
8883
8884 if (last_insn.kind == last_insn_other
8885 || last_insn.seg != now_seg)
8886 return 1;
8887
8888 if (flag_debug)
8889 as_warn_where (last_insn.file, last_insn.line,
8890 _("`%s` skips -malign-branch-boundary on `%s`"),
8891 last_insn.name, i.tm.name);
8892
8893 return 0;
8894 }
8895
8896 /* Return 1 if a BRANCH_PADDING frag should be generated. */
8897
8898 static int
8899 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
8900 enum mf_jcc_kind *mf_jcc_p)
8901 {
8902 int add_padding;
8903
8904 /* NB: Don't work with COND_JUMP86 without i386. */
8905 if (!align_branch_power
8906 || now_seg == absolute_section
8907 || !cpu_arch_flags.bitfield.cpui386)
8908 return 0;
8909
8910 add_padding = 0;
8911
8912 /* Check for jcc and direct jmp. */
8913 if (i.tm.opcode_modifier.jump == JUMP)
8914 {
8915 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8916 {
8917 *branch_p = align_branch_jmp;
8918 add_padding = align_branch & align_branch_jmp_bit;
8919 }
8920 else
8921 {
8922 /* Because J<cc> and JN<cc> share same group in macro-fusible table,
8923 igore the lowest bit. */
8924 *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
8925 *branch_p = align_branch_jcc;
8926 if ((align_branch & align_branch_jcc_bit))
8927 add_padding = 1;
8928 }
8929 }
8930 else if (is_any_vex_encoding (&i.tm))
8931 return 0;
8932 else if ((i.tm.base_opcode | 1) == 0xc3)
8933 {
8934 /* Near ret. */
8935 *branch_p = align_branch_ret;
8936 if ((align_branch & align_branch_ret_bit))
8937 add_padding = 1;
8938 }
8939 else
8940 {
8941 /* Check for indirect jmp, direct and indirect calls. */
8942 if (i.tm.base_opcode == 0xe8)
8943 {
8944 /* Direct call. */
8945 *branch_p = align_branch_call;
8946 if ((align_branch & align_branch_call_bit))
8947 add_padding = 1;
8948 }
8949 else if (i.tm.base_opcode == 0xff
8950 && (i.tm.extension_opcode == 2
8951 || i.tm.extension_opcode == 4))
8952 {
8953 /* Indirect call and jmp. */
8954 *branch_p = align_branch_indirect;
8955 if ((align_branch & align_branch_indirect_bit))
8956 add_padding = 1;
8957 }
8958
8959 if (add_padding
8960 && i.disp_operands
8961 && tls_get_addr
8962 && (i.op[0].disps->X_op == O_symbol
8963 || (i.op[0].disps->X_op == O_subtract
8964 && i.op[0].disps->X_op_symbol == GOT_symbol)))
8965 {
8966 symbolS *s = i.op[0].disps->X_add_symbol;
8967 /* No padding to call to global or undefined tls_get_addr. */
8968 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
8969 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
8970 return 0;
8971 }
8972 }
8973
8974 if (add_padding
8975 && last_insn.kind != last_insn_other
8976 && last_insn.seg == now_seg)
8977 {
8978 if (flag_debug)
8979 as_warn_where (last_insn.file, last_insn.line,
8980 _("`%s` skips -malign-branch-boundary on `%s`"),
8981 last_insn.name, i.tm.name);
8982 return 0;
8983 }
8984
8985 return add_padding;
8986 }
8987
8988 static void
8989 output_insn (void)
8990 {
8991 fragS *insn_start_frag;
8992 offsetT insn_start_off;
8993 fragS *fragP = NULL;
8994 enum align_branch_kind branch = align_branch_none;
8995 /* The initializer is arbitrary just to avoid uninitialized error.
8996 it's actually either assigned in add_branch_padding_frag_p
8997 or never be used. */
8998 enum mf_jcc_kind mf_jcc = mf_jcc_jo;
8999
9000 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9001 if (IS_ELF && x86_used_note)
9002 {
9003 if (i.tm.cpu_flags.bitfield.cpucmov)
9004 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
9005 if (i.tm.cpu_flags.bitfield.cpusse)
9006 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
9007 if (i.tm.cpu_flags.bitfield.cpusse2)
9008 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
9009 if (i.tm.cpu_flags.bitfield.cpusse3)
9010 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
9011 if (i.tm.cpu_flags.bitfield.cpussse3)
9012 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
9013 if (i.tm.cpu_flags.bitfield.cpusse4_1)
9014 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
9015 if (i.tm.cpu_flags.bitfield.cpusse4_2)
9016 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
9017 if (i.tm.cpu_flags.bitfield.cpuavx)
9018 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
9019 if (i.tm.cpu_flags.bitfield.cpuavx2)
9020 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
9021 if (i.tm.cpu_flags.bitfield.cpufma)
9022 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
9023 if (i.tm.cpu_flags.bitfield.cpuavx512f)
9024 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
9025 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
9026 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
9027 if (i.tm.cpu_flags.bitfield.cpuavx512er)
9028 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
9029 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
9030 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
9031 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
9032 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
9033 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
9034 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
9035 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
9036 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
9037 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
9038 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
9039 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
9040 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
9041 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
9042 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
9043 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
9044 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
9045 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
9046 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
9047 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
9048 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
9049 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
9050 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
9051 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
9052 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
9053
9054 if (i.tm.cpu_flags.bitfield.cpu8087
9055 || i.tm.cpu_flags.bitfield.cpu287
9056 || i.tm.cpu_flags.bitfield.cpu387
9057 || i.tm.cpu_flags.bitfield.cpu687
9058 || i.tm.cpu_flags.bitfield.cpufisttp)
9059 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9060 if (i.has_regmmx
9061 || i.tm.base_opcode == 0xf77 /* emms */
9062 || i.tm.base_opcode == 0xf0e /* femms */
9063 || i.tm.base_opcode == 0xf2a /* cvtpi2ps */
9064 || i.tm.base_opcode == 0x660f2a /* cvtpi2pd */)
9065 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9066 if (i.has_regxmm)
9067 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9068 if (i.has_regymm)
9069 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9070 if (i.has_regzmm)
9071 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9072 if (i.tm.cpu_flags.bitfield.cpufxsr)
9073 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9074 if (i.tm.cpu_flags.bitfield.cpuxsave)
9075 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9076 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9077 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9078 if (i.tm.cpu_flags.bitfield.cpuxsavec)
9079 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9080 }
9081 #endif
9082
9083 /* Tie dwarf2 debug info to the address at the start of the insn.
9084 We can't do this after the insn has been output as the current
9085 frag may have been closed off. eg. by frag_var. */
9086 dwarf2_emit_insn (0);
9087
9088 insn_start_frag = frag_now;
9089 insn_start_off = frag_now_fix ();
9090
9091 if (add_branch_padding_frag_p (&branch, &mf_jcc))
9092 {
9093 char *p;
9094 /* Branch can be 8 bytes. Leave some room for prefixes. */
9095 unsigned int max_branch_padding_size = 14;
9096
9097 /* Align section to boundary. */
9098 record_alignment (now_seg, align_branch_power);
9099
9100 /* Make room for padding. */
9101 frag_grow (max_branch_padding_size);
9102
9103 /* Start of the padding. */
9104 p = frag_more (0);
9105
9106 fragP = frag_now;
9107
9108 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9109 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9110 NULL, 0, p);
9111
9112 fragP->tc_frag_data.mf_type = mf_jcc;
9113 fragP->tc_frag_data.branch_type = branch;
9114 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9115 }
9116
9117 /* Output jumps. */
9118 if (i.tm.opcode_modifier.jump == JUMP)
9119 output_branch ();
9120 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9121 || i.tm.opcode_modifier.jump == JUMP_DWORD)
9122 output_jump ();
9123 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9124 output_interseg_jump ();
9125 else
9126 {
9127 /* Output normal instructions here. */
9128 char *p;
9129 unsigned char *q;
9130 unsigned int j;
9131 unsigned int prefix;
9132 enum mf_cmp_kind mf_cmp;
9133
9134 if (avoid_fence
9135 && (i.tm.base_opcode == 0xfaee8
9136 || i.tm.base_opcode == 0xfaef0
9137 || i.tm.base_opcode == 0xfaef8))
9138 {
9139 /* Encode lfence, mfence, and sfence as
9140 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
9141 offsetT val = 0x240483f0ULL;
9142 p = frag_more (5);
9143 md_number_to_chars (p, val, 5);
9144 return;
9145 }
9146
9147 /* Some processors fail on LOCK prefix. This options makes
9148 assembler ignore LOCK prefix and serves as a workaround. */
9149 if (omit_lock_prefix)
9150 {
9151 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9152 return;
9153 i.prefix[LOCK_PREFIX] = 0;
9154 }
9155
9156 if (branch)
9157 /* Skip if this is a branch. */
9158 ;
9159 else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9160 {
9161 /* Make room for padding. */
9162 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9163 p = frag_more (0);
9164
9165 fragP = frag_now;
9166
9167 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9168 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9169 NULL, 0, p);
9170
9171 fragP->tc_frag_data.mf_type = mf_cmp;
9172 fragP->tc_frag_data.branch_type = align_branch_fused;
9173 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9174 }
9175 else if (add_branch_prefix_frag_p ())
9176 {
9177 unsigned int max_prefix_size = align_branch_prefix_size;
9178
9179 /* Make room for padding. */
9180 frag_grow (max_prefix_size);
9181 p = frag_more (0);
9182
9183 fragP = frag_now;
9184
9185 frag_var (rs_machine_dependent, max_prefix_size, 0,
9186 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9187 NULL, 0, p);
9188
9189 fragP->tc_frag_data.max_bytes = max_prefix_size;
9190 }
9191
9192 /* Since the VEX/EVEX prefix contains the implicit prefix, we
9193 don't need the explicit prefix. */
9194 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9195 {
9196 switch (i.tm.opcode_length)
9197 {
9198 case 3:
9199 if (i.tm.base_opcode & 0xff000000)
9200 {
9201 prefix = (i.tm.base_opcode >> 24) & 0xff;
9202 if (!i.tm.cpu_flags.bitfield.cpupadlock
9203 || prefix != REPE_PREFIX_OPCODE
9204 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
9205 add_prefix (prefix);
9206 }
9207 break;
9208 case 2:
9209 if ((i.tm.base_opcode & 0xff0000) != 0)
9210 {
9211 prefix = (i.tm.base_opcode >> 16) & 0xff;
9212 add_prefix (prefix);
9213 }
9214 break;
9215 case 1:
9216 break;
9217 case 0:
9218 /* Check for pseudo prefixes. */
9219 as_bad_where (insn_start_frag->fr_file,
9220 insn_start_frag->fr_line,
9221 _("pseudo prefix without instruction"));
9222 return;
9223 default:
9224 abort ();
9225 }
9226
9227 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9228 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9229 R_X86_64_GOTTPOFF relocation so that linker can safely
9230 perform IE->LE optimization. A dummy REX_OPCODE prefix
9231 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9232 relocation for GDesc -> IE/LE optimization. */
9233 if (x86_elf_abi == X86_64_X32_ABI
9234 && i.operands == 2
9235 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9236 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9237 && i.prefix[REX_PREFIX] == 0)
9238 add_prefix (REX_OPCODE);
9239 #endif
9240
9241 /* The prefix bytes. */
9242 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9243 if (*q)
9244 FRAG_APPEND_1_CHAR (*q);
9245 }
9246 else
9247 {
9248 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9249 if (*q)
9250 switch (j)
9251 {
9252 case REX_PREFIX:
9253 /* REX byte is encoded in VEX prefix. */
9254 break;
9255 case SEG_PREFIX:
9256 case ADDR_PREFIX:
9257 FRAG_APPEND_1_CHAR (*q);
9258 break;
9259 default:
9260 /* There should be no other prefixes for instructions
9261 with VEX prefix. */
9262 abort ();
9263 }
9264
9265 /* For EVEX instructions i.vrex should become 0 after
9266 build_evex_prefix. For VEX instructions upper 16 registers
9267 aren't available, so VREX should be 0. */
9268 if (i.vrex)
9269 abort ();
9270 /* Now the VEX prefix. */
9271 p = frag_more (i.vex.length);
9272 for (j = 0; j < i.vex.length; j++)
9273 p[j] = i.vex.bytes[j];
9274 }
9275
9276 /* Now the opcode; be careful about word order here! */
9277 if (i.tm.opcode_length == 1)
9278 {
9279 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9280 }
9281 else
9282 {
9283 switch (i.tm.opcode_length)
9284 {
9285 case 4:
9286 p = frag_more (4);
9287 *p++ = (i.tm.base_opcode >> 24) & 0xff;
9288 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9289 break;
9290 case 3:
9291 p = frag_more (3);
9292 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9293 break;
9294 case 2:
9295 p = frag_more (2);
9296 break;
9297 default:
9298 abort ();
9299 break;
9300 }
9301
9302 /* Put out high byte first: can't use md_number_to_chars! */
9303 *p++ = (i.tm.base_opcode >> 8) & 0xff;
9304 *p = i.tm.base_opcode & 0xff;
9305 }
9306
9307 /* Now the modrm byte and sib byte (if present). */
9308 if (i.tm.opcode_modifier.modrm)
9309 {
9310 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
9311 | i.rm.reg << 3
9312 | i.rm.mode << 6));
9313 /* If i.rm.regmem == ESP (4)
9314 && i.rm.mode != (Register mode)
9315 && not 16 bit
9316 ==> need second modrm byte. */
9317 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9318 && i.rm.mode != 3
9319 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9320 FRAG_APPEND_1_CHAR ((i.sib.base << 0
9321 | i.sib.index << 3
9322 | i.sib.scale << 6));
9323 }
9324
9325 if (i.disp_operands)
9326 output_disp (insn_start_frag, insn_start_off);
9327
9328 if (i.imm_operands)
9329 output_imm (insn_start_frag, insn_start_off);
9330
9331 /*
9332 * frag_now_fix () returning plain abs_section_offset when we're in the
9333 * absolute section, and abs_section_offset not getting updated as data
9334 * gets added to the frag breaks the logic below.
9335 */
9336 if (now_seg != absolute_section)
9337 {
9338 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9339 if (j > 15)
9340 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9341 j);
9342 else if (fragP)
9343 {
9344 /* NB: Don't add prefix with GOTPC relocation since
9345 output_disp() above depends on the fixed encoding
9346 length. Can't add prefix with TLS relocation since
9347 it breaks TLS linker optimization. */
9348 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9349 /* Prefix count on the current instruction. */
9350 unsigned int count = i.vex.length;
9351 unsigned int k;
9352 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9353 /* REX byte is encoded in VEX/EVEX prefix. */
9354 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9355 count++;
9356
9357 /* Count prefixes for extended opcode maps. */
9358 if (!i.vex.length)
9359 switch (i.tm.opcode_length)
9360 {
9361 case 3:
9362 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9363 {
9364 count++;
9365 switch ((i.tm.base_opcode >> 8) & 0xff)
9366 {
9367 case 0x38:
9368 case 0x3a:
9369 count++;
9370 break;
9371 default:
9372 break;
9373 }
9374 }
9375 break;
9376 case 2:
9377 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9378 count++;
9379 break;
9380 case 1:
9381 break;
9382 default:
9383 abort ();
9384 }
9385
9386 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9387 == BRANCH_PREFIX)
9388 {
9389 /* Set the maximum prefix size in BRANCH_PREFIX
9390 frag. */
9391 if (fragP->tc_frag_data.max_bytes > max)
9392 fragP->tc_frag_data.max_bytes = max;
9393 if (fragP->tc_frag_data.max_bytes > count)
9394 fragP->tc_frag_data.max_bytes -= count;
9395 else
9396 fragP->tc_frag_data.max_bytes = 0;
9397 }
9398 else
9399 {
9400 /* Remember the maximum prefix size in FUSED_JCC_PADDING
9401 frag. */
9402 unsigned int max_prefix_size;
9403 if (align_branch_prefix_size > max)
9404 max_prefix_size = max;
9405 else
9406 max_prefix_size = align_branch_prefix_size;
9407 if (max_prefix_size > count)
9408 fragP->tc_frag_data.max_prefix_length
9409 = max_prefix_size - count;
9410 }
9411
9412 /* Use existing segment prefix if possible. Use CS
9413 segment prefix in 64-bit mode. In 32-bit mode, use SS
9414 segment prefix with ESP/EBP base register and use DS
9415 segment prefix without ESP/EBP base register. */
9416 if (i.prefix[SEG_PREFIX])
9417 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9418 else if (flag_code == CODE_64BIT)
9419 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9420 else if (i.base_reg
9421 && (i.base_reg->reg_num == 4
9422 || i.base_reg->reg_num == 5))
9423 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9424 else
9425 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9426 }
9427 }
9428 }
9429
9430 /* NB: Don't work with COND_JUMP86 without i386. */
9431 if (align_branch_power
9432 && now_seg != absolute_section
9433 && cpu_arch_flags.bitfield.cpui386)
9434 {
9435 /* Terminate each frag so that we can add prefix and check for
9436 fused jcc. */
9437 frag_wane (frag_now);
9438 frag_new (0);
9439 }
9440
9441 #ifdef DEBUG386
9442 if (flag_debug)
9443 {
9444 pi ("" /*line*/, &i);
9445 }
9446 #endif /* DEBUG386 */
9447 }
9448
9449 /* Return the size of the displacement operand N. */
9450
9451 static int
9452 disp_size (unsigned int n)
9453 {
9454 int size = 4;
9455
9456 if (i.types[n].bitfield.disp64)
9457 size = 8;
9458 else if (i.types[n].bitfield.disp8)
9459 size = 1;
9460 else if (i.types[n].bitfield.disp16)
9461 size = 2;
9462 return size;
9463 }
9464
9465 /* Return the size of the immediate operand N. */
9466
9467 static int
9468 imm_size (unsigned int n)
9469 {
9470 int size = 4;
9471 if (i.types[n].bitfield.imm64)
9472 size = 8;
9473 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9474 size = 1;
9475 else if (i.types[n].bitfield.imm16)
9476 size = 2;
9477 return size;
9478 }
9479
9480 static void
9481 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9482 {
9483 char *p;
9484 unsigned int n;
9485
9486 for (n = 0; n < i.operands; n++)
9487 {
9488 if (operand_type_check (i.types[n], disp))
9489 {
9490 if (i.op[n].disps->X_op == O_constant)
9491 {
9492 int size = disp_size (n);
9493 offsetT val = i.op[n].disps->X_add_number;
9494
9495 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9496 size);
9497 p = frag_more (size);
9498 md_number_to_chars (p, val, size);
9499 }
9500 else
9501 {
9502 enum bfd_reloc_code_real reloc_type;
9503 int size = disp_size (n);
9504 int sign = i.types[n].bitfield.disp32s;
9505 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9506 fixS *fixP;
9507
9508 /* We can't have 8 bit displacement here. */
9509 gas_assert (!i.types[n].bitfield.disp8);
9510
9511 /* The PC relative address is computed relative
9512 to the instruction boundary, so in case immediate
9513 fields follows, we need to adjust the value. */
9514 if (pcrel && i.imm_operands)
9515 {
9516 unsigned int n1;
9517 int sz = 0;
9518
9519 for (n1 = 0; n1 < i.operands; n1++)
9520 if (operand_type_check (i.types[n1], imm))
9521 {
9522 /* Only one immediate is allowed for PC
9523 relative address. */
9524 gas_assert (sz == 0);
9525 sz = imm_size (n1);
9526 i.op[n].disps->X_add_number -= sz;
9527 }
9528 /* We should find the immediate. */
9529 gas_assert (sz != 0);
9530 }
9531
9532 p = frag_more (size);
9533 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9534 if (GOT_symbol
9535 && GOT_symbol == i.op[n].disps->X_add_symbol
9536 && (((reloc_type == BFD_RELOC_32
9537 || reloc_type == BFD_RELOC_X86_64_32S
9538 || (reloc_type == BFD_RELOC_64
9539 && object_64bit))
9540 && (i.op[n].disps->X_op == O_symbol
9541 || (i.op[n].disps->X_op == O_add
9542 && ((symbol_get_value_expression
9543 (i.op[n].disps->X_op_symbol)->X_op)
9544 == O_subtract))))
9545 || reloc_type == BFD_RELOC_32_PCREL))
9546 {
9547 if (!object_64bit)
9548 {
9549 reloc_type = BFD_RELOC_386_GOTPC;
9550 i.has_gotpc_tls_reloc = TRUE;
9551 i.op[n].imms->X_add_number +=
9552 encoding_length (insn_start_frag, insn_start_off, p);
9553 }
9554 else if (reloc_type == BFD_RELOC_64)
9555 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9556 else
9557 /* Don't do the adjustment for x86-64, as there
9558 the pcrel addressing is relative to the _next_
9559 insn, and that is taken care of in other code. */
9560 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9561 }
9562 else if (align_branch_power)
9563 {
9564 switch (reloc_type)
9565 {
9566 case BFD_RELOC_386_TLS_GD:
9567 case BFD_RELOC_386_TLS_LDM:
9568 case BFD_RELOC_386_TLS_IE:
9569 case BFD_RELOC_386_TLS_IE_32:
9570 case BFD_RELOC_386_TLS_GOTIE:
9571 case BFD_RELOC_386_TLS_GOTDESC:
9572 case BFD_RELOC_386_TLS_DESC_CALL:
9573 case BFD_RELOC_X86_64_TLSGD:
9574 case BFD_RELOC_X86_64_TLSLD:
9575 case BFD_RELOC_X86_64_GOTTPOFF:
9576 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9577 case BFD_RELOC_X86_64_TLSDESC_CALL:
9578 i.has_gotpc_tls_reloc = TRUE;
9579 default:
9580 break;
9581 }
9582 }
9583 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9584 size, i.op[n].disps, pcrel,
9585 reloc_type);
9586 /* Check for "call/jmp *mem", "mov mem, %reg",
9587 "test %reg, mem" and "binop mem, %reg" where binop
9588 is one of adc, add, and, cmp, or, sbb, sub, xor
9589 instructions without data prefix. Always generate
9590 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9591 if (i.prefix[DATA_PREFIX] == 0
9592 && (generate_relax_relocations
9593 || (!object_64bit
9594 && i.rm.mode == 0
9595 && i.rm.regmem == 5))
9596 && (i.rm.mode == 2
9597 || (i.rm.mode == 0 && i.rm.regmem == 5))
9598 && !is_any_vex_encoding(&i.tm)
9599 && ((i.operands == 1
9600 && i.tm.base_opcode == 0xff
9601 && (i.rm.reg == 2 || i.rm.reg == 4))
9602 || (i.operands == 2
9603 && (i.tm.base_opcode == 0x8b
9604 || i.tm.base_opcode == 0x85
9605 || (i.tm.base_opcode & ~0x38) == 0x03))))
9606 {
9607 if (object_64bit)
9608 {
9609 fixP->fx_tcbit = i.rex != 0;
9610 if (i.base_reg
9611 && (i.base_reg->reg_num == RegIP))
9612 fixP->fx_tcbit2 = 1;
9613 }
9614 else
9615 fixP->fx_tcbit2 = 1;
9616 }
9617 }
9618 }
9619 }
9620 }
9621
9622 static void
9623 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9624 {
9625 char *p;
9626 unsigned int n;
9627
9628 for (n = 0; n < i.operands; n++)
9629 {
9630 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9631 if (i.rounding && (int) n == i.rounding->operand)
9632 continue;
9633
9634 if (operand_type_check (i.types[n], imm))
9635 {
9636 if (i.op[n].imms->X_op == O_constant)
9637 {
9638 int size = imm_size (n);
9639 offsetT val;
9640
9641 val = offset_in_range (i.op[n].imms->X_add_number,
9642 size);
9643 p = frag_more (size);
9644 md_number_to_chars (p, val, size);
9645 }
9646 else
9647 {
9648 /* Not absolute_section.
9649 Need a 32-bit fixup (don't support 8bit
9650 non-absolute imms). Try to support other
9651 sizes ... */
9652 enum bfd_reloc_code_real reloc_type;
9653 int size = imm_size (n);
9654 int sign;
9655
9656 if (i.types[n].bitfield.imm32s
9657 && (i.suffix == QWORD_MNEM_SUFFIX
9658 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9659 sign = 1;
9660 else
9661 sign = 0;
9662
9663 p = frag_more (size);
9664 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9665
9666 /* This is tough to explain. We end up with this one if we
9667 * have operands that look like
9668 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9669 * obtain the absolute address of the GOT, and it is strongly
9670 * preferable from a performance point of view to avoid using
9671 * a runtime relocation for this. The actual sequence of
9672 * instructions often look something like:
9673 *
9674 * call .L66
9675 * .L66:
9676 * popl %ebx
9677 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9678 *
9679 * The call and pop essentially return the absolute address
9680 * of the label .L66 and store it in %ebx. The linker itself
9681 * will ultimately change the first operand of the addl so
9682 * that %ebx points to the GOT, but to keep things simple, the
9683 * .o file must have this operand set so that it generates not
9684 * the absolute address of .L66, but the absolute address of
9685 * itself. This allows the linker itself simply treat a GOTPC
9686 * relocation as asking for a pcrel offset to the GOT to be
9687 * added in, and the addend of the relocation is stored in the
9688 * operand field for the instruction itself.
9689 *
9690 * Our job here is to fix the operand so that it would add
9691 * the correct offset so that %ebx would point to itself. The
9692 * thing that is tricky is that .-.L66 will point to the
9693 * beginning of the instruction, so we need to further modify
9694 * the operand so that it will point to itself. There are
9695 * other cases where you have something like:
9696 *
9697 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9698 *
9699 * and here no correction would be required. Internally in
9700 * the assembler we treat operands of this form as not being
9701 * pcrel since the '.' is explicitly mentioned, and I wonder
9702 * whether it would simplify matters to do it this way. Who
9703 * knows. In earlier versions of the PIC patches, the
9704 * pcrel_adjust field was used to store the correction, but
9705 * since the expression is not pcrel, I felt it would be
9706 * confusing to do it this way. */
9707
9708 if ((reloc_type == BFD_RELOC_32
9709 || reloc_type == BFD_RELOC_X86_64_32S
9710 || reloc_type == BFD_RELOC_64)
9711 && GOT_symbol
9712 && GOT_symbol == i.op[n].imms->X_add_symbol
9713 && (i.op[n].imms->X_op == O_symbol
9714 || (i.op[n].imms->X_op == O_add
9715 && ((symbol_get_value_expression
9716 (i.op[n].imms->X_op_symbol)->X_op)
9717 == O_subtract))))
9718 {
9719 if (!object_64bit)
9720 reloc_type = BFD_RELOC_386_GOTPC;
9721 else if (size == 4)
9722 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9723 else if (size == 8)
9724 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9725 i.has_gotpc_tls_reloc = TRUE;
9726 i.op[n].imms->X_add_number +=
9727 encoding_length (insn_start_frag, insn_start_off, p);
9728 }
9729 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9730 i.op[n].imms, 0, reloc_type);
9731 }
9732 }
9733 }
9734 }
9735 \f
9736 /* x86_cons_fix_new is called via the expression parsing code when a
9737 reloc is needed. We use this hook to get the correct .got reloc. */
9738 static int cons_sign = -1;
9739
9740 void
9741 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9742 expressionS *exp, bfd_reloc_code_real_type r)
9743 {
9744 r = reloc (len, 0, cons_sign, r);
9745
9746 #ifdef TE_PE
9747 if (exp->X_op == O_secrel)
9748 {
9749 exp->X_op = O_symbol;
9750 r = BFD_RELOC_32_SECREL;
9751 }
9752 #endif
9753
9754 fix_new_exp (frag, off, len, exp, 0, r);
9755 }
9756
9757 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9758 purpose of the `.dc.a' internal pseudo-op. */
9759
9760 int
9761 x86_address_bytes (void)
9762 {
9763 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9764 return 4;
9765 return stdoutput->arch_info->bits_per_address / 8;
9766 }
9767
9768 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9769 || defined (LEX_AT)
9770 # define lex_got(reloc, adjust, types) NULL
9771 #else
9772 /* Parse operands of the form
9773 <symbol>@GOTOFF+<nnn>
9774 and similar .plt or .got references.
9775
9776 If we find one, set up the correct relocation in RELOC and copy the
9777 input string, minus the `@GOTOFF' into a malloc'd buffer for
9778 parsing by the calling routine. Return this buffer, and if ADJUST
9779 is non-null set it to the length of the string we removed from the
9780 input line. Otherwise return NULL. */
9781 static char *
9782 lex_got (enum bfd_reloc_code_real *rel,
9783 int *adjust,
9784 i386_operand_type *types)
9785 {
9786 /* Some of the relocations depend on the size of what field is to
9787 be relocated. But in our callers i386_immediate and i386_displacement
9788 we don't yet know the operand size (this will be set by insn
9789 matching). Hence we record the word32 relocation here,
9790 and adjust the reloc according to the real size in reloc(). */
9791 static const struct {
9792 const char *str;
9793 int len;
9794 const enum bfd_reloc_code_real rel[2];
9795 const i386_operand_type types64;
9796 } gotrel[] = {
9797 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9798 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9799 BFD_RELOC_SIZE32 },
9800 OPERAND_TYPE_IMM32_64 },
9801 #endif
9802 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9803 BFD_RELOC_X86_64_PLTOFF64 },
9804 OPERAND_TYPE_IMM64 },
9805 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9806 BFD_RELOC_X86_64_PLT32 },
9807 OPERAND_TYPE_IMM32_32S_DISP32 },
9808 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9809 BFD_RELOC_X86_64_GOTPLT64 },
9810 OPERAND_TYPE_IMM64_DISP64 },
9811 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9812 BFD_RELOC_X86_64_GOTOFF64 },
9813 OPERAND_TYPE_IMM64_DISP64 },
9814 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9815 BFD_RELOC_X86_64_GOTPCREL },
9816 OPERAND_TYPE_IMM32_32S_DISP32 },
9817 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9818 BFD_RELOC_X86_64_TLSGD },
9819 OPERAND_TYPE_IMM32_32S_DISP32 },
9820 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9821 _dummy_first_bfd_reloc_code_real },
9822 OPERAND_TYPE_NONE },
9823 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9824 BFD_RELOC_X86_64_TLSLD },
9825 OPERAND_TYPE_IMM32_32S_DISP32 },
9826 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9827 BFD_RELOC_X86_64_GOTTPOFF },
9828 OPERAND_TYPE_IMM32_32S_DISP32 },
9829 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9830 BFD_RELOC_X86_64_TPOFF32 },
9831 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9832 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9833 _dummy_first_bfd_reloc_code_real },
9834 OPERAND_TYPE_NONE },
9835 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9836 BFD_RELOC_X86_64_DTPOFF32 },
9837 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9838 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9839 _dummy_first_bfd_reloc_code_real },
9840 OPERAND_TYPE_NONE },
9841 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9842 _dummy_first_bfd_reloc_code_real },
9843 OPERAND_TYPE_NONE },
9844 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9845 BFD_RELOC_X86_64_GOT32 },
9846 OPERAND_TYPE_IMM32_32S_64_DISP32 },
9847 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9848 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9849 OPERAND_TYPE_IMM32_32S_DISP32 },
9850 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9851 BFD_RELOC_X86_64_TLSDESC_CALL },
9852 OPERAND_TYPE_IMM32_32S_DISP32 },
9853 };
9854 char *cp;
9855 unsigned int j;
9856
9857 #if defined (OBJ_MAYBE_ELF)
9858 if (!IS_ELF)
9859 return NULL;
9860 #endif
9861
9862 for (cp = input_line_pointer; *cp != '@'; cp++)
9863 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9864 return NULL;
9865
9866 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9867 {
9868 int len = gotrel[j].len;
9869 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9870 {
9871 if (gotrel[j].rel[object_64bit] != 0)
9872 {
9873 int first, second;
9874 char *tmpbuf, *past_reloc;
9875
9876 *rel = gotrel[j].rel[object_64bit];
9877
9878 if (types)
9879 {
9880 if (flag_code != CODE_64BIT)
9881 {
9882 types->bitfield.imm32 = 1;
9883 types->bitfield.disp32 = 1;
9884 }
9885 else
9886 *types = gotrel[j].types64;
9887 }
9888
9889 if (j != 0 && GOT_symbol == NULL)
9890 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9891
9892 /* The length of the first part of our input line. */
9893 first = cp - input_line_pointer;
9894
9895 /* The second part goes from after the reloc token until
9896 (and including) an end_of_line char or comma. */
9897 past_reloc = cp + 1 + len;
9898 cp = past_reloc;
9899 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9900 ++cp;
9901 second = cp + 1 - past_reloc;
9902
9903 /* Allocate and copy string. The trailing NUL shouldn't
9904 be necessary, but be safe. */
9905 tmpbuf = XNEWVEC (char, first + second + 2);
9906 memcpy (tmpbuf, input_line_pointer, first);
9907 if (second != 0 && *past_reloc != ' ')
9908 /* Replace the relocation token with ' ', so that
9909 errors like foo@GOTOFF1 will be detected. */
9910 tmpbuf[first++] = ' ';
9911 else
9912 /* Increment length by 1 if the relocation token is
9913 removed. */
9914 len++;
9915 if (adjust)
9916 *adjust = len;
9917 memcpy (tmpbuf + first, past_reloc, second);
9918 tmpbuf[first + second] = '\0';
9919 return tmpbuf;
9920 }
9921
9922 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9923 gotrel[j].str, 1 << (5 + object_64bit));
9924 return NULL;
9925 }
9926 }
9927
9928 /* Might be a symbol version string. Don't as_bad here. */
9929 return NULL;
9930 }
9931 #endif
9932
9933 #ifdef TE_PE
9934 #ifdef lex_got
9935 #undef lex_got
9936 #endif
9937 /* Parse operands of the form
9938 <symbol>@SECREL32+<nnn>
9939
9940 If we find one, set up the correct relocation in RELOC and copy the
9941 input string, minus the `@SECREL32' into a malloc'd buffer for
9942 parsing by the calling routine. Return this buffer, and if ADJUST
9943 is non-null set it to the length of the string we removed from the
9944 input line. Otherwise return NULL.
9945
9946 This function is copied from the ELF version above adjusted for PE targets. */
9947
9948 static char *
9949 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
9950 int *adjust ATTRIBUTE_UNUSED,
9951 i386_operand_type *types)
9952 {
9953 static const struct
9954 {
9955 const char *str;
9956 int len;
9957 const enum bfd_reloc_code_real rel[2];
9958 const i386_operand_type types64;
9959 }
9960 gotrel[] =
9961 {
9962 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
9963 BFD_RELOC_32_SECREL },
9964 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9965 };
9966
9967 char *cp;
9968 unsigned j;
9969
9970 for (cp = input_line_pointer; *cp != '@'; cp++)
9971 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9972 return NULL;
9973
9974 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9975 {
9976 int len = gotrel[j].len;
9977
9978 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9979 {
9980 if (gotrel[j].rel[object_64bit] != 0)
9981 {
9982 int first, second;
9983 char *tmpbuf, *past_reloc;
9984
9985 *rel = gotrel[j].rel[object_64bit];
9986 if (adjust)
9987 *adjust = len;
9988
9989 if (types)
9990 {
9991 if (flag_code != CODE_64BIT)
9992 {
9993 types->bitfield.imm32 = 1;
9994 types->bitfield.disp32 = 1;
9995 }
9996 else
9997 *types = gotrel[j].types64;
9998 }
9999
10000 /* The length of the first part of our input line. */
10001 first = cp - input_line_pointer;
10002
10003 /* The second part goes from after the reloc token until
10004 (and including) an end_of_line char or comma. */
10005 past_reloc = cp + 1 + len;
10006 cp = past_reloc;
10007 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10008 ++cp;
10009 second = cp + 1 - past_reloc;
10010
10011 /* Allocate and copy string. The trailing NUL shouldn't
10012 be necessary, but be safe. */
10013 tmpbuf = XNEWVEC (char, first + second + 2);
10014 memcpy (tmpbuf, input_line_pointer, first);
10015 if (second != 0 && *past_reloc != ' ')
10016 /* Replace the relocation token with ' ', so that
10017 errors like foo@SECLREL321 will be detected. */
10018 tmpbuf[first++] = ' ';
10019 memcpy (tmpbuf + first, past_reloc, second);
10020 tmpbuf[first + second] = '\0';
10021 return tmpbuf;
10022 }
10023
10024 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10025 gotrel[j].str, 1 << (5 + object_64bit));
10026 return NULL;
10027 }
10028 }
10029
10030 /* Might be a symbol version string. Don't as_bad here. */
10031 return NULL;
10032 }
10033
10034 #endif /* TE_PE */
10035
10036 bfd_reloc_code_real_type
10037 x86_cons (expressionS *exp, int size)
10038 {
10039 bfd_reloc_code_real_type got_reloc = NO_RELOC;
10040
10041 intel_syntax = -intel_syntax;
10042
10043 exp->X_md = 0;
10044 if (size == 4 || (object_64bit && size == 8))
10045 {
10046 /* Handle @GOTOFF and the like in an expression. */
10047 char *save;
10048 char *gotfree_input_line;
10049 int adjust = 0;
10050
10051 save = input_line_pointer;
10052 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10053 if (gotfree_input_line)
10054 input_line_pointer = gotfree_input_line;
10055
10056 expression (exp);
10057
10058 if (gotfree_input_line)
10059 {
10060 /* expression () has merrily parsed up to the end of line,
10061 or a comma - in the wrong buffer. Transfer how far
10062 input_line_pointer has moved to the right buffer. */
10063 input_line_pointer = (save
10064 + (input_line_pointer - gotfree_input_line)
10065 + adjust);
10066 free (gotfree_input_line);
10067 if (exp->X_op == O_constant
10068 || exp->X_op == O_absent
10069 || exp->X_op == O_illegal
10070 || exp->X_op == O_register
10071 || exp->X_op == O_big)
10072 {
10073 char c = *input_line_pointer;
10074 *input_line_pointer = 0;
10075 as_bad (_("missing or invalid expression `%s'"), save);
10076 *input_line_pointer = c;
10077 }
10078 else if ((got_reloc == BFD_RELOC_386_PLT32
10079 || got_reloc == BFD_RELOC_X86_64_PLT32)
10080 && exp->X_op != O_symbol)
10081 {
10082 char c = *input_line_pointer;
10083 *input_line_pointer = 0;
10084 as_bad (_("invalid PLT expression `%s'"), save);
10085 *input_line_pointer = c;
10086 }
10087 }
10088 }
10089 else
10090 expression (exp);
10091
10092 intel_syntax = -intel_syntax;
10093
10094 if (intel_syntax)
10095 i386_intel_simplify (exp);
10096
10097 return got_reloc;
10098 }
10099
10100 static void
10101 signed_cons (int size)
10102 {
10103 if (flag_code == CODE_64BIT)
10104 cons_sign = 1;
10105 cons (size);
10106 cons_sign = -1;
10107 }
10108
10109 #ifdef TE_PE
10110 static void
10111 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10112 {
10113 expressionS exp;
10114
10115 do
10116 {
10117 expression (&exp);
10118 if (exp.X_op == O_symbol)
10119 exp.X_op = O_secrel;
10120
10121 emit_expr (&exp, 4);
10122 }
10123 while (*input_line_pointer++ == ',');
10124
10125 input_line_pointer--;
10126 demand_empty_rest_of_line ();
10127 }
10128 #endif
10129
10130 /* Handle Vector operations. */
10131
10132 static char *
10133 check_VecOperations (char *op_string, char *op_end)
10134 {
10135 const reg_entry *mask;
10136 const char *saved;
10137 char *end_op;
10138
10139 while (*op_string
10140 && (op_end == NULL || op_string < op_end))
10141 {
10142 saved = op_string;
10143 if (*op_string == '{')
10144 {
10145 op_string++;
10146
10147 /* Check broadcasts. */
10148 if (strncmp (op_string, "1to", 3) == 0)
10149 {
10150 int bcst_type;
10151
10152 if (i.broadcast)
10153 goto duplicated_vec_op;
10154
10155 op_string += 3;
10156 if (*op_string == '8')
10157 bcst_type = 8;
10158 else if (*op_string == '4')
10159 bcst_type = 4;
10160 else if (*op_string == '2')
10161 bcst_type = 2;
10162 else if (*op_string == '1'
10163 && *(op_string+1) == '6')
10164 {
10165 bcst_type = 16;
10166 op_string++;
10167 }
10168 else
10169 {
10170 as_bad (_("Unsupported broadcast: `%s'"), saved);
10171 return NULL;
10172 }
10173 op_string++;
10174
10175 broadcast_op.type = bcst_type;
10176 broadcast_op.operand = this_operand;
10177 broadcast_op.bytes = 0;
10178 i.broadcast = &broadcast_op;
10179 }
10180 /* Check masking operation. */
10181 else if ((mask = parse_register (op_string, &end_op)) != NULL)
10182 {
10183 if (mask == &bad_reg)
10184 return NULL;
10185
10186 /* k0 can't be used for write mask. */
10187 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10188 {
10189 as_bad (_("`%s%s' can't be used for write mask"),
10190 register_prefix, mask->reg_name);
10191 return NULL;
10192 }
10193
10194 if (!i.mask)
10195 {
10196 mask_op.mask = mask;
10197 mask_op.zeroing = 0;
10198 mask_op.operand = this_operand;
10199 i.mask = &mask_op;
10200 }
10201 else
10202 {
10203 if (i.mask->mask)
10204 goto duplicated_vec_op;
10205
10206 i.mask->mask = mask;
10207
10208 /* Only "{z}" is allowed here. No need to check
10209 zeroing mask explicitly. */
10210 if (i.mask->operand != this_operand)
10211 {
10212 as_bad (_("invalid write mask `%s'"), saved);
10213 return NULL;
10214 }
10215 }
10216
10217 op_string = end_op;
10218 }
10219 /* Check zeroing-flag for masking operation. */
10220 else if (*op_string == 'z')
10221 {
10222 if (!i.mask)
10223 {
10224 mask_op.mask = NULL;
10225 mask_op.zeroing = 1;
10226 mask_op.operand = this_operand;
10227 i.mask = &mask_op;
10228 }
10229 else
10230 {
10231 if (i.mask->zeroing)
10232 {
10233 duplicated_vec_op:
10234 as_bad (_("duplicated `%s'"), saved);
10235 return NULL;
10236 }
10237
10238 i.mask->zeroing = 1;
10239
10240 /* Only "{%k}" is allowed here. No need to check mask
10241 register explicitly. */
10242 if (i.mask->operand != this_operand)
10243 {
10244 as_bad (_("invalid zeroing-masking `%s'"),
10245 saved);
10246 return NULL;
10247 }
10248 }
10249
10250 op_string++;
10251 }
10252 else
10253 goto unknown_vec_op;
10254
10255 if (*op_string != '}')
10256 {
10257 as_bad (_("missing `}' in `%s'"), saved);
10258 return NULL;
10259 }
10260 op_string++;
10261
10262 /* Strip whitespace since the addition of pseudo prefixes
10263 changed how the scrubber treats '{'. */
10264 if (is_space_char (*op_string))
10265 ++op_string;
10266
10267 continue;
10268 }
10269 unknown_vec_op:
10270 /* We don't know this one. */
10271 as_bad (_("unknown vector operation: `%s'"), saved);
10272 return NULL;
10273 }
10274
10275 if (i.mask && i.mask->zeroing && !i.mask->mask)
10276 {
10277 as_bad (_("zeroing-masking only allowed with write mask"));
10278 return NULL;
10279 }
10280
10281 return op_string;
10282 }
10283
10284 static int
10285 i386_immediate (char *imm_start)
10286 {
10287 char *save_input_line_pointer;
10288 char *gotfree_input_line;
10289 segT exp_seg = 0;
10290 expressionS *exp;
10291 i386_operand_type types;
10292
10293 operand_type_set (&types, ~0);
10294
10295 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10296 {
10297 as_bad (_("at most %d immediate operands are allowed"),
10298 MAX_IMMEDIATE_OPERANDS);
10299 return 0;
10300 }
10301
10302 exp = &im_expressions[i.imm_operands++];
10303 i.op[this_operand].imms = exp;
10304
10305 if (is_space_char (*imm_start))
10306 ++imm_start;
10307
10308 save_input_line_pointer = input_line_pointer;
10309 input_line_pointer = imm_start;
10310
10311 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10312 if (gotfree_input_line)
10313 input_line_pointer = gotfree_input_line;
10314
10315 exp_seg = expression (exp);
10316
10317 SKIP_WHITESPACE ();
10318
10319 /* Handle vector operations. */
10320 if (*input_line_pointer == '{')
10321 {
10322 input_line_pointer = check_VecOperations (input_line_pointer,
10323 NULL);
10324 if (input_line_pointer == NULL)
10325 return 0;
10326 }
10327
10328 if (*input_line_pointer)
10329 as_bad (_("junk `%s' after expression"), input_line_pointer);
10330
10331 input_line_pointer = save_input_line_pointer;
10332 if (gotfree_input_line)
10333 {
10334 free (gotfree_input_line);
10335
10336 if (exp->X_op == O_constant || exp->X_op == O_register)
10337 exp->X_op = O_illegal;
10338 }
10339
10340 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10341 }
10342
10343 static int
10344 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10345 i386_operand_type types, const char *imm_start)
10346 {
10347 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10348 {
10349 if (imm_start)
10350 as_bad (_("missing or invalid immediate expression `%s'"),
10351 imm_start);
10352 return 0;
10353 }
10354 else if (exp->X_op == O_constant)
10355 {
10356 /* Size it properly later. */
10357 i.types[this_operand].bitfield.imm64 = 1;
10358 /* If not 64bit, sign extend val. */
10359 if (flag_code != CODE_64BIT
10360 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10361 exp->X_add_number
10362 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10363 }
10364 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10365 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10366 && exp_seg != absolute_section
10367 && exp_seg != text_section
10368 && exp_seg != data_section
10369 && exp_seg != bss_section
10370 && exp_seg != undefined_section
10371 && !bfd_is_com_section (exp_seg))
10372 {
10373 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10374 return 0;
10375 }
10376 #endif
10377 else if (!intel_syntax && exp_seg == reg_section)
10378 {
10379 if (imm_start)
10380 as_bad (_("illegal immediate register operand %s"), imm_start);
10381 return 0;
10382 }
10383 else
10384 {
10385 /* This is an address. The size of the address will be
10386 determined later, depending on destination register,
10387 suffix, or the default for the section. */
10388 i.types[this_operand].bitfield.imm8 = 1;
10389 i.types[this_operand].bitfield.imm16 = 1;
10390 i.types[this_operand].bitfield.imm32 = 1;
10391 i.types[this_operand].bitfield.imm32s = 1;
10392 i.types[this_operand].bitfield.imm64 = 1;
10393 i.types[this_operand] = operand_type_and (i.types[this_operand],
10394 types);
10395 }
10396
10397 return 1;
10398 }
10399
10400 static char *
10401 i386_scale (char *scale)
10402 {
10403 offsetT val;
10404 char *save = input_line_pointer;
10405
10406 input_line_pointer = scale;
10407 val = get_absolute_expression ();
10408
10409 switch (val)
10410 {
10411 case 1:
10412 i.log2_scale_factor = 0;
10413 break;
10414 case 2:
10415 i.log2_scale_factor = 1;
10416 break;
10417 case 4:
10418 i.log2_scale_factor = 2;
10419 break;
10420 case 8:
10421 i.log2_scale_factor = 3;
10422 break;
10423 default:
10424 {
10425 char sep = *input_line_pointer;
10426
10427 *input_line_pointer = '\0';
10428 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10429 scale);
10430 *input_line_pointer = sep;
10431 input_line_pointer = save;
10432 return NULL;
10433 }
10434 }
10435 if (i.log2_scale_factor != 0 && i.index_reg == 0)
10436 {
10437 as_warn (_("scale factor of %d without an index register"),
10438 1 << i.log2_scale_factor);
10439 i.log2_scale_factor = 0;
10440 }
10441 scale = input_line_pointer;
10442 input_line_pointer = save;
10443 return scale;
10444 }
10445
10446 static int
10447 i386_displacement (char *disp_start, char *disp_end)
10448 {
10449 expressionS *exp;
10450 segT exp_seg = 0;
10451 char *save_input_line_pointer;
10452 char *gotfree_input_line;
10453 int override;
10454 i386_operand_type bigdisp, types = anydisp;
10455 int ret;
10456
10457 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10458 {
10459 as_bad (_("at most %d displacement operands are allowed"),
10460 MAX_MEMORY_OPERANDS);
10461 return 0;
10462 }
10463
10464 operand_type_set (&bigdisp, 0);
10465 if (i.jumpabsolute
10466 || i.types[this_operand].bitfield.baseindex
10467 || (current_templates->start->opcode_modifier.jump != JUMP
10468 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10469 {
10470 i386_addressing_mode ();
10471 override = (i.prefix[ADDR_PREFIX] != 0);
10472 if (flag_code == CODE_64BIT)
10473 {
10474 if (!override)
10475 {
10476 bigdisp.bitfield.disp32s = 1;
10477 bigdisp.bitfield.disp64 = 1;
10478 }
10479 else
10480 bigdisp.bitfield.disp32 = 1;
10481 }
10482 else if ((flag_code == CODE_16BIT) ^ override)
10483 bigdisp.bitfield.disp16 = 1;
10484 else
10485 bigdisp.bitfield.disp32 = 1;
10486 }
10487 else
10488 {
10489 /* For PC-relative branches, the width of the displacement may be
10490 dependent upon data size, but is never dependent upon address size.
10491 Also make sure to not unintentionally match against a non-PC-relative
10492 branch template. */
10493 static templates aux_templates;
10494 const insn_template *t = current_templates->start;
10495 bfd_boolean has_intel64 = FALSE;
10496
10497 aux_templates.start = t;
10498 while (++t < current_templates->end)
10499 {
10500 if (t->opcode_modifier.jump
10501 != current_templates->start->opcode_modifier.jump)
10502 break;
10503 if ((t->opcode_modifier.isa64 >= INTEL64))
10504 has_intel64 = TRUE;
10505 }
10506 if (t < current_templates->end)
10507 {
10508 aux_templates.end = t;
10509 current_templates = &aux_templates;
10510 }
10511
10512 override = (i.prefix[DATA_PREFIX] != 0);
10513 if (flag_code == CODE_64BIT)
10514 {
10515 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10516 && (!intel64 || !has_intel64))
10517 bigdisp.bitfield.disp16 = 1;
10518 else
10519 bigdisp.bitfield.disp32s = 1;
10520 }
10521 else
10522 {
10523 if (!override)
10524 override = (i.suffix == (flag_code != CODE_16BIT
10525 ? WORD_MNEM_SUFFIX
10526 : LONG_MNEM_SUFFIX));
10527 bigdisp.bitfield.disp32 = 1;
10528 if ((flag_code == CODE_16BIT) ^ override)
10529 {
10530 bigdisp.bitfield.disp32 = 0;
10531 bigdisp.bitfield.disp16 = 1;
10532 }
10533 }
10534 }
10535 i.types[this_operand] = operand_type_or (i.types[this_operand],
10536 bigdisp);
10537
10538 exp = &disp_expressions[i.disp_operands];
10539 i.op[this_operand].disps = exp;
10540 i.disp_operands++;
10541 save_input_line_pointer = input_line_pointer;
10542 input_line_pointer = disp_start;
10543 END_STRING_AND_SAVE (disp_end);
10544
10545 #ifndef GCC_ASM_O_HACK
10546 #define GCC_ASM_O_HACK 0
10547 #endif
10548 #if GCC_ASM_O_HACK
10549 END_STRING_AND_SAVE (disp_end + 1);
10550 if (i.types[this_operand].bitfield.baseIndex
10551 && displacement_string_end[-1] == '+')
10552 {
10553 /* This hack is to avoid a warning when using the "o"
10554 constraint within gcc asm statements.
10555 For instance:
10556
10557 #define _set_tssldt_desc(n,addr,limit,type) \
10558 __asm__ __volatile__ ( \
10559 "movw %w2,%0\n\t" \
10560 "movw %w1,2+%0\n\t" \
10561 "rorl $16,%1\n\t" \
10562 "movb %b1,4+%0\n\t" \
10563 "movb %4,5+%0\n\t" \
10564 "movb $0,6+%0\n\t" \
10565 "movb %h1,7+%0\n\t" \
10566 "rorl $16,%1" \
10567 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10568
10569 This works great except that the output assembler ends
10570 up looking a bit weird if it turns out that there is
10571 no offset. You end up producing code that looks like:
10572
10573 #APP
10574 movw $235,(%eax)
10575 movw %dx,2+(%eax)
10576 rorl $16,%edx
10577 movb %dl,4+(%eax)
10578 movb $137,5+(%eax)
10579 movb $0,6+(%eax)
10580 movb %dh,7+(%eax)
10581 rorl $16,%edx
10582 #NO_APP
10583
10584 So here we provide the missing zero. */
10585
10586 *displacement_string_end = '0';
10587 }
10588 #endif
10589 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10590 if (gotfree_input_line)
10591 input_line_pointer = gotfree_input_line;
10592
10593 exp_seg = expression (exp);
10594
10595 SKIP_WHITESPACE ();
10596 if (*input_line_pointer)
10597 as_bad (_("junk `%s' after expression"), input_line_pointer);
10598 #if GCC_ASM_O_HACK
10599 RESTORE_END_STRING (disp_end + 1);
10600 #endif
10601 input_line_pointer = save_input_line_pointer;
10602 if (gotfree_input_line)
10603 {
10604 free (gotfree_input_line);
10605
10606 if (exp->X_op == O_constant || exp->X_op == O_register)
10607 exp->X_op = O_illegal;
10608 }
10609
10610 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10611
10612 RESTORE_END_STRING (disp_end);
10613
10614 return ret;
10615 }
10616
10617 static int
10618 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10619 i386_operand_type types, const char *disp_start)
10620 {
10621 i386_operand_type bigdisp;
10622 int ret = 1;
10623
10624 /* We do this to make sure that the section symbol is in
10625 the symbol table. We will ultimately change the relocation
10626 to be relative to the beginning of the section. */
10627 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10628 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10629 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10630 {
10631 if (exp->X_op != O_symbol)
10632 goto inv_disp;
10633
10634 if (S_IS_LOCAL (exp->X_add_symbol)
10635 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10636 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10637 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10638 exp->X_op = O_subtract;
10639 exp->X_op_symbol = GOT_symbol;
10640 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10641 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10642 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10643 i.reloc[this_operand] = BFD_RELOC_64;
10644 else
10645 i.reloc[this_operand] = BFD_RELOC_32;
10646 }
10647
10648 else if (exp->X_op == O_absent
10649 || exp->X_op == O_illegal
10650 || exp->X_op == O_big)
10651 {
10652 inv_disp:
10653 as_bad (_("missing or invalid displacement expression `%s'"),
10654 disp_start);
10655 ret = 0;
10656 }
10657
10658 else if (flag_code == CODE_64BIT
10659 && !i.prefix[ADDR_PREFIX]
10660 && exp->X_op == O_constant)
10661 {
10662 /* Since displacement is signed extended to 64bit, don't allow
10663 disp32 and turn off disp32s if they are out of range. */
10664 i.types[this_operand].bitfield.disp32 = 0;
10665 if (!fits_in_signed_long (exp->X_add_number))
10666 {
10667 i.types[this_operand].bitfield.disp32s = 0;
10668 if (i.types[this_operand].bitfield.baseindex)
10669 {
10670 as_bad (_("0x%lx out range of signed 32bit displacement"),
10671 (long) exp->X_add_number);
10672 ret = 0;
10673 }
10674 }
10675 }
10676
10677 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10678 else if (exp->X_op != O_constant
10679 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10680 && exp_seg != absolute_section
10681 && exp_seg != text_section
10682 && exp_seg != data_section
10683 && exp_seg != bss_section
10684 && exp_seg != undefined_section
10685 && !bfd_is_com_section (exp_seg))
10686 {
10687 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10688 ret = 0;
10689 }
10690 #endif
10691
10692 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10693 /* Constants get taken care of by optimize_disp(). */
10694 && exp->X_op != O_constant)
10695 i.types[this_operand].bitfield.disp8 = 1;
10696
10697 /* Check if this is a displacement only operand. */
10698 bigdisp = i.types[this_operand];
10699 bigdisp.bitfield.disp8 = 0;
10700 bigdisp.bitfield.disp16 = 0;
10701 bigdisp.bitfield.disp32 = 0;
10702 bigdisp.bitfield.disp32s = 0;
10703 bigdisp.bitfield.disp64 = 0;
10704 if (operand_type_all_zero (&bigdisp))
10705 i.types[this_operand] = operand_type_and (i.types[this_operand],
10706 types);
10707
10708 return ret;
10709 }
10710
10711 /* Return the active addressing mode, taking address override and
10712 registers forming the address into consideration. Update the
10713 address override prefix if necessary. */
10714
10715 static enum flag_code
10716 i386_addressing_mode (void)
10717 {
10718 enum flag_code addr_mode;
10719
10720 if (i.prefix[ADDR_PREFIX])
10721 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10722 else if (flag_code == CODE_16BIT
10723 && current_templates->start->cpu_flags.bitfield.cpumpx
10724 /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10725 from md_assemble() by "is not a valid base/index expression"
10726 when there is a base and/or index. */
10727 && !i.types[this_operand].bitfield.baseindex)
10728 {
10729 /* MPX insn memory operands with neither base nor index must be forced
10730 to use 32-bit addressing in 16-bit mode. */
10731 addr_mode = CODE_32BIT;
10732 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10733 ++i.prefixes;
10734 gas_assert (!i.types[this_operand].bitfield.disp16);
10735 gas_assert (!i.types[this_operand].bitfield.disp32);
10736 }
10737 else
10738 {
10739 addr_mode = flag_code;
10740
10741 #if INFER_ADDR_PREFIX
10742 if (i.mem_operands == 0)
10743 {
10744 /* Infer address prefix from the first memory operand. */
10745 const reg_entry *addr_reg = i.base_reg;
10746
10747 if (addr_reg == NULL)
10748 addr_reg = i.index_reg;
10749
10750 if (addr_reg)
10751 {
10752 if (addr_reg->reg_type.bitfield.dword)
10753 addr_mode = CODE_32BIT;
10754 else if (flag_code != CODE_64BIT
10755 && addr_reg->reg_type.bitfield.word)
10756 addr_mode = CODE_16BIT;
10757
10758 if (addr_mode != flag_code)
10759 {
10760 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10761 i.prefixes += 1;
10762 /* Change the size of any displacement too. At most one
10763 of Disp16 or Disp32 is set.
10764 FIXME. There doesn't seem to be any real need for
10765 separate Disp16 and Disp32 flags. The same goes for
10766 Imm16 and Imm32. Removing them would probably clean
10767 up the code quite a lot. */
10768 if (flag_code != CODE_64BIT
10769 && (i.types[this_operand].bitfield.disp16
10770 || i.types[this_operand].bitfield.disp32))
10771 i.types[this_operand]
10772 = operand_type_xor (i.types[this_operand], disp16_32);
10773 }
10774 }
10775 }
10776 #endif
10777 }
10778
10779 return addr_mode;
10780 }
10781
10782 /* Make sure the memory operand we've been dealt is valid.
10783 Return 1 on success, 0 on a failure. */
10784
10785 static int
10786 i386_index_check (const char *operand_string)
10787 {
10788 const char *kind = "base/index";
10789 enum flag_code addr_mode = i386_addressing_mode ();
10790
10791 if (current_templates->start->opcode_modifier.isstring
10792 && !current_templates->start->cpu_flags.bitfield.cpupadlock
10793 && (current_templates->end[-1].opcode_modifier.isstring
10794 || i.mem_operands))
10795 {
10796 /* Memory operands of string insns are special in that they only allow
10797 a single register (rDI, rSI, or rBX) as their memory address. */
10798 const reg_entry *expected_reg;
10799 static const char *di_si[][2] =
10800 {
10801 { "esi", "edi" },
10802 { "si", "di" },
10803 { "rsi", "rdi" }
10804 };
10805 static const char *bx[] = { "ebx", "bx", "rbx" };
10806
10807 kind = "string address";
10808
10809 if (current_templates->start->opcode_modifier.repprefixok)
10810 {
10811 int es_op = current_templates->end[-1].opcode_modifier.isstring
10812 - IS_STRING_ES_OP0;
10813 int op = 0;
10814
10815 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10816 || ((!i.mem_operands != !intel_syntax)
10817 && current_templates->end[-1].operand_types[1]
10818 .bitfield.baseindex))
10819 op = 1;
10820 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10821 }
10822 else
10823 expected_reg = hash_find (reg_hash, bx[addr_mode]);
10824
10825 if (i.base_reg != expected_reg
10826 || i.index_reg
10827 || operand_type_check (i.types[this_operand], disp))
10828 {
10829 /* The second memory operand must have the same size as
10830 the first one. */
10831 if (i.mem_operands
10832 && i.base_reg
10833 && !((addr_mode == CODE_64BIT
10834 && i.base_reg->reg_type.bitfield.qword)
10835 || (addr_mode == CODE_32BIT
10836 ? i.base_reg->reg_type.bitfield.dword
10837 : i.base_reg->reg_type.bitfield.word)))
10838 goto bad_address;
10839
10840 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10841 operand_string,
10842 intel_syntax ? '[' : '(',
10843 register_prefix,
10844 expected_reg->reg_name,
10845 intel_syntax ? ']' : ')');
10846 return 1;
10847 }
10848 else
10849 return 1;
10850
10851 bad_address:
10852 as_bad (_("`%s' is not a valid %s expression"),
10853 operand_string, kind);
10854 return 0;
10855 }
10856 else
10857 {
10858 if (addr_mode != CODE_16BIT)
10859 {
10860 /* 32-bit/64-bit checks. */
10861 if ((i.base_reg
10862 && ((addr_mode == CODE_64BIT
10863 ? !i.base_reg->reg_type.bitfield.qword
10864 : !i.base_reg->reg_type.bitfield.dword)
10865 || (i.index_reg && i.base_reg->reg_num == RegIP)
10866 || i.base_reg->reg_num == RegIZ))
10867 || (i.index_reg
10868 && !i.index_reg->reg_type.bitfield.xmmword
10869 && !i.index_reg->reg_type.bitfield.ymmword
10870 && !i.index_reg->reg_type.bitfield.zmmword
10871 && ((addr_mode == CODE_64BIT
10872 ? !i.index_reg->reg_type.bitfield.qword
10873 : !i.index_reg->reg_type.bitfield.dword)
10874 || !i.index_reg->reg_type.bitfield.baseindex)))
10875 goto bad_address;
10876
10877 /* bndmk, bndldx, and bndstx have special restrictions. */
10878 if (current_templates->start->base_opcode == 0xf30f1b
10879 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10880 {
10881 /* They cannot use RIP-relative addressing. */
10882 if (i.base_reg && i.base_reg->reg_num == RegIP)
10883 {
10884 as_bad (_("`%s' cannot be used here"), operand_string);
10885 return 0;
10886 }
10887
10888 /* bndldx and bndstx ignore their scale factor. */
10889 if (current_templates->start->base_opcode != 0xf30f1b
10890 && i.log2_scale_factor)
10891 as_warn (_("register scaling is being ignored here"));
10892 }
10893 }
10894 else
10895 {
10896 /* 16-bit checks. */
10897 if ((i.base_reg
10898 && (!i.base_reg->reg_type.bitfield.word
10899 || !i.base_reg->reg_type.bitfield.baseindex))
10900 || (i.index_reg
10901 && (!i.index_reg->reg_type.bitfield.word
10902 || !i.index_reg->reg_type.bitfield.baseindex
10903 || !(i.base_reg
10904 && i.base_reg->reg_num < 6
10905 && i.index_reg->reg_num >= 6
10906 && i.log2_scale_factor == 0))))
10907 goto bad_address;
10908 }
10909 }
10910 return 1;
10911 }
10912
10913 /* Handle vector immediates. */
10914
10915 static int
10916 RC_SAE_immediate (const char *imm_start)
10917 {
10918 unsigned int match_found, j;
10919 const char *pstr = imm_start;
10920 expressionS *exp;
10921
10922 if (*pstr != '{')
10923 return 0;
10924
10925 pstr++;
10926 match_found = 0;
10927 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10928 {
10929 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10930 {
10931 if (!i.rounding)
10932 {
10933 rc_op.type = RC_NamesTable[j].type;
10934 rc_op.operand = this_operand;
10935 i.rounding = &rc_op;
10936 }
10937 else
10938 {
10939 as_bad (_("duplicated `%s'"), imm_start);
10940 return 0;
10941 }
10942 pstr += RC_NamesTable[j].len;
10943 match_found = 1;
10944 break;
10945 }
10946 }
10947 if (!match_found)
10948 return 0;
10949
10950 if (*pstr++ != '}')
10951 {
10952 as_bad (_("Missing '}': '%s'"), imm_start);
10953 return 0;
10954 }
10955 /* RC/SAE immediate string should contain nothing more. */;
10956 if (*pstr != 0)
10957 {
10958 as_bad (_("Junk after '}': '%s'"), imm_start);
10959 return 0;
10960 }
10961
10962 exp = &im_expressions[i.imm_operands++];
10963 i.op[this_operand].imms = exp;
10964
10965 exp->X_op = O_constant;
10966 exp->X_add_number = 0;
10967 exp->X_add_symbol = (symbolS *) 0;
10968 exp->X_op_symbol = (symbolS *) 0;
10969
10970 i.types[this_operand].bitfield.imm8 = 1;
10971 return 1;
10972 }
10973
10974 /* Only string instructions can have a second memory operand, so
10975 reduce current_templates to just those if it contains any. */
10976 static int
10977 maybe_adjust_templates (void)
10978 {
10979 const insn_template *t;
10980
10981 gas_assert (i.mem_operands == 1);
10982
10983 for (t = current_templates->start; t < current_templates->end; ++t)
10984 if (t->opcode_modifier.isstring)
10985 break;
10986
10987 if (t < current_templates->end)
10988 {
10989 static templates aux_templates;
10990 bfd_boolean recheck;
10991
10992 aux_templates.start = t;
10993 for (; t < current_templates->end; ++t)
10994 if (!t->opcode_modifier.isstring)
10995 break;
10996 aux_templates.end = t;
10997
10998 /* Determine whether to re-check the first memory operand. */
10999 recheck = (aux_templates.start != current_templates->start
11000 || t != current_templates->end);
11001
11002 current_templates = &aux_templates;
11003
11004 if (recheck)
11005 {
11006 i.mem_operands = 0;
11007 if (i.memop1_string != NULL
11008 && i386_index_check (i.memop1_string) == 0)
11009 return 0;
11010 i.mem_operands = 1;
11011 }
11012 }
11013
11014 return 1;
11015 }
11016
11017 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
11018 on error. */
11019
11020 static int
11021 i386_att_operand (char *operand_string)
11022 {
11023 const reg_entry *r;
11024 char *end_op;
11025 char *op_string = operand_string;
11026
11027 if (is_space_char (*op_string))
11028 ++op_string;
11029
11030 /* We check for an absolute prefix (differentiating,
11031 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
11032 if (*op_string == ABSOLUTE_PREFIX)
11033 {
11034 ++op_string;
11035 if (is_space_char (*op_string))
11036 ++op_string;
11037 i.jumpabsolute = TRUE;
11038 }
11039
11040 /* Check if operand is a register. */
11041 if ((r = parse_register (op_string, &end_op)) != NULL)
11042 {
11043 i386_operand_type temp;
11044
11045 if (r == &bad_reg)
11046 return 0;
11047
11048 /* Check for a segment override by searching for ':' after a
11049 segment register. */
11050 op_string = end_op;
11051 if (is_space_char (*op_string))
11052 ++op_string;
11053 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11054 {
11055 switch (r->reg_num)
11056 {
11057 case 0:
11058 i.seg[i.mem_operands] = &es;
11059 break;
11060 case 1:
11061 i.seg[i.mem_operands] = &cs;
11062 break;
11063 case 2:
11064 i.seg[i.mem_operands] = &ss;
11065 break;
11066 case 3:
11067 i.seg[i.mem_operands] = &ds;
11068 break;
11069 case 4:
11070 i.seg[i.mem_operands] = &fs;
11071 break;
11072 case 5:
11073 i.seg[i.mem_operands] = &gs;
11074 break;
11075 }
11076
11077 /* Skip the ':' and whitespace. */
11078 ++op_string;
11079 if (is_space_char (*op_string))
11080 ++op_string;
11081
11082 if (!is_digit_char (*op_string)
11083 && !is_identifier_char (*op_string)
11084 && *op_string != '('
11085 && *op_string != ABSOLUTE_PREFIX)
11086 {
11087 as_bad (_("bad memory operand `%s'"), op_string);
11088 return 0;
11089 }
11090 /* Handle case of %es:*foo. */
11091 if (*op_string == ABSOLUTE_PREFIX)
11092 {
11093 ++op_string;
11094 if (is_space_char (*op_string))
11095 ++op_string;
11096 i.jumpabsolute = TRUE;
11097 }
11098 goto do_memory_reference;
11099 }
11100
11101 /* Handle vector operations. */
11102 if (*op_string == '{')
11103 {
11104 op_string = check_VecOperations (op_string, NULL);
11105 if (op_string == NULL)
11106 return 0;
11107 }
11108
11109 if (*op_string)
11110 {
11111 as_bad (_("junk `%s' after register"), op_string);
11112 return 0;
11113 }
11114 temp = r->reg_type;
11115 temp.bitfield.baseindex = 0;
11116 i.types[this_operand] = operand_type_or (i.types[this_operand],
11117 temp);
11118 i.types[this_operand].bitfield.unspecified = 0;
11119 i.op[this_operand].regs = r;
11120 i.reg_operands++;
11121 }
11122 else if (*op_string == REGISTER_PREFIX)
11123 {
11124 as_bad (_("bad register name `%s'"), op_string);
11125 return 0;
11126 }
11127 else if (*op_string == IMMEDIATE_PREFIX)
11128 {
11129 ++op_string;
11130 if (i.jumpabsolute)
11131 {
11132 as_bad (_("immediate operand illegal with absolute jump"));
11133 return 0;
11134 }
11135 if (!i386_immediate (op_string))
11136 return 0;
11137 }
11138 else if (RC_SAE_immediate (operand_string))
11139 {
11140 /* If it is a RC or SAE immediate, do nothing. */
11141 ;
11142 }
11143 else if (is_digit_char (*op_string)
11144 || is_identifier_char (*op_string)
11145 || *op_string == '"'
11146 || *op_string == '(')
11147 {
11148 /* This is a memory reference of some sort. */
11149 char *base_string;
11150
11151 /* Start and end of displacement string expression (if found). */
11152 char *displacement_string_start;
11153 char *displacement_string_end;
11154 char *vop_start;
11155
11156 do_memory_reference:
11157 if (i.mem_operands == 1 && !maybe_adjust_templates ())
11158 return 0;
11159 if ((i.mem_operands == 1
11160 && !current_templates->start->opcode_modifier.isstring)
11161 || i.mem_operands == 2)
11162 {
11163 as_bad (_("too many memory references for `%s'"),
11164 current_templates->start->name);
11165 return 0;
11166 }
11167
11168 /* Check for base index form. We detect the base index form by
11169 looking for an ')' at the end of the operand, searching
11170 for the '(' matching it, and finding a REGISTER_PREFIX or ','
11171 after the '('. */
11172 base_string = op_string + strlen (op_string);
11173
11174 /* Handle vector operations. */
11175 vop_start = strchr (op_string, '{');
11176 if (vop_start && vop_start < base_string)
11177 {
11178 if (check_VecOperations (vop_start, base_string) == NULL)
11179 return 0;
11180 base_string = vop_start;
11181 }
11182
11183 --base_string;
11184 if (is_space_char (*base_string))
11185 --base_string;
11186
11187 /* If we only have a displacement, set-up for it to be parsed later. */
11188 displacement_string_start = op_string;
11189 displacement_string_end = base_string + 1;
11190
11191 if (*base_string == ')')
11192 {
11193 char *temp_string;
11194 unsigned int parens_balanced = 1;
11195 /* We've already checked that the number of left & right ()'s are
11196 equal, so this loop will not be infinite. */
11197 do
11198 {
11199 base_string--;
11200 if (*base_string == ')')
11201 parens_balanced++;
11202 if (*base_string == '(')
11203 parens_balanced--;
11204 }
11205 while (parens_balanced);
11206
11207 temp_string = base_string;
11208
11209 /* Skip past '(' and whitespace. */
11210 ++base_string;
11211 if (is_space_char (*base_string))
11212 ++base_string;
11213
11214 if (*base_string == ','
11215 || ((i.base_reg = parse_register (base_string, &end_op))
11216 != NULL))
11217 {
11218 displacement_string_end = temp_string;
11219
11220 i.types[this_operand].bitfield.baseindex = 1;
11221
11222 if (i.base_reg)
11223 {
11224 if (i.base_reg == &bad_reg)
11225 return 0;
11226 base_string = end_op;
11227 if (is_space_char (*base_string))
11228 ++base_string;
11229 }
11230
11231 /* There may be an index reg or scale factor here. */
11232 if (*base_string == ',')
11233 {
11234 ++base_string;
11235 if (is_space_char (*base_string))
11236 ++base_string;
11237
11238 if ((i.index_reg = parse_register (base_string, &end_op))
11239 != NULL)
11240 {
11241 if (i.index_reg == &bad_reg)
11242 return 0;
11243 base_string = end_op;
11244 if (is_space_char (*base_string))
11245 ++base_string;
11246 if (*base_string == ',')
11247 {
11248 ++base_string;
11249 if (is_space_char (*base_string))
11250 ++base_string;
11251 }
11252 else if (*base_string != ')')
11253 {
11254 as_bad (_("expecting `,' or `)' "
11255 "after index register in `%s'"),
11256 operand_string);
11257 return 0;
11258 }
11259 }
11260 else if (*base_string == REGISTER_PREFIX)
11261 {
11262 end_op = strchr (base_string, ',');
11263 if (end_op)
11264 *end_op = '\0';
11265 as_bad (_("bad register name `%s'"), base_string);
11266 return 0;
11267 }
11268
11269 /* Check for scale factor. */
11270 if (*base_string != ')')
11271 {
11272 char *end_scale = i386_scale (base_string);
11273
11274 if (!end_scale)
11275 return 0;
11276
11277 base_string = end_scale;
11278 if (is_space_char (*base_string))
11279 ++base_string;
11280 if (*base_string != ')')
11281 {
11282 as_bad (_("expecting `)' "
11283 "after scale factor in `%s'"),
11284 operand_string);
11285 return 0;
11286 }
11287 }
11288 else if (!i.index_reg)
11289 {
11290 as_bad (_("expecting index register or scale factor "
11291 "after `,'; got '%c'"),
11292 *base_string);
11293 return 0;
11294 }
11295 }
11296 else if (*base_string != ')')
11297 {
11298 as_bad (_("expecting `,' or `)' "
11299 "after base register in `%s'"),
11300 operand_string);
11301 return 0;
11302 }
11303 }
11304 else if (*base_string == REGISTER_PREFIX)
11305 {
11306 end_op = strchr (base_string, ',');
11307 if (end_op)
11308 *end_op = '\0';
11309 as_bad (_("bad register name `%s'"), base_string);
11310 return 0;
11311 }
11312 }
11313
11314 /* If there's an expression beginning the operand, parse it,
11315 assuming displacement_string_start and
11316 displacement_string_end are meaningful. */
11317 if (displacement_string_start != displacement_string_end)
11318 {
11319 if (!i386_displacement (displacement_string_start,
11320 displacement_string_end))
11321 return 0;
11322 }
11323
11324 /* Special case for (%dx) while doing input/output op. */
11325 if (i.base_reg
11326 && i.base_reg->reg_type.bitfield.instance == RegD
11327 && i.base_reg->reg_type.bitfield.word
11328 && i.index_reg == 0
11329 && i.log2_scale_factor == 0
11330 && i.seg[i.mem_operands] == 0
11331 && !operand_type_check (i.types[this_operand], disp))
11332 {
11333 i.types[this_operand] = i.base_reg->reg_type;
11334 return 1;
11335 }
11336
11337 if (i386_index_check (operand_string) == 0)
11338 return 0;
11339 i.flags[this_operand] |= Operand_Mem;
11340 if (i.mem_operands == 0)
11341 i.memop1_string = xstrdup (operand_string);
11342 i.mem_operands++;
11343 }
11344 else
11345 {
11346 /* It's not a memory operand; argh! */
11347 as_bad (_("invalid char %s beginning operand %d `%s'"),
11348 output_invalid (*op_string),
11349 this_operand + 1,
11350 op_string);
11351 return 0;
11352 }
11353 return 1; /* Normal return. */
11354 }
11355 \f
11356 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11357 that an rs_machine_dependent frag may reach. */
11358
11359 unsigned int
11360 i386_frag_max_var (fragS *frag)
11361 {
11362 /* The only relaxable frags are for jumps.
11363 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
11364 gas_assert (frag->fr_type == rs_machine_dependent);
11365 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11366 }
11367
11368 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11369 static int
11370 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11371 {
11372 /* STT_GNU_IFUNC symbol must go through PLT. */
11373 if ((symbol_get_bfdsym (fr_symbol)->flags
11374 & BSF_GNU_INDIRECT_FUNCTION) != 0)
11375 return 0;
11376
11377 if (!S_IS_EXTERNAL (fr_symbol))
11378 /* Symbol may be weak or local. */
11379 return !S_IS_WEAK (fr_symbol);
11380
11381 /* Global symbols with non-default visibility can't be preempted. */
11382 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11383 return 1;
11384
11385 if (fr_var != NO_RELOC)
11386 switch ((enum bfd_reloc_code_real) fr_var)
11387 {
11388 case BFD_RELOC_386_PLT32:
11389 case BFD_RELOC_X86_64_PLT32:
11390 /* Symbol with PLT relocation may be preempted. */
11391 return 0;
11392 default:
11393 abort ();
11394 }
11395
11396 /* Global symbols with default visibility in a shared library may be
11397 preempted by another definition. */
11398 return !shared;
11399 }
11400 #endif
11401
11402 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11403 Note also work for Skylake and Cascadelake.
11404 ---------------------------------------------------------------------
11405 | JCC | ADD/SUB/CMP | INC/DEC | TEST/AND |
11406 | ------ | ----------- | ------- | -------- |
11407 | Jo | N | N | Y |
11408 | Jno | N | N | Y |
11409 | Jc/Jb | Y | N | Y |
11410 | Jae/Jnb | Y | N | Y |
11411 | Je/Jz | Y | Y | Y |
11412 | Jne/Jnz | Y | Y | Y |
11413 | Jna/Jbe | Y | N | Y |
11414 | Ja/Jnbe | Y | N | Y |
11415 | Js | N | N | Y |
11416 | Jns | N | N | Y |
11417 | Jp/Jpe | N | N | Y |
11418 | Jnp/Jpo | N | N | Y |
11419 | Jl/Jnge | Y | Y | Y |
11420 | Jge/Jnl | Y | Y | Y |
11421 | Jle/Jng | Y | Y | Y |
11422 | Jg/Jnle | Y | Y | Y |
11423 --------------------------------------------------------------------- */
11424 static int
11425 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11426 {
11427 if (mf_cmp == mf_cmp_alu_cmp)
11428 return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11429 || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11430 if (mf_cmp == mf_cmp_incdec)
11431 return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11432 || mf_jcc == mf_jcc_jle);
11433 if (mf_cmp == mf_cmp_test_and)
11434 return 1;
11435 return 0;
11436 }
11437
11438 /* Return the next non-empty frag. */
11439
11440 static fragS *
11441 i386_next_non_empty_frag (fragS *fragP)
11442 {
11443 /* There may be a frag with a ".fill 0" when there is no room in
11444 the current frag for frag_grow in output_insn. */
11445 for (fragP = fragP->fr_next;
11446 (fragP != NULL
11447 && fragP->fr_type == rs_fill
11448 && fragP->fr_fix == 0);
11449 fragP = fragP->fr_next)
11450 ;
11451 return fragP;
11452 }
11453
11454 /* Return the next jcc frag after BRANCH_PADDING. */
11455
11456 static fragS *
11457 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11458 {
11459 fragS *branch_fragP;
11460 if (!pad_fragP)
11461 return NULL;
11462
11463 if (pad_fragP->fr_type == rs_machine_dependent
11464 && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11465 == BRANCH_PADDING))
11466 {
11467 branch_fragP = i386_next_non_empty_frag (pad_fragP);
11468 if (branch_fragP->fr_type != rs_machine_dependent)
11469 return NULL;
11470 if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11471 && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11472 pad_fragP->tc_frag_data.mf_type))
11473 return branch_fragP;
11474 }
11475
11476 return NULL;
11477 }
11478
11479 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
11480
11481 static void
11482 i386_classify_machine_dependent_frag (fragS *fragP)
11483 {
11484 fragS *cmp_fragP;
11485 fragS *pad_fragP;
11486 fragS *branch_fragP;
11487 fragS *next_fragP;
11488 unsigned int max_prefix_length;
11489
11490 if (fragP->tc_frag_data.classified)
11491 return;
11492
11493 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11494 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11495 for (next_fragP = fragP;
11496 next_fragP != NULL;
11497 next_fragP = next_fragP->fr_next)
11498 {
11499 next_fragP->tc_frag_data.classified = 1;
11500 if (next_fragP->fr_type == rs_machine_dependent)
11501 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11502 {
11503 case BRANCH_PADDING:
11504 /* The BRANCH_PADDING frag must be followed by a branch
11505 frag. */
11506 branch_fragP = i386_next_non_empty_frag (next_fragP);
11507 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11508 break;
11509 case FUSED_JCC_PADDING:
11510 /* Check if this is a fused jcc:
11511 FUSED_JCC_PADDING
11512 CMP like instruction
11513 BRANCH_PADDING
11514 COND_JUMP
11515 */
11516 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11517 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11518 branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11519 if (branch_fragP)
11520 {
11521 /* The BRANCH_PADDING frag is merged with the
11522 FUSED_JCC_PADDING frag. */
11523 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11524 /* CMP like instruction size. */
11525 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11526 frag_wane (pad_fragP);
11527 /* Skip to branch_fragP. */
11528 next_fragP = branch_fragP;
11529 }
11530 else if (next_fragP->tc_frag_data.max_prefix_length)
11531 {
11532 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11533 a fused jcc. */
11534 next_fragP->fr_subtype
11535 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11536 next_fragP->tc_frag_data.max_bytes
11537 = next_fragP->tc_frag_data.max_prefix_length;
11538 /* This will be updated in the BRANCH_PREFIX scan. */
11539 next_fragP->tc_frag_data.max_prefix_length = 0;
11540 }
11541 else
11542 frag_wane (next_fragP);
11543 break;
11544 }
11545 }
11546
11547 /* Stop if there is no BRANCH_PREFIX. */
11548 if (!align_branch_prefix_size)
11549 return;
11550
11551 /* Scan for BRANCH_PREFIX. */
11552 for (; fragP != NULL; fragP = fragP->fr_next)
11553 {
11554 if (fragP->fr_type != rs_machine_dependent
11555 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11556 != BRANCH_PREFIX))
11557 continue;
11558
11559 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11560 COND_JUMP_PREFIX. */
11561 max_prefix_length = 0;
11562 for (next_fragP = fragP;
11563 next_fragP != NULL;
11564 next_fragP = next_fragP->fr_next)
11565 {
11566 if (next_fragP->fr_type == rs_fill)
11567 /* Skip rs_fill frags. */
11568 continue;
11569 else if (next_fragP->fr_type != rs_machine_dependent)
11570 /* Stop for all other frags. */
11571 break;
11572
11573 /* rs_machine_dependent frags. */
11574 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11575 == BRANCH_PREFIX)
11576 {
11577 /* Count BRANCH_PREFIX frags. */
11578 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11579 {
11580 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11581 frag_wane (next_fragP);
11582 }
11583 else
11584 max_prefix_length
11585 += next_fragP->tc_frag_data.max_bytes;
11586 }
11587 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11588 == BRANCH_PADDING)
11589 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11590 == FUSED_JCC_PADDING))
11591 {
11592 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11593 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11594 break;
11595 }
11596 else
11597 /* Stop for other rs_machine_dependent frags. */
11598 break;
11599 }
11600
11601 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11602
11603 /* Skip to the next frag. */
11604 fragP = next_fragP;
11605 }
11606 }
11607
11608 /* Compute padding size for
11609
11610 FUSED_JCC_PADDING
11611 CMP like instruction
11612 BRANCH_PADDING
11613 COND_JUMP/UNCOND_JUMP
11614
11615 or
11616
11617 BRANCH_PADDING
11618 COND_JUMP/UNCOND_JUMP
11619 */
11620
11621 static int
11622 i386_branch_padding_size (fragS *fragP, offsetT address)
11623 {
11624 unsigned int offset, size, padding_size;
11625 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11626
11627 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11628 if (!address)
11629 address = fragP->fr_address;
11630 address += fragP->fr_fix;
11631
11632 /* CMP like instrunction size. */
11633 size = fragP->tc_frag_data.cmp_size;
11634
11635 /* The base size of the branch frag. */
11636 size += branch_fragP->fr_fix;
11637
11638 /* Add opcode and displacement bytes for the rs_machine_dependent
11639 branch frag. */
11640 if (branch_fragP->fr_type == rs_machine_dependent)
11641 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11642
11643 /* Check if branch is within boundary and doesn't end at the last
11644 byte. */
11645 offset = address & ((1U << align_branch_power) - 1);
11646 if ((offset + size) >= (1U << align_branch_power))
11647 /* Padding needed to avoid crossing boundary. */
11648 padding_size = (1U << align_branch_power) - offset;
11649 else
11650 /* No padding needed. */
11651 padding_size = 0;
11652
11653 /* The return value may be saved in tc_frag_data.length which is
11654 unsigned byte. */
11655 if (!fits_in_unsigned_byte (padding_size))
11656 abort ();
11657
11658 return padding_size;
11659 }
11660
11661 /* i386_generic_table_relax_frag()
11662
11663 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11664 grow/shrink padding to align branch frags. Hand others to
11665 relax_frag(). */
11666
11667 long
11668 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11669 {
11670 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11671 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11672 {
11673 long padding_size = i386_branch_padding_size (fragP, 0);
11674 long grow = padding_size - fragP->tc_frag_data.length;
11675
11676 /* When the BRANCH_PREFIX frag is used, the computed address
11677 must match the actual address and there should be no padding. */
11678 if (fragP->tc_frag_data.padding_address
11679 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11680 || padding_size))
11681 abort ();
11682
11683 /* Update the padding size. */
11684 if (grow)
11685 fragP->tc_frag_data.length = padding_size;
11686
11687 return grow;
11688 }
11689 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11690 {
11691 fragS *padding_fragP, *next_fragP;
11692 long padding_size, left_size, last_size;
11693
11694 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11695 if (!padding_fragP)
11696 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11697 return (fragP->tc_frag_data.length
11698 - fragP->tc_frag_data.last_length);
11699
11700 /* Compute the relative address of the padding frag in the very
11701 first time where the BRANCH_PREFIX frag sizes are zero. */
11702 if (!fragP->tc_frag_data.padding_address)
11703 fragP->tc_frag_data.padding_address
11704 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11705
11706 /* First update the last length from the previous interation. */
11707 left_size = fragP->tc_frag_data.prefix_length;
11708 for (next_fragP = fragP;
11709 next_fragP != padding_fragP;
11710 next_fragP = next_fragP->fr_next)
11711 if (next_fragP->fr_type == rs_machine_dependent
11712 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11713 == BRANCH_PREFIX))
11714 {
11715 if (left_size)
11716 {
11717 int max = next_fragP->tc_frag_data.max_bytes;
11718 if (max)
11719 {
11720 int size;
11721 if (max > left_size)
11722 size = left_size;
11723 else
11724 size = max;
11725 left_size -= size;
11726 next_fragP->tc_frag_data.last_length = size;
11727 }
11728 }
11729 else
11730 next_fragP->tc_frag_data.last_length = 0;
11731 }
11732
11733 /* Check the padding size for the padding frag. */
11734 padding_size = i386_branch_padding_size
11735 (padding_fragP, (fragP->fr_address
11736 + fragP->tc_frag_data.padding_address));
11737
11738 last_size = fragP->tc_frag_data.prefix_length;
11739 /* Check if there is change from the last interation. */
11740 if (padding_size == last_size)
11741 {
11742 /* Update the expected address of the padding frag. */
11743 padding_fragP->tc_frag_data.padding_address
11744 = (fragP->fr_address + padding_size
11745 + fragP->tc_frag_data.padding_address);
11746 return 0;
11747 }
11748
11749 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11750 {
11751 /* No padding if there is no sufficient room. Clear the
11752 expected address of the padding frag. */
11753 padding_fragP->tc_frag_data.padding_address = 0;
11754 padding_size = 0;
11755 }
11756 else
11757 /* Store the expected address of the padding frag. */
11758 padding_fragP->tc_frag_data.padding_address
11759 = (fragP->fr_address + padding_size
11760 + fragP->tc_frag_data.padding_address);
11761
11762 fragP->tc_frag_data.prefix_length = padding_size;
11763
11764 /* Update the length for the current interation. */
11765 left_size = padding_size;
11766 for (next_fragP = fragP;
11767 next_fragP != padding_fragP;
11768 next_fragP = next_fragP->fr_next)
11769 if (next_fragP->fr_type == rs_machine_dependent
11770 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11771 == BRANCH_PREFIX))
11772 {
11773 if (left_size)
11774 {
11775 int max = next_fragP->tc_frag_data.max_bytes;
11776 if (max)
11777 {
11778 int size;
11779 if (max > left_size)
11780 size = left_size;
11781 else
11782 size = max;
11783 left_size -= size;
11784 next_fragP->tc_frag_data.length = size;
11785 }
11786 }
11787 else
11788 next_fragP->tc_frag_data.length = 0;
11789 }
11790
11791 return (fragP->tc_frag_data.length
11792 - fragP->tc_frag_data.last_length);
11793 }
11794 return relax_frag (segment, fragP, stretch);
11795 }
11796
11797 /* md_estimate_size_before_relax()
11798
11799 Called just before relax() for rs_machine_dependent frags. The x86
11800 assembler uses these frags to handle variable size jump
11801 instructions.
11802
11803 Any symbol that is now undefined will not become defined.
11804 Return the correct fr_subtype in the frag.
11805 Return the initial "guess for variable size of frag" to caller.
11806 The guess is actually the growth beyond the fixed part. Whatever
11807 we do to grow the fixed or variable part contributes to our
11808 returned value. */
11809
11810 int
11811 md_estimate_size_before_relax (fragS *fragP, segT segment)
11812 {
11813 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11814 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11815 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11816 {
11817 i386_classify_machine_dependent_frag (fragP);
11818 return fragP->tc_frag_data.length;
11819 }
11820
11821 /* We've already got fragP->fr_subtype right; all we have to do is
11822 check for un-relaxable symbols. On an ELF system, we can't relax
11823 an externally visible symbol, because it may be overridden by a
11824 shared library. */
11825 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11826 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11827 || (IS_ELF
11828 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11829 fragP->fr_var))
11830 #endif
11831 #if defined (OBJ_COFF) && defined (TE_PE)
11832 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11833 && S_IS_WEAK (fragP->fr_symbol))
11834 #endif
11835 )
11836 {
11837 /* Symbol is undefined in this segment, or we need to keep a
11838 reloc so that weak symbols can be overridden. */
11839 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11840 enum bfd_reloc_code_real reloc_type;
11841 unsigned char *opcode;
11842 int old_fr_fix;
11843
11844 if (fragP->fr_var != NO_RELOC)
11845 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11846 else if (size == 2)
11847 reloc_type = BFD_RELOC_16_PCREL;
11848 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11849 else if (need_plt32_p (fragP->fr_symbol))
11850 reloc_type = BFD_RELOC_X86_64_PLT32;
11851 #endif
11852 else
11853 reloc_type = BFD_RELOC_32_PCREL;
11854
11855 old_fr_fix = fragP->fr_fix;
11856 opcode = (unsigned char *) fragP->fr_opcode;
11857
11858 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11859 {
11860 case UNCOND_JUMP:
11861 /* Make jmp (0xeb) a (d)word displacement jump. */
11862 opcode[0] = 0xe9;
11863 fragP->fr_fix += size;
11864 fix_new (fragP, old_fr_fix, size,
11865 fragP->fr_symbol,
11866 fragP->fr_offset, 1,
11867 reloc_type);
11868 break;
11869
11870 case COND_JUMP86:
11871 if (size == 2
11872 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11873 {
11874 /* Negate the condition, and branch past an
11875 unconditional jump. */
11876 opcode[0] ^= 1;
11877 opcode[1] = 3;
11878 /* Insert an unconditional jump. */
11879 opcode[2] = 0xe9;
11880 /* We added two extra opcode bytes, and have a two byte
11881 offset. */
11882 fragP->fr_fix += 2 + 2;
11883 fix_new (fragP, old_fr_fix + 2, 2,
11884 fragP->fr_symbol,
11885 fragP->fr_offset, 1,
11886 reloc_type);
11887 break;
11888 }
11889 /* Fall through. */
11890
11891 case COND_JUMP:
11892 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11893 {
11894 fixS *fixP;
11895
11896 fragP->fr_fix += 1;
11897 fixP = fix_new (fragP, old_fr_fix, 1,
11898 fragP->fr_symbol,
11899 fragP->fr_offset, 1,
11900 BFD_RELOC_8_PCREL);
11901 fixP->fx_signed = 1;
11902 break;
11903 }
11904
11905 /* This changes the byte-displacement jump 0x7N
11906 to the (d)word-displacement jump 0x0f,0x8N. */
11907 opcode[1] = opcode[0] + 0x10;
11908 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11909 /* We've added an opcode byte. */
11910 fragP->fr_fix += 1 + size;
11911 fix_new (fragP, old_fr_fix + 1, size,
11912 fragP->fr_symbol,
11913 fragP->fr_offset, 1,
11914 reloc_type);
11915 break;
11916
11917 default:
11918 BAD_CASE (fragP->fr_subtype);
11919 break;
11920 }
11921 frag_wane (fragP);
11922 return fragP->fr_fix - old_fr_fix;
11923 }
11924
11925 /* Guess size depending on current relax state. Initially the relax
11926 state will correspond to a short jump and we return 1, because
11927 the variable part of the frag (the branch offset) is one byte
11928 long. However, we can relax a section more than once and in that
11929 case we must either set fr_subtype back to the unrelaxed state,
11930 or return the value for the appropriate branch. */
11931 return md_relax_table[fragP->fr_subtype].rlx_length;
11932 }
11933
11934 /* Called after relax() is finished.
11935
11936 In: Address of frag.
11937 fr_type == rs_machine_dependent.
11938 fr_subtype is what the address relaxed to.
11939
11940 Out: Any fixSs and constants are set up.
11941 Caller will turn frag into a ".space 0". */
11942
11943 void
11944 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
11945 fragS *fragP)
11946 {
11947 unsigned char *opcode;
11948 unsigned char *where_to_put_displacement = NULL;
11949 offsetT target_address;
11950 offsetT opcode_address;
11951 unsigned int extension = 0;
11952 offsetT displacement_from_opcode_start;
11953
11954 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11955 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
11956 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11957 {
11958 /* Generate nop padding. */
11959 unsigned int size = fragP->tc_frag_data.length;
11960 if (size)
11961 {
11962 if (size > fragP->tc_frag_data.max_bytes)
11963 abort ();
11964
11965 if (flag_debug)
11966 {
11967 const char *msg;
11968 const char *branch = "branch";
11969 const char *prefix = "";
11970 fragS *padding_fragP;
11971 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11972 == BRANCH_PREFIX)
11973 {
11974 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11975 switch (fragP->tc_frag_data.default_prefix)
11976 {
11977 default:
11978 abort ();
11979 break;
11980 case CS_PREFIX_OPCODE:
11981 prefix = " cs";
11982 break;
11983 case DS_PREFIX_OPCODE:
11984 prefix = " ds";
11985 break;
11986 case ES_PREFIX_OPCODE:
11987 prefix = " es";
11988 break;
11989 case FS_PREFIX_OPCODE:
11990 prefix = " fs";
11991 break;
11992 case GS_PREFIX_OPCODE:
11993 prefix = " gs";
11994 break;
11995 case SS_PREFIX_OPCODE:
11996 prefix = " ss";
11997 break;
11998 }
11999 if (padding_fragP)
12000 msg = _("%s:%u: add %d%s at 0x%llx to align "
12001 "%s within %d-byte boundary\n");
12002 else
12003 msg = _("%s:%u: add additional %d%s at 0x%llx to "
12004 "align %s within %d-byte boundary\n");
12005 }
12006 else
12007 {
12008 padding_fragP = fragP;
12009 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12010 "%s within %d-byte boundary\n");
12011 }
12012
12013 if (padding_fragP)
12014 switch (padding_fragP->tc_frag_data.branch_type)
12015 {
12016 case align_branch_jcc:
12017 branch = "jcc";
12018 break;
12019 case align_branch_fused:
12020 branch = "fused jcc";
12021 break;
12022 case align_branch_jmp:
12023 branch = "jmp";
12024 break;
12025 case align_branch_call:
12026 branch = "call";
12027 break;
12028 case align_branch_indirect:
12029 branch = "indiret branch";
12030 break;
12031 case align_branch_ret:
12032 branch = "ret";
12033 break;
12034 default:
12035 break;
12036 }
12037
12038 fprintf (stdout, msg,
12039 fragP->fr_file, fragP->fr_line, size, prefix,
12040 (long long) fragP->fr_address, branch,
12041 1 << align_branch_power);
12042 }
12043 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12044 memset (fragP->fr_opcode,
12045 fragP->tc_frag_data.default_prefix, size);
12046 else
12047 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12048 size, 0);
12049 fragP->fr_fix += size;
12050 }
12051 return;
12052 }
12053
12054 opcode = (unsigned char *) fragP->fr_opcode;
12055
12056 /* Address we want to reach in file space. */
12057 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12058
12059 /* Address opcode resides at in file space. */
12060 opcode_address = fragP->fr_address + fragP->fr_fix;
12061
12062 /* Displacement from opcode start to fill into instruction. */
12063 displacement_from_opcode_start = target_address - opcode_address;
12064
12065 if ((fragP->fr_subtype & BIG) == 0)
12066 {
12067 /* Don't have to change opcode. */
12068 extension = 1; /* 1 opcode + 1 displacement */
12069 where_to_put_displacement = &opcode[1];
12070 }
12071 else
12072 {
12073 if (no_cond_jump_promotion
12074 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12075 as_warn_where (fragP->fr_file, fragP->fr_line,
12076 _("long jump required"));
12077
12078 switch (fragP->fr_subtype)
12079 {
12080 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12081 extension = 4; /* 1 opcode + 4 displacement */
12082 opcode[0] = 0xe9;
12083 where_to_put_displacement = &opcode[1];
12084 break;
12085
12086 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12087 extension = 2; /* 1 opcode + 2 displacement */
12088 opcode[0] = 0xe9;
12089 where_to_put_displacement = &opcode[1];
12090 break;
12091
12092 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12093 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12094 extension = 5; /* 2 opcode + 4 displacement */
12095 opcode[1] = opcode[0] + 0x10;
12096 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12097 where_to_put_displacement = &opcode[2];
12098 break;
12099
12100 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12101 extension = 3; /* 2 opcode + 2 displacement */
12102 opcode[1] = opcode[0] + 0x10;
12103 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12104 where_to_put_displacement = &opcode[2];
12105 break;
12106
12107 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12108 extension = 4;
12109 opcode[0] ^= 1;
12110 opcode[1] = 3;
12111 opcode[2] = 0xe9;
12112 where_to_put_displacement = &opcode[3];
12113 break;
12114
12115 default:
12116 BAD_CASE (fragP->fr_subtype);
12117 break;
12118 }
12119 }
12120
12121 /* If size if less then four we are sure that the operand fits,
12122 but if it's 4, then it could be that the displacement is larger
12123 then -/+ 2GB. */
12124 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12125 && object_64bit
12126 && ((addressT) (displacement_from_opcode_start - extension
12127 + ((addressT) 1 << 31))
12128 > (((addressT) 2 << 31) - 1)))
12129 {
12130 as_bad_where (fragP->fr_file, fragP->fr_line,
12131 _("jump target out of range"));
12132 /* Make us emit 0. */
12133 displacement_from_opcode_start = extension;
12134 }
12135 /* Now put displacement after opcode. */
12136 md_number_to_chars ((char *) where_to_put_displacement,
12137 (valueT) (displacement_from_opcode_start - extension),
12138 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12139 fragP->fr_fix += extension;
12140 }
12141 \f
12142 /* Apply a fixup (fixP) to segment data, once it has been determined
12143 by our caller that we have all the info we need to fix it up.
12144
12145 Parameter valP is the pointer to the value of the bits.
12146
12147 On the 386, immediates, displacements, and data pointers are all in
12148 the same (little-endian) format, so we don't need to care about which
12149 we are handling. */
12150
12151 void
12152 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12153 {
12154 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12155 valueT value = *valP;
12156
12157 #if !defined (TE_Mach)
12158 if (fixP->fx_pcrel)
12159 {
12160 switch (fixP->fx_r_type)
12161 {
12162 default:
12163 break;
12164
12165 case BFD_RELOC_64:
12166 fixP->fx_r_type = BFD_RELOC_64_PCREL;
12167 break;
12168 case BFD_RELOC_32:
12169 case BFD_RELOC_X86_64_32S:
12170 fixP->fx_r_type = BFD_RELOC_32_PCREL;
12171 break;
12172 case BFD_RELOC_16:
12173 fixP->fx_r_type = BFD_RELOC_16_PCREL;
12174 break;
12175 case BFD_RELOC_8:
12176 fixP->fx_r_type = BFD_RELOC_8_PCREL;
12177 break;
12178 }
12179 }
12180
12181 if (fixP->fx_addsy != NULL
12182 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12183 || fixP->fx_r_type == BFD_RELOC_64_PCREL
12184 || fixP->fx_r_type == BFD_RELOC_16_PCREL
12185 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12186 && !use_rela_relocations)
12187 {
12188 /* This is a hack. There should be a better way to handle this.
12189 This covers for the fact that bfd_install_relocation will
12190 subtract the current location (for partial_inplace, PC relative
12191 relocations); see more below. */
12192 #ifndef OBJ_AOUT
12193 if (IS_ELF
12194 #ifdef TE_PE
12195 || OUTPUT_FLAVOR == bfd_target_coff_flavour
12196 #endif
12197 )
12198 value += fixP->fx_where + fixP->fx_frag->fr_address;
12199 #endif
12200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12201 if (IS_ELF)
12202 {
12203 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12204
12205 if ((sym_seg == seg
12206 || (symbol_section_p (fixP->fx_addsy)
12207 && sym_seg != absolute_section))
12208 && !generic_force_reloc (fixP))
12209 {
12210 /* Yes, we add the values in twice. This is because
12211 bfd_install_relocation subtracts them out again. I think
12212 bfd_install_relocation is broken, but I don't dare change
12213 it. FIXME. */
12214 value += fixP->fx_where + fixP->fx_frag->fr_address;
12215 }
12216 }
12217 #endif
12218 #if defined (OBJ_COFF) && defined (TE_PE)
12219 /* For some reason, the PE format does not store a
12220 section address offset for a PC relative symbol. */
12221 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12222 || S_IS_WEAK (fixP->fx_addsy))
12223 value += md_pcrel_from (fixP);
12224 #endif
12225 }
12226 #if defined (OBJ_COFF) && defined (TE_PE)
12227 if (fixP->fx_addsy != NULL
12228 && S_IS_WEAK (fixP->fx_addsy)
12229 /* PR 16858: Do not modify weak function references. */
12230 && ! fixP->fx_pcrel)
12231 {
12232 #if !defined (TE_PEP)
12233 /* For x86 PE weak function symbols are neither PC-relative
12234 nor do they set S_IS_FUNCTION. So the only reliable way
12235 to detect them is to check the flags of their containing
12236 section. */
12237 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12238 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12239 ;
12240 else
12241 #endif
12242 value -= S_GET_VALUE (fixP->fx_addsy);
12243 }
12244 #endif
12245
12246 /* Fix a few things - the dynamic linker expects certain values here,
12247 and we must not disappoint it. */
12248 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12249 if (IS_ELF && fixP->fx_addsy)
12250 switch (fixP->fx_r_type)
12251 {
12252 case BFD_RELOC_386_PLT32:
12253 case BFD_RELOC_X86_64_PLT32:
12254 /* Make the jump instruction point to the address of the operand.
12255 At runtime we merely add the offset to the actual PLT entry.
12256 NB: Subtract the offset size only for jump instructions. */
12257 if (fixP->fx_pcrel)
12258 value = -4;
12259 break;
12260
12261 case BFD_RELOC_386_TLS_GD:
12262 case BFD_RELOC_386_TLS_LDM:
12263 case BFD_RELOC_386_TLS_IE_32:
12264 case BFD_RELOC_386_TLS_IE:
12265 case BFD_RELOC_386_TLS_GOTIE:
12266 case BFD_RELOC_386_TLS_GOTDESC:
12267 case BFD_RELOC_X86_64_TLSGD:
12268 case BFD_RELOC_X86_64_TLSLD:
12269 case BFD_RELOC_X86_64_GOTTPOFF:
12270 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12271 value = 0; /* Fully resolved at runtime. No addend. */
12272 /* Fallthrough */
12273 case BFD_RELOC_386_TLS_LE:
12274 case BFD_RELOC_386_TLS_LDO_32:
12275 case BFD_RELOC_386_TLS_LE_32:
12276 case BFD_RELOC_X86_64_DTPOFF32:
12277 case BFD_RELOC_X86_64_DTPOFF64:
12278 case BFD_RELOC_X86_64_TPOFF32:
12279 case BFD_RELOC_X86_64_TPOFF64:
12280 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12281 break;
12282
12283 case BFD_RELOC_386_TLS_DESC_CALL:
12284 case BFD_RELOC_X86_64_TLSDESC_CALL:
12285 value = 0; /* Fully resolved at runtime. No addend. */
12286 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12287 fixP->fx_done = 0;
12288 return;
12289
12290 case BFD_RELOC_VTABLE_INHERIT:
12291 case BFD_RELOC_VTABLE_ENTRY:
12292 fixP->fx_done = 0;
12293 return;
12294
12295 default:
12296 break;
12297 }
12298 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
12299 *valP = value;
12300 #endif /* !defined (TE_Mach) */
12301
12302 /* Are we finished with this relocation now? */
12303 if (fixP->fx_addsy == NULL)
12304 fixP->fx_done = 1;
12305 #if defined (OBJ_COFF) && defined (TE_PE)
12306 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12307 {
12308 fixP->fx_done = 0;
12309 /* Remember value for tc_gen_reloc. */
12310 fixP->fx_addnumber = value;
12311 /* Clear out the frag for now. */
12312 value = 0;
12313 }
12314 #endif
12315 else if (use_rela_relocations)
12316 {
12317 fixP->fx_no_overflow = 1;
12318 /* Remember value for tc_gen_reloc. */
12319 fixP->fx_addnumber = value;
12320 value = 0;
12321 }
12322
12323 md_number_to_chars (p, value, fixP->fx_size);
12324 }
12325 \f
12326 const char *
12327 md_atof (int type, char *litP, int *sizeP)
12328 {
12329 /* This outputs the LITTLENUMs in REVERSE order;
12330 in accord with the bigendian 386. */
12331 return ieee_md_atof (type, litP, sizeP, FALSE);
12332 }
12333 \f
12334 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12335
12336 static char *
12337 output_invalid (int c)
12338 {
12339 if (ISPRINT (c))
12340 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12341 "'%c'", c);
12342 else
12343 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12344 "(0x%x)", (unsigned char) c);
12345 return output_invalid_buf;
12346 }
12347
12348 /* Verify that @r can be used in the current context. */
12349
12350 static bfd_boolean check_register (const reg_entry *r)
12351 {
12352 if (allow_pseudo_reg)
12353 return TRUE;
12354
12355 if (operand_type_all_zero (&r->reg_type))
12356 return FALSE;
12357
12358 if ((r->reg_type.bitfield.dword
12359 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12360 || r->reg_type.bitfield.class == RegCR
12361 || r->reg_type.bitfield.class == RegDR
12362 || r->reg_type.bitfield.class == RegTR)
12363 && !cpu_arch_flags.bitfield.cpui386)
12364 return FALSE;
12365
12366 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12367 return FALSE;
12368
12369 if (!cpu_arch_flags.bitfield.cpuavx512f)
12370 {
12371 if (r->reg_type.bitfield.zmmword
12372 || r->reg_type.bitfield.class == RegMask)
12373 return FALSE;
12374
12375 if (!cpu_arch_flags.bitfield.cpuavx)
12376 {
12377 if (r->reg_type.bitfield.ymmword)
12378 return FALSE;
12379
12380 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12381 return FALSE;
12382 }
12383 }
12384
12385 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12386 return FALSE;
12387
12388 /* Don't allow fake index register unless allow_index_reg isn't 0. */
12389 if (!allow_index_reg && r->reg_num == RegIZ)
12390 return FALSE;
12391
12392 /* Upper 16 vector registers are only available with VREX in 64bit
12393 mode, and require EVEX encoding. */
12394 if (r->reg_flags & RegVRex)
12395 {
12396 if (!cpu_arch_flags.bitfield.cpuavx512f
12397 || flag_code != CODE_64BIT)
12398 return FALSE;
12399
12400 i.vec_encoding = vex_encoding_evex;
12401 }
12402
12403 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12404 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12405 && flag_code != CODE_64BIT)
12406 return FALSE;
12407
12408 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12409 && !intel_syntax)
12410 return FALSE;
12411
12412 return TRUE;
12413 }
12414
12415 /* REG_STRING starts *before* REGISTER_PREFIX. */
12416
12417 static const reg_entry *
12418 parse_real_register (char *reg_string, char **end_op)
12419 {
12420 char *s = reg_string;
12421 char *p;
12422 char reg_name_given[MAX_REG_NAME_SIZE + 1];
12423 const reg_entry *r;
12424
12425 /* Skip possible REGISTER_PREFIX and possible whitespace. */
12426 if (*s == REGISTER_PREFIX)
12427 ++s;
12428
12429 if (is_space_char (*s))
12430 ++s;
12431
12432 p = reg_name_given;
12433 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12434 {
12435 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12436 return (const reg_entry *) NULL;
12437 s++;
12438 }
12439
12440 /* For naked regs, make sure that we are not dealing with an identifier.
12441 This prevents confusing an identifier like `eax_var' with register
12442 `eax'. */
12443 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12444 return (const reg_entry *) NULL;
12445
12446 *end_op = s;
12447
12448 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
12449
12450 /* Handle floating point regs, allowing spaces in the (i) part. */
12451 if (r == i386_regtab /* %st is first entry of table */)
12452 {
12453 if (!cpu_arch_flags.bitfield.cpu8087
12454 && !cpu_arch_flags.bitfield.cpu287
12455 && !cpu_arch_flags.bitfield.cpu387)
12456 return (const reg_entry *) NULL;
12457
12458 if (is_space_char (*s))
12459 ++s;
12460 if (*s == '(')
12461 {
12462 ++s;
12463 if (is_space_char (*s))
12464 ++s;
12465 if (*s >= '0' && *s <= '7')
12466 {
12467 int fpr = *s - '0';
12468 ++s;
12469 if (is_space_char (*s))
12470 ++s;
12471 if (*s == ')')
12472 {
12473 *end_op = s + 1;
12474 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
12475 know (r);
12476 return r + fpr;
12477 }
12478 }
12479 /* We have "%st(" then garbage. */
12480 return (const reg_entry *) NULL;
12481 }
12482 }
12483
12484 return r && check_register (r) ? r : NULL;
12485 }
12486
12487 /* REG_STRING starts *before* REGISTER_PREFIX. */
12488
12489 static const reg_entry *
12490 parse_register (char *reg_string, char **end_op)
12491 {
12492 const reg_entry *r;
12493
12494 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12495 r = parse_real_register (reg_string, end_op);
12496 else
12497 r = NULL;
12498 if (!r)
12499 {
12500 char *save = input_line_pointer;
12501 char c;
12502 symbolS *symbolP;
12503
12504 input_line_pointer = reg_string;
12505 c = get_symbol_name (&reg_string);
12506 symbolP = symbol_find (reg_string);
12507 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12508 {
12509 const expressionS *e = symbol_get_value_expression (symbolP);
12510
12511 know (e->X_op == O_register);
12512 know (e->X_add_number >= 0
12513 && (valueT) e->X_add_number < i386_regtab_size);
12514 r = i386_regtab + e->X_add_number;
12515 if (!check_register (r))
12516 {
12517 as_bad (_("register '%s%s' cannot be used here"),
12518 register_prefix, r->reg_name);
12519 r = &bad_reg;
12520 }
12521 *end_op = input_line_pointer;
12522 }
12523 *input_line_pointer = c;
12524 input_line_pointer = save;
12525 }
12526 return r;
12527 }
12528
12529 int
12530 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12531 {
12532 const reg_entry *r;
12533 char *end = input_line_pointer;
12534
12535 *end = *nextcharP;
12536 r = parse_register (name, &input_line_pointer);
12537 if (r && end <= input_line_pointer)
12538 {
12539 *nextcharP = *input_line_pointer;
12540 *input_line_pointer = 0;
12541 if (r != &bad_reg)
12542 {
12543 e->X_op = O_register;
12544 e->X_add_number = r - i386_regtab;
12545 }
12546 else
12547 e->X_op = O_illegal;
12548 return 1;
12549 }
12550 input_line_pointer = end;
12551 *end = 0;
12552 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12553 }
12554
12555 void
12556 md_operand (expressionS *e)
12557 {
12558 char *end;
12559 const reg_entry *r;
12560
12561 switch (*input_line_pointer)
12562 {
12563 case REGISTER_PREFIX:
12564 r = parse_real_register (input_line_pointer, &end);
12565 if (r)
12566 {
12567 e->X_op = O_register;
12568 e->X_add_number = r - i386_regtab;
12569 input_line_pointer = end;
12570 }
12571 break;
12572
12573 case '[':
12574 gas_assert (intel_syntax);
12575 end = input_line_pointer++;
12576 expression (e);
12577 if (*input_line_pointer == ']')
12578 {
12579 ++input_line_pointer;
12580 e->X_op_symbol = make_expr_symbol (e);
12581 e->X_add_symbol = NULL;
12582 e->X_add_number = 0;
12583 e->X_op = O_index;
12584 }
12585 else
12586 {
12587 e->X_op = O_absent;
12588 input_line_pointer = end;
12589 }
12590 break;
12591 }
12592 }
12593
12594 \f
12595 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12596 const char *md_shortopts = "kVQ:sqnO::";
12597 #else
12598 const char *md_shortopts = "qnO::";
12599 #endif
12600
12601 #define OPTION_32 (OPTION_MD_BASE + 0)
12602 #define OPTION_64 (OPTION_MD_BASE + 1)
12603 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12604 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12605 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12606 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12607 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12608 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12609 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12610 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12611 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12612 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12613 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12614 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12615 #define OPTION_X32 (OPTION_MD_BASE + 14)
12616 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12617 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12618 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12619 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12620 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12621 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12622 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12623 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12624 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12625 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12626 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12627 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12628 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12629 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12630 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12631 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12632 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12633 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12634 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12635
12636 struct option md_longopts[] =
12637 {
12638 {"32", no_argument, NULL, OPTION_32},
12639 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12640 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12641 {"64", no_argument, NULL, OPTION_64},
12642 #endif
12643 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12644 {"x32", no_argument, NULL, OPTION_X32},
12645 {"mshared", no_argument, NULL, OPTION_MSHARED},
12646 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12647 #endif
12648 {"divide", no_argument, NULL, OPTION_DIVIDE},
12649 {"march", required_argument, NULL, OPTION_MARCH},
12650 {"mtune", required_argument, NULL, OPTION_MTUNE},
12651 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12652 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12653 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12654 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12655 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12656 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12657 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12658 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12659 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12660 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12661 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12662 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12663 # if defined (TE_PE) || defined (TE_PEP)
12664 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12665 #endif
12666 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12667 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12668 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12669 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12670 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12671 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12672 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12673 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12674 {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12675 {"mlfence-before-indirect-branch", required_argument, NULL,
12676 OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12677 {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12678 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12679 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12680 {NULL, no_argument, NULL, 0}
12681 };
12682 size_t md_longopts_size = sizeof (md_longopts);
12683
12684 int
12685 md_parse_option (int c, const char *arg)
12686 {
12687 unsigned int j;
12688 char *arch, *next, *saved, *type;
12689
12690 switch (c)
12691 {
12692 case 'n':
12693 optimize_align_code = 0;
12694 break;
12695
12696 case 'q':
12697 quiet_warnings = 1;
12698 break;
12699
12700 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12701 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12702 should be emitted or not. FIXME: Not implemented. */
12703 case 'Q':
12704 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12705 return 0;
12706 break;
12707
12708 /* -V: SVR4 argument to print version ID. */
12709 case 'V':
12710 print_version_id ();
12711 break;
12712
12713 /* -k: Ignore for FreeBSD compatibility. */
12714 case 'k':
12715 break;
12716
12717 case 's':
12718 /* -s: On i386 Solaris, this tells the native assembler to use
12719 .stab instead of .stab.excl. We always use .stab anyhow. */
12720 break;
12721
12722 case OPTION_MSHARED:
12723 shared = 1;
12724 break;
12725
12726 case OPTION_X86_USED_NOTE:
12727 if (strcasecmp (arg, "yes") == 0)
12728 x86_used_note = 1;
12729 else if (strcasecmp (arg, "no") == 0)
12730 x86_used_note = 0;
12731 else
12732 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12733 break;
12734
12735
12736 #endif
12737 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12738 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12739 case OPTION_64:
12740 {
12741 const char **list, **l;
12742
12743 list = bfd_target_list ();
12744 for (l = list; *l != NULL; l++)
12745 if (CONST_STRNEQ (*l, "elf64-x86-64")
12746 || strcmp (*l, "coff-x86-64") == 0
12747 || strcmp (*l, "pe-x86-64") == 0
12748 || strcmp (*l, "pei-x86-64") == 0
12749 || strcmp (*l, "mach-o-x86-64") == 0)
12750 {
12751 default_arch = "x86_64";
12752 break;
12753 }
12754 if (*l == NULL)
12755 as_fatal (_("no compiled in support for x86_64"));
12756 free (list);
12757 }
12758 break;
12759 #endif
12760
12761 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12762 case OPTION_X32:
12763 if (IS_ELF)
12764 {
12765 const char **list, **l;
12766
12767 list = bfd_target_list ();
12768 for (l = list; *l != NULL; l++)
12769 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12770 {
12771 default_arch = "x86_64:32";
12772 break;
12773 }
12774 if (*l == NULL)
12775 as_fatal (_("no compiled in support for 32bit x86_64"));
12776 free (list);
12777 }
12778 else
12779 as_fatal (_("32bit x86_64 is only supported for ELF"));
12780 break;
12781 #endif
12782
12783 case OPTION_32:
12784 default_arch = "i386";
12785 break;
12786
12787 case OPTION_DIVIDE:
12788 #ifdef SVR4_COMMENT_CHARS
12789 {
12790 char *n, *t;
12791 const char *s;
12792
12793 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12794 t = n;
12795 for (s = i386_comment_chars; *s != '\0'; s++)
12796 if (*s != '/')
12797 *t++ = *s;
12798 *t = '\0';
12799 i386_comment_chars = n;
12800 }
12801 #endif
12802 break;
12803
12804 case OPTION_MARCH:
12805 saved = xstrdup (arg);
12806 arch = saved;
12807 /* Allow -march=+nosse. */
12808 if (*arch == '+')
12809 arch++;
12810 do
12811 {
12812 if (*arch == '.')
12813 as_fatal (_("invalid -march= option: `%s'"), arg);
12814 next = strchr (arch, '+');
12815 if (next)
12816 *next++ = '\0';
12817 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12818 {
12819 if (strcmp (arch, cpu_arch [j].name) == 0)
12820 {
12821 /* Processor. */
12822 if (! cpu_arch[j].flags.bitfield.cpui386)
12823 continue;
12824
12825 cpu_arch_name = cpu_arch[j].name;
12826 cpu_sub_arch_name = NULL;
12827 cpu_arch_flags = cpu_arch[j].flags;
12828 cpu_arch_isa = cpu_arch[j].type;
12829 cpu_arch_isa_flags = cpu_arch[j].flags;
12830 if (!cpu_arch_tune_set)
12831 {
12832 cpu_arch_tune = cpu_arch_isa;
12833 cpu_arch_tune_flags = cpu_arch_isa_flags;
12834 }
12835 break;
12836 }
12837 else if (*cpu_arch [j].name == '.'
12838 && strcmp (arch, cpu_arch [j].name + 1) == 0)
12839 {
12840 /* ISA extension. */
12841 i386_cpu_flags flags;
12842
12843 flags = cpu_flags_or (cpu_arch_flags,
12844 cpu_arch[j].flags);
12845
12846 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12847 {
12848 if (cpu_sub_arch_name)
12849 {
12850 char *name = cpu_sub_arch_name;
12851 cpu_sub_arch_name = concat (name,
12852 cpu_arch[j].name,
12853 (const char *) NULL);
12854 free (name);
12855 }
12856 else
12857 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12858 cpu_arch_flags = flags;
12859 cpu_arch_isa_flags = flags;
12860 }
12861 else
12862 cpu_arch_isa_flags
12863 = cpu_flags_or (cpu_arch_isa_flags,
12864 cpu_arch[j].flags);
12865 break;
12866 }
12867 }
12868
12869 if (j >= ARRAY_SIZE (cpu_arch))
12870 {
12871 /* Disable an ISA extension. */
12872 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12873 if (strcmp (arch, cpu_noarch [j].name) == 0)
12874 {
12875 i386_cpu_flags flags;
12876
12877 flags = cpu_flags_and_not (cpu_arch_flags,
12878 cpu_noarch[j].flags);
12879 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12880 {
12881 if (cpu_sub_arch_name)
12882 {
12883 char *name = cpu_sub_arch_name;
12884 cpu_sub_arch_name = concat (arch,
12885 (const char *) NULL);
12886 free (name);
12887 }
12888 else
12889 cpu_sub_arch_name = xstrdup (arch);
12890 cpu_arch_flags = flags;
12891 cpu_arch_isa_flags = flags;
12892 }
12893 break;
12894 }
12895
12896 if (j >= ARRAY_SIZE (cpu_noarch))
12897 j = ARRAY_SIZE (cpu_arch);
12898 }
12899
12900 if (j >= ARRAY_SIZE (cpu_arch))
12901 as_fatal (_("invalid -march= option: `%s'"), arg);
12902
12903 arch = next;
12904 }
12905 while (next != NULL);
12906 free (saved);
12907 break;
12908
12909 case OPTION_MTUNE:
12910 if (*arg == '.')
12911 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12912 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12913 {
12914 if (strcmp (arg, cpu_arch [j].name) == 0)
12915 {
12916 cpu_arch_tune_set = 1;
12917 cpu_arch_tune = cpu_arch [j].type;
12918 cpu_arch_tune_flags = cpu_arch[j].flags;
12919 break;
12920 }
12921 }
12922 if (j >= ARRAY_SIZE (cpu_arch))
12923 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12924 break;
12925
12926 case OPTION_MMNEMONIC:
12927 if (strcasecmp (arg, "att") == 0)
12928 intel_mnemonic = 0;
12929 else if (strcasecmp (arg, "intel") == 0)
12930 intel_mnemonic = 1;
12931 else
12932 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
12933 break;
12934
12935 case OPTION_MSYNTAX:
12936 if (strcasecmp (arg, "att") == 0)
12937 intel_syntax = 0;
12938 else if (strcasecmp (arg, "intel") == 0)
12939 intel_syntax = 1;
12940 else
12941 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
12942 break;
12943
12944 case OPTION_MINDEX_REG:
12945 allow_index_reg = 1;
12946 break;
12947
12948 case OPTION_MNAKED_REG:
12949 allow_naked_reg = 1;
12950 break;
12951
12952 case OPTION_MSSE2AVX:
12953 sse2avx = 1;
12954 break;
12955
12956 case OPTION_MSSE_CHECK:
12957 if (strcasecmp (arg, "error") == 0)
12958 sse_check = check_error;
12959 else if (strcasecmp (arg, "warning") == 0)
12960 sse_check = check_warning;
12961 else if (strcasecmp (arg, "none") == 0)
12962 sse_check = check_none;
12963 else
12964 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
12965 break;
12966
12967 case OPTION_MOPERAND_CHECK:
12968 if (strcasecmp (arg, "error") == 0)
12969 operand_check = check_error;
12970 else if (strcasecmp (arg, "warning") == 0)
12971 operand_check = check_warning;
12972 else if (strcasecmp (arg, "none") == 0)
12973 operand_check = check_none;
12974 else
12975 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
12976 break;
12977
12978 case OPTION_MAVXSCALAR:
12979 if (strcasecmp (arg, "128") == 0)
12980 avxscalar = vex128;
12981 else if (strcasecmp (arg, "256") == 0)
12982 avxscalar = vex256;
12983 else
12984 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
12985 break;
12986
12987 case OPTION_MVEXWIG:
12988 if (strcmp (arg, "0") == 0)
12989 vexwig = vexw0;
12990 else if (strcmp (arg, "1") == 0)
12991 vexwig = vexw1;
12992 else
12993 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
12994 break;
12995
12996 case OPTION_MADD_BND_PREFIX:
12997 add_bnd_prefix = 1;
12998 break;
12999
13000 case OPTION_MEVEXLIG:
13001 if (strcmp (arg, "128") == 0)
13002 evexlig = evexl128;
13003 else if (strcmp (arg, "256") == 0)
13004 evexlig = evexl256;
13005 else if (strcmp (arg, "512") == 0)
13006 evexlig = evexl512;
13007 else
13008 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13009 break;
13010
13011 case OPTION_MEVEXRCIG:
13012 if (strcmp (arg, "rne") == 0)
13013 evexrcig = rne;
13014 else if (strcmp (arg, "rd") == 0)
13015 evexrcig = rd;
13016 else if (strcmp (arg, "ru") == 0)
13017 evexrcig = ru;
13018 else if (strcmp (arg, "rz") == 0)
13019 evexrcig = rz;
13020 else
13021 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13022 break;
13023
13024 case OPTION_MEVEXWIG:
13025 if (strcmp (arg, "0") == 0)
13026 evexwig = evexw0;
13027 else if (strcmp (arg, "1") == 0)
13028 evexwig = evexw1;
13029 else
13030 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13031 break;
13032
13033 # if defined (TE_PE) || defined (TE_PEP)
13034 case OPTION_MBIG_OBJ:
13035 use_big_obj = 1;
13036 break;
13037 #endif
13038
13039 case OPTION_MOMIT_LOCK_PREFIX:
13040 if (strcasecmp (arg, "yes") == 0)
13041 omit_lock_prefix = 1;
13042 else if (strcasecmp (arg, "no") == 0)
13043 omit_lock_prefix = 0;
13044 else
13045 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13046 break;
13047
13048 case OPTION_MFENCE_AS_LOCK_ADD:
13049 if (strcasecmp (arg, "yes") == 0)
13050 avoid_fence = 1;
13051 else if (strcasecmp (arg, "no") == 0)
13052 avoid_fence = 0;
13053 else
13054 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13055 break;
13056
13057 case OPTION_MLFENCE_AFTER_LOAD:
13058 if (strcasecmp (arg, "yes") == 0)
13059 lfence_after_load = 1;
13060 else if (strcasecmp (arg, "no") == 0)
13061 lfence_after_load = 0;
13062 else
13063 as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13064 break;
13065
13066 case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13067 if (strcasecmp (arg, "all") == 0)
13068 {
13069 lfence_before_indirect_branch = lfence_branch_all;
13070 if (lfence_before_ret == lfence_before_ret_none)
13071 lfence_before_ret = lfence_before_ret_shl;
13072 }
13073 else if (strcasecmp (arg, "memory") == 0)
13074 lfence_before_indirect_branch = lfence_branch_memory;
13075 else if (strcasecmp (arg, "register") == 0)
13076 lfence_before_indirect_branch = lfence_branch_register;
13077 else if (strcasecmp (arg, "none") == 0)
13078 lfence_before_indirect_branch = lfence_branch_none;
13079 else
13080 as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13081 arg);
13082 break;
13083
13084 case OPTION_MLFENCE_BEFORE_RET:
13085 if (strcasecmp (arg, "or") == 0)
13086 lfence_before_ret = lfence_before_ret_or;
13087 else if (strcasecmp (arg, "not") == 0)
13088 lfence_before_ret = lfence_before_ret_not;
13089 else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13090 lfence_before_ret = lfence_before_ret_shl;
13091 else if (strcasecmp (arg, "none") == 0)
13092 lfence_before_ret = lfence_before_ret_none;
13093 else
13094 as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13095 arg);
13096 break;
13097
13098 case OPTION_MRELAX_RELOCATIONS:
13099 if (strcasecmp (arg, "yes") == 0)
13100 generate_relax_relocations = 1;
13101 else if (strcasecmp (arg, "no") == 0)
13102 generate_relax_relocations = 0;
13103 else
13104 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13105 break;
13106
13107 case OPTION_MALIGN_BRANCH_BOUNDARY:
13108 {
13109 char *end;
13110 long int align = strtoul (arg, &end, 0);
13111 if (*end == '\0')
13112 {
13113 if (align == 0)
13114 {
13115 align_branch_power = 0;
13116 break;
13117 }
13118 else if (align >= 16)
13119 {
13120 int align_power;
13121 for (align_power = 0;
13122 (align & 1) == 0;
13123 align >>= 1, align_power++)
13124 continue;
13125 /* Limit alignment power to 31. */
13126 if (align == 1 && align_power < 32)
13127 {
13128 align_branch_power = align_power;
13129 break;
13130 }
13131 }
13132 }
13133 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13134 }
13135 break;
13136
13137 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13138 {
13139 char *end;
13140 int align = strtoul (arg, &end, 0);
13141 /* Some processors only support 5 prefixes. */
13142 if (*end == '\0' && align >= 0 && align < 6)
13143 {
13144 align_branch_prefix_size = align;
13145 break;
13146 }
13147 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13148 arg);
13149 }
13150 break;
13151
13152 case OPTION_MALIGN_BRANCH:
13153 align_branch = 0;
13154 saved = xstrdup (arg);
13155 type = saved;
13156 do
13157 {
13158 next = strchr (type, '+');
13159 if (next)
13160 *next++ = '\0';
13161 if (strcasecmp (type, "jcc") == 0)
13162 align_branch |= align_branch_jcc_bit;
13163 else if (strcasecmp (type, "fused") == 0)
13164 align_branch |= align_branch_fused_bit;
13165 else if (strcasecmp (type, "jmp") == 0)
13166 align_branch |= align_branch_jmp_bit;
13167 else if (strcasecmp (type, "call") == 0)
13168 align_branch |= align_branch_call_bit;
13169 else if (strcasecmp (type, "ret") == 0)
13170 align_branch |= align_branch_ret_bit;
13171 else if (strcasecmp (type, "indirect") == 0)
13172 align_branch |= align_branch_indirect_bit;
13173 else
13174 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13175 type = next;
13176 }
13177 while (next != NULL);
13178 free (saved);
13179 break;
13180
13181 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13182 align_branch_power = 5;
13183 align_branch_prefix_size = 5;
13184 align_branch = (align_branch_jcc_bit
13185 | align_branch_fused_bit
13186 | align_branch_jmp_bit);
13187 break;
13188
13189 case OPTION_MAMD64:
13190 isa64 = amd64;
13191 break;
13192
13193 case OPTION_MINTEL64:
13194 isa64 = intel64;
13195 break;
13196
13197 case 'O':
13198 if (arg == NULL)
13199 {
13200 optimize = 1;
13201 /* Turn off -Os. */
13202 optimize_for_space = 0;
13203 }
13204 else if (*arg == 's')
13205 {
13206 optimize_for_space = 1;
13207 /* Turn on all encoding optimizations. */
13208 optimize = INT_MAX;
13209 }
13210 else
13211 {
13212 optimize = atoi (arg);
13213 /* Turn off -Os. */
13214 optimize_for_space = 0;
13215 }
13216 break;
13217
13218 default:
13219 return 0;
13220 }
13221 return 1;
13222 }
13223
13224 #define MESSAGE_TEMPLATE \
13225 " "
13226
13227 static char *
13228 output_message (FILE *stream, char *p, char *message, char *start,
13229 int *left_p, const char *name, int len)
13230 {
13231 int size = sizeof (MESSAGE_TEMPLATE);
13232 int left = *left_p;
13233
13234 /* Reserve 2 spaces for ", " or ",\0" */
13235 left -= len + 2;
13236
13237 /* Check if there is any room. */
13238 if (left >= 0)
13239 {
13240 if (p != start)
13241 {
13242 *p++ = ',';
13243 *p++ = ' ';
13244 }
13245 p = mempcpy (p, name, len);
13246 }
13247 else
13248 {
13249 /* Output the current message now and start a new one. */
13250 *p++ = ',';
13251 *p = '\0';
13252 fprintf (stream, "%s\n", message);
13253 p = start;
13254 left = size - (start - message) - len - 2;
13255
13256 gas_assert (left >= 0);
13257
13258 p = mempcpy (p, name, len);
13259 }
13260
13261 *left_p = left;
13262 return p;
13263 }
13264
13265 static void
13266 show_arch (FILE *stream, int ext, int check)
13267 {
13268 static char message[] = MESSAGE_TEMPLATE;
13269 char *start = message + 27;
13270 char *p;
13271 int size = sizeof (MESSAGE_TEMPLATE);
13272 int left;
13273 const char *name;
13274 int len;
13275 unsigned int j;
13276
13277 p = start;
13278 left = size - (start - message);
13279 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13280 {
13281 /* Should it be skipped? */
13282 if (cpu_arch [j].skip)
13283 continue;
13284
13285 name = cpu_arch [j].name;
13286 len = cpu_arch [j].len;
13287 if (*name == '.')
13288 {
13289 /* It is an extension. Skip if we aren't asked to show it. */
13290 if (ext)
13291 {
13292 name++;
13293 len--;
13294 }
13295 else
13296 continue;
13297 }
13298 else if (ext)
13299 {
13300 /* It is an processor. Skip if we show only extension. */
13301 continue;
13302 }
13303 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13304 {
13305 /* It is an impossible processor - skip. */
13306 continue;
13307 }
13308
13309 p = output_message (stream, p, message, start, &left, name, len);
13310 }
13311
13312 /* Display disabled extensions. */
13313 if (ext)
13314 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13315 {
13316 name = cpu_noarch [j].name;
13317 len = cpu_noarch [j].len;
13318 p = output_message (stream, p, message, start, &left, name,
13319 len);
13320 }
13321
13322 *p = '\0';
13323 fprintf (stream, "%s\n", message);
13324 }
13325
13326 void
13327 md_show_usage (FILE *stream)
13328 {
13329 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13330 fprintf (stream, _("\
13331 -Qy, -Qn ignored\n\
13332 -V print assembler version number\n\
13333 -k ignored\n"));
13334 #endif
13335 fprintf (stream, _("\
13336 -n Do not optimize code alignment\n\
13337 -q quieten some warnings\n"));
13338 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13339 fprintf (stream, _("\
13340 -s ignored\n"));
13341 #endif
13342 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13343 || defined (TE_PE) || defined (TE_PEP))
13344 fprintf (stream, _("\
13345 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
13346 #endif
13347 #ifdef SVR4_COMMENT_CHARS
13348 fprintf (stream, _("\
13349 --divide do not treat `/' as a comment character\n"));
13350 #else
13351 fprintf (stream, _("\
13352 --divide ignored\n"));
13353 #endif
13354 fprintf (stream, _("\
13355 -march=CPU[,+EXTENSION...]\n\
13356 generate code for CPU and EXTENSION, CPU is one of:\n"));
13357 show_arch (stream, 0, 1);
13358 fprintf (stream, _("\
13359 EXTENSION is combination of:\n"));
13360 show_arch (stream, 1, 0);
13361 fprintf (stream, _("\
13362 -mtune=CPU optimize for CPU, CPU is one of:\n"));
13363 show_arch (stream, 0, 0);
13364 fprintf (stream, _("\
13365 -msse2avx encode SSE instructions with VEX prefix\n"));
13366 fprintf (stream, _("\
13367 -msse-check=[none|error|warning] (default: warning)\n\
13368 check SSE instructions\n"));
13369 fprintf (stream, _("\
13370 -moperand-check=[none|error|warning] (default: warning)\n\
13371 check operand combinations for validity\n"));
13372 fprintf (stream, _("\
13373 -mavxscalar=[128|256] (default: 128)\n\
13374 encode scalar AVX instructions with specific vector\n\
13375 length\n"));
13376 fprintf (stream, _("\
13377 -mvexwig=[0|1] (default: 0)\n\
13378 encode VEX instructions with specific VEX.W value\n\
13379 for VEX.W bit ignored instructions\n"));
13380 fprintf (stream, _("\
13381 -mevexlig=[128|256|512] (default: 128)\n\
13382 encode scalar EVEX instructions with specific vector\n\
13383 length\n"));
13384 fprintf (stream, _("\
13385 -mevexwig=[0|1] (default: 0)\n\
13386 encode EVEX instructions with specific EVEX.W value\n\
13387 for EVEX.W bit ignored instructions\n"));
13388 fprintf (stream, _("\
13389 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13390 encode EVEX instructions with specific EVEX.RC value\n\
13391 for SAE-only ignored instructions\n"));
13392 fprintf (stream, _("\
13393 -mmnemonic=[att|intel] "));
13394 if (SYSV386_COMPAT)
13395 fprintf (stream, _("(default: att)\n"));
13396 else
13397 fprintf (stream, _("(default: intel)\n"));
13398 fprintf (stream, _("\
13399 use AT&T/Intel mnemonic\n"));
13400 fprintf (stream, _("\
13401 -msyntax=[att|intel] (default: att)\n\
13402 use AT&T/Intel syntax\n"));
13403 fprintf (stream, _("\
13404 -mindex-reg support pseudo index registers\n"));
13405 fprintf (stream, _("\
13406 -mnaked-reg don't require `%%' prefix for registers\n"));
13407 fprintf (stream, _("\
13408 -madd-bnd-prefix add BND prefix for all valid branches\n"));
13409 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13410 fprintf (stream, _("\
13411 -mshared disable branch optimization for shared code\n"));
13412 fprintf (stream, _("\
13413 -mx86-used-note=[no|yes] "));
13414 if (DEFAULT_X86_USED_NOTE)
13415 fprintf (stream, _("(default: yes)\n"));
13416 else
13417 fprintf (stream, _("(default: no)\n"));
13418 fprintf (stream, _("\
13419 generate x86 used ISA and feature properties\n"));
13420 #endif
13421 #if defined (TE_PE) || defined (TE_PEP)
13422 fprintf (stream, _("\
13423 -mbig-obj generate big object files\n"));
13424 #endif
13425 fprintf (stream, _("\
13426 -momit-lock-prefix=[no|yes] (default: no)\n\
13427 strip all lock prefixes\n"));
13428 fprintf (stream, _("\
13429 -mfence-as-lock-add=[no|yes] (default: no)\n\
13430 encode lfence, mfence and sfence as\n\
13431 lock addl $0x0, (%%{re}sp)\n"));
13432 fprintf (stream, _("\
13433 -mrelax-relocations=[no|yes] "));
13434 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13435 fprintf (stream, _("(default: yes)\n"));
13436 else
13437 fprintf (stream, _("(default: no)\n"));
13438 fprintf (stream, _("\
13439 generate relax relocations\n"));
13440 fprintf (stream, _("\
13441 -malign-branch-boundary=NUM (default: 0)\n\
13442 align branches within NUM byte boundary\n"));
13443 fprintf (stream, _("\
13444 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13445 TYPE is combination of jcc, fused, jmp, call, ret,\n\
13446 indirect\n\
13447 specify types of branches to align\n"));
13448 fprintf (stream, _("\
13449 -malign-branch-prefix-size=NUM (default: 5)\n\
13450 align branches with NUM prefixes per instruction\n"));
13451 fprintf (stream, _("\
13452 -mbranches-within-32B-boundaries\n\
13453 align branches within 32 byte boundary\n"));
13454 fprintf (stream, _("\
13455 -mlfence-after-load=[no|yes] (default: no)\n\
13456 generate lfence after load\n"));
13457 fprintf (stream, _("\
13458 -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13459 generate lfence before indirect near branch\n"));
13460 fprintf (stream, _("\
13461 -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13462 generate lfence before ret\n"));
13463 fprintf (stream, _("\
13464 -mamd64 accept only AMD64 ISA [default]\n"));
13465 fprintf (stream, _("\
13466 -mintel64 accept only Intel64 ISA\n"));
13467 }
13468
13469 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13470 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13471 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13472
13473 /* Pick the target format to use. */
13474
13475 const char *
13476 i386_target_format (void)
13477 {
13478 if (!strncmp (default_arch, "x86_64", 6))
13479 {
13480 update_code_flag (CODE_64BIT, 1);
13481 if (default_arch[6] == '\0')
13482 x86_elf_abi = X86_64_ABI;
13483 else
13484 x86_elf_abi = X86_64_X32_ABI;
13485 }
13486 else if (!strcmp (default_arch, "i386"))
13487 update_code_flag (CODE_32BIT, 1);
13488 else if (!strcmp (default_arch, "iamcu"))
13489 {
13490 update_code_flag (CODE_32BIT, 1);
13491 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13492 {
13493 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13494 cpu_arch_name = "iamcu";
13495 cpu_sub_arch_name = NULL;
13496 cpu_arch_flags = iamcu_flags;
13497 cpu_arch_isa = PROCESSOR_IAMCU;
13498 cpu_arch_isa_flags = iamcu_flags;
13499 if (!cpu_arch_tune_set)
13500 {
13501 cpu_arch_tune = cpu_arch_isa;
13502 cpu_arch_tune_flags = cpu_arch_isa_flags;
13503 }
13504 }
13505 else if (cpu_arch_isa != PROCESSOR_IAMCU)
13506 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13507 cpu_arch_name);
13508 }
13509 else
13510 as_fatal (_("unknown architecture"));
13511
13512 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13513 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13514 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13515 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13516
13517 switch (OUTPUT_FLAVOR)
13518 {
13519 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13520 case bfd_target_aout_flavour:
13521 return AOUT_TARGET_FORMAT;
13522 #endif
13523 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13524 # if defined (TE_PE) || defined (TE_PEP)
13525 case bfd_target_coff_flavour:
13526 if (flag_code == CODE_64BIT)
13527 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13528 else
13529 return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13530 # elif defined (TE_GO32)
13531 case bfd_target_coff_flavour:
13532 return "coff-go32";
13533 # else
13534 case bfd_target_coff_flavour:
13535 return "coff-i386";
13536 # endif
13537 #endif
13538 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13539 case bfd_target_elf_flavour:
13540 {
13541 const char *format;
13542
13543 switch (x86_elf_abi)
13544 {
13545 default:
13546 format = ELF_TARGET_FORMAT;
13547 #ifndef TE_SOLARIS
13548 tls_get_addr = "___tls_get_addr";
13549 #endif
13550 break;
13551 case X86_64_ABI:
13552 use_rela_relocations = 1;
13553 object_64bit = 1;
13554 #ifndef TE_SOLARIS
13555 tls_get_addr = "__tls_get_addr";
13556 #endif
13557 format = ELF_TARGET_FORMAT64;
13558 break;
13559 case X86_64_X32_ABI:
13560 use_rela_relocations = 1;
13561 object_64bit = 1;
13562 #ifndef TE_SOLARIS
13563 tls_get_addr = "__tls_get_addr";
13564 #endif
13565 disallow_64bit_reloc = 1;
13566 format = ELF_TARGET_FORMAT32;
13567 break;
13568 }
13569 if (cpu_arch_isa == PROCESSOR_L1OM)
13570 {
13571 if (x86_elf_abi != X86_64_ABI)
13572 as_fatal (_("Intel L1OM is 64bit only"));
13573 return ELF_TARGET_L1OM_FORMAT;
13574 }
13575 else if (cpu_arch_isa == PROCESSOR_K1OM)
13576 {
13577 if (x86_elf_abi != X86_64_ABI)
13578 as_fatal (_("Intel K1OM is 64bit only"));
13579 return ELF_TARGET_K1OM_FORMAT;
13580 }
13581 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13582 {
13583 if (x86_elf_abi != I386_ABI)
13584 as_fatal (_("Intel MCU is 32bit only"));
13585 return ELF_TARGET_IAMCU_FORMAT;
13586 }
13587 else
13588 return format;
13589 }
13590 #endif
13591 #if defined (OBJ_MACH_O)
13592 case bfd_target_mach_o_flavour:
13593 if (flag_code == CODE_64BIT)
13594 {
13595 use_rela_relocations = 1;
13596 object_64bit = 1;
13597 return "mach-o-x86-64";
13598 }
13599 else
13600 return "mach-o-i386";
13601 #endif
13602 default:
13603 abort ();
13604 return NULL;
13605 }
13606 }
13607
13608 #endif /* OBJ_MAYBE_ more than one */
13609 \f
13610 symbolS *
13611 md_undefined_symbol (char *name)
13612 {
13613 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13614 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13615 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13616 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13617 {
13618 if (!GOT_symbol)
13619 {
13620 if (symbol_find (name))
13621 as_bad (_("GOT already in symbol table"));
13622 GOT_symbol = symbol_new (name, undefined_section,
13623 (valueT) 0, &zero_address_frag);
13624 };
13625 return GOT_symbol;
13626 }
13627 return 0;
13628 }
13629
13630 /* Round up a section size to the appropriate boundary. */
13631
13632 valueT
13633 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13634 {
13635 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13636 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13637 {
13638 /* For a.out, force the section size to be aligned. If we don't do
13639 this, BFD will align it for us, but it will not write out the
13640 final bytes of the section. This may be a bug in BFD, but it is
13641 easier to fix it here since that is how the other a.out targets
13642 work. */
13643 int align;
13644
13645 align = bfd_section_alignment (segment);
13646 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13647 }
13648 #endif
13649
13650 return size;
13651 }
13652
13653 /* On the i386, PC-relative offsets are relative to the start of the
13654 next instruction. That is, the address of the offset, plus its
13655 size, since the offset is always the last part of the insn. */
13656
13657 long
13658 md_pcrel_from (fixS *fixP)
13659 {
13660 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13661 }
13662
13663 #ifndef I386COFF
13664
13665 static void
13666 s_bss (int ignore ATTRIBUTE_UNUSED)
13667 {
13668 int temp;
13669
13670 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13671 if (IS_ELF)
13672 obj_elf_section_change_hook ();
13673 #endif
13674 temp = get_absolute_expression ();
13675 subseg_set (bss_section, (subsegT) temp);
13676 demand_empty_rest_of_line ();
13677 }
13678
13679 #endif
13680
13681 /* Remember constant directive. */
13682
13683 void
13684 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13685 {
13686 if (last_insn.kind != last_insn_directive
13687 && (bfd_section_flags (now_seg) & SEC_CODE))
13688 {
13689 last_insn.seg = now_seg;
13690 last_insn.kind = last_insn_directive;
13691 last_insn.name = "constant directive";
13692 last_insn.file = as_where (&last_insn.line);
13693 if (lfence_before_ret != lfence_before_ret_none)
13694 {
13695 if (lfence_before_indirect_branch != lfence_branch_none)
13696 as_warn (_("constant directive skips -mlfence-before-ret "
13697 "and -mlfence-before-indirect-branch"));
13698 else
13699 as_warn (_("constant directive skips -mlfence-before-ret"));
13700 }
13701 else if (lfence_before_indirect_branch != lfence_branch_none)
13702 as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13703 }
13704 }
13705
13706 void
13707 i386_validate_fix (fixS *fixp)
13708 {
13709 if (fixp->fx_subsy)
13710 {
13711 if (fixp->fx_subsy == GOT_symbol)
13712 {
13713 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13714 {
13715 if (!object_64bit)
13716 abort ();
13717 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13718 if (fixp->fx_tcbit2)
13719 fixp->fx_r_type = (fixp->fx_tcbit
13720 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13721 : BFD_RELOC_X86_64_GOTPCRELX);
13722 else
13723 #endif
13724 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13725 }
13726 else
13727 {
13728 if (!object_64bit)
13729 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13730 else
13731 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13732 }
13733 fixp->fx_subsy = 0;
13734 }
13735 }
13736 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13737 else if (!object_64bit)
13738 {
13739 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13740 && fixp->fx_tcbit2)
13741 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13742 }
13743 #endif
13744 }
13745
13746 arelent *
13747 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13748 {
13749 arelent *rel;
13750 bfd_reloc_code_real_type code;
13751
13752 switch (fixp->fx_r_type)
13753 {
13754 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13755 case BFD_RELOC_SIZE32:
13756 case BFD_RELOC_SIZE64:
13757 if (S_IS_DEFINED (fixp->fx_addsy)
13758 && !S_IS_EXTERNAL (fixp->fx_addsy))
13759 {
13760 /* Resolve size relocation against local symbol to size of
13761 the symbol plus addend. */
13762 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13763 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13764 && !fits_in_unsigned_long (value))
13765 as_bad_where (fixp->fx_file, fixp->fx_line,
13766 _("symbol size computation overflow"));
13767 fixp->fx_addsy = NULL;
13768 fixp->fx_subsy = NULL;
13769 md_apply_fix (fixp, (valueT *) &value, NULL);
13770 return NULL;
13771 }
13772 #endif
13773 /* Fall through. */
13774
13775 case BFD_RELOC_X86_64_PLT32:
13776 case BFD_RELOC_X86_64_GOT32:
13777 case BFD_RELOC_X86_64_GOTPCREL:
13778 case BFD_RELOC_X86_64_GOTPCRELX:
13779 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13780 case BFD_RELOC_386_PLT32:
13781 case BFD_RELOC_386_GOT32:
13782 case BFD_RELOC_386_GOT32X:
13783 case BFD_RELOC_386_GOTOFF:
13784 case BFD_RELOC_386_GOTPC:
13785 case BFD_RELOC_386_TLS_GD:
13786 case BFD_RELOC_386_TLS_LDM:
13787 case BFD_RELOC_386_TLS_LDO_32:
13788 case BFD_RELOC_386_TLS_IE_32:
13789 case BFD_RELOC_386_TLS_IE:
13790 case BFD_RELOC_386_TLS_GOTIE:
13791 case BFD_RELOC_386_TLS_LE_32:
13792 case BFD_RELOC_386_TLS_LE:
13793 case BFD_RELOC_386_TLS_GOTDESC:
13794 case BFD_RELOC_386_TLS_DESC_CALL:
13795 case BFD_RELOC_X86_64_TLSGD:
13796 case BFD_RELOC_X86_64_TLSLD:
13797 case BFD_RELOC_X86_64_DTPOFF32:
13798 case BFD_RELOC_X86_64_DTPOFF64:
13799 case BFD_RELOC_X86_64_GOTTPOFF:
13800 case BFD_RELOC_X86_64_TPOFF32:
13801 case BFD_RELOC_X86_64_TPOFF64:
13802 case BFD_RELOC_X86_64_GOTOFF64:
13803 case BFD_RELOC_X86_64_GOTPC32:
13804 case BFD_RELOC_X86_64_GOT64:
13805 case BFD_RELOC_X86_64_GOTPCREL64:
13806 case BFD_RELOC_X86_64_GOTPC64:
13807 case BFD_RELOC_X86_64_GOTPLT64:
13808 case BFD_RELOC_X86_64_PLTOFF64:
13809 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13810 case BFD_RELOC_X86_64_TLSDESC_CALL:
13811 case BFD_RELOC_RVA:
13812 case BFD_RELOC_VTABLE_ENTRY:
13813 case BFD_RELOC_VTABLE_INHERIT:
13814 #ifdef TE_PE
13815 case BFD_RELOC_32_SECREL:
13816 #endif
13817 code = fixp->fx_r_type;
13818 break;
13819 case BFD_RELOC_X86_64_32S:
13820 if (!fixp->fx_pcrel)
13821 {
13822 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13823 code = fixp->fx_r_type;
13824 break;
13825 }
13826 /* Fall through. */
13827 default:
13828 if (fixp->fx_pcrel)
13829 {
13830 switch (fixp->fx_size)
13831 {
13832 default:
13833 as_bad_where (fixp->fx_file, fixp->fx_line,
13834 _("can not do %d byte pc-relative relocation"),
13835 fixp->fx_size);
13836 code = BFD_RELOC_32_PCREL;
13837 break;
13838 case 1: code = BFD_RELOC_8_PCREL; break;
13839 case 2: code = BFD_RELOC_16_PCREL; break;
13840 case 4: code = BFD_RELOC_32_PCREL; break;
13841 #ifdef BFD64
13842 case 8: code = BFD_RELOC_64_PCREL; break;
13843 #endif
13844 }
13845 }
13846 else
13847 {
13848 switch (fixp->fx_size)
13849 {
13850 default:
13851 as_bad_where (fixp->fx_file, fixp->fx_line,
13852 _("can not do %d byte relocation"),
13853 fixp->fx_size);
13854 code = BFD_RELOC_32;
13855 break;
13856 case 1: code = BFD_RELOC_8; break;
13857 case 2: code = BFD_RELOC_16; break;
13858 case 4: code = BFD_RELOC_32; break;
13859 #ifdef BFD64
13860 case 8: code = BFD_RELOC_64; break;
13861 #endif
13862 }
13863 }
13864 break;
13865 }
13866
13867 if ((code == BFD_RELOC_32
13868 || code == BFD_RELOC_32_PCREL
13869 || code == BFD_RELOC_X86_64_32S)
13870 && GOT_symbol
13871 && fixp->fx_addsy == GOT_symbol)
13872 {
13873 if (!object_64bit)
13874 code = BFD_RELOC_386_GOTPC;
13875 else
13876 code = BFD_RELOC_X86_64_GOTPC32;
13877 }
13878 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13879 && GOT_symbol
13880 && fixp->fx_addsy == GOT_symbol)
13881 {
13882 code = BFD_RELOC_X86_64_GOTPC64;
13883 }
13884
13885 rel = XNEW (arelent);
13886 rel->sym_ptr_ptr = XNEW (asymbol *);
13887 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13888
13889 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13890
13891 if (!use_rela_relocations)
13892 {
13893 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13894 vtable entry to be used in the relocation's section offset. */
13895 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13896 rel->address = fixp->fx_offset;
13897 #if defined (OBJ_COFF) && defined (TE_PE)
13898 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13899 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13900 else
13901 #endif
13902 rel->addend = 0;
13903 }
13904 /* Use the rela in 64bit mode. */
13905 else
13906 {
13907 if (disallow_64bit_reloc)
13908 switch (code)
13909 {
13910 case BFD_RELOC_X86_64_DTPOFF64:
13911 case BFD_RELOC_X86_64_TPOFF64:
13912 case BFD_RELOC_64_PCREL:
13913 case BFD_RELOC_X86_64_GOTOFF64:
13914 case BFD_RELOC_X86_64_GOT64:
13915 case BFD_RELOC_X86_64_GOTPCREL64:
13916 case BFD_RELOC_X86_64_GOTPC64:
13917 case BFD_RELOC_X86_64_GOTPLT64:
13918 case BFD_RELOC_X86_64_PLTOFF64:
13919 as_bad_where (fixp->fx_file, fixp->fx_line,
13920 _("cannot represent relocation type %s in x32 mode"),
13921 bfd_get_reloc_code_name (code));
13922 break;
13923 default:
13924 break;
13925 }
13926
13927 if (!fixp->fx_pcrel)
13928 rel->addend = fixp->fx_offset;
13929 else
13930 switch (code)
13931 {
13932 case BFD_RELOC_X86_64_PLT32:
13933 case BFD_RELOC_X86_64_GOT32:
13934 case BFD_RELOC_X86_64_GOTPCREL:
13935 case BFD_RELOC_X86_64_GOTPCRELX:
13936 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13937 case BFD_RELOC_X86_64_TLSGD:
13938 case BFD_RELOC_X86_64_TLSLD:
13939 case BFD_RELOC_X86_64_GOTTPOFF:
13940 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13941 case BFD_RELOC_X86_64_TLSDESC_CALL:
13942 rel->addend = fixp->fx_offset - fixp->fx_size;
13943 break;
13944 default:
13945 rel->addend = (section->vma
13946 - fixp->fx_size
13947 + fixp->fx_addnumber
13948 + md_pcrel_from (fixp));
13949 break;
13950 }
13951 }
13952
13953 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
13954 if (rel->howto == NULL)
13955 {
13956 as_bad_where (fixp->fx_file, fixp->fx_line,
13957 _("cannot represent relocation type %s"),
13958 bfd_get_reloc_code_name (code));
13959 /* Set howto to a garbage value so that we can keep going. */
13960 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
13961 gas_assert (rel->howto != NULL);
13962 }
13963
13964 return rel;
13965 }
13966
13967 #include "tc-i386-intel.c"
13968
13969 void
13970 tc_x86_parse_to_dw2regnum (expressionS *exp)
13971 {
13972 int saved_naked_reg;
13973 char saved_register_dot;
13974
13975 saved_naked_reg = allow_naked_reg;
13976 allow_naked_reg = 1;
13977 saved_register_dot = register_chars['.'];
13978 register_chars['.'] = '.';
13979 allow_pseudo_reg = 1;
13980 expression_and_evaluate (exp);
13981 allow_pseudo_reg = 0;
13982 register_chars['.'] = saved_register_dot;
13983 allow_naked_reg = saved_naked_reg;
13984
13985 if (exp->X_op == O_register && exp->X_add_number >= 0)
13986 {
13987 if ((addressT) exp->X_add_number < i386_regtab_size)
13988 {
13989 exp->X_op = O_constant;
13990 exp->X_add_number = i386_regtab[exp->X_add_number]
13991 .dw2_regnum[flag_code >> 1];
13992 }
13993 else
13994 exp->X_op = O_illegal;
13995 }
13996 }
13997
13998 void
13999 tc_x86_frame_initial_instructions (void)
14000 {
14001 static unsigned int sp_regno[2];
14002
14003 if (!sp_regno[flag_code >> 1])
14004 {
14005 char *saved_input = input_line_pointer;
14006 char sp[][4] = {"esp", "rsp"};
14007 expressionS exp;
14008
14009 input_line_pointer = sp[flag_code >> 1];
14010 tc_x86_parse_to_dw2regnum (&exp);
14011 gas_assert (exp.X_op == O_constant);
14012 sp_regno[flag_code >> 1] = exp.X_add_number;
14013 input_line_pointer = saved_input;
14014 }
14015
14016 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14017 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14018 }
14019
14020 int
14021 x86_dwarf2_addr_size (void)
14022 {
14023 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14024 if (x86_elf_abi == X86_64_X32_ABI)
14025 return 4;
14026 #endif
14027 return bfd_arch_bits_per_address (stdoutput) / 8;
14028 }
14029
14030 int
14031 i386_elf_section_type (const char *str, size_t len)
14032 {
14033 if (flag_code == CODE_64BIT
14034 && len == sizeof ("unwind") - 1
14035 && strncmp (str, "unwind", 6) == 0)
14036 return SHT_X86_64_UNWIND;
14037
14038 return -1;
14039 }
14040
14041 #ifdef TE_SOLARIS
14042 void
14043 i386_solaris_fix_up_eh_frame (segT sec)
14044 {
14045 if (flag_code == CODE_64BIT)
14046 elf_section_type (sec) = SHT_X86_64_UNWIND;
14047 }
14048 #endif
14049
14050 #ifdef TE_PE
14051 void
14052 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14053 {
14054 expressionS exp;
14055
14056 exp.X_op = O_secrel;
14057 exp.X_add_symbol = symbol;
14058 exp.X_add_number = 0;
14059 emit_expr (&exp, size);
14060 }
14061 #endif
14062
14063 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14064 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
14065
14066 bfd_vma
14067 x86_64_section_letter (int letter, const char **ptr_msg)
14068 {
14069 if (flag_code == CODE_64BIT)
14070 {
14071 if (letter == 'l')
14072 return SHF_X86_64_LARGE;
14073
14074 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14075 }
14076 else
14077 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14078 return -1;
14079 }
14080
14081 bfd_vma
14082 x86_64_section_word (char *str, size_t len)
14083 {
14084 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
14085 return SHF_X86_64_LARGE;
14086
14087 return -1;
14088 }
14089
14090 static void
14091 handle_large_common (int small ATTRIBUTE_UNUSED)
14092 {
14093 if (flag_code != CODE_64BIT)
14094 {
14095 s_comm_internal (0, elf_common_parse);
14096 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14097 }
14098 else
14099 {
14100 static segT lbss_section;
14101 asection *saved_com_section_ptr = elf_com_section_ptr;
14102 asection *saved_bss_section = bss_section;
14103
14104 if (lbss_section == NULL)
14105 {
14106 flagword applicable;
14107 segT seg = now_seg;
14108 subsegT subseg = now_subseg;
14109
14110 /* The .lbss section is for local .largecomm symbols. */
14111 lbss_section = subseg_new (".lbss", 0);
14112 applicable = bfd_applicable_section_flags (stdoutput);
14113 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14114 seg_info (lbss_section)->bss = 1;
14115
14116 subseg_set (seg, subseg);
14117 }
14118
14119 elf_com_section_ptr = &_bfd_elf_large_com_section;
14120 bss_section = lbss_section;
14121
14122 s_comm_internal (0, elf_common_parse);
14123
14124 elf_com_section_ptr = saved_com_section_ptr;
14125 bss_section = saved_bss_section;
14126 }
14127 }
14128 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 0.334179 seconds and 5 git commands to generate.