x86: simplify check_byte_reg()
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef INFER_ADDR_PREFIX
48 #define INFER_ADDR_PREFIX 1
49 #endif
50
51 #ifndef DEFAULT_ARCH
52 #define DEFAULT_ARCH "i386"
53 #endif
54
55 #ifndef INLINE
56 #if __GNUC__ >= 2
57 #define INLINE __inline__
58 #else
59 #define INLINE
60 #endif
61 #endif
62
63 /* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
68 #define WAIT_PREFIX 0
69 #define SEG_PREFIX 1
70 #define ADDR_PREFIX 2
71 #define DATA_PREFIX 3
72 #define REP_PREFIX 4
73 #define HLE_PREFIX REP_PREFIX
74 #define BND_PREFIX REP_PREFIX
75 #define LOCK_PREFIX 5
76 #define REX_PREFIX 6 /* must come last. */
77 #define MAX_PREFIXES 7 /* max prefixes per opcode */
78
79 /* we define the syntax here (modulo base,index,scale syntax) */
80 #define REGISTER_PREFIX '%'
81 #define IMMEDIATE_PREFIX '$'
82 #define ABSOLUTE_PREFIX '*'
83
84 /* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86 #define WORD_MNEM_SUFFIX 'w'
87 #define BYTE_MNEM_SUFFIX 'b'
88 #define SHORT_MNEM_SUFFIX 's'
89 #define LONG_MNEM_SUFFIX 'l'
90 #define QWORD_MNEM_SUFFIX 'q'
91 /* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95 #define END_OF_INSN '\0'
96
97 /* This matches the C -> StaticRounding alias in the opcode table. */
98 #define commutative staticrounding
99
100 /*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107 typedef struct
108 {
109 const insn_template *start;
110 const insn_template *end;
111 }
112 templates;
113
114 /* 386 operand encoding bytes: see 386 book for details of this. */
115 typedef struct
116 {
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120 }
121 modrm_byte;
122
123 /* x86-64 extension prefix. */
124 typedef int rex_byte;
125
126 /* 386 opcode byte to code indirect addressing. */
127 typedef struct
128 {
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132 }
133 sib_byte;
134
135 /* x86 arch names, types and features */
136 typedef struct
137 {
138 const char *name; /* arch name */
139 unsigned int len; /* arch string length */
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
142 unsigned int skip; /* show_arch should skip this. */
143 }
144 arch_entry;
145
146 /* Used to turn off indicated flags. */
147 typedef struct
148 {
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152 }
153 noarch_entry;
154
155 static void update_code_flag (int, int);
156 static void set_code_flag (int);
157 static void set_16bit_gcc_code_flag (int);
158 static void set_intel_syntax (int);
159 static void set_intel_mnemonic (int);
160 static void set_allow_index_reg (int);
161 static void set_check (int);
162 static void set_cpu_arch (int);
163 #ifdef TE_PE
164 static void pe_directive_secrel (int);
165 #endif
166 static void signed_cons (int);
167 static char *output_invalid (int c);
168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
172 static int i386_att_operand (char *);
173 static int i386_intel_operand (char *, int);
174 static int i386_intel_simplify (expressionS *);
175 static int i386_intel_parse_name (const char *, expressionS *);
176 static const reg_entry *parse_register (char *, char **);
177 static char *parse_insn (char *, char *);
178 static char *parse_operands (char *, const char *);
179 static void swap_operands (void);
180 static void swap_2_operands (int, int);
181 static enum flag_code i386_addressing_mode (void);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
202
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
210
211 static const char *default_arch = DEFAULT_ARCH;
212
213 /* parse_register() returns this when a register alias cannot be used. */
214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
215 { Dw2Inval, Dw2Inval } };
216
217 /* This struct describes rounding control and SAE in the instruction. */
218 struct RC_Operation
219 {
220 enum rc_type
221 {
222 rne = 0,
223 rd,
224 ru,
225 rz,
226 saeonly
227 } type;
228 int operand;
229 };
230
231 static struct RC_Operation rc_op;
232
233 /* The struct describes masking, applied to OPERAND in the instruction.
234 MASK is a pointer to the corresponding mask register. ZEROING tells
235 whether merging or zeroing mask is used. */
236 struct Mask_Operation
237 {
238 const reg_entry *mask;
239 unsigned int zeroing;
240 /* The operand where this operation is associated. */
241 int operand;
242 };
243
244 static struct Mask_Operation mask_op;
245
246 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
247 broadcast factor. */
248 struct Broadcast_Operation
249 {
250 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
251 int type;
252
253 /* Index of broadcasted operand. */
254 int operand;
255
256 /* Number of bytes to broadcast. */
257 int bytes;
258 };
259
260 static struct Broadcast_Operation broadcast_op;
261
262 /* VEX prefix. */
263 typedef struct
264 {
265 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
266 unsigned char bytes[4];
267 unsigned int length;
268 /* Destination or source register specifier. */
269 const reg_entry *register_specifier;
270 } vex_prefix;
271
272 /* 'md_assemble ()' gathers together information and puts it into a
273 i386_insn. */
274
275 union i386_op
276 {
277 expressionS *disps;
278 expressionS *imms;
279 const reg_entry *regs;
280 };
281
282 enum i386_error
283 {
284 operand_size_mismatch,
285 operand_type_mismatch,
286 register_type_mismatch,
287 number_of_operands_mismatch,
288 invalid_instruction_suffix,
289 bad_imm4,
290 unsupported_with_intel_mnemonic,
291 unsupported_syntax,
292 unsupported,
293 invalid_vsib_address,
294 invalid_vector_register_set,
295 unsupported_vector_index_register,
296 unsupported_broadcast,
297 broadcast_needed,
298 unsupported_masking,
299 mask_not_on_destination,
300 no_default_mask,
301 unsupported_rc_sae,
302 rc_sae_operand_not_last_imm,
303 invalid_register_operand,
304 };
305
306 struct _i386_insn
307 {
308 /* TM holds the template for the insn were currently assembling. */
309 insn_template tm;
310
311 /* SUFFIX holds the instruction size suffix for byte, word, dword
312 or qword, if given. */
313 char suffix;
314
315 /* OPERANDS gives the number of given operands. */
316 unsigned int operands;
317
318 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
319 of given register, displacement, memory operands and immediate
320 operands. */
321 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
322
323 /* TYPES [i] is the type (see above #defines) which tells us how to
324 use OP[i] for the corresponding operand. */
325 i386_operand_type types[MAX_OPERANDS];
326
327 /* Displacement expression, immediate expression, or register for each
328 operand. */
329 union i386_op op[MAX_OPERANDS];
330
331 /* Flags for operands. */
332 unsigned int flags[MAX_OPERANDS];
333 #define Operand_PCrel 1
334 #define Operand_Mem 2
335
336 /* Relocation type for operand */
337 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
338
339 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
340 the base index byte below. */
341 const reg_entry *base_reg;
342 const reg_entry *index_reg;
343 unsigned int log2_scale_factor;
344
345 /* SEG gives the seg_entries of this insn. They are zero unless
346 explicit segment overrides are given. */
347 const seg_entry *seg[2];
348
349 /* Copied first memory operand string, for re-checking. */
350 char *memop1_string;
351
352 /* PREFIX holds all the given prefix opcodes (usually null).
353 PREFIXES is the number of prefix opcodes. */
354 unsigned int prefixes;
355 unsigned char prefix[MAX_PREFIXES];
356
357 /* Register is in low 3 bits of opcode. */
358 bfd_boolean short_form;
359
360 /* The operand to a branch insn indicates an absolute branch. */
361 bfd_boolean jumpabsolute;
362
363 /* Has MMX register operands. */
364 bfd_boolean has_regmmx;
365
366 /* Has XMM register operands. */
367 bfd_boolean has_regxmm;
368
369 /* Has YMM register operands. */
370 bfd_boolean has_regymm;
371
372 /* Has ZMM register operands. */
373 bfd_boolean has_regzmm;
374
375 /* Has GOTPC or TLS relocation. */
376 bfd_boolean has_gotpc_tls_reloc;
377
378 /* RM and SIB are the modrm byte and the sib byte where the
379 addressing modes of this insn are encoded. */
380 modrm_byte rm;
381 rex_byte rex;
382 rex_byte vrex;
383 sib_byte sib;
384 vex_prefix vex;
385
386 /* Masking attributes. */
387 struct Mask_Operation *mask;
388
389 /* Rounding control and SAE attributes. */
390 struct RC_Operation *rounding;
391
392 /* Broadcasting attributes. */
393 struct Broadcast_Operation *broadcast;
394
395 /* Compressed disp8*N attribute. */
396 unsigned int memshift;
397
398 /* Prefer load or store in encoding. */
399 enum
400 {
401 dir_encoding_default = 0,
402 dir_encoding_load,
403 dir_encoding_store,
404 dir_encoding_swap
405 } dir_encoding;
406
407 /* Prefer 8bit or 32bit displacement in encoding. */
408 enum
409 {
410 disp_encoding_default = 0,
411 disp_encoding_8bit,
412 disp_encoding_32bit
413 } disp_encoding;
414
415 /* Prefer the REX byte in encoding. */
416 bfd_boolean rex_encoding;
417
418 /* Disable instruction size optimization. */
419 bfd_boolean no_optimize;
420
421 /* How to encode vector instructions. */
422 enum
423 {
424 vex_encoding_default = 0,
425 vex_encoding_vex,
426 vex_encoding_vex3,
427 vex_encoding_evex
428 } vec_encoding;
429
430 /* REP prefix. */
431 const char *rep_prefix;
432
433 /* HLE prefix. */
434 const char *hle_prefix;
435
436 /* Have BND prefix. */
437 const char *bnd_prefix;
438
439 /* Have NOTRACK prefix. */
440 const char *notrack_prefix;
441
442 /* Error message. */
443 enum i386_error error;
444 };
445
446 typedef struct _i386_insn i386_insn;
447
448 /* Link RC type with corresponding string, that'll be looked for in
449 asm. */
450 struct RC_name
451 {
452 enum rc_type type;
453 const char *name;
454 unsigned int len;
455 };
456
457 static const struct RC_name RC_NamesTable[] =
458 {
459 { rne, STRING_COMMA_LEN ("rn-sae") },
460 { rd, STRING_COMMA_LEN ("rd-sae") },
461 { ru, STRING_COMMA_LEN ("ru-sae") },
462 { rz, STRING_COMMA_LEN ("rz-sae") },
463 { saeonly, STRING_COMMA_LEN ("sae") },
464 };
465
466 /* List of chars besides those in app.c:symbol_chars that can start an
467 operand. Used to prevent the scrubber eating vital white-space. */
468 const char extra_symbol_chars[] = "*%-([{}"
469 #ifdef LEX_AT
470 "@"
471 #endif
472 #ifdef LEX_QM
473 "?"
474 #endif
475 ;
476
477 #if (defined (TE_I386AIX) \
478 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
479 && !defined (TE_GNU) \
480 && !defined (TE_LINUX) \
481 && !defined (TE_NACL) \
482 && !defined (TE_FreeBSD) \
483 && !defined (TE_DragonFly) \
484 && !defined (TE_NetBSD)))
485 /* This array holds the chars that always start a comment. If the
486 pre-processor is disabled, these aren't very useful. The option
487 --divide will remove '/' from this list. */
488 const char *i386_comment_chars = "#/";
489 #define SVR4_COMMENT_CHARS 1
490 #define PREFIX_SEPARATOR '\\'
491
492 #else
493 const char *i386_comment_chars = "#";
494 #define PREFIX_SEPARATOR '/'
495 #endif
496
497 /* This array holds the chars that only start a comment at the beginning of
498 a line. If the line seems to have the form '# 123 filename'
499 .line and .file directives will appear in the pre-processed output.
500 Note that input_file.c hand checks for '#' at the beginning of the
501 first line of the input file. This is because the compiler outputs
502 #NO_APP at the beginning of its output.
503 Also note that comments started like this one will always work if
504 '/' isn't otherwise defined. */
505 const char line_comment_chars[] = "#/";
506
507 const char line_separator_chars[] = ";";
508
509 /* Chars that can be used to separate mant from exp in floating point
510 nums. */
511 const char EXP_CHARS[] = "eE";
512
513 /* Chars that mean this number is a floating point constant
514 As in 0f12.456
515 or 0d1.2345e12. */
516 const char FLT_CHARS[] = "fFdDxX";
517
518 /* Tables for lexical analysis. */
519 static char mnemonic_chars[256];
520 static char register_chars[256];
521 static char operand_chars[256];
522 static char identifier_chars[256];
523 static char digit_chars[256];
524
525 /* Lexical macros. */
526 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
527 #define is_operand_char(x) (operand_chars[(unsigned char) x])
528 #define is_register_char(x) (register_chars[(unsigned char) x])
529 #define is_space_char(x) ((x) == ' ')
530 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
531 #define is_digit_char(x) (digit_chars[(unsigned char) x])
532
533 /* All non-digit non-letter characters that may occur in an operand. */
534 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
535
536 /* md_assemble() always leaves the strings it's passed unaltered. To
537 effect this we maintain a stack of saved characters that we've smashed
538 with '\0's (indicating end of strings for various sub-fields of the
539 assembler instruction). */
540 static char save_stack[32];
541 static char *save_stack_p;
542 #define END_STRING_AND_SAVE(s) \
543 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
544 #define RESTORE_END_STRING(s) \
545 do { *(s) = *--save_stack_p; } while (0)
546
547 /* The instruction we're assembling. */
548 static i386_insn i;
549
550 /* Possible templates for current insn. */
551 static const templates *current_templates;
552
553 /* Per instruction expressionS buffers: max displacements & immediates. */
554 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
555 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
556
557 /* Current operand we are working on. */
558 static int this_operand = -1;
559
560 /* We support four different modes. FLAG_CODE variable is used to distinguish
561 these. */
562
563 enum flag_code {
564 CODE_32BIT,
565 CODE_16BIT,
566 CODE_64BIT };
567
568 static enum flag_code flag_code;
569 static unsigned int object_64bit;
570 static unsigned int disallow_64bit_reloc;
571 static int use_rela_relocations = 0;
572 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
573 static const char *tls_get_addr;
574
575 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
576 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
577 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
578
579 /* The ELF ABI to use. */
580 enum x86_elf_abi
581 {
582 I386_ABI,
583 X86_64_ABI,
584 X86_64_X32_ABI
585 };
586
587 static enum x86_elf_abi x86_elf_abi = I386_ABI;
588 #endif
589
590 #if defined (TE_PE) || defined (TE_PEP)
591 /* Use big object file format. */
592 static int use_big_obj = 0;
593 #endif
594
595 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
596 /* 1 if generating code for a shared library. */
597 static int shared = 0;
598 #endif
599
600 /* 1 for intel syntax,
601 0 if att syntax. */
602 static int intel_syntax = 0;
603
604 static enum x86_64_isa
605 {
606 amd64 = 1, /* AMD64 ISA. */
607 intel64 /* Intel64 ISA. */
608 } isa64;
609
610 /* 1 for intel mnemonic,
611 0 if att mnemonic. */
612 static int intel_mnemonic = !SYSV386_COMPAT;
613
614 /* 1 if pseudo registers are permitted. */
615 static int allow_pseudo_reg = 0;
616
617 /* 1 if register prefix % not required. */
618 static int allow_naked_reg = 0;
619
620 /* 1 if the assembler should add BND prefix for all control-transferring
621 instructions supporting it, even if this prefix wasn't specified
622 explicitly. */
623 static int add_bnd_prefix = 0;
624
625 /* 1 if pseudo index register, eiz/riz, is allowed . */
626 static int allow_index_reg = 0;
627
628 /* 1 if the assembler should ignore LOCK prefix, even if it was
629 specified explicitly. */
630 static int omit_lock_prefix = 0;
631
632 /* 1 if the assembler should encode lfence, mfence, and sfence as
633 "lock addl $0, (%{re}sp)". */
634 static int avoid_fence = 0;
635
636 /* 1 if lfence should be inserted after every load. */
637 static int lfence_after_load = 0;
638
639 /* Non-zero if lfence should be inserted before indirect branch. */
640 static enum lfence_before_indirect_branch_kind
641 {
642 lfence_branch_none = 0,
643 lfence_branch_register,
644 lfence_branch_memory,
645 lfence_branch_all
646 }
647 lfence_before_indirect_branch;
648
649 /* Non-zero if lfence should be inserted before ret. */
650 static enum lfence_before_ret_kind
651 {
652 lfence_before_ret_none = 0,
653 lfence_before_ret_not,
654 lfence_before_ret_or,
655 lfence_before_ret_shl
656 }
657 lfence_before_ret;
658
659 /* Types of previous instruction is .byte or prefix. */
660 static struct
661 {
662 segT seg;
663 const char *file;
664 const char *name;
665 unsigned int line;
666 enum last_insn_kind
667 {
668 last_insn_other = 0,
669 last_insn_directive,
670 last_insn_prefix
671 } kind;
672 } last_insn;
673
674 /* 1 if the assembler should generate relax relocations. */
675
676 static int generate_relax_relocations
677 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
678
679 static enum check_kind
680 {
681 check_none = 0,
682 check_warning,
683 check_error
684 }
685 sse_check, operand_check = check_warning;
686
687 /* Non-zero if branches should be aligned within power of 2 boundary. */
688 static int align_branch_power = 0;
689
690 /* Types of branches to align. */
691 enum align_branch_kind
692 {
693 align_branch_none = 0,
694 align_branch_jcc = 1,
695 align_branch_fused = 2,
696 align_branch_jmp = 3,
697 align_branch_call = 4,
698 align_branch_indirect = 5,
699 align_branch_ret = 6
700 };
701
702 /* Type bits of branches to align. */
703 enum align_branch_bit
704 {
705 align_branch_jcc_bit = 1 << align_branch_jcc,
706 align_branch_fused_bit = 1 << align_branch_fused,
707 align_branch_jmp_bit = 1 << align_branch_jmp,
708 align_branch_call_bit = 1 << align_branch_call,
709 align_branch_indirect_bit = 1 << align_branch_indirect,
710 align_branch_ret_bit = 1 << align_branch_ret
711 };
712
713 static unsigned int align_branch = (align_branch_jcc_bit
714 | align_branch_fused_bit
715 | align_branch_jmp_bit);
716
717 /* Types of condition jump used by macro-fusion. */
718 enum mf_jcc_kind
719 {
720 mf_jcc_jo = 0, /* base opcode 0x70 */
721 mf_jcc_jc, /* base opcode 0x72 */
722 mf_jcc_je, /* base opcode 0x74 */
723 mf_jcc_jna, /* base opcode 0x76 */
724 mf_jcc_js, /* base opcode 0x78 */
725 mf_jcc_jp, /* base opcode 0x7a */
726 mf_jcc_jl, /* base opcode 0x7c */
727 mf_jcc_jle, /* base opcode 0x7e */
728 };
729
730 /* Types of compare flag-modifying insntructions used by macro-fusion. */
731 enum mf_cmp_kind
732 {
733 mf_cmp_test_and, /* test/cmp */
734 mf_cmp_alu_cmp, /* add/sub/cmp */
735 mf_cmp_incdec /* inc/dec */
736 };
737
738 /* The maximum padding size for fused jcc. CMP like instruction can
739 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
740 prefixes. */
741 #define MAX_FUSED_JCC_PADDING_SIZE 20
742
743 /* The maximum number of prefixes added for an instruction. */
744 static unsigned int align_branch_prefix_size = 5;
745
746 /* Optimization:
747 1. Clear the REX_W bit with register operand if possible.
748 2. Above plus use 128bit vector instruction to clear the full vector
749 register.
750 */
751 static int optimize = 0;
752
753 /* Optimization:
754 1. Clear the REX_W bit with register operand if possible.
755 2. Above plus use 128bit vector instruction to clear the full vector
756 register.
757 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
758 "testb $imm7,%r8".
759 */
760 static int optimize_for_space = 0;
761
762 /* Register prefix used for error message. */
763 static const char *register_prefix = "%";
764
765 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
766 leave, push, and pop instructions so that gcc has the same stack
767 frame as in 32 bit mode. */
768 static char stackop_size = '\0';
769
770 /* Non-zero to optimize code alignment. */
771 int optimize_align_code = 1;
772
773 /* Non-zero to quieten some warnings. */
774 static int quiet_warnings = 0;
775
776 /* CPU name. */
777 static const char *cpu_arch_name = NULL;
778 static char *cpu_sub_arch_name = NULL;
779
780 /* CPU feature flags. */
781 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
782
783 /* If we have selected a cpu we are generating instructions for. */
784 static int cpu_arch_tune_set = 0;
785
786 /* Cpu we are generating instructions for. */
787 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
788
789 /* CPU feature flags of cpu we are generating instructions for. */
790 static i386_cpu_flags cpu_arch_tune_flags;
791
792 /* CPU instruction set architecture used. */
793 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
794
795 /* CPU feature flags of instruction set architecture used. */
796 i386_cpu_flags cpu_arch_isa_flags;
797
798 /* If set, conditional jumps are not automatically promoted to handle
799 larger than a byte offset. */
800 static unsigned int no_cond_jump_promotion = 0;
801
802 /* Encode SSE instructions with VEX prefix. */
803 static unsigned int sse2avx;
804
805 /* Encode scalar AVX instructions with specific vector length. */
806 static enum
807 {
808 vex128 = 0,
809 vex256
810 } avxscalar;
811
812 /* Encode VEX WIG instructions with specific vex.w. */
813 static enum
814 {
815 vexw0 = 0,
816 vexw1
817 } vexwig;
818
819 /* Encode scalar EVEX LIG instructions with specific vector length. */
820 static enum
821 {
822 evexl128 = 0,
823 evexl256,
824 evexl512
825 } evexlig;
826
827 /* Encode EVEX WIG instructions with specific evex.w. */
828 static enum
829 {
830 evexw0 = 0,
831 evexw1
832 } evexwig;
833
834 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
835 static enum rc_type evexrcig = rne;
836
837 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
838 static symbolS *GOT_symbol;
839
840 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
841 unsigned int x86_dwarf2_return_column;
842
843 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
844 int x86_cie_data_alignment;
845
846 /* Interface to relax_segment.
847 There are 3 major relax states for 386 jump insns because the
848 different types of jumps add different sizes to frags when we're
849 figuring out what sort of jump to choose to reach a given label.
850
851 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
852 branches which are handled by md_estimate_size_before_relax() and
853 i386_generic_table_relax_frag(). */
854
855 /* Types. */
856 #define UNCOND_JUMP 0
857 #define COND_JUMP 1
858 #define COND_JUMP86 2
859 #define BRANCH_PADDING 3
860 #define BRANCH_PREFIX 4
861 #define FUSED_JCC_PADDING 5
862
863 /* Sizes. */
864 #define CODE16 1
865 #define SMALL 0
866 #define SMALL16 (SMALL | CODE16)
867 #define BIG 2
868 #define BIG16 (BIG | CODE16)
869
870 #ifndef INLINE
871 #ifdef __GNUC__
872 #define INLINE __inline__
873 #else
874 #define INLINE
875 #endif
876 #endif
877
878 #define ENCODE_RELAX_STATE(type, size) \
879 ((relax_substateT) (((type) << 2) | (size)))
880 #define TYPE_FROM_RELAX_STATE(s) \
881 ((s) >> 2)
882 #define DISP_SIZE_FROM_RELAX_STATE(s) \
883 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
884
885 /* This table is used by relax_frag to promote short jumps to long
886 ones where necessary. SMALL (short) jumps may be promoted to BIG
887 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
888 don't allow a short jump in a 32 bit code segment to be promoted to
889 a 16 bit offset jump because it's slower (requires data size
890 prefix), and doesn't work, unless the destination is in the bottom
891 64k of the code segment (The top 16 bits of eip are zeroed). */
892
893 const relax_typeS md_relax_table[] =
894 {
895 /* The fields are:
896 1) most positive reach of this state,
897 2) most negative reach of this state,
898 3) how many bytes this mode will have in the variable part of the frag
899 4) which index into the table to try if we can't fit into this one. */
900
901 /* UNCOND_JUMP states. */
902 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
903 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
904 /* dword jmp adds 4 bytes to frag:
905 0 extra opcode bytes, 4 displacement bytes. */
906 {0, 0, 4, 0},
907 /* word jmp adds 2 byte2 to frag:
908 0 extra opcode bytes, 2 displacement bytes. */
909 {0, 0, 2, 0},
910
911 /* COND_JUMP states. */
912 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
913 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
914 /* dword conditionals adds 5 bytes to frag:
915 1 extra opcode byte, 4 displacement bytes. */
916 {0, 0, 5, 0},
917 /* word conditionals add 3 bytes to frag:
918 1 extra opcode byte, 2 displacement bytes. */
919 {0, 0, 3, 0},
920
921 /* COND_JUMP86 states. */
922 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
923 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
924 /* dword conditionals adds 5 bytes to frag:
925 1 extra opcode byte, 4 displacement bytes. */
926 {0, 0, 5, 0},
927 /* word conditionals add 4 bytes to frag:
928 1 displacement byte and a 3 byte long branch insn. */
929 {0, 0, 4, 0}
930 };
931
932 static const arch_entry cpu_arch[] =
933 {
934 /* Do not replace the first two entries - i386_target_format()
935 relies on them being there in this order. */
936 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
937 CPU_GENERIC32_FLAGS, 0 },
938 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
939 CPU_GENERIC64_FLAGS, 0 },
940 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
941 CPU_NONE_FLAGS, 0 },
942 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
943 CPU_I186_FLAGS, 0 },
944 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
945 CPU_I286_FLAGS, 0 },
946 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
947 CPU_I386_FLAGS, 0 },
948 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
949 CPU_I486_FLAGS, 0 },
950 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
951 CPU_I586_FLAGS, 0 },
952 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
953 CPU_I686_FLAGS, 0 },
954 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
955 CPU_I586_FLAGS, 0 },
956 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
957 CPU_PENTIUMPRO_FLAGS, 0 },
958 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
959 CPU_P2_FLAGS, 0 },
960 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
961 CPU_P3_FLAGS, 0 },
962 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
963 CPU_P4_FLAGS, 0 },
964 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
965 CPU_CORE_FLAGS, 0 },
966 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
967 CPU_NOCONA_FLAGS, 0 },
968 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
969 CPU_CORE_FLAGS, 1 },
970 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
971 CPU_CORE_FLAGS, 0 },
972 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
973 CPU_CORE2_FLAGS, 1 },
974 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
975 CPU_CORE2_FLAGS, 0 },
976 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
977 CPU_COREI7_FLAGS, 0 },
978 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
979 CPU_L1OM_FLAGS, 0 },
980 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
981 CPU_K1OM_FLAGS, 0 },
982 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
983 CPU_IAMCU_FLAGS, 0 },
984 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
985 CPU_K6_FLAGS, 0 },
986 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
987 CPU_K6_2_FLAGS, 0 },
988 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
989 CPU_ATHLON_FLAGS, 0 },
990 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
991 CPU_K8_FLAGS, 1 },
992 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
993 CPU_K8_FLAGS, 0 },
994 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
995 CPU_K8_FLAGS, 0 },
996 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
997 CPU_AMDFAM10_FLAGS, 0 },
998 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
999 CPU_BDVER1_FLAGS, 0 },
1000 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1001 CPU_BDVER2_FLAGS, 0 },
1002 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1003 CPU_BDVER3_FLAGS, 0 },
1004 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1005 CPU_BDVER4_FLAGS, 0 },
1006 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1007 CPU_ZNVER1_FLAGS, 0 },
1008 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1009 CPU_ZNVER2_FLAGS, 0 },
1010 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1011 CPU_BTVER1_FLAGS, 0 },
1012 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1013 CPU_BTVER2_FLAGS, 0 },
1014 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1015 CPU_8087_FLAGS, 0 },
1016 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1017 CPU_287_FLAGS, 0 },
1018 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1019 CPU_387_FLAGS, 0 },
1020 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1021 CPU_687_FLAGS, 0 },
1022 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1023 CPU_CMOV_FLAGS, 0 },
1024 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1025 CPU_FXSR_FLAGS, 0 },
1026 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1027 CPU_MMX_FLAGS, 0 },
1028 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1029 CPU_SSE_FLAGS, 0 },
1030 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1031 CPU_SSE2_FLAGS, 0 },
1032 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1033 CPU_SSE3_FLAGS, 0 },
1034 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1035 CPU_SSE4A_FLAGS, 0 },
1036 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1037 CPU_SSSE3_FLAGS, 0 },
1038 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1039 CPU_SSE4_1_FLAGS, 0 },
1040 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1041 CPU_SSE4_2_FLAGS, 0 },
1042 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1043 CPU_SSE4_2_FLAGS, 0 },
1044 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1045 CPU_AVX_FLAGS, 0 },
1046 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1047 CPU_AVX2_FLAGS, 0 },
1048 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1049 CPU_AVX512F_FLAGS, 0 },
1050 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1051 CPU_AVX512CD_FLAGS, 0 },
1052 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1053 CPU_AVX512ER_FLAGS, 0 },
1054 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1055 CPU_AVX512PF_FLAGS, 0 },
1056 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1057 CPU_AVX512DQ_FLAGS, 0 },
1058 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1059 CPU_AVX512BW_FLAGS, 0 },
1060 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1061 CPU_AVX512VL_FLAGS, 0 },
1062 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1063 CPU_VMX_FLAGS, 0 },
1064 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1065 CPU_VMFUNC_FLAGS, 0 },
1066 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1067 CPU_SMX_FLAGS, 0 },
1068 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1069 CPU_XSAVE_FLAGS, 0 },
1070 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1071 CPU_XSAVEOPT_FLAGS, 0 },
1072 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1073 CPU_XSAVEC_FLAGS, 0 },
1074 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1075 CPU_XSAVES_FLAGS, 0 },
1076 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1077 CPU_AES_FLAGS, 0 },
1078 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1079 CPU_PCLMUL_FLAGS, 0 },
1080 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1081 CPU_PCLMUL_FLAGS, 1 },
1082 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1083 CPU_FSGSBASE_FLAGS, 0 },
1084 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1085 CPU_RDRND_FLAGS, 0 },
1086 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1087 CPU_F16C_FLAGS, 0 },
1088 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1089 CPU_BMI2_FLAGS, 0 },
1090 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1091 CPU_FMA_FLAGS, 0 },
1092 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1093 CPU_FMA4_FLAGS, 0 },
1094 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1095 CPU_XOP_FLAGS, 0 },
1096 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1097 CPU_LWP_FLAGS, 0 },
1098 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1099 CPU_MOVBE_FLAGS, 0 },
1100 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1101 CPU_CX16_FLAGS, 0 },
1102 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1103 CPU_EPT_FLAGS, 0 },
1104 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1105 CPU_LZCNT_FLAGS, 0 },
1106 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1107 CPU_POPCNT_FLAGS, 0 },
1108 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1109 CPU_HLE_FLAGS, 0 },
1110 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1111 CPU_RTM_FLAGS, 0 },
1112 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1113 CPU_INVPCID_FLAGS, 0 },
1114 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1115 CPU_CLFLUSH_FLAGS, 0 },
1116 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1117 CPU_NOP_FLAGS, 0 },
1118 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1119 CPU_SYSCALL_FLAGS, 0 },
1120 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1121 CPU_RDTSCP_FLAGS, 0 },
1122 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1123 CPU_3DNOW_FLAGS, 0 },
1124 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1125 CPU_3DNOWA_FLAGS, 0 },
1126 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1127 CPU_PADLOCK_FLAGS, 0 },
1128 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1129 CPU_SVME_FLAGS, 1 },
1130 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1131 CPU_SVME_FLAGS, 0 },
1132 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1133 CPU_SSE4A_FLAGS, 0 },
1134 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1135 CPU_ABM_FLAGS, 0 },
1136 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1137 CPU_BMI_FLAGS, 0 },
1138 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1139 CPU_TBM_FLAGS, 0 },
1140 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1141 CPU_ADX_FLAGS, 0 },
1142 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1143 CPU_RDSEED_FLAGS, 0 },
1144 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1145 CPU_PRFCHW_FLAGS, 0 },
1146 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1147 CPU_SMAP_FLAGS, 0 },
1148 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1149 CPU_MPX_FLAGS, 0 },
1150 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1151 CPU_SHA_FLAGS, 0 },
1152 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1153 CPU_CLFLUSHOPT_FLAGS, 0 },
1154 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1155 CPU_PREFETCHWT1_FLAGS, 0 },
1156 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1157 CPU_SE1_FLAGS, 0 },
1158 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1159 CPU_CLWB_FLAGS, 0 },
1160 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1161 CPU_AVX512IFMA_FLAGS, 0 },
1162 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1163 CPU_AVX512VBMI_FLAGS, 0 },
1164 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1165 CPU_AVX512_4FMAPS_FLAGS, 0 },
1166 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1167 CPU_AVX512_4VNNIW_FLAGS, 0 },
1168 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1169 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1170 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1171 CPU_AVX512_VBMI2_FLAGS, 0 },
1172 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1173 CPU_AVX512_VNNI_FLAGS, 0 },
1174 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1175 CPU_AVX512_BITALG_FLAGS, 0 },
1176 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1177 CPU_CLZERO_FLAGS, 0 },
1178 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1179 CPU_MWAITX_FLAGS, 0 },
1180 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1181 CPU_OSPKE_FLAGS, 0 },
1182 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1183 CPU_RDPID_FLAGS, 0 },
1184 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1185 CPU_PTWRITE_FLAGS, 0 },
1186 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1187 CPU_IBT_FLAGS, 0 },
1188 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1189 CPU_SHSTK_FLAGS, 0 },
1190 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1191 CPU_GFNI_FLAGS, 0 },
1192 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1193 CPU_VAES_FLAGS, 0 },
1194 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1195 CPU_VPCLMULQDQ_FLAGS, 0 },
1196 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1197 CPU_WBNOINVD_FLAGS, 0 },
1198 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1199 CPU_PCONFIG_FLAGS, 0 },
1200 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1201 CPU_WAITPKG_FLAGS, 0 },
1202 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1203 CPU_CLDEMOTE_FLAGS, 0 },
1204 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1205 CPU_MOVDIRI_FLAGS, 0 },
1206 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1207 CPU_MOVDIR64B_FLAGS, 0 },
1208 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1209 CPU_AVX512_BF16_FLAGS, 0 },
1210 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1211 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1212 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1213 CPU_ENQCMD_FLAGS, 0 },
1214 { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1215 CPU_SERIALIZE_FLAGS, 0 },
1216 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1217 CPU_RDPRU_FLAGS, 0 },
1218 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1219 CPU_MCOMMIT_FLAGS, 0 },
1220 { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1221 CPU_SEV_ES_FLAGS, 0 },
1222 { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1223 CPU_TSXLDTRK_FLAGS, 0 },
1224 };
1225
1226 static const noarch_entry cpu_noarch[] =
1227 {
1228 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1229 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1230 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1231 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1232 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1233 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1234 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1235 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1236 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1237 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1238 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1239 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1240 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1241 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1242 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1243 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1244 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1245 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1246 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1247 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1248 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1249 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1250 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1251 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1252 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1253 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1254 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1255 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1256 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1257 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1258 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1259 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1260 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1261 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1262 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1263 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1264 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1265 { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1266 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1267 { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1268 { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1269 };
1270
1271 #ifdef I386COFF
1272 /* Like s_lcomm_internal in gas/read.c but the alignment string
1273 is allowed to be optional. */
1274
1275 static symbolS *
1276 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1277 {
1278 addressT align = 0;
1279
1280 SKIP_WHITESPACE ();
1281
1282 if (needs_align
1283 && *input_line_pointer == ',')
1284 {
1285 align = parse_align (needs_align - 1);
1286
1287 if (align == (addressT) -1)
1288 return NULL;
1289 }
1290 else
1291 {
1292 if (size >= 8)
1293 align = 3;
1294 else if (size >= 4)
1295 align = 2;
1296 else if (size >= 2)
1297 align = 1;
1298 else
1299 align = 0;
1300 }
1301
1302 bss_alloc (symbolP, size, align);
1303 return symbolP;
1304 }
1305
1306 static void
1307 pe_lcomm (int needs_align)
1308 {
1309 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1310 }
1311 #endif
1312
1313 const pseudo_typeS md_pseudo_table[] =
1314 {
1315 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1316 {"align", s_align_bytes, 0},
1317 #else
1318 {"align", s_align_ptwo, 0},
1319 #endif
1320 {"arch", set_cpu_arch, 0},
1321 #ifndef I386COFF
1322 {"bss", s_bss, 0},
1323 #else
1324 {"lcomm", pe_lcomm, 1},
1325 #endif
1326 {"ffloat", float_cons, 'f'},
1327 {"dfloat", float_cons, 'd'},
1328 {"tfloat", float_cons, 'x'},
1329 {"value", cons, 2},
1330 {"slong", signed_cons, 4},
1331 {"noopt", s_ignore, 0},
1332 {"optim", s_ignore, 0},
1333 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1334 {"code16", set_code_flag, CODE_16BIT},
1335 {"code32", set_code_flag, CODE_32BIT},
1336 #ifdef BFD64
1337 {"code64", set_code_flag, CODE_64BIT},
1338 #endif
1339 {"intel_syntax", set_intel_syntax, 1},
1340 {"att_syntax", set_intel_syntax, 0},
1341 {"intel_mnemonic", set_intel_mnemonic, 1},
1342 {"att_mnemonic", set_intel_mnemonic, 0},
1343 {"allow_index_reg", set_allow_index_reg, 1},
1344 {"disallow_index_reg", set_allow_index_reg, 0},
1345 {"sse_check", set_check, 0},
1346 {"operand_check", set_check, 1},
1347 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1348 {"largecomm", handle_large_common, 0},
1349 #else
1350 {"file", dwarf2_directive_file, 0},
1351 {"loc", dwarf2_directive_loc, 0},
1352 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1353 #endif
1354 #ifdef TE_PE
1355 {"secrel32", pe_directive_secrel, 0},
1356 #endif
1357 {0, 0, 0}
1358 };
1359
1360 /* For interface with expression (). */
1361 extern char *input_line_pointer;
1362
1363 /* Hash table for instruction mnemonic lookup. */
1364 static struct hash_control *op_hash;
1365
1366 /* Hash table for register lookup. */
1367 static struct hash_control *reg_hash;
1368 \f
1369 /* Various efficient no-op patterns for aligning code labels.
1370 Note: Don't try to assemble the instructions in the comments.
1371 0L and 0w are not legal. */
1372 static const unsigned char f32_1[] =
1373 {0x90}; /* nop */
1374 static const unsigned char f32_2[] =
1375 {0x66,0x90}; /* xchg %ax,%ax */
1376 static const unsigned char f32_3[] =
1377 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1378 static const unsigned char f32_4[] =
1379 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1380 static const unsigned char f32_6[] =
1381 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1382 static const unsigned char f32_7[] =
1383 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1384 static const unsigned char f16_3[] =
1385 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1386 static const unsigned char f16_4[] =
1387 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1388 static const unsigned char jump_disp8[] =
1389 {0xeb}; /* jmp disp8 */
1390 static const unsigned char jump32_disp32[] =
1391 {0xe9}; /* jmp disp32 */
1392 static const unsigned char jump16_disp32[] =
1393 {0x66,0xe9}; /* jmp disp32 */
1394 /* 32-bit NOPs patterns. */
1395 static const unsigned char *const f32_patt[] = {
1396 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1397 };
1398 /* 16-bit NOPs patterns. */
1399 static const unsigned char *const f16_patt[] = {
1400 f32_1, f32_2, f16_3, f16_4
1401 };
1402 /* nopl (%[re]ax) */
1403 static const unsigned char alt_3[] =
1404 {0x0f,0x1f,0x00};
1405 /* nopl 0(%[re]ax) */
1406 static const unsigned char alt_4[] =
1407 {0x0f,0x1f,0x40,0x00};
1408 /* nopl 0(%[re]ax,%[re]ax,1) */
1409 static const unsigned char alt_5[] =
1410 {0x0f,0x1f,0x44,0x00,0x00};
1411 /* nopw 0(%[re]ax,%[re]ax,1) */
1412 static const unsigned char alt_6[] =
1413 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1414 /* nopl 0L(%[re]ax) */
1415 static const unsigned char alt_7[] =
1416 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1417 /* nopl 0L(%[re]ax,%[re]ax,1) */
1418 static const unsigned char alt_8[] =
1419 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1420 /* nopw 0L(%[re]ax,%[re]ax,1) */
1421 static const unsigned char alt_9[] =
1422 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1423 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1424 static const unsigned char alt_10[] =
1425 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1426 /* data16 nopw %cs:0L(%eax,%eax,1) */
1427 static const unsigned char alt_11[] =
1428 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1429 /* 32-bit and 64-bit NOPs patterns. */
1430 static const unsigned char *const alt_patt[] = {
1431 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1432 alt_9, alt_10, alt_11
1433 };
1434
1435 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1436 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1437
1438 static void
1439 i386_output_nops (char *where, const unsigned char *const *patt,
1440 int count, int max_single_nop_size)
1441
1442 {
1443 /* Place the longer NOP first. */
1444 int last;
1445 int offset;
1446 const unsigned char *nops;
1447
1448 if (max_single_nop_size < 1)
1449 {
1450 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1451 max_single_nop_size);
1452 return;
1453 }
1454
1455 nops = patt[max_single_nop_size - 1];
1456
1457 /* Use the smaller one if the requsted one isn't available. */
1458 if (nops == NULL)
1459 {
1460 max_single_nop_size--;
1461 nops = patt[max_single_nop_size - 1];
1462 }
1463
1464 last = count % max_single_nop_size;
1465
1466 count -= last;
1467 for (offset = 0; offset < count; offset += max_single_nop_size)
1468 memcpy (where + offset, nops, max_single_nop_size);
1469
1470 if (last)
1471 {
1472 nops = patt[last - 1];
1473 if (nops == NULL)
1474 {
1475 /* Use the smaller one plus one-byte NOP if the needed one
1476 isn't available. */
1477 last--;
1478 nops = patt[last - 1];
1479 memcpy (where + offset, nops, last);
1480 where[offset + last] = *patt[0];
1481 }
1482 else
1483 memcpy (where + offset, nops, last);
1484 }
1485 }
1486
1487 static INLINE int
1488 fits_in_imm7 (offsetT num)
1489 {
1490 return (num & 0x7f) == num;
1491 }
1492
1493 static INLINE int
1494 fits_in_imm31 (offsetT num)
1495 {
1496 return (num & 0x7fffffff) == num;
1497 }
1498
1499 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1500 single NOP instruction LIMIT. */
1501
1502 void
1503 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1504 {
1505 const unsigned char *const *patt = NULL;
1506 int max_single_nop_size;
1507 /* Maximum number of NOPs before switching to jump over NOPs. */
1508 int max_number_of_nops;
1509
1510 switch (fragP->fr_type)
1511 {
1512 case rs_fill_nop:
1513 case rs_align_code:
1514 break;
1515 case rs_machine_dependent:
1516 /* Allow NOP padding for jumps and calls. */
1517 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1518 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1519 break;
1520 /* Fall through. */
1521 default:
1522 return;
1523 }
1524
1525 /* We need to decide which NOP sequence to use for 32bit and
1526 64bit. When -mtune= is used:
1527
1528 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1529 PROCESSOR_GENERIC32, f32_patt will be used.
1530 2. For the rest, alt_patt will be used.
1531
1532 When -mtune= isn't used, alt_patt will be used if
1533 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1534 be used.
1535
1536 When -march= or .arch is used, we can't use anything beyond
1537 cpu_arch_isa_flags. */
1538
1539 if (flag_code == CODE_16BIT)
1540 {
1541 patt = f16_patt;
1542 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1543 /* Limit number of NOPs to 2 in 16-bit mode. */
1544 max_number_of_nops = 2;
1545 }
1546 else
1547 {
1548 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1549 {
1550 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1551 switch (cpu_arch_tune)
1552 {
1553 case PROCESSOR_UNKNOWN:
1554 /* We use cpu_arch_isa_flags to check if we SHOULD
1555 optimize with nops. */
1556 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1557 patt = alt_patt;
1558 else
1559 patt = f32_patt;
1560 break;
1561 case PROCESSOR_PENTIUM4:
1562 case PROCESSOR_NOCONA:
1563 case PROCESSOR_CORE:
1564 case PROCESSOR_CORE2:
1565 case PROCESSOR_COREI7:
1566 case PROCESSOR_L1OM:
1567 case PROCESSOR_K1OM:
1568 case PROCESSOR_GENERIC64:
1569 case PROCESSOR_K6:
1570 case PROCESSOR_ATHLON:
1571 case PROCESSOR_K8:
1572 case PROCESSOR_AMDFAM10:
1573 case PROCESSOR_BD:
1574 case PROCESSOR_ZNVER:
1575 case PROCESSOR_BT:
1576 patt = alt_patt;
1577 break;
1578 case PROCESSOR_I386:
1579 case PROCESSOR_I486:
1580 case PROCESSOR_PENTIUM:
1581 case PROCESSOR_PENTIUMPRO:
1582 case PROCESSOR_IAMCU:
1583 case PROCESSOR_GENERIC32:
1584 patt = f32_patt;
1585 break;
1586 }
1587 }
1588 else
1589 {
1590 switch (fragP->tc_frag_data.tune)
1591 {
1592 case PROCESSOR_UNKNOWN:
1593 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1594 PROCESSOR_UNKNOWN. */
1595 abort ();
1596 break;
1597
1598 case PROCESSOR_I386:
1599 case PROCESSOR_I486:
1600 case PROCESSOR_PENTIUM:
1601 case PROCESSOR_IAMCU:
1602 case PROCESSOR_K6:
1603 case PROCESSOR_ATHLON:
1604 case PROCESSOR_K8:
1605 case PROCESSOR_AMDFAM10:
1606 case PROCESSOR_BD:
1607 case PROCESSOR_ZNVER:
1608 case PROCESSOR_BT:
1609 case PROCESSOR_GENERIC32:
1610 /* We use cpu_arch_isa_flags to check if we CAN optimize
1611 with nops. */
1612 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1613 patt = alt_patt;
1614 else
1615 patt = f32_patt;
1616 break;
1617 case PROCESSOR_PENTIUMPRO:
1618 case PROCESSOR_PENTIUM4:
1619 case PROCESSOR_NOCONA:
1620 case PROCESSOR_CORE:
1621 case PROCESSOR_CORE2:
1622 case PROCESSOR_COREI7:
1623 case PROCESSOR_L1OM:
1624 case PROCESSOR_K1OM:
1625 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1626 patt = alt_patt;
1627 else
1628 patt = f32_patt;
1629 break;
1630 case PROCESSOR_GENERIC64:
1631 patt = alt_patt;
1632 break;
1633 }
1634 }
1635
1636 if (patt == f32_patt)
1637 {
1638 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1639 /* Limit number of NOPs to 2 for older processors. */
1640 max_number_of_nops = 2;
1641 }
1642 else
1643 {
1644 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1645 /* Limit number of NOPs to 7 for newer processors. */
1646 max_number_of_nops = 7;
1647 }
1648 }
1649
1650 if (limit == 0)
1651 limit = max_single_nop_size;
1652
1653 if (fragP->fr_type == rs_fill_nop)
1654 {
1655 /* Output NOPs for .nop directive. */
1656 if (limit > max_single_nop_size)
1657 {
1658 as_bad_where (fragP->fr_file, fragP->fr_line,
1659 _("invalid single nop size: %d "
1660 "(expect within [0, %d])"),
1661 limit, max_single_nop_size);
1662 return;
1663 }
1664 }
1665 else if (fragP->fr_type != rs_machine_dependent)
1666 fragP->fr_var = count;
1667
1668 if ((count / max_single_nop_size) > max_number_of_nops)
1669 {
1670 /* Generate jump over NOPs. */
1671 offsetT disp = count - 2;
1672 if (fits_in_imm7 (disp))
1673 {
1674 /* Use "jmp disp8" if possible. */
1675 count = disp;
1676 where[0] = jump_disp8[0];
1677 where[1] = count;
1678 where += 2;
1679 }
1680 else
1681 {
1682 unsigned int size_of_jump;
1683
1684 if (flag_code == CODE_16BIT)
1685 {
1686 where[0] = jump16_disp32[0];
1687 where[1] = jump16_disp32[1];
1688 size_of_jump = 2;
1689 }
1690 else
1691 {
1692 where[0] = jump32_disp32[0];
1693 size_of_jump = 1;
1694 }
1695
1696 count -= size_of_jump + 4;
1697 if (!fits_in_imm31 (count))
1698 {
1699 as_bad_where (fragP->fr_file, fragP->fr_line,
1700 _("jump over nop padding out of range"));
1701 return;
1702 }
1703
1704 md_number_to_chars (where + size_of_jump, count, 4);
1705 where += size_of_jump + 4;
1706 }
1707 }
1708
1709 /* Generate multiple NOPs. */
1710 i386_output_nops (where, patt, count, limit);
1711 }
1712
1713 static INLINE int
1714 operand_type_all_zero (const union i386_operand_type *x)
1715 {
1716 switch (ARRAY_SIZE(x->array))
1717 {
1718 case 3:
1719 if (x->array[2])
1720 return 0;
1721 /* Fall through. */
1722 case 2:
1723 if (x->array[1])
1724 return 0;
1725 /* Fall through. */
1726 case 1:
1727 return !x->array[0];
1728 default:
1729 abort ();
1730 }
1731 }
1732
1733 static INLINE void
1734 operand_type_set (union i386_operand_type *x, unsigned int v)
1735 {
1736 switch (ARRAY_SIZE(x->array))
1737 {
1738 case 3:
1739 x->array[2] = v;
1740 /* Fall through. */
1741 case 2:
1742 x->array[1] = v;
1743 /* Fall through. */
1744 case 1:
1745 x->array[0] = v;
1746 /* Fall through. */
1747 break;
1748 default:
1749 abort ();
1750 }
1751
1752 x->bitfield.class = ClassNone;
1753 x->bitfield.instance = InstanceNone;
1754 }
1755
1756 static INLINE int
1757 operand_type_equal (const union i386_operand_type *x,
1758 const union i386_operand_type *y)
1759 {
1760 switch (ARRAY_SIZE(x->array))
1761 {
1762 case 3:
1763 if (x->array[2] != y->array[2])
1764 return 0;
1765 /* Fall through. */
1766 case 2:
1767 if (x->array[1] != y->array[1])
1768 return 0;
1769 /* Fall through. */
1770 case 1:
1771 return x->array[0] == y->array[0];
1772 break;
1773 default:
1774 abort ();
1775 }
1776 }
1777
1778 static INLINE int
1779 cpu_flags_all_zero (const union i386_cpu_flags *x)
1780 {
1781 switch (ARRAY_SIZE(x->array))
1782 {
1783 case 4:
1784 if (x->array[3])
1785 return 0;
1786 /* Fall through. */
1787 case 3:
1788 if (x->array[2])
1789 return 0;
1790 /* Fall through. */
1791 case 2:
1792 if (x->array[1])
1793 return 0;
1794 /* Fall through. */
1795 case 1:
1796 return !x->array[0];
1797 default:
1798 abort ();
1799 }
1800 }
1801
1802 static INLINE int
1803 cpu_flags_equal (const union i386_cpu_flags *x,
1804 const union i386_cpu_flags *y)
1805 {
1806 switch (ARRAY_SIZE(x->array))
1807 {
1808 case 4:
1809 if (x->array[3] != y->array[3])
1810 return 0;
1811 /* Fall through. */
1812 case 3:
1813 if (x->array[2] != y->array[2])
1814 return 0;
1815 /* Fall through. */
1816 case 2:
1817 if (x->array[1] != y->array[1])
1818 return 0;
1819 /* Fall through. */
1820 case 1:
1821 return x->array[0] == y->array[0];
1822 break;
1823 default:
1824 abort ();
1825 }
1826 }
1827
1828 static INLINE int
1829 cpu_flags_check_cpu64 (i386_cpu_flags f)
1830 {
1831 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1832 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1833 }
1834
1835 static INLINE i386_cpu_flags
1836 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1837 {
1838 switch (ARRAY_SIZE (x.array))
1839 {
1840 case 4:
1841 x.array [3] &= y.array [3];
1842 /* Fall through. */
1843 case 3:
1844 x.array [2] &= y.array [2];
1845 /* Fall through. */
1846 case 2:
1847 x.array [1] &= y.array [1];
1848 /* Fall through. */
1849 case 1:
1850 x.array [0] &= y.array [0];
1851 break;
1852 default:
1853 abort ();
1854 }
1855 return x;
1856 }
1857
1858 static INLINE i386_cpu_flags
1859 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1860 {
1861 switch (ARRAY_SIZE (x.array))
1862 {
1863 case 4:
1864 x.array [3] |= y.array [3];
1865 /* Fall through. */
1866 case 3:
1867 x.array [2] |= y.array [2];
1868 /* Fall through. */
1869 case 2:
1870 x.array [1] |= y.array [1];
1871 /* Fall through. */
1872 case 1:
1873 x.array [0] |= y.array [0];
1874 break;
1875 default:
1876 abort ();
1877 }
1878 return x;
1879 }
1880
1881 static INLINE i386_cpu_flags
1882 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1883 {
1884 switch (ARRAY_SIZE (x.array))
1885 {
1886 case 4:
1887 x.array [3] &= ~y.array [3];
1888 /* Fall through. */
1889 case 3:
1890 x.array [2] &= ~y.array [2];
1891 /* Fall through. */
1892 case 2:
1893 x.array [1] &= ~y.array [1];
1894 /* Fall through. */
1895 case 1:
1896 x.array [0] &= ~y.array [0];
1897 break;
1898 default:
1899 abort ();
1900 }
1901 return x;
1902 }
1903
1904 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1905
1906 #define CPU_FLAGS_ARCH_MATCH 0x1
1907 #define CPU_FLAGS_64BIT_MATCH 0x2
1908
1909 #define CPU_FLAGS_PERFECT_MATCH \
1910 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1911
1912 /* Return CPU flags match bits. */
1913
1914 static int
1915 cpu_flags_match (const insn_template *t)
1916 {
1917 i386_cpu_flags x = t->cpu_flags;
1918 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1919
1920 x.bitfield.cpu64 = 0;
1921 x.bitfield.cpuno64 = 0;
1922
1923 if (cpu_flags_all_zero (&x))
1924 {
1925 /* This instruction is available on all archs. */
1926 match |= CPU_FLAGS_ARCH_MATCH;
1927 }
1928 else
1929 {
1930 /* This instruction is available only on some archs. */
1931 i386_cpu_flags cpu = cpu_arch_flags;
1932
1933 /* AVX512VL is no standalone feature - match it and then strip it. */
1934 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1935 return match;
1936 x.bitfield.cpuavx512vl = 0;
1937
1938 cpu = cpu_flags_and (x, cpu);
1939 if (!cpu_flags_all_zero (&cpu))
1940 {
1941 if (x.bitfield.cpuavx)
1942 {
1943 /* We need to check a few extra flags with AVX. */
1944 if (cpu.bitfield.cpuavx
1945 && (!t->opcode_modifier.sse2avx || sse2avx)
1946 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1947 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1948 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1949 match |= CPU_FLAGS_ARCH_MATCH;
1950 }
1951 else if (x.bitfield.cpuavx512f)
1952 {
1953 /* We need to check a few extra flags with AVX512F. */
1954 if (cpu.bitfield.cpuavx512f
1955 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1956 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1957 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1958 match |= CPU_FLAGS_ARCH_MATCH;
1959 }
1960 else
1961 match |= CPU_FLAGS_ARCH_MATCH;
1962 }
1963 }
1964 return match;
1965 }
1966
1967 static INLINE i386_operand_type
1968 operand_type_and (i386_operand_type x, i386_operand_type y)
1969 {
1970 if (x.bitfield.class != y.bitfield.class)
1971 x.bitfield.class = ClassNone;
1972 if (x.bitfield.instance != y.bitfield.instance)
1973 x.bitfield.instance = InstanceNone;
1974
1975 switch (ARRAY_SIZE (x.array))
1976 {
1977 case 3:
1978 x.array [2] &= y.array [2];
1979 /* Fall through. */
1980 case 2:
1981 x.array [1] &= y.array [1];
1982 /* Fall through. */
1983 case 1:
1984 x.array [0] &= y.array [0];
1985 break;
1986 default:
1987 abort ();
1988 }
1989 return x;
1990 }
1991
1992 static INLINE i386_operand_type
1993 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1994 {
1995 gas_assert (y.bitfield.class == ClassNone);
1996 gas_assert (y.bitfield.instance == InstanceNone);
1997
1998 switch (ARRAY_SIZE (x.array))
1999 {
2000 case 3:
2001 x.array [2] &= ~y.array [2];
2002 /* Fall through. */
2003 case 2:
2004 x.array [1] &= ~y.array [1];
2005 /* Fall through. */
2006 case 1:
2007 x.array [0] &= ~y.array [0];
2008 break;
2009 default:
2010 abort ();
2011 }
2012 return x;
2013 }
2014
2015 static INLINE i386_operand_type
2016 operand_type_or (i386_operand_type x, i386_operand_type y)
2017 {
2018 gas_assert (x.bitfield.class == ClassNone ||
2019 y.bitfield.class == ClassNone ||
2020 x.bitfield.class == y.bitfield.class);
2021 gas_assert (x.bitfield.instance == InstanceNone ||
2022 y.bitfield.instance == InstanceNone ||
2023 x.bitfield.instance == y.bitfield.instance);
2024
2025 switch (ARRAY_SIZE (x.array))
2026 {
2027 case 3:
2028 x.array [2] |= y.array [2];
2029 /* Fall through. */
2030 case 2:
2031 x.array [1] |= y.array [1];
2032 /* Fall through. */
2033 case 1:
2034 x.array [0] |= y.array [0];
2035 break;
2036 default:
2037 abort ();
2038 }
2039 return x;
2040 }
2041
2042 static INLINE i386_operand_type
2043 operand_type_xor (i386_operand_type x, i386_operand_type y)
2044 {
2045 gas_assert (y.bitfield.class == ClassNone);
2046 gas_assert (y.bitfield.instance == InstanceNone);
2047
2048 switch (ARRAY_SIZE (x.array))
2049 {
2050 case 3:
2051 x.array [2] ^= y.array [2];
2052 /* Fall through. */
2053 case 2:
2054 x.array [1] ^= y.array [1];
2055 /* Fall through. */
2056 case 1:
2057 x.array [0] ^= y.array [0];
2058 break;
2059 default:
2060 abort ();
2061 }
2062 return x;
2063 }
2064
2065 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2066 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2067 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2068 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2069 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2070 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2071 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2072 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2073 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2074 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2075 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2076 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2077 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2078 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2079 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2080 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2081 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2082
2083 enum operand_type
2084 {
2085 reg,
2086 imm,
2087 disp,
2088 anymem
2089 };
2090
2091 static INLINE int
2092 operand_type_check (i386_operand_type t, enum operand_type c)
2093 {
2094 switch (c)
2095 {
2096 case reg:
2097 return t.bitfield.class == Reg;
2098
2099 case imm:
2100 return (t.bitfield.imm8
2101 || t.bitfield.imm8s
2102 || t.bitfield.imm16
2103 || t.bitfield.imm32
2104 || t.bitfield.imm32s
2105 || t.bitfield.imm64);
2106
2107 case disp:
2108 return (t.bitfield.disp8
2109 || t.bitfield.disp16
2110 || t.bitfield.disp32
2111 || t.bitfield.disp32s
2112 || t.bitfield.disp64);
2113
2114 case anymem:
2115 return (t.bitfield.disp8
2116 || t.bitfield.disp16
2117 || t.bitfield.disp32
2118 || t.bitfield.disp32s
2119 || t.bitfield.disp64
2120 || t.bitfield.baseindex);
2121
2122 default:
2123 abort ();
2124 }
2125
2126 return 0;
2127 }
2128
2129 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2130 between operand GIVEN and opeand WANTED for instruction template T. */
2131
2132 static INLINE int
2133 match_operand_size (const insn_template *t, unsigned int wanted,
2134 unsigned int given)
2135 {
2136 return !((i.types[given].bitfield.byte
2137 && !t->operand_types[wanted].bitfield.byte)
2138 || (i.types[given].bitfield.word
2139 && !t->operand_types[wanted].bitfield.word)
2140 || (i.types[given].bitfield.dword
2141 && !t->operand_types[wanted].bitfield.dword)
2142 || (i.types[given].bitfield.qword
2143 && !t->operand_types[wanted].bitfield.qword)
2144 || (i.types[given].bitfield.tbyte
2145 && !t->operand_types[wanted].bitfield.tbyte));
2146 }
2147
2148 /* Return 1 if there is no conflict in SIMD register between operand
2149 GIVEN and opeand WANTED for instruction template T. */
2150
2151 static INLINE int
2152 match_simd_size (const insn_template *t, unsigned int wanted,
2153 unsigned int given)
2154 {
2155 return !((i.types[given].bitfield.xmmword
2156 && !t->operand_types[wanted].bitfield.xmmword)
2157 || (i.types[given].bitfield.ymmword
2158 && !t->operand_types[wanted].bitfield.ymmword)
2159 || (i.types[given].bitfield.zmmword
2160 && !t->operand_types[wanted].bitfield.zmmword));
2161 }
2162
2163 /* Return 1 if there is no conflict in any size between operand GIVEN
2164 and opeand WANTED for instruction template T. */
2165
2166 static INLINE int
2167 match_mem_size (const insn_template *t, unsigned int wanted,
2168 unsigned int given)
2169 {
2170 return (match_operand_size (t, wanted, given)
2171 && !((i.types[given].bitfield.unspecified
2172 && !i.broadcast
2173 && !t->operand_types[wanted].bitfield.unspecified)
2174 || (i.types[given].bitfield.fword
2175 && !t->operand_types[wanted].bitfield.fword)
2176 /* For scalar opcode templates to allow register and memory
2177 operands at the same time, some special casing is needed
2178 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2179 down-conversion vpmov*. */
2180 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2181 && t->operand_types[wanted].bitfield.byte
2182 + t->operand_types[wanted].bitfield.word
2183 + t->operand_types[wanted].bitfield.dword
2184 + t->operand_types[wanted].bitfield.qword
2185 > !!t->opcode_modifier.broadcast)
2186 ? (i.types[given].bitfield.xmmword
2187 || i.types[given].bitfield.ymmword
2188 || i.types[given].bitfield.zmmword)
2189 : !match_simd_size(t, wanted, given))));
2190 }
2191
2192 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2193 operands for instruction template T, and it has MATCH_REVERSE set if there
2194 is no size conflict on any operands for the template with operands reversed
2195 (and the template allows for reversing in the first place). */
2196
2197 #define MATCH_STRAIGHT 1
2198 #define MATCH_REVERSE 2
2199
2200 static INLINE unsigned int
2201 operand_size_match (const insn_template *t)
2202 {
2203 unsigned int j, match = MATCH_STRAIGHT;
2204
2205 /* Don't check non-absolute jump instructions. */
2206 if (t->opcode_modifier.jump
2207 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2208 return match;
2209
2210 /* Check memory and accumulator operand size. */
2211 for (j = 0; j < i.operands; j++)
2212 {
2213 if (i.types[j].bitfield.class != Reg
2214 && i.types[j].bitfield.class != RegSIMD
2215 && t->opcode_modifier.anysize)
2216 continue;
2217
2218 if (t->operand_types[j].bitfield.class == Reg
2219 && !match_operand_size (t, j, j))
2220 {
2221 match = 0;
2222 break;
2223 }
2224
2225 if (t->operand_types[j].bitfield.class == RegSIMD
2226 && !match_simd_size (t, j, j))
2227 {
2228 match = 0;
2229 break;
2230 }
2231
2232 if (t->operand_types[j].bitfield.instance == Accum
2233 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2234 {
2235 match = 0;
2236 break;
2237 }
2238
2239 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2240 {
2241 match = 0;
2242 break;
2243 }
2244 }
2245
2246 if (!t->opcode_modifier.d)
2247 {
2248 mismatch:
2249 if (!match)
2250 i.error = operand_size_mismatch;
2251 return match;
2252 }
2253
2254 /* Check reverse. */
2255 gas_assert (i.operands >= 2 && i.operands <= 3);
2256
2257 for (j = 0; j < i.operands; j++)
2258 {
2259 unsigned int given = i.operands - j - 1;
2260
2261 if (t->operand_types[j].bitfield.class == Reg
2262 && !match_operand_size (t, j, given))
2263 goto mismatch;
2264
2265 if (t->operand_types[j].bitfield.class == RegSIMD
2266 && !match_simd_size (t, j, given))
2267 goto mismatch;
2268
2269 if (t->operand_types[j].bitfield.instance == Accum
2270 && (!match_operand_size (t, j, given)
2271 || !match_simd_size (t, j, given)))
2272 goto mismatch;
2273
2274 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2275 goto mismatch;
2276 }
2277
2278 return match | MATCH_REVERSE;
2279 }
2280
2281 static INLINE int
2282 operand_type_match (i386_operand_type overlap,
2283 i386_operand_type given)
2284 {
2285 i386_operand_type temp = overlap;
2286
2287 temp.bitfield.unspecified = 0;
2288 temp.bitfield.byte = 0;
2289 temp.bitfield.word = 0;
2290 temp.bitfield.dword = 0;
2291 temp.bitfield.fword = 0;
2292 temp.bitfield.qword = 0;
2293 temp.bitfield.tbyte = 0;
2294 temp.bitfield.xmmword = 0;
2295 temp.bitfield.ymmword = 0;
2296 temp.bitfield.zmmword = 0;
2297 if (operand_type_all_zero (&temp))
2298 goto mismatch;
2299
2300 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2301 return 1;
2302
2303 mismatch:
2304 i.error = operand_type_mismatch;
2305 return 0;
2306 }
2307
2308 /* If given types g0 and g1 are registers they must be of the same type
2309 unless the expected operand type register overlap is null.
2310 Some Intel syntax memory operand size checking also happens here. */
2311
2312 static INLINE int
2313 operand_type_register_match (i386_operand_type g0,
2314 i386_operand_type t0,
2315 i386_operand_type g1,
2316 i386_operand_type t1)
2317 {
2318 if (g0.bitfield.class != Reg
2319 && g0.bitfield.class != RegSIMD
2320 && (!operand_type_check (g0, anymem)
2321 || g0.bitfield.unspecified
2322 || (t0.bitfield.class != Reg
2323 && t0.bitfield.class != RegSIMD)))
2324 return 1;
2325
2326 if (g1.bitfield.class != Reg
2327 && g1.bitfield.class != RegSIMD
2328 && (!operand_type_check (g1, anymem)
2329 || g1.bitfield.unspecified
2330 || (t1.bitfield.class != Reg
2331 && t1.bitfield.class != RegSIMD)))
2332 return 1;
2333
2334 if (g0.bitfield.byte == g1.bitfield.byte
2335 && g0.bitfield.word == g1.bitfield.word
2336 && g0.bitfield.dword == g1.bitfield.dword
2337 && g0.bitfield.qword == g1.bitfield.qword
2338 && g0.bitfield.xmmword == g1.bitfield.xmmword
2339 && g0.bitfield.ymmword == g1.bitfield.ymmword
2340 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2341 return 1;
2342
2343 if (!(t0.bitfield.byte & t1.bitfield.byte)
2344 && !(t0.bitfield.word & t1.bitfield.word)
2345 && !(t0.bitfield.dword & t1.bitfield.dword)
2346 && !(t0.bitfield.qword & t1.bitfield.qword)
2347 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2348 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2349 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2350 return 1;
2351
2352 i.error = register_type_mismatch;
2353
2354 return 0;
2355 }
2356
2357 static INLINE unsigned int
2358 register_number (const reg_entry *r)
2359 {
2360 unsigned int nr = r->reg_num;
2361
2362 if (r->reg_flags & RegRex)
2363 nr += 8;
2364
2365 if (r->reg_flags & RegVRex)
2366 nr += 16;
2367
2368 return nr;
2369 }
2370
2371 static INLINE unsigned int
2372 mode_from_disp_size (i386_operand_type t)
2373 {
2374 if (t.bitfield.disp8)
2375 return 1;
2376 else if (t.bitfield.disp16
2377 || t.bitfield.disp32
2378 || t.bitfield.disp32s)
2379 return 2;
2380 else
2381 return 0;
2382 }
2383
2384 static INLINE int
2385 fits_in_signed_byte (addressT num)
2386 {
2387 return num + 0x80 <= 0xff;
2388 }
2389
2390 static INLINE int
2391 fits_in_unsigned_byte (addressT num)
2392 {
2393 return num <= 0xff;
2394 }
2395
2396 static INLINE int
2397 fits_in_unsigned_word (addressT num)
2398 {
2399 return num <= 0xffff;
2400 }
2401
2402 static INLINE int
2403 fits_in_signed_word (addressT num)
2404 {
2405 return num + 0x8000 <= 0xffff;
2406 }
2407
2408 static INLINE int
2409 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2410 {
2411 #ifndef BFD64
2412 return 1;
2413 #else
2414 return num + 0x80000000 <= 0xffffffff;
2415 #endif
2416 } /* fits_in_signed_long() */
2417
2418 static INLINE int
2419 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2420 {
2421 #ifndef BFD64
2422 return 1;
2423 #else
2424 return num <= 0xffffffff;
2425 #endif
2426 } /* fits_in_unsigned_long() */
2427
2428 static INLINE int
2429 fits_in_disp8 (offsetT num)
2430 {
2431 int shift = i.memshift;
2432 unsigned int mask;
2433
2434 if (shift == -1)
2435 abort ();
2436
2437 mask = (1 << shift) - 1;
2438
2439 /* Return 0 if NUM isn't properly aligned. */
2440 if ((num & mask))
2441 return 0;
2442
2443 /* Check if NUM will fit in 8bit after shift. */
2444 return fits_in_signed_byte (num >> shift);
2445 }
2446
2447 static INLINE int
2448 fits_in_imm4 (offsetT num)
2449 {
2450 return (num & 0xf) == num;
2451 }
2452
2453 static i386_operand_type
2454 smallest_imm_type (offsetT num)
2455 {
2456 i386_operand_type t;
2457
2458 operand_type_set (&t, 0);
2459 t.bitfield.imm64 = 1;
2460
2461 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2462 {
2463 /* This code is disabled on the 486 because all the Imm1 forms
2464 in the opcode table are slower on the i486. They're the
2465 versions with the implicitly specified single-position
2466 displacement, which has another syntax if you really want to
2467 use that form. */
2468 t.bitfield.imm1 = 1;
2469 t.bitfield.imm8 = 1;
2470 t.bitfield.imm8s = 1;
2471 t.bitfield.imm16 = 1;
2472 t.bitfield.imm32 = 1;
2473 t.bitfield.imm32s = 1;
2474 }
2475 else if (fits_in_signed_byte (num))
2476 {
2477 t.bitfield.imm8 = 1;
2478 t.bitfield.imm8s = 1;
2479 t.bitfield.imm16 = 1;
2480 t.bitfield.imm32 = 1;
2481 t.bitfield.imm32s = 1;
2482 }
2483 else if (fits_in_unsigned_byte (num))
2484 {
2485 t.bitfield.imm8 = 1;
2486 t.bitfield.imm16 = 1;
2487 t.bitfield.imm32 = 1;
2488 t.bitfield.imm32s = 1;
2489 }
2490 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2491 {
2492 t.bitfield.imm16 = 1;
2493 t.bitfield.imm32 = 1;
2494 t.bitfield.imm32s = 1;
2495 }
2496 else if (fits_in_signed_long (num))
2497 {
2498 t.bitfield.imm32 = 1;
2499 t.bitfield.imm32s = 1;
2500 }
2501 else if (fits_in_unsigned_long (num))
2502 t.bitfield.imm32 = 1;
2503
2504 return t;
2505 }
2506
2507 static offsetT
2508 offset_in_range (offsetT val, int size)
2509 {
2510 addressT mask;
2511
2512 switch (size)
2513 {
2514 case 1: mask = ((addressT) 1 << 8) - 1; break;
2515 case 2: mask = ((addressT) 1 << 16) - 1; break;
2516 case 4: mask = ((addressT) 2 << 31) - 1; break;
2517 #ifdef BFD64
2518 case 8: mask = ((addressT) 2 << 63) - 1; break;
2519 #endif
2520 default: abort ();
2521 }
2522
2523 #ifdef BFD64
2524 /* If BFD64, sign extend val for 32bit address mode. */
2525 if (flag_code != CODE_64BIT
2526 || i.prefix[ADDR_PREFIX])
2527 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2528 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2529 #endif
2530
2531 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2532 {
2533 char buf1[40], buf2[40];
2534
2535 sprint_value (buf1, val);
2536 sprint_value (buf2, val & mask);
2537 as_warn (_("%s shortened to %s"), buf1, buf2);
2538 }
2539 return val & mask;
2540 }
2541
2542 enum PREFIX_GROUP
2543 {
2544 PREFIX_EXIST = 0,
2545 PREFIX_LOCK,
2546 PREFIX_REP,
2547 PREFIX_DS,
2548 PREFIX_OTHER
2549 };
2550
2551 /* Returns
2552 a. PREFIX_EXIST if attempting to add a prefix where one from the
2553 same class already exists.
2554 b. PREFIX_LOCK if lock prefix is added.
2555 c. PREFIX_REP if rep/repne prefix is added.
2556 d. PREFIX_DS if ds prefix is added.
2557 e. PREFIX_OTHER if other prefix is added.
2558 */
2559
2560 static enum PREFIX_GROUP
2561 add_prefix (unsigned int prefix)
2562 {
2563 enum PREFIX_GROUP ret = PREFIX_OTHER;
2564 unsigned int q;
2565
2566 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2567 && flag_code == CODE_64BIT)
2568 {
2569 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2570 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2571 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2572 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2573 ret = PREFIX_EXIST;
2574 q = REX_PREFIX;
2575 }
2576 else
2577 {
2578 switch (prefix)
2579 {
2580 default:
2581 abort ();
2582
2583 case DS_PREFIX_OPCODE:
2584 ret = PREFIX_DS;
2585 /* Fall through. */
2586 case CS_PREFIX_OPCODE:
2587 case ES_PREFIX_OPCODE:
2588 case FS_PREFIX_OPCODE:
2589 case GS_PREFIX_OPCODE:
2590 case SS_PREFIX_OPCODE:
2591 q = SEG_PREFIX;
2592 break;
2593
2594 case REPNE_PREFIX_OPCODE:
2595 case REPE_PREFIX_OPCODE:
2596 q = REP_PREFIX;
2597 ret = PREFIX_REP;
2598 break;
2599
2600 case LOCK_PREFIX_OPCODE:
2601 q = LOCK_PREFIX;
2602 ret = PREFIX_LOCK;
2603 break;
2604
2605 case FWAIT_OPCODE:
2606 q = WAIT_PREFIX;
2607 break;
2608
2609 case ADDR_PREFIX_OPCODE:
2610 q = ADDR_PREFIX;
2611 break;
2612
2613 case DATA_PREFIX_OPCODE:
2614 q = DATA_PREFIX;
2615 break;
2616 }
2617 if (i.prefix[q] != 0)
2618 ret = PREFIX_EXIST;
2619 }
2620
2621 if (ret)
2622 {
2623 if (!i.prefix[q])
2624 ++i.prefixes;
2625 i.prefix[q] |= prefix;
2626 }
2627 else
2628 as_bad (_("same type of prefix used twice"));
2629
2630 return ret;
2631 }
2632
2633 static void
2634 update_code_flag (int value, int check)
2635 {
2636 PRINTF_LIKE ((*as_error));
2637
2638 flag_code = (enum flag_code) value;
2639 if (flag_code == CODE_64BIT)
2640 {
2641 cpu_arch_flags.bitfield.cpu64 = 1;
2642 cpu_arch_flags.bitfield.cpuno64 = 0;
2643 }
2644 else
2645 {
2646 cpu_arch_flags.bitfield.cpu64 = 0;
2647 cpu_arch_flags.bitfield.cpuno64 = 1;
2648 }
2649 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2650 {
2651 if (check)
2652 as_error = as_fatal;
2653 else
2654 as_error = as_bad;
2655 (*as_error) (_("64bit mode not supported on `%s'."),
2656 cpu_arch_name ? cpu_arch_name : default_arch);
2657 }
2658 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2659 {
2660 if (check)
2661 as_error = as_fatal;
2662 else
2663 as_error = as_bad;
2664 (*as_error) (_("32bit mode not supported on `%s'."),
2665 cpu_arch_name ? cpu_arch_name : default_arch);
2666 }
2667 stackop_size = '\0';
2668 }
2669
2670 static void
2671 set_code_flag (int value)
2672 {
2673 update_code_flag (value, 0);
2674 }
2675
2676 static void
2677 set_16bit_gcc_code_flag (int new_code_flag)
2678 {
2679 flag_code = (enum flag_code) new_code_flag;
2680 if (flag_code != CODE_16BIT)
2681 abort ();
2682 cpu_arch_flags.bitfield.cpu64 = 0;
2683 cpu_arch_flags.bitfield.cpuno64 = 1;
2684 stackop_size = LONG_MNEM_SUFFIX;
2685 }
2686
2687 static void
2688 set_intel_syntax (int syntax_flag)
2689 {
2690 /* Find out if register prefixing is specified. */
2691 int ask_naked_reg = 0;
2692
2693 SKIP_WHITESPACE ();
2694 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2695 {
2696 char *string;
2697 int e = get_symbol_name (&string);
2698
2699 if (strcmp (string, "prefix") == 0)
2700 ask_naked_reg = 1;
2701 else if (strcmp (string, "noprefix") == 0)
2702 ask_naked_reg = -1;
2703 else
2704 as_bad (_("bad argument to syntax directive."));
2705 (void) restore_line_pointer (e);
2706 }
2707 demand_empty_rest_of_line ();
2708
2709 intel_syntax = syntax_flag;
2710
2711 if (ask_naked_reg == 0)
2712 allow_naked_reg = (intel_syntax
2713 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2714 else
2715 allow_naked_reg = (ask_naked_reg < 0);
2716
2717 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2718
2719 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2720 identifier_chars['$'] = intel_syntax ? '$' : 0;
2721 register_prefix = allow_naked_reg ? "" : "%";
2722 }
2723
2724 static void
2725 set_intel_mnemonic (int mnemonic_flag)
2726 {
2727 intel_mnemonic = mnemonic_flag;
2728 }
2729
2730 static void
2731 set_allow_index_reg (int flag)
2732 {
2733 allow_index_reg = flag;
2734 }
2735
2736 static void
2737 set_check (int what)
2738 {
2739 enum check_kind *kind;
2740 const char *str;
2741
2742 if (what)
2743 {
2744 kind = &operand_check;
2745 str = "operand";
2746 }
2747 else
2748 {
2749 kind = &sse_check;
2750 str = "sse";
2751 }
2752
2753 SKIP_WHITESPACE ();
2754
2755 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2756 {
2757 char *string;
2758 int e = get_symbol_name (&string);
2759
2760 if (strcmp (string, "none") == 0)
2761 *kind = check_none;
2762 else if (strcmp (string, "warning") == 0)
2763 *kind = check_warning;
2764 else if (strcmp (string, "error") == 0)
2765 *kind = check_error;
2766 else
2767 as_bad (_("bad argument to %s_check directive."), str);
2768 (void) restore_line_pointer (e);
2769 }
2770 else
2771 as_bad (_("missing argument for %s_check directive"), str);
2772
2773 demand_empty_rest_of_line ();
2774 }
2775
2776 static void
2777 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2778 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2779 {
2780 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2781 static const char *arch;
2782
2783 /* Intel LIOM is only supported on ELF. */
2784 if (!IS_ELF)
2785 return;
2786
2787 if (!arch)
2788 {
2789 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2790 use default_arch. */
2791 arch = cpu_arch_name;
2792 if (!arch)
2793 arch = default_arch;
2794 }
2795
2796 /* If we are targeting Intel MCU, we must enable it. */
2797 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2798 || new_flag.bitfield.cpuiamcu)
2799 return;
2800
2801 /* If we are targeting Intel L1OM, we must enable it. */
2802 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2803 || new_flag.bitfield.cpul1om)
2804 return;
2805
2806 /* If we are targeting Intel K1OM, we must enable it. */
2807 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2808 || new_flag.bitfield.cpuk1om)
2809 return;
2810
2811 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2812 #endif
2813 }
2814
2815 static void
2816 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2817 {
2818 SKIP_WHITESPACE ();
2819
2820 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2821 {
2822 char *string;
2823 int e = get_symbol_name (&string);
2824 unsigned int j;
2825 i386_cpu_flags flags;
2826
2827 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2828 {
2829 if (strcmp (string, cpu_arch[j].name) == 0)
2830 {
2831 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2832
2833 if (*string != '.')
2834 {
2835 cpu_arch_name = cpu_arch[j].name;
2836 cpu_sub_arch_name = NULL;
2837 cpu_arch_flags = cpu_arch[j].flags;
2838 if (flag_code == CODE_64BIT)
2839 {
2840 cpu_arch_flags.bitfield.cpu64 = 1;
2841 cpu_arch_flags.bitfield.cpuno64 = 0;
2842 }
2843 else
2844 {
2845 cpu_arch_flags.bitfield.cpu64 = 0;
2846 cpu_arch_flags.bitfield.cpuno64 = 1;
2847 }
2848 cpu_arch_isa = cpu_arch[j].type;
2849 cpu_arch_isa_flags = cpu_arch[j].flags;
2850 if (!cpu_arch_tune_set)
2851 {
2852 cpu_arch_tune = cpu_arch_isa;
2853 cpu_arch_tune_flags = cpu_arch_isa_flags;
2854 }
2855 break;
2856 }
2857
2858 flags = cpu_flags_or (cpu_arch_flags,
2859 cpu_arch[j].flags);
2860
2861 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2862 {
2863 if (cpu_sub_arch_name)
2864 {
2865 char *name = cpu_sub_arch_name;
2866 cpu_sub_arch_name = concat (name,
2867 cpu_arch[j].name,
2868 (const char *) NULL);
2869 free (name);
2870 }
2871 else
2872 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2873 cpu_arch_flags = flags;
2874 cpu_arch_isa_flags = flags;
2875 }
2876 else
2877 cpu_arch_isa_flags
2878 = cpu_flags_or (cpu_arch_isa_flags,
2879 cpu_arch[j].flags);
2880 (void) restore_line_pointer (e);
2881 demand_empty_rest_of_line ();
2882 return;
2883 }
2884 }
2885
2886 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2887 {
2888 /* Disable an ISA extension. */
2889 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2890 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2891 {
2892 flags = cpu_flags_and_not (cpu_arch_flags,
2893 cpu_noarch[j].flags);
2894 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2895 {
2896 if (cpu_sub_arch_name)
2897 {
2898 char *name = cpu_sub_arch_name;
2899 cpu_sub_arch_name = concat (name, string,
2900 (const char *) NULL);
2901 free (name);
2902 }
2903 else
2904 cpu_sub_arch_name = xstrdup (string);
2905 cpu_arch_flags = flags;
2906 cpu_arch_isa_flags = flags;
2907 }
2908 (void) restore_line_pointer (e);
2909 demand_empty_rest_of_line ();
2910 return;
2911 }
2912
2913 j = ARRAY_SIZE (cpu_arch);
2914 }
2915
2916 if (j >= ARRAY_SIZE (cpu_arch))
2917 as_bad (_("no such architecture: `%s'"), string);
2918
2919 *input_line_pointer = e;
2920 }
2921 else
2922 as_bad (_("missing cpu architecture"));
2923
2924 no_cond_jump_promotion = 0;
2925 if (*input_line_pointer == ','
2926 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2927 {
2928 char *string;
2929 char e;
2930
2931 ++input_line_pointer;
2932 e = get_symbol_name (&string);
2933
2934 if (strcmp (string, "nojumps") == 0)
2935 no_cond_jump_promotion = 1;
2936 else if (strcmp (string, "jumps") == 0)
2937 ;
2938 else
2939 as_bad (_("no such architecture modifier: `%s'"), string);
2940
2941 (void) restore_line_pointer (e);
2942 }
2943
2944 demand_empty_rest_of_line ();
2945 }
2946
2947 enum bfd_architecture
2948 i386_arch (void)
2949 {
2950 if (cpu_arch_isa == PROCESSOR_L1OM)
2951 {
2952 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2953 || flag_code != CODE_64BIT)
2954 as_fatal (_("Intel L1OM is 64bit ELF only"));
2955 return bfd_arch_l1om;
2956 }
2957 else if (cpu_arch_isa == PROCESSOR_K1OM)
2958 {
2959 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2960 || flag_code != CODE_64BIT)
2961 as_fatal (_("Intel K1OM is 64bit ELF only"));
2962 return bfd_arch_k1om;
2963 }
2964 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2965 {
2966 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2967 || flag_code == CODE_64BIT)
2968 as_fatal (_("Intel MCU is 32bit ELF only"));
2969 return bfd_arch_iamcu;
2970 }
2971 else
2972 return bfd_arch_i386;
2973 }
2974
2975 unsigned long
2976 i386_mach (void)
2977 {
2978 if (!strncmp (default_arch, "x86_64", 6))
2979 {
2980 if (cpu_arch_isa == PROCESSOR_L1OM)
2981 {
2982 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2983 || default_arch[6] != '\0')
2984 as_fatal (_("Intel L1OM is 64bit ELF only"));
2985 return bfd_mach_l1om;
2986 }
2987 else if (cpu_arch_isa == PROCESSOR_K1OM)
2988 {
2989 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2990 || default_arch[6] != '\0')
2991 as_fatal (_("Intel K1OM is 64bit ELF only"));
2992 return bfd_mach_k1om;
2993 }
2994 else if (default_arch[6] == '\0')
2995 return bfd_mach_x86_64;
2996 else
2997 return bfd_mach_x64_32;
2998 }
2999 else if (!strcmp (default_arch, "i386")
3000 || !strcmp (default_arch, "iamcu"))
3001 {
3002 if (cpu_arch_isa == PROCESSOR_IAMCU)
3003 {
3004 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3005 as_fatal (_("Intel MCU is 32bit ELF only"));
3006 return bfd_mach_i386_iamcu;
3007 }
3008 else
3009 return bfd_mach_i386_i386;
3010 }
3011 else
3012 as_fatal (_("unknown architecture"));
3013 }
3014 \f
3015 void
3016 md_begin (void)
3017 {
3018 const char *hash_err;
3019
3020 /* Support pseudo prefixes like {disp32}. */
3021 lex_type ['{'] = LEX_BEGIN_NAME;
3022
3023 /* Initialize op_hash hash table. */
3024 op_hash = hash_new ();
3025
3026 {
3027 const insn_template *optab;
3028 templates *core_optab;
3029
3030 /* Setup for loop. */
3031 optab = i386_optab;
3032 core_optab = XNEW (templates);
3033 core_optab->start = optab;
3034
3035 while (1)
3036 {
3037 ++optab;
3038 if (optab->name == NULL
3039 || strcmp (optab->name, (optab - 1)->name) != 0)
3040 {
3041 /* different name --> ship out current template list;
3042 add to hash table; & begin anew. */
3043 core_optab->end = optab;
3044 hash_err = hash_insert (op_hash,
3045 (optab - 1)->name,
3046 (void *) core_optab);
3047 if (hash_err)
3048 {
3049 as_fatal (_("can't hash %s: %s"),
3050 (optab - 1)->name,
3051 hash_err);
3052 }
3053 if (optab->name == NULL)
3054 break;
3055 core_optab = XNEW (templates);
3056 core_optab->start = optab;
3057 }
3058 }
3059 }
3060
3061 /* Initialize reg_hash hash table. */
3062 reg_hash = hash_new ();
3063 {
3064 const reg_entry *regtab;
3065 unsigned int regtab_size = i386_regtab_size;
3066
3067 for (regtab = i386_regtab; regtab_size--; regtab++)
3068 {
3069 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3070 if (hash_err)
3071 as_fatal (_("can't hash %s: %s"),
3072 regtab->reg_name,
3073 hash_err);
3074 }
3075 }
3076
3077 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3078 {
3079 int c;
3080 char *p;
3081
3082 for (c = 0; c < 256; c++)
3083 {
3084 if (ISDIGIT (c))
3085 {
3086 digit_chars[c] = c;
3087 mnemonic_chars[c] = c;
3088 register_chars[c] = c;
3089 operand_chars[c] = c;
3090 }
3091 else if (ISLOWER (c))
3092 {
3093 mnemonic_chars[c] = c;
3094 register_chars[c] = c;
3095 operand_chars[c] = c;
3096 }
3097 else if (ISUPPER (c))
3098 {
3099 mnemonic_chars[c] = TOLOWER (c);
3100 register_chars[c] = mnemonic_chars[c];
3101 operand_chars[c] = c;
3102 }
3103 else if (c == '{' || c == '}')
3104 {
3105 mnemonic_chars[c] = c;
3106 operand_chars[c] = c;
3107 }
3108
3109 if (ISALPHA (c) || ISDIGIT (c))
3110 identifier_chars[c] = c;
3111 else if (c >= 128)
3112 {
3113 identifier_chars[c] = c;
3114 operand_chars[c] = c;
3115 }
3116 }
3117
3118 #ifdef LEX_AT
3119 identifier_chars['@'] = '@';
3120 #endif
3121 #ifdef LEX_QM
3122 identifier_chars['?'] = '?';
3123 operand_chars['?'] = '?';
3124 #endif
3125 digit_chars['-'] = '-';
3126 mnemonic_chars['_'] = '_';
3127 mnemonic_chars['-'] = '-';
3128 mnemonic_chars['.'] = '.';
3129 identifier_chars['_'] = '_';
3130 identifier_chars['.'] = '.';
3131
3132 for (p = operand_special_chars; *p != '\0'; p++)
3133 operand_chars[(unsigned char) *p] = *p;
3134 }
3135
3136 if (flag_code == CODE_64BIT)
3137 {
3138 #if defined (OBJ_COFF) && defined (TE_PE)
3139 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3140 ? 32 : 16);
3141 #else
3142 x86_dwarf2_return_column = 16;
3143 #endif
3144 x86_cie_data_alignment = -8;
3145 }
3146 else
3147 {
3148 x86_dwarf2_return_column = 8;
3149 x86_cie_data_alignment = -4;
3150 }
3151
3152 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3153 can be turned into BRANCH_PREFIX frag. */
3154 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3155 abort ();
3156 }
3157
3158 void
3159 i386_print_statistics (FILE *file)
3160 {
3161 hash_print_statistics (file, "i386 opcode", op_hash);
3162 hash_print_statistics (file, "i386 register", reg_hash);
3163 }
3164 \f
3165 #ifdef DEBUG386
3166
3167 /* Debugging routines for md_assemble. */
3168 static void pte (insn_template *);
3169 static void pt (i386_operand_type);
3170 static void pe (expressionS *);
3171 static void ps (symbolS *);
3172
3173 static void
3174 pi (const char *line, i386_insn *x)
3175 {
3176 unsigned int j;
3177
3178 fprintf (stdout, "%s: template ", line);
3179 pte (&x->tm);
3180 fprintf (stdout, " address: base %s index %s scale %x\n",
3181 x->base_reg ? x->base_reg->reg_name : "none",
3182 x->index_reg ? x->index_reg->reg_name : "none",
3183 x->log2_scale_factor);
3184 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3185 x->rm.mode, x->rm.reg, x->rm.regmem);
3186 fprintf (stdout, " sib: base %x index %x scale %x\n",
3187 x->sib.base, x->sib.index, x->sib.scale);
3188 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3189 (x->rex & REX_W) != 0,
3190 (x->rex & REX_R) != 0,
3191 (x->rex & REX_X) != 0,
3192 (x->rex & REX_B) != 0);
3193 for (j = 0; j < x->operands; j++)
3194 {
3195 fprintf (stdout, " #%d: ", j + 1);
3196 pt (x->types[j]);
3197 fprintf (stdout, "\n");
3198 if (x->types[j].bitfield.class == Reg
3199 || x->types[j].bitfield.class == RegMMX
3200 || x->types[j].bitfield.class == RegSIMD
3201 || x->types[j].bitfield.class == SReg
3202 || x->types[j].bitfield.class == RegCR
3203 || x->types[j].bitfield.class == RegDR
3204 || x->types[j].bitfield.class == RegTR)
3205 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3206 if (operand_type_check (x->types[j], imm))
3207 pe (x->op[j].imms);
3208 if (operand_type_check (x->types[j], disp))
3209 pe (x->op[j].disps);
3210 }
3211 }
3212
3213 static void
3214 pte (insn_template *t)
3215 {
3216 unsigned int j;
3217 fprintf (stdout, " %d operands ", t->operands);
3218 fprintf (stdout, "opcode %x ", t->base_opcode);
3219 if (t->extension_opcode != None)
3220 fprintf (stdout, "ext %x ", t->extension_opcode);
3221 if (t->opcode_modifier.d)
3222 fprintf (stdout, "D");
3223 if (t->opcode_modifier.w)
3224 fprintf (stdout, "W");
3225 fprintf (stdout, "\n");
3226 for (j = 0; j < t->operands; j++)
3227 {
3228 fprintf (stdout, " #%d type ", j + 1);
3229 pt (t->operand_types[j]);
3230 fprintf (stdout, "\n");
3231 }
3232 }
3233
3234 static void
3235 pe (expressionS *e)
3236 {
3237 fprintf (stdout, " operation %d\n", e->X_op);
3238 fprintf (stdout, " add_number %ld (%lx)\n",
3239 (long) e->X_add_number, (long) e->X_add_number);
3240 if (e->X_add_symbol)
3241 {
3242 fprintf (stdout, " add_symbol ");
3243 ps (e->X_add_symbol);
3244 fprintf (stdout, "\n");
3245 }
3246 if (e->X_op_symbol)
3247 {
3248 fprintf (stdout, " op_symbol ");
3249 ps (e->X_op_symbol);
3250 fprintf (stdout, "\n");
3251 }
3252 }
3253
3254 static void
3255 ps (symbolS *s)
3256 {
3257 fprintf (stdout, "%s type %s%s",
3258 S_GET_NAME (s),
3259 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3260 segment_name (S_GET_SEGMENT (s)));
3261 }
3262
3263 static struct type_name
3264 {
3265 i386_operand_type mask;
3266 const char *name;
3267 }
3268 const type_names[] =
3269 {
3270 { OPERAND_TYPE_REG8, "r8" },
3271 { OPERAND_TYPE_REG16, "r16" },
3272 { OPERAND_TYPE_REG32, "r32" },
3273 { OPERAND_TYPE_REG64, "r64" },
3274 { OPERAND_TYPE_ACC8, "acc8" },
3275 { OPERAND_TYPE_ACC16, "acc16" },
3276 { OPERAND_TYPE_ACC32, "acc32" },
3277 { OPERAND_TYPE_ACC64, "acc64" },
3278 { OPERAND_TYPE_IMM8, "i8" },
3279 { OPERAND_TYPE_IMM8, "i8s" },
3280 { OPERAND_TYPE_IMM16, "i16" },
3281 { OPERAND_TYPE_IMM32, "i32" },
3282 { OPERAND_TYPE_IMM32S, "i32s" },
3283 { OPERAND_TYPE_IMM64, "i64" },
3284 { OPERAND_TYPE_IMM1, "i1" },
3285 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3286 { OPERAND_TYPE_DISP8, "d8" },
3287 { OPERAND_TYPE_DISP16, "d16" },
3288 { OPERAND_TYPE_DISP32, "d32" },
3289 { OPERAND_TYPE_DISP32S, "d32s" },
3290 { OPERAND_TYPE_DISP64, "d64" },
3291 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3292 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3293 { OPERAND_TYPE_CONTROL, "control reg" },
3294 { OPERAND_TYPE_TEST, "test reg" },
3295 { OPERAND_TYPE_DEBUG, "debug reg" },
3296 { OPERAND_TYPE_FLOATREG, "FReg" },
3297 { OPERAND_TYPE_FLOATACC, "FAcc" },
3298 { OPERAND_TYPE_SREG, "SReg" },
3299 { OPERAND_TYPE_REGMMX, "rMMX" },
3300 { OPERAND_TYPE_REGXMM, "rXMM" },
3301 { OPERAND_TYPE_REGYMM, "rYMM" },
3302 { OPERAND_TYPE_REGZMM, "rZMM" },
3303 { OPERAND_TYPE_REGMASK, "Mask reg" },
3304 };
3305
3306 static void
3307 pt (i386_operand_type t)
3308 {
3309 unsigned int j;
3310 i386_operand_type a;
3311
3312 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3313 {
3314 a = operand_type_and (t, type_names[j].mask);
3315 if (operand_type_equal (&a, &type_names[j].mask))
3316 fprintf (stdout, "%s, ", type_names[j].name);
3317 }
3318 fflush (stdout);
3319 }
3320
3321 #endif /* DEBUG386 */
3322 \f
3323 static bfd_reloc_code_real_type
3324 reloc (unsigned int size,
3325 int pcrel,
3326 int sign,
3327 bfd_reloc_code_real_type other)
3328 {
3329 if (other != NO_RELOC)
3330 {
3331 reloc_howto_type *rel;
3332
3333 if (size == 8)
3334 switch (other)
3335 {
3336 case BFD_RELOC_X86_64_GOT32:
3337 return BFD_RELOC_X86_64_GOT64;
3338 break;
3339 case BFD_RELOC_X86_64_GOTPLT64:
3340 return BFD_RELOC_X86_64_GOTPLT64;
3341 break;
3342 case BFD_RELOC_X86_64_PLTOFF64:
3343 return BFD_RELOC_X86_64_PLTOFF64;
3344 break;
3345 case BFD_RELOC_X86_64_GOTPC32:
3346 other = BFD_RELOC_X86_64_GOTPC64;
3347 break;
3348 case BFD_RELOC_X86_64_GOTPCREL:
3349 other = BFD_RELOC_X86_64_GOTPCREL64;
3350 break;
3351 case BFD_RELOC_X86_64_TPOFF32:
3352 other = BFD_RELOC_X86_64_TPOFF64;
3353 break;
3354 case BFD_RELOC_X86_64_DTPOFF32:
3355 other = BFD_RELOC_X86_64_DTPOFF64;
3356 break;
3357 default:
3358 break;
3359 }
3360
3361 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3362 if (other == BFD_RELOC_SIZE32)
3363 {
3364 if (size == 8)
3365 other = BFD_RELOC_SIZE64;
3366 if (pcrel)
3367 {
3368 as_bad (_("there are no pc-relative size relocations"));
3369 return NO_RELOC;
3370 }
3371 }
3372 #endif
3373
3374 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3375 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3376 sign = -1;
3377
3378 rel = bfd_reloc_type_lookup (stdoutput, other);
3379 if (!rel)
3380 as_bad (_("unknown relocation (%u)"), other);
3381 else if (size != bfd_get_reloc_size (rel))
3382 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3383 bfd_get_reloc_size (rel),
3384 size);
3385 else if (pcrel && !rel->pc_relative)
3386 as_bad (_("non-pc-relative relocation for pc-relative field"));
3387 else if ((rel->complain_on_overflow == complain_overflow_signed
3388 && !sign)
3389 || (rel->complain_on_overflow == complain_overflow_unsigned
3390 && sign > 0))
3391 as_bad (_("relocated field and relocation type differ in signedness"));
3392 else
3393 return other;
3394 return NO_RELOC;
3395 }
3396
3397 if (pcrel)
3398 {
3399 if (!sign)
3400 as_bad (_("there are no unsigned pc-relative relocations"));
3401 switch (size)
3402 {
3403 case 1: return BFD_RELOC_8_PCREL;
3404 case 2: return BFD_RELOC_16_PCREL;
3405 case 4: return BFD_RELOC_32_PCREL;
3406 case 8: return BFD_RELOC_64_PCREL;
3407 }
3408 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3409 }
3410 else
3411 {
3412 if (sign > 0)
3413 switch (size)
3414 {
3415 case 4: return BFD_RELOC_X86_64_32S;
3416 }
3417 else
3418 switch (size)
3419 {
3420 case 1: return BFD_RELOC_8;
3421 case 2: return BFD_RELOC_16;
3422 case 4: return BFD_RELOC_32;
3423 case 8: return BFD_RELOC_64;
3424 }
3425 as_bad (_("cannot do %s %u byte relocation"),
3426 sign > 0 ? "signed" : "unsigned", size);
3427 }
3428
3429 return NO_RELOC;
3430 }
3431
3432 /* Here we decide which fixups can be adjusted to make them relative to
3433 the beginning of the section instead of the symbol. Basically we need
3434 to make sure that the dynamic relocations are done correctly, so in
3435 some cases we force the original symbol to be used. */
3436
3437 int
3438 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3439 {
3440 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3441 if (!IS_ELF)
3442 return 1;
3443
3444 /* Don't adjust pc-relative references to merge sections in 64-bit
3445 mode. */
3446 if (use_rela_relocations
3447 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3448 && fixP->fx_pcrel)
3449 return 0;
3450
3451 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3452 and changed later by validate_fix. */
3453 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3454 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3455 return 0;
3456
3457 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3458 for size relocations. */
3459 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3460 || fixP->fx_r_type == BFD_RELOC_SIZE64
3461 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3462 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3463 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3464 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3465 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3466 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3467 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3468 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3469 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3470 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3471 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3472 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3473 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3474 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3475 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3476 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3477 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3478 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3479 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3480 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3481 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3482 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3483 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3484 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3485 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3486 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3487 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3488 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3489 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3490 return 0;
3491 #endif
3492 return 1;
3493 }
3494
3495 static int
3496 intel_float_operand (const char *mnemonic)
3497 {
3498 /* Note that the value returned is meaningful only for opcodes with (memory)
3499 operands, hence the code here is free to improperly handle opcodes that
3500 have no operands (for better performance and smaller code). */
3501
3502 if (mnemonic[0] != 'f')
3503 return 0; /* non-math */
3504
3505 switch (mnemonic[1])
3506 {
3507 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3508 the fs segment override prefix not currently handled because no
3509 call path can make opcodes without operands get here */
3510 case 'i':
3511 return 2 /* integer op */;
3512 case 'l':
3513 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3514 return 3; /* fldcw/fldenv */
3515 break;
3516 case 'n':
3517 if (mnemonic[2] != 'o' /* fnop */)
3518 return 3; /* non-waiting control op */
3519 break;
3520 case 'r':
3521 if (mnemonic[2] == 's')
3522 return 3; /* frstor/frstpm */
3523 break;
3524 case 's':
3525 if (mnemonic[2] == 'a')
3526 return 3; /* fsave */
3527 if (mnemonic[2] == 't')
3528 {
3529 switch (mnemonic[3])
3530 {
3531 case 'c': /* fstcw */
3532 case 'd': /* fstdw */
3533 case 'e': /* fstenv */
3534 case 's': /* fsts[gw] */
3535 return 3;
3536 }
3537 }
3538 break;
3539 case 'x':
3540 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3541 return 0; /* fxsave/fxrstor are not really math ops */
3542 break;
3543 }
3544
3545 return 1;
3546 }
3547
3548 /* Build the VEX prefix. */
3549
3550 static void
3551 build_vex_prefix (const insn_template *t)
3552 {
3553 unsigned int register_specifier;
3554 unsigned int implied_prefix;
3555 unsigned int vector_length;
3556 unsigned int w;
3557
3558 /* Check register specifier. */
3559 if (i.vex.register_specifier)
3560 {
3561 register_specifier =
3562 ~register_number (i.vex.register_specifier) & 0xf;
3563 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3564 }
3565 else
3566 register_specifier = 0xf;
3567
3568 /* Use 2-byte VEX prefix by swapping destination and source operand
3569 if there are more than 1 register operand. */
3570 if (i.reg_operands > 1
3571 && i.vec_encoding != vex_encoding_vex3
3572 && i.dir_encoding == dir_encoding_default
3573 && i.operands == i.reg_operands
3574 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3575 && i.tm.opcode_modifier.vexopcode == VEX0F
3576 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3577 && i.rex == REX_B)
3578 {
3579 unsigned int xchg = i.operands - 1;
3580 union i386_op temp_op;
3581 i386_operand_type temp_type;
3582
3583 temp_type = i.types[xchg];
3584 i.types[xchg] = i.types[0];
3585 i.types[0] = temp_type;
3586 temp_op = i.op[xchg];
3587 i.op[xchg] = i.op[0];
3588 i.op[0] = temp_op;
3589
3590 gas_assert (i.rm.mode == 3);
3591
3592 i.rex = REX_R;
3593 xchg = i.rm.regmem;
3594 i.rm.regmem = i.rm.reg;
3595 i.rm.reg = xchg;
3596
3597 if (i.tm.opcode_modifier.d)
3598 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3599 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3600 else /* Use the next insn. */
3601 i.tm = t[1];
3602 }
3603
3604 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3605 are no memory operands and at least 3 register ones. */
3606 if (i.reg_operands >= 3
3607 && i.vec_encoding != vex_encoding_vex3
3608 && i.reg_operands == i.operands - i.imm_operands
3609 && i.tm.opcode_modifier.vex
3610 && i.tm.opcode_modifier.commutative
3611 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3612 && i.rex == REX_B
3613 && i.vex.register_specifier
3614 && !(i.vex.register_specifier->reg_flags & RegRex))
3615 {
3616 unsigned int xchg = i.operands - i.reg_operands;
3617 union i386_op temp_op;
3618 i386_operand_type temp_type;
3619
3620 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3621 gas_assert (!i.tm.opcode_modifier.sae);
3622 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3623 &i.types[i.operands - 3]));
3624 gas_assert (i.rm.mode == 3);
3625
3626 temp_type = i.types[xchg];
3627 i.types[xchg] = i.types[xchg + 1];
3628 i.types[xchg + 1] = temp_type;
3629 temp_op = i.op[xchg];
3630 i.op[xchg] = i.op[xchg + 1];
3631 i.op[xchg + 1] = temp_op;
3632
3633 i.rex = 0;
3634 xchg = i.rm.regmem | 8;
3635 i.rm.regmem = ~register_specifier & 0xf;
3636 gas_assert (!(i.rm.regmem & 8));
3637 i.vex.register_specifier += xchg - i.rm.regmem;
3638 register_specifier = ~xchg & 0xf;
3639 }
3640
3641 if (i.tm.opcode_modifier.vex == VEXScalar)
3642 vector_length = avxscalar;
3643 else if (i.tm.opcode_modifier.vex == VEX256)
3644 vector_length = 1;
3645 else
3646 {
3647 unsigned int op;
3648
3649 /* Determine vector length from the last multi-length vector
3650 operand. */
3651 vector_length = 0;
3652 for (op = t->operands; op--;)
3653 if (t->operand_types[op].bitfield.xmmword
3654 && t->operand_types[op].bitfield.ymmword
3655 && i.types[op].bitfield.ymmword)
3656 {
3657 vector_length = 1;
3658 break;
3659 }
3660 }
3661
3662 switch ((i.tm.base_opcode >> 8) & 0xff)
3663 {
3664 case 0:
3665 implied_prefix = 0;
3666 break;
3667 case DATA_PREFIX_OPCODE:
3668 implied_prefix = 1;
3669 break;
3670 case REPE_PREFIX_OPCODE:
3671 implied_prefix = 2;
3672 break;
3673 case REPNE_PREFIX_OPCODE:
3674 implied_prefix = 3;
3675 break;
3676 default:
3677 abort ();
3678 }
3679
3680 /* Check the REX.W bit and VEXW. */
3681 if (i.tm.opcode_modifier.vexw == VEXWIG)
3682 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3683 else if (i.tm.opcode_modifier.vexw)
3684 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3685 else
3686 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3687
3688 /* Use 2-byte VEX prefix if possible. */
3689 if (w == 0
3690 && i.vec_encoding != vex_encoding_vex3
3691 && i.tm.opcode_modifier.vexopcode == VEX0F
3692 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3693 {
3694 /* 2-byte VEX prefix. */
3695 unsigned int r;
3696
3697 i.vex.length = 2;
3698 i.vex.bytes[0] = 0xc5;
3699
3700 /* Check the REX.R bit. */
3701 r = (i.rex & REX_R) ? 0 : 1;
3702 i.vex.bytes[1] = (r << 7
3703 | register_specifier << 3
3704 | vector_length << 2
3705 | implied_prefix);
3706 }
3707 else
3708 {
3709 /* 3-byte VEX prefix. */
3710 unsigned int m;
3711
3712 i.vex.length = 3;
3713
3714 switch (i.tm.opcode_modifier.vexopcode)
3715 {
3716 case VEX0F:
3717 m = 0x1;
3718 i.vex.bytes[0] = 0xc4;
3719 break;
3720 case VEX0F38:
3721 m = 0x2;
3722 i.vex.bytes[0] = 0xc4;
3723 break;
3724 case VEX0F3A:
3725 m = 0x3;
3726 i.vex.bytes[0] = 0xc4;
3727 break;
3728 case XOP08:
3729 m = 0x8;
3730 i.vex.bytes[0] = 0x8f;
3731 break;
3732 case XOP09:
3733 m = 0x9;
3734 i.vex.bytes[0] = 0x8f;
3735 break;
3736 case XOP0A:
3737 m = 0xa;
3738 i.vex.bytes[0] = 0x8f;
3739 break;
3740 default:
3741 abort ();
3742 }
3743
3744 /* The high 3 bits of the second VEX byte are 1's compliment
3745 of RXB bits from REX. */
3746 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3747
3748 i.vex.bytes[2] = (w << 7
3749 | register_specifier << 3
3750 | vector_length << 2
3751 | implied_prefix);
3752 }
3753 }
3754
3755 static INLINE bfd_boolean
3756 is_evex_encoding (const insn_template *t)
3757 {
3758 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3759 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3760 || t->opcode_modifier.sae;
3761 }
3762
3763 static INLINE bfd_boolean
3764 is_any_vex_encoding (const insn_template *t)
3765 {
3766 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3767 || is_evex_encoding (t);
3768 }
3769
3770 /* Build the EVEX prefix. */
3771
3772 static void
3773 build_evex_prefix (void)
3774 {
3775 unsigned int register_specifier;
3776 unsigned int implied_prefix;
3777 unsigned int m, w;
3778 rex_byte vrex_used = 0;
3779
3780 /* Check register specifier. */
3781 if (i.vex.register_specifier)
3782 {
3783 gas_assert ((i.vrex & REX_X) == 0);
3784
3785 register_specifier = i.vex.register_specifier->reg_num;
3786 if ((i.vex.register_specifier->reg_flags & RegRex))
3787 register_specifier += 8;
3788 /* The upper 16 registers are encoded in the fourth byte of the
3789 EVEX prefix. */
3790 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3791 i.vex.bytes[3] = 0x8;
3792 register_specifier = ~register_specifier & 0xf;
3793 }
3794 else
3795 {
3796 register_specifier = 0xf;
3797
3798 /* Encode upper 16 vector index register in the fourth byte of
3799 the EVEX prefix. */
3800 if (!(i.vrex & REX_X))
3801 i.vex.bytes[3] = 0x8;
3802 else
3803 vrex_used |= REX_X;
3804 }
3805
3806 switch ((i.tm.base_opcode >> 8) & 0xff)
3807 {
3808 case 0:
3809 implied_prefix = 0;
3810 break;
3811 case DATA_PREFIX_OPCODE:
3812 implied_prefix = 1;
3813 break;
3814 case REPE_PREFIX_OPCODE:
3815 implied_prefix = 2;
3816 break;
3817 case REPNE_PREFIX_OPCODE:
3818 implied_prefix = 3;
3819 break;
3820 default:
3821 abort ();
3822 }
3823
3824 /* 4 byte EVEX prefix. */
3825 i.vex.length = 4;
3826 i.vex.bytes[0] = 0x62;
3827
3828 /* mmmm bits. */
3829 switch (i.tm.opcode_modifier.vexopcode)
3830 {
3831 case VEX0F:
3832 m = 1;
3833 break;
3834 case VEX0F38:
3835 m = 2;
3836 break;
3837 case VEX0F3A:
3838 m = 3;
3839 break;
3840 default:
3841 abort ();
3842 break;
3843 }
3844
3845 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3846 bits from REX. */
3847 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3848
3849 /* The fifth bit of the second EVEX byte is 1's compliment of the
3850 REX_R bit in VREX. */
3851 if (!(i.vrex & REX_R))
3852 i.vex.bytes[1] |= 0x10;
3853 else
3854 vrex_used |= REX_R;
3855
3856 if ((i.reg_operands + i.imm_operands) == i.operands)
3857 {
3858 /* When all operands are registers, the REX_X bit in REX is not
3859 used. We reuse it to encode the upper 16 registers, which is
3860 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3861 as 1's compliment. */
3862 if ((i.vrex & REX_B))
3863 {
3864 vrex_used |= REX_B;
3865 i.vex.bytes[1] &= ~0x40;
3866 }
3867 }
3868
3869 /* EVEX instructions shouldn't need the REX prefix. */
3870 i.vrex &= ~vrex_used;
3871 gas_assert (i.vrex == 0);
3872
3873 /* Check the REX.W bit and VEXW. */
3874 if (i.tm.opcode_modifier.vexw == VEXWIG)
3875 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3876 else if (i.tm.opcode_modifier.vexw)
3877 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3878 else
3879 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3880
3881 /* Encode the U bit. */
3882 implied_prefix |= 0x4;
3883
3884 /* The third byte of the EVEX prefix. */
3885 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3886
3887 /* The fourth byte of the EVEX prefix. */
3888 /* The zeroing-masking bit. */
3889 if (i.mask && i.mask->zeroing)
3890 i.vex.bytes[3] |= 0x80;
3891
3892 /* Don't always set the broadcast bit if there is no RC. */
3893 if (!i.rounding)
3894 {
3895 /* Encode the vector length. */
3896 unsigned int vec_length;
3897
3898 if (!i.tm.opcode_modifier.evex
3899 || i.tm.opcode_modifier.evex == EVEXDYN)
3900 {
3901 unsigned int op;
3902
3903 /* Determine vector length from the last multi-length vector
3904 operand. */
3905 vec_length = 0;
3906 for (op = i.operands; op--;)
3907 if (i.tm.operand_types[op].bitfield.xmmword
3908 + i.tm.operand_types[op].bitfield.ymmword
3909 + i.tm.operand_types[op].bitfield.zmmword > 1)
3910 {
3911 if (i.types[op].bitfield.zmmword)
3912 {
3913 i.tm.opcode_modifier.evex = EVEX512;
3914 break;
3915 }
3916 else if (i.types[op].bitfield.ymmword)
3917 {
3918 i.tm.opcode_modifier.evex = EVEX256;
3919 break;
3920 }
3921 else if (i.types[op].bitfield.xmmword)
3922 {
3923 i.tm.opcode_modifier.evex = EVEX128;
3924 break;
3925 }
3926 else if (i.broadcast && (int) op == i.broadcast->operand)
3927 {
3928 switch (i.broadcast->bytes)
3929 {
3930 case 64:
3931 i.tm.opcode_modifier.evex = EVEX512;
3932 break;
3933 case 32:
3934 i.tm.opcode_modifier.evex = EVEX256;
3935 break;
3936 case 16:
3937 i.tm.opcode_modifier.evex = EVEX128;
3938 break;
3939 default:
3940 abort ();
3941 }
3942 break;
3943 }
3944 }
3945
3946 if (op >= MAX_OPERANDS)
3947 abort ();
3948 }
3949
3950 switch (i.tm.opcode_modifier.evex)
3951 {
3952 case EVEXLIG: /* LL' is ignored */
3953 vec_length = evexlig << 5;
3954 break;
3955 case EVEX128:
3956 vec_length = 0 << 5;
3957 break;
3958 case EVEX256:
3959 vec_length = 1 << 5;
3960 break;
3961 case EVEX512:
3962 vec_length = 2 << 5;
3963 break;
3964 default:
3965 abort ();
3966 break;
3967 }
3968 i.vex.bytes[3] |= vec_length;
3969 /* Encode the broadcast bit. */
3970 if (i.broadcast)
3971 i.vex.bytes[3] |= 0x10;
3972 }
3973 else
3974 {
3975 if (i.rounding->type != saeonly)
3976 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3977 else
3978 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3979 }
3980
3981 if (i.mask && i.mask->mask)
3982 i.vex.bytes[3] |= i.mask->mask->reg_num;
3983 }
3984
3985 static void
3986 process_immext (void)
3987 {
3988 expressionS *exp;
3989
3990 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3991 which is coded in the same place as an 8-bit immediate field
3992 would be. Here we fake an 8-bit immediate operand from the
3993 opcode suffix stored in tm.extension_opcode.
3994
3995 AVX instructions also use this encoding, for some of
3996 3 argument instructions. */
3997
3998 gas_assert (i.imm_operands <= 1
3999 && (i.operands <= 2
4000 || (is_any_vex_encoding (&i.tm)
4001 && i.operands <= 4)));
4002
4003 exp = &im_expressions[i.imm_operands++];
4004 i.op[i.operands].imms = exp;
4005 i.types[i.operands] = imm8;
4006 i.operands++;
4007 exp->X_op = O_constant;
4008 exp->X_add_number = i.tm.extension_opcode;
4009 i.tm.extension_opcode = None;
4010 }
4011
4012
4013 static int
4014 check_hle (void)
4015 {
4016 switch (i.tm.opcode_modifier.hleprefixok)
4017 {
4018 default:
4019 abort ();
4020 case HLEPrefixNone:
4021 as_bad (_("invalid instruction `%s' after `%s'"),
4022 i.tm.name, i.hle_prefix);
4023 return 0;
4024 case HLEPrefixLock:
4025 if (i.prefix[LOCK_PREFIX])
4026 return 1;
4027 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4028 return 0;
4029 case HLEPrefixAny:
4030 return 1;
4031 case HLEPrefixRelease:
4032 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4033 {
4034 as_bad (_("instruction `%s' after `xacquire' not allowed"),
4035 i.tm.name);
4036 return 0;
4037 }
4038 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4039 {
4040 as_bad (_("memory destination needed for instruction `%s'"
4041 " after `xrelease'"), i.tm.name);
4042 return 0;
4043 }
4044 return 1;
4045 }
4046 }
4047
4048 /* Try the shortest encoding by shortening operand size. */
4049
4050 static void
4051 optimize_encoding (void)
4052 {
4053 unsigned int j;
4054
4055 if (optimize_for_space
4056 && !is_any_vex_encoding (&i.tm)
4057 && i.reg_operands == 1
4058 && i.imm_operands == 1
4059 && !i.types[1].bitfield.byte
4060 && i.op[0].imms->X_op == O_constant
4061 && fits_in_imm7 (i.op[0].imms->X_add_number)
4062 && (i.tm.base_opcode == 0xa8
4063 || (i.tm.base_opcode == 0xf6
4064 && i.tm.extension_opcode == 0x0)))
4065 {
4066 /* Optimize: -Os:
4067 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4068 */
4069 unsigned int base_regnum = i.op[1].regs->reg_num;
4070 if (flag_code == CODE_64BIT || base_regnum < 4)
4071 {
4072 i.types[1].bitfield.byte = 1;
4073 /* Ignore the suffix. */
4074 i.suffix = 0;
4075 /* Convert to byte registers. */
4076 if (i.types[1].bitfield.word)
4077 j = 16;
4078 else if (i.types[1].bitfield.dword)
4079 j = 32;
4080 else
4081 j = 48;
4082 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4083 j += 8;
4084 i.op[1].regs -= j;
4085 }
4086 }
4087 else if (flag_code == CODE_64BIT
4088 && !is_any_vex_encoding (&i.tm)
4089 && ((i.types[1].bitfield.qword
4090 && i.reg_operands == 1
4091 && i.imm_operands == 1
4092 && i.op[0].imms->X_op == O_constant
4093 && ((i.tm.base_opcode == 0xb8
4094 && i.tm.extension_opcode == None
4095 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4096 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4097 && ((i.tm.base_opcode == 0x24
4098 || i.tm.base_opcode == 0xa8)
4099 || (i.tm.base_opcode == 0x80
4100 && i.tm.extension_opcode == 0x4)
4101 || ((i.tm.base_opcode == 0xf6
4102 || (i.tm.base_opcode | 1) == 0xc7)
4103 && i.tm.extension_opcode == 0x0)))
4104 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4105 && i.tm.base_opcode == 0x83
4106 && i.tm.extension_opcode == 0x4)))
4107 || (i.types[0].bitfield.qword
4108 && ((i.reg_operands == 2
4109 && i.op[0].regs == i.op[1].regs
4110 && (i.tm.base_opcode == 0x30
4111 || i.tm.base_opcode == 0x28))
4112 || (i.reg_operands == 1
4113 && i.operands == 1
4114 && i.tm.base_opcode == 0x30)))))
4115 {
4116 /* Optimize: -O:
4117 andq $imm31, %r64 -> andl $imm31, %r32
4118 andq $imm7, %r64 -> andl $imm7, %r32
4119 testq $imm31, %r64 -> testl $imm31, %r32
4120 xorq %r64, %r64 -> xorl %r32, %r32
4121 subq %r64, %r64 -> subl %r32, %r32
4122 movq $imm31, %r64 -> movl $imm31, %r32
4123 movq $imm32, %r64 -> movl $imm32, %r32
4124 */
4125 i.tm.opcode_modifier.norex64 = 1;
4126 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4127 {
4128 /* Handle
4129 movq $imm31, %r64 -> movl $imm31, %r32
4130 movq $imm32, %r64 -> movl $imm32, %r32
4131 */
4132 i.tm.operand_types[0].bitfield.imm32 = 1;
4133 i.tm.operand_types[0].bitfield.imm32s = 0;
4134 i.tm.operand_types[0].bitfield.imm64 = 0;
4135 i.types[0].bitfield.imm32 = 1;
4136 i.types[0].bitfield.imm32s = 0;
4137 i.types[0].bitfield.imm64 = 0;
4138 i.types[1].bitfield.dword = 1;
4139 i.types[1].bitfield.qword = 0;
4140 if ((i.tm.base_opcode | 1) == 0xc7)
4141 {
4142 /* Handle
4143 movq $imm31, %r64 -> movl $imm31, %r32
4144 */
4145 i.tm.base_opcode = 0xb8;
4146 i.tm.extension_opcode = None;
4147 i.tm.opcode_modifier.w = 0;
4148 i.tm.opcode_modifier.modrm = 0;
4149 }
4150 }
4151 }
4152 else if (optimize > 1
4153 && !optimize_for_space
4154 && !is_any_vex_encoding (&i.tm)
4155 && i.reg_operands == 2
4156 && i.op[0].regs == i.op[1].regs
4157 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4158 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4159 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4160 {
4161 /* Optimize: -O2:
4162 andb %rN, %rN -> testb %rN, %rN
4163 andw %rN, %rN -> testw %rN, %rN
4164 andq %rN, %rN -> testq %rN, %rN
4165 orb %rN, %rN -> testb %rN, %rN
4166 orw %rN, %rN -> testw %rN, %rN
4167 orq %rN, %rN -> testq %rN, %rN
4168
4169 and outside of 64-bit mode
4170
4171 andl %rN, %rN -> testl %rN, %rN
4172 orl %rN, %rN -> testl %rN, %rN
4173 */
4174 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4175 }
4176 else if (i.reg_operands == 3
4177 && i.op[0].regs == i.op[1].regs
4178 && !i.types[2].bitfield.xmmword
4179 && (i.tm.opcode_modifier.vex
4180 || ((!i.mask || i.mask->zeroing)
4181 && !i.rounding
4182 && is_evex_encoding (&i.tm)
4183 && (i.vec_encoding != vex_encoding_evex
4184 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4185 || i.tm.cpu_flags.bitfield.cpuavx512vl
4186 || (i.tm.operand_types[2].bitfield.zmmword
4187 && i.types[2].bitfield.ymmword))))
4188 && ((i.tm.base_opcode == 0x55
4189 || i.tm.base_opcode == 0x6655
4190 || i.tm.base_opcode == 0x66df
4191 || i.tm.base_opcode == 0x57
4192 || i.tm.base_opcode == 0x6657
4193 || i.tm.base_opcode == 0x66ef
4194 || i.tm.base_opcode == 0x66f8
4195 || i.tm.base_opcode == 0x66f9
4196 || i.tm.base_opcode == 0x66fa
4197 || i.tm.base_opcode == 0x66fb
4198 || i.tm.base_opcode == 0x42
4199 || i.tm.base_opcode == 0x6642
4200 || i.tm.base_opcode == 0x47
4201 || i.tm.base_opcode == 0x6647)
4202 && i.tm.extension_opcode == None))
4203 {
4204 /* Optimize: -O1:
4205 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4206 vpsubq and vpsubw:
4207 EVEX VOP %zmmM, %zmmM, %zmmN
4208 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4209 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4210 EVEX VOP %ymmM, %ymmM, %ymmN
4211 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4212 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4213 VEX VOP %ymmM, %ymmM, %ymmN
4214 -> VEX VOP %xmmM, %xmmM, %xmmN
4215 VOP, one of vpandn and vpxor:
4216 VEX VOP %ymmM, %ymmM, %ymmN
4217 -> VEX VOP %xmmM, %xmmM, %xmmN
4218 VOP, one of vpandnd and vpandnq:
4219 EVEX VOP %zmmM, %zmmM, %zmmN
4220 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4221 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4222 EVEX VOP %ymmM, %ymmM, %ymmN
4223 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4224 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4225 VOP, one of vpxord and vpxorq:
4226 EVEX VOP %zmmM, %zmmM, %zmmN
4227 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4228 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4229 EVEX VOP %ymmM, %ymmM, %ymmN
4230 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4231 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4232 VOP, one of kxord and kxorq:
4233 VEX VOP %kM, %kM, %kN
4234 -> VEX kxorw %kM, %kM, %kN
4235 VOP, one of kandnd and kandnq:
4236 VEX VOP %kM, %kM, %kN
4237 -> VEX kandnw %kM, %kM, %kN
4238 */
4239 if (is_evex_encoding (&i.tm))
4240 {
4241 if (i.vec_encoding != vex_encoding_evex)
4242 {
4243 i.tm.opcode_modifier.vex = VEX128;
4244 i.tm.opcode_modifier.vexw = VEXW0;
4245 i.tm.opcode_modifier.evex = 0;
4246 }
4247 else if (optimize > 1)
4248 i.tm.opcode_modifier.evex = EVEX128;
4249 else
4250 return;
4251 }
4252 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4253 {
4254 i.tm.base_opcode &= 0xff;
4255 i.tm.opcode_modifier.vexw = VEXW0;
4256 }
4257 else
4258 i.tm.opcode_modifier.vex = VEX128;
4259
4260 if (i.tm.opcode_modifier.vex)
4261 for (j = 0; j < 3; j++)
4262 {
4263 i.types[j].bitfield.xmmword = 1;
4264 i.types[j].bitfield.ymmword = 0;
4265 }
4266 }
4267 else if (i.vec_encoding != vex_encoding_evex
4268 && !i.types[0].bitfield.zmmword
4269 && !i.types[1].bitfield.zmmword
4270 && !i.mask
4271 && !i.broadcast
4272 && is_evex_encoding (&i.tm)
4273 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4274 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4275 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4276 || (i.tm.base_opcode & ~4) == 0x66db
4277 || (i.tm.base_opcode & ~4) == 0x66eb)
4278 && i.tm.extension_opcode == None)
4279 {
4280 /* Optimize: -O1:
4281 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4282 vmovdqu32 and vmovdqu64:
4283 EVEX VOP %xmmM, %xmmN
4284 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4285 EVEX VOP %ymmM, %ymmN
4286 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4287 EVEX VOP %xmmM, mem
4288 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4289 EVEX VOP %ymmM, mem
4290 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4291 EVEX VOP mem, %xmmN
4292 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4293 EVEX VOP mem, %ymmN
4294 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4295 VOP, one of vpand, vpandn, vpor, vpxor:
4296 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4297 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4298 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4299 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4300 EVEX VOP{d,q} mem, %xmmM, %xmmN
4301 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4302 EVEX VOP{d,q} mem, %ymmM, %ymmN
4303 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4304 */
4305 for (j = 0; j < i.operands; j++)
4306 if (operand_type_check (i.types[j], disp)
4307 && i.op[j].disps->X_op == O_constant)
4308 {
4309 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4310 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4311 bytes, we choose EVEX Disp8 over VEX Disp32. */
4312 int evex_disp8, vex_disp8;
4313 unsigned int memshift = i.memshift;
4314 offsetT n = i.op[j].disps->X_add_number;
4315
4316 evex_disp8 = fits_in_disp8 (n);
4317 i.memshift = 0;
4318 vex_disp8 = fits_in_disp8 (n);
4319 if (evex_disp8 != vex_disp8)
4320 {
4321 i.memshift = memshift;
4322 return;
4323 }
4324
4325 i.types[j].bitfield.disp8 = vex_disp8;
4326 break;
4327 }
4328 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4329 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4330 i.tm.opcode_modifier.vex
4331 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4332 i.tm.opcode_modifier.vexw = VEXW0;
4333 /* VPAND, VPOR, and VPXOR are commutative. */
4334 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4335 i.tm.opcode_modifier.commutative = 1;
4336 i.tm.opcode_modifier.evex = 0;
4337 i.tm.opcode_modifier.masking = 0;
4338 i.tm.opcode_modifier.broadcast = 0;
4339 i.tm.opcode_modifier.disp8memshift = 0;
4340 i.memshift = 0;
4341 if (j < i.operands)
4342 i.types[j].bitfield.disp8
4343 = fits_in_disp8 (i.op[j].disps->X_add_number);
4344 }
4345 }
4346
4347 /* Return non-zero for load instruction. */
4348
4349 static int
4350 load_insn_p (void)
4351 {
4352 unsigned int dest;
4353 int any_vex_p = is_any_vex_encoding (&i.tm);
4354 unsigned int base_opcode = i.tm.base_opcode | 1;
4355
4356 if (!any_vex_p)
4357 {
4358 /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4359 prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4360 bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote. */
4361 if (i.tm.opcode_modifier.anysize)
4362 return 0;
4363
4364 /* pop, popf, popa. */
4365 if (strcmp (i.tm.name, "pop") == 0
4366 || i.tm.base_opcode == 0x9d
4367 || i.tm.base_opcode == 0x61)
4368 return 1;
4369
4370 /* movs, cmps, lods, scas. */
4371 if ((i.tm.base_opcode | 0xb) == 0xaf)
4372 return 1;
4373
4374 /* outs, xlatb. */
4375 if (base_opcode == 0x6f
4376 || i.tm.base_opcode == 0xd7)
4377 return 1;
4378 /* NB: For AMD-specific insns with implicit memory operands,
4379 they're intentionally not covered. */
4380 }
4381
4382 /* No memory operand. */
4383 if (!i.mem_operands)
4384 return 0;
4385
4386 if (any_vex_p)
4387 {
4388 /* vldmxcsr. */
4389 if (i.tm.base_opcode == 0xae
4390 && i.tm.opcode_modifier.vex
4391 && i.tm.opcode_modifier.vexopcode == VEX0F
4392 && i.tm.extension_opcode == 2)
4393 return 1;
4394 }
4395 else
4396 {
4397 /* test, not, neg, mul, imul, div, idiv. */
4398 if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4399 && i.tm.extension_opcode != 1)
4400 return 1;
4401
4402 /* inc, dec. */
4403 if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4404 return 1;
4405
4406 /* add, or, adc, sbb, and, sub, xor, cmp. */
4407 if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4408 return 1;
4409
4410 /* bt, bts, btr, btc. */
4411 if (i.tm.base_opcode == 0xfba
4412 && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4413 return 1;
4414
4415 /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4416 if ((base_opcode == 0xc1
4417 || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4418 && i.tm.extension_opcode != 6)
4419 return 1;
4420
4421 /* cmpxchg8b, cmpxchg16b, xrstors. */
4422 if (i.tm.base_opcode == 0xfc7
4423 && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4424 return 1;
4425
4426 /* fxrstor, ldmxcsr, xrstor. */
4427 if (i.tm.base_opcode == 0xfae
4428 && (i.tm.extension_opcode == 1
4429 || i.tm.extension_opcode == 2
4430 || i.tm.extension_opcode == 5))
4431 return 1;
4432
4433 /* lgdt, lidt, lmsw. */
4434 if (i.tm.base_opcode == 0xf01
4435 && (i.tm.extension_opcode == 2
4436 || i.tm.extension_opcode == 3
4437 || i.tm.extension_opcode == 6))
4438 return 1;
4439
4440 /* vmptrld */
4441 if (i.tm.base_opcode == 0xfc7
4442 && i.tm.extension_opcode == 6)
4443 return 1;
4444
4445 /* Check for x87 instructions. */
4446 if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4447 {
4448 /* Skip fst, fstp, fstenv, fstcw. */
4449 if (i.tm.base_opcode == 0xd9
4450 && (i.tm.extension_opcode == 2
4451 || i.tm.extension_opcode == 3
4452 || i.tm.extension_opcode == 6
4453 || i.tm.extension_opcode == 7))
4454 return 0;
4455
4456 /* Skip fisttp, fist, fistp, fstp. */
4457 if (i.tm.base_opcode == 0xdb
4458 && (i.tm.extension_opcode == 1
4459 || i.tm.extension_opcode == 2
4460 || i.tm.extension_opcode == 3
4461 || i.tm.extension_opcode == 7))
4462 return 0;
4463
4464 /* Skip fisttp, fst, fstp, fsave, fstsw. */
4465 if (i.tm.base_opcode == 0xdd
4466 && (i.tm.extension_opcode == 1
4467 || i.tm.extension_opcode == 2
4468 || i.tm.extension_opcode == 3
4469 || i.tm.extension_opcode == 6
4470 || i.tm.extension_opcode == 7))
4471 return 0;
4472
4473 /* Skip fisttp, fist, fistp, fbstp, fistp. */
4474 if (i.tm.base_opcode == 0xdf
4475 && (i.tm.extension_opcode == 1
4476 || i.tm.extension_opcode == 2
4477 || i.tm.extension_opcode == 3
4478 || i.tm.extension_opcode == 6
4479 || i.tm.extension_opcode == 7))
4480 return 0;
4481
4482 return 1;
4483 }
4484 }
4485
4486 dest = i.operands - 1;
4487
4488 /* Check fake imm8 operand and 3 source operands. */
4489 if ((i.tm.opcode_modifier.immext
4490 || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4491 && i.types[dest].bitfield.imm8)
4492 dest--;
4493
4494 /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd */
4495 if (!any_vex_p
4496 && (base_opcode == 0x1
4497 || base_opcode == 0x9
4498 || base_opcode == 0x11
4499 || base_opcode == 0x19
4500 || base_opcode == 0x21
4501 || base_opcode == 0x29
4502 || base_opcode == 0x31
4503 || base_opcode == 0x39
4504 || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4505 || base_opcode == 0xfc1))
4506 return 1;
4507
4508 /* Check for load instruction. */
4509 return (i.types[dest].bitfield.class != ClassNone
4510 || i.types[dest].bitfield.instance == Accum);
4511 }
4512
4513 /* Output lfence, 0xfaee8, after instruction. */
4514
4515 static void
4516 insert_lfence_after (void)
4517 {
4518 if (lfence_after_load && load_insn_p ())
4519 {
4520 /* There are also two REP string instructions that require
4521 special treatment. Specifically, the compare string (CMPS)
4522 and scan string (SCAS) instructions set EFLAGS in a manner
4523 that depends on the data being compared/scanned. When used
4524 with a REP prefix, the number of iterations may therefore
4525 vary depending on this data. If the data is a program secret
4526 chosen by the adversary using an LVI method,
4527 then this data-dependent behavior may leak some aspect
4528 of the secret. */
4529 if (((i.tm.base_opcode | 0x1) == 0xa7
4530 || (i.tm.base_opcode | 0x1) == 0xaf)
4531 && i.prefix[REP_PREFIX])
4532 {
4533 as_warn (_("`%s` changes flags which would affect control flow behavior"),
4534 i.tm.name);
4535 }
4536 char *p = frag_more (3);
4537 *p++ = 0xf;
4538 *p++ = 0xae;
4539 *p = 0xe8;
4540 }
4541 }
4542
4543 /* Output lfence, 0xfaee8, before instruction. */
4544
4545 static void
4546 insert_lfence_before (void)
4547 {
4548 char *p;
4549
4550 if (is_any_vex_encoding (&i.tm))
4551 return;
4552
4553 if (i.tm.base_opcode == 0xff
4554 && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4555 {
4556 /* Insert lfence before indirect branch if needed. */
4557
4558 if (lfence_before_indirect_branch == lfence_branch_none)
4559 return;
4560
4561 if (i.operands != 1)
4562 abort ();
4563
4564 if (i.reg_operands == 1)
4565 {
4566 /* Indirect branch via register. Don't insert lfence with
4567 -mlfence-after-load=yes. */
4568 if (lfence_after_load
4569 || lfence_before_indirect_branch == lfence_branch_memory)
4570 return;
4571 }
4572 else if (i.mem_operands == 1
4573 && lfence_before_indirect_branch != lfence_branch_register)
4574 {
4575 as_warn (_("indirect `%s` with memory operand should be avoided"),
4576 i.tm.name);
4577 return;
4578 }
4579 else
4580 return;
4581
4582 if (last_insn.kind != last_insn_other
4583 && last_insn.seg == now_seg)
4584 {
4585 as_warn_where (last_insn.file, last_insn.line,
4586 _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4587 last_insn.name, i.tm.name);
4588 return;
4589 }
4590
4591 p = frag_more (3);
4592 *p++ = 0xf;
4593 *p++ = 0xae;
4594 *p = 0xe8;
4595 return;
4596 }
4597
4598 /* Output or/not/shl and lfence before near ret. */
4599 if (lfence_before_ret != lfence_before_ret_none
4600 && (i.tm.base_opcode == 0xc2
4601 || i.tm.base_opcode == 0xc3))
4602 {
4603 if (last_insn.kind != last_insn_other
4604 && last_insn.seg == now_seg)
4605 {
4606 as_warn_where (last_insn.file, last_insn.line,
4607 _("`%s` skips -mlfence-before-ret on `%s`"),
4608 last_insn.name, i.tm.name);
4609 return;
4610 }
4611
4612 /* Near ret ingore operand size override under CPU64. */
4613 char prefix = flag_code == CODE_64BIT
4614 ? 0x48
4615 : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4616
4617 if (lfence_before_ret == lfence_before_ret_not)
4618 {
4619 /* not: 0xf71424, may add prefix
4620 for operand size override or 64-bit code. */
4621 p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4622 if (prefix)
4623 *p++ = prefix;
4624 *p++ = 0xf7;
4625 *p++ = 0x14;
4626 *p++ = 0x24;
4627 if (prefix)
4628 *p++ = prefix;
4629 *p++ = 0xf7;
4630 *p++ = 0x14;
4631 *p++ = 0x24;
4632 }
4633 else
4634 {
4635 p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4636 if (prefix)
4637 *p++ = prefix;
4638 if (lfence_before_ret == lfence_before_ret_or)
4639 {
4640 /* or: 0x830c2400, may add prefix
4641 for operand size override or 64-bit code. */
4642 *p++ = 0x83;
4643 *p++ = 0x0c;
4644 }
4645 else
4646 {
4647 /* shl: 0xc1242400, may add prefix
4648 for operand size override or 64-bit code. */
4649 *p++ = 0xc1;
4650 *p++ = 0x24;
4651 }
4652
4653 *p++ = 0x24;
4654 *p++ = 0x0;
4655 }
4656
4657 *p++ = 0xf;
4658 *p++ = 0xae;
4659 *p = 0xe8;
4660 }
4661 }
4662
4663 /* This is the guts of the machine-dependent assembler. LINE points to a
4664 machine dependent instruction. This function is supposed to emit
4665 the frags/bytes it assembles to. */
4666
4667 void
4668 md_assemble (char *line)
4669 {
4670 unsigned int j;
4671 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4672 const insn_template *t;
4673
4674 /* Initialize globals. */
4675 memset (&i, '\0', sizeof (i));
4676 for (j = 0; j < MAX_OPERANDS; j++)
4677 i.reloc[j] = NO_RELOC;
4678 memset (disp_expressions, '\0', sizeof (disp_expressions));
4679 memset (im_expressions, '\0', sizeof (im_expressions));
4680 save_stack_p = save_stack;
4681
4682 /* First parse an instruction mnemonic & call i386_operand for the operands.
4683 We assume that the scrubber has arranged it so that line[0] is the valid
4684 start of a (possibly prefixed) mnemonic. */
4685
4686 line = parse_insn (line, mnemonic);
4687 if (line == NULL)
4688 return;
4689 mnem_suffix = i.suffix;
4690
4691 line = parse_operands (line, mnemonic);
4692 this_operand = -1;
4693 xfree (i.memop1_string);
4694 i.memop1_string = NULL;
4695 if (line == NULL)
4696 return;
4697
4698 /* Now we've parsed the mnemonic into a set of templates, and have the
4699 operands at hand. */
4700
4701 /* All Intel opcodes have reversed operands except for "bound", "enter",
4702 "monitor*", "mwait*", "tpause", and "umwait". We also don't reverse
4703 intersegment "jmp" and "call" instructions with 2 immediate operands so
4704 that the immediate segment precedes the offset, as it does when in AT&T
4705 mode. */
4706 if (intel_syntax
4707 && i.operands > 1
4708 && (strcmp (mnemonic, "bound") != 0)
4709 && (strcmp (mnemonic, "invlpga") != 0)
4710 && (strncmp (mnemonic, "monitor", 7) != 0)
4711 && (strncmp (mnemonic, "mwait", 5) != 0)
4712 && (strcmp (mnemonic, "tpause") != 0)
4713 && (strcmp (mnemonic, "umwait") != 0)
4714 && !(operand_type_check (i.types[0], imm)
4715 && operand_type_check (i.types[1], imm)))
4716 swap_operands ();
4717
4718 /* The order of the immediates should be reversed
4719 for 2 immediates extrq and insertq instructions */
4720 if (i.imm_operands == 2
4721 && (strcmp (mnemonic, "extrq") == 0
4722 || strcmp (mnemonic, "insertq") == 0))
4723 swap_2_operands (0, 1);
4724
4725 if (i.imm_operands)
4726 optimize_imm ();
4727
4728 /* Don't optimize displacement for movabs since it only takes 64bit
4729 displacement. */
4730 if (i.disp_operands
4731 && i.disp_encoding != disp_encoding_32bit
4732 && (flag_code != CODE_64BIT
4733 || strcmp (mnemonic, "movabs") != 0))
4734 optimize_disp ();
4735
4736 /* Next, we find a template that matches the given insn,
4737 making sure the overlap of the given operands types is consistent
4738 with the template operand types. */
4739
4740 if (!(t = match_template (mnem_suffix)))
4741 return;
4742
4743 if (sse_check != check_none
4744 && !i.tm.opcode_modifier.noavx
4745 && !i.tm.cpu_flags.bitfield.cpuavx
4746 && !i.tm.cpu_flags.bitfield.cpuavx512f
4747 && (i.tm.cpu_flags.bitfield.cpusse
4748 || i.tm.cpu_flags.bitfield.cpusse2
4749 || i.tm.cpu_flags.bitfield.cpusse3
4750 || i.tm.cpu_flags.bitfield.cpussse3
4751 || i.tm.cpu_flags.bitfield.cpusse4_1
4752 || i.tm.cpu_flags.bitfield.cpusse4_2
4753 || i.tm.cpu_flags.bitfield.cpusse4a
4754 || i.tm.cpu_flags.bitfield.cpupclmul
4755 || i.tm.cpu_flags.bitfield.cpuaes
4756 || i.tm.cpu_flags.bitfield.cpusha
4757 || i.tm.cpu_flags.bitfield.cpugfni))
4758 {
4759 (sse_check == check_warning
4760 ? as_warn
4761 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4762 }
4763
4764 if (i.tm.opcode_modifier.fwait)
4765 if (!add_prefix (FWAIT_OPCODE))
4766 return;
4767
4768 /* Check if REP prefix is OK. */
4769 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4770 {
4771 as_bad (_("invalid instruction `%s' after `%s'"),
4772 i.tm.name, i.rep_prefix);
4773 return;
4774 }
4775
4776 /* Check for lock without a lockable instruction. Destination operand
4777 must be memory unless it is xchg (0x86). */
4778 if (i.prefix[LOCK_PREFIX]
4779 && (!i.tm.opcode_modifier.islockable
4780 || i.mem_operands == 0
4781 || (i.tm.base_opcode != 0x86
4782 && !(i.flags[i.operands - 1] & Operand_Mem))))
4783 {
4784 as_bad (_("expecting lockable instruction after `lock'"));
4785 return;
4786 }
4787
4788 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4789 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4790 {
4791 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4792 return;
4793 }
4794
4795 /* Check if HLE prefix is OK. */
4796 if (i.hle_prefix && !check_hle ())
4797 return;
4798
4799 /* Check BND prefix. */
4800 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4801 as_bad (_("expecting valid branch instruction after `bnd'"));
4802
4803 /* Check NOTRACK prefix. */
4804 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4805 as_bad (_("expecting indirect branch instruction after `notrack'"));
4806
4807 if (i.tm.cpu_flags.bitfield.cpumpx)
4808 {
4809 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4810 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4811 else if (flag_code != CODE_16BIT
4812 ? i.prefix[ADDR_PREFIX]
4813 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4814 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4815 }
4816
4817 /* Insert BND prefix. */
4818 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4819 {
4820 if (!i.prefix[BND_PREFIX])
4821 add_prefix (BND_PREFIX_OPCODE);
4822 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4823 {
4824 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4825 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4826 }
4827 }
4828
4829 /* Check string instruction segment overrides. */
4830 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4831 {
4832 gas_assert (i.mem_operands);
4833 if (!check_string ())
4834 return;
4835 i.disp_operands = 0;
4836 }
4837
4838 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4839 optimize_encoding ();
4840
4841 if (!process_suffix ())
4842 return;
4843
4844 /* Update operand types. */
4845 for (j = 0; j < i.operands; j++)
4846 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4847
4848 /* Make still unresolved immediate matches conform to size of immediate
4849 given in i.suffix. */
4850 if (!finalize_imm ())
4851 return;
4852
4853 if (i.types[0].bitfield.imm1)
4854 i.imm_operands = 0; /* kludge for shift insns. */
4855
4856 /* We only need to check those implicit registers for instructions
4857 with 3 operands or less. */
4858 if (i.operands <= 3)
4859 for (j = 0; j < i.operands; j++)
4860 if (i.types[j].bitfield.instance != InstanceNone
4861 && !i.types[j].bitfield.xmmword)
4862 i.reg_operands--;
4863
4864 /* ImmExt should be processed after SSE2AVX. */
4865 if (!i.tm.opcode_modifier.sse2avx
4866 && i.tm.opcode_modifier.immext)
4867 process_immext ();
4868
4869 /* For insns with operands there are more diddles to do to the opcode. */
4870 if (i.operands)
4871 {
4872 if (!process_operands ())
4873 return;
4874 }
4875 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4876 {
4877 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4878 as_warn (_("translating to `%sp'"), i.tm.name);
4879 }
4880
4881 if (is_any_vex_encoding (&i.tm))
4882 {
4883 if (!cpu_arch_flags.bitfield.cpui286)
4884 {
4885 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4886 i.tm.name);
4887 return;
4888 }
4889
4890 if (i.tm.opcode_modifier.vex)
4891 build_vex_prefix (t);
4892 else
4893 build_evex_prefix ();
4894 }
4895
4896 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4897 instructions may define INT_OPCODE as well, so avoid this corner
4898 case for those instructions that use MODRM. */
4899 if (i.tm.base_opcode == INT_OPCODE
4900 && !i.tm.opcode_modifier.modrm
4901 && i.op[0].imms->X_add_number == 3)
4902 {
4903 i.tm.base_opcode = INT3_OPCODE;
4904 i.imm_operands = 0;
4905 }
4906
4907 if ((i.tm.opcode_modifier.jump == JUMP
4908 || i.tm.opcode_modifier.jump == JUMP_BYTE
4909 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4910 && i.op[0].disps->X_op == O_constant)
4911 {
4912 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4913 the absolute address given by the constant. Since ix86 jumps and
4914 calls are pc relative, we need to generate a reloc. */
4915 i.op[0].disps->X_add_symbol = &abs_symbol;
4916 i.op[0].disps->X_op = O_symbol;
4917 }
4918
4919 /* For 8 bit registers we need an empty rex prefix. Also if the
4920 instruction already has a prefix, we need to convert old
4921 registers to new ones. */
4922
4923 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4924 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4925 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4926 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4927 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4928 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4929 && i.rex != 0))
4930 {
4931 int x;
4932
4933 i.rex |= REX_OPCODE;
4934 for (x = 0; x < 2; x++)
4935 {
4936 /* Look for 8 bit operand that uses old registers. */
4937 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4938 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4939 {
4940 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4941 /* In case it is "hi" register, give up. */
4942 if (i.op[x].regs->reg_num > 3)
4943 as_bad (_("can't encode register '%s%s' in an "
4944 "instruction requiring REX prefix."),
4945 register_prefix, i.op[x].regs->reg_name);
4946
4947 /* Otherwise it is equivalent to the extended register.
4948 Since the encoding doesn't change this is merely
4949 cosmetic cleanup for debug output. */
4950
4951 i.op[x].regs = i.op[x].regs + 8;
4952 }
4953 }
4954 }
4955
4956 if (i.rex == 0 && i.rex_encoding)
4957 {
4958 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4959 that uses legacy register. If it is "hi" register, don't add
4960 the REX_OPCODE byte. */
4961 int x;
4962 for (x = 0; x < 2; x++)
4963 if (i.types[x].bitfield.class == Reg
4964 && i.types[x].bitfield.byte
4965 && (i.op[x].regs->reg_flags & RegRex64) == 0
4966 && i.op[x].regs->reg_num > 3)
4967 {
4968 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4969 i.rex_encoding = FALSE;
4970 break;
4971 }
4972
4973 if (i.rex_encoding)
4974 i.rex = REX_OPCODE;
4975 }
4976
4977 if (i.rex != 0)
4978 add_prefix (REX_OPCODE | i.rex);
4979
4980 insert_lfence_before ();
4981
4982 /* We are ready to output the insn. */
4983 output_insn ();
4984
4985 insert_lfence_after ();
4986
4987 last_insn.seg = now_seg;
4988
4989 if (i.tm.opcode_modifier.isprefix)
4990 {
4991 last_insn.kind = last_insn_prefix;
4992 last_insn.name = i.tm.name;
4993 last_insn.file = as_where (&last_insn.line);
4994 }
4995 else
4996 last_insn.kind = last_insn_other;
4997 }
4998
4999 static char *
5000 parse_insn (char *line, char *mnemonic)
5001 {
5002 char *l = line;
5003 char *token_start = l;
5004 char *mnem_p;
5005 int supported;
5006 const insn_template *t;
5007 char *dot_p = NULL;
5008
5009 while (1)
5010 {
5011 mnem_p = mnemonic;
5012 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5013 {
5014 if (*mnem_p == '.')
5015 dot_p = mnem_p;
5016 mnem_p++;
5017 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5018 {
5019 as_bad (_("no such instruction: `%s'"), token_start);
5020 return NULL;
5021 }
5022 l++;
5023 }
5024 if (!is_space_char (*l)
5025 && *l != END_OF_INSN
5026 && (intel_syntax
5027 || (*l != PREFIX_SEPARATOR
5028 && *l != ',')))
5029 {
5030 as_bad (_("invalid character %s in mnemonic"),
5031 output_invalid (*l));
5032 return NULL;
5033 }
5034 if (token_start == l)
5035 {
5036 if (!intel_syntax && *l == PREFIX_SEPARATOR)
5037 as_bad (_("expecting prefix; got nothing"));
5038 else
5039 as_bad (_("expecting mnemonic; got nothing"));
5040 return NULL;
5041 }
5042
5043 /* Look up instruction (or prefix) via hash table. */
5044 current_templates = (const templates *) hash_find (op_hash, mnemonic);
5045
5046 if (*l != END_OF_INSN
5047 && (!is_space_char (*l) || l[1] != END_OF_INSN)
5048 && current_templates
5049 && current_templates->start->opcode_modifier.isprefix)
5050 {
5051 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5052 {
5053 as_bad ((flag_code != CODE_64BIT
5054 ? _("`%s' is only supported in 64-bit mode")
5055 : _("`%s' is not supported in 64-bit mode")),
5056 current_templates->start->name);
5057 return NULL;
5058 }
5059 /* If we are in 16-bit mode, do not allow addr16 or data16.
5060 Similarly, in 32-bit mode, do not allow addr32 or data32. */
5061 if ((current_templates->start->opcode_modifier.size == SIZE16
5062 || current_templates->start->opcode_modifier.size == SIZE32)
5063 && flag_code != CODE_64BIT
5064 && ((current_templates->start->opcode_modifier.size == SIZE32)
5065 ^ (flag_code == CODE_16BIT)))
5066 {
5067 as_bad (_("redundant %s prefix"),
5068 current_templates->start->name);
5069 return NULL;
5070 }
5071 if (current_templates->start->opcode_length == 0)
5072 {
5073 /* Handle pseudo prefixes. */
5074 switch (current_templates->start->base_opcode)
5075 {
5076 case 0x0:
5077 /* {disp8} */
5078 i.disp_encoding = disp_encoding_8bit;
5079 break;
5080 case 0x1:
5081 /* {disp32} */
5082 i.disp_encoding = disp_encoding_32bit;
5083 break;
5084 case 0x2:
5085 /* {load} */
5086 i.dir_encoding = dir_encoding_load;
5087 break;
5088 case 0x3:
5089 /* {store} */
5090 i.dir_encoding = dir_encoding_store;
5091 break;
5092 case 0x4:
5093 /* {vex} */
5094 i.vec_encoding = vex_encoding_vex;
5095 break;
5096 case 0x5:
5097 /* {vex3} */
5098 i.vec_encoding = vex_encoding_vex3;
5099 break;
5100 case 0x6:
5101 /* {evex} */
5102 i.vec_encoding = vex_encoding_evex;
5103 break;
5104 case 0x7:
5105 /* {rex} */
5106 i.rex_encoding = TRUE;
5107 break;
5108 case 0x8:
5109 /* {nooptimize} */
5110 i.no_optimize = TRUE;
5111 break;
5112 default:
5113 abort ();
5114 }
5115 }
5116 else
5117 {
5118 /* Add prefix, checking for repeated prefixes. */
5119 switch (add_prefix (current_templates->start->base_opcode))
5120 {
5121 case PREFIX_EXIST:
5122 return NULL;
5123 case PREFIX_DS:
5124 if (current_templates->start->cpu_flags.bitfield.cpuibt)
5125 i.notrack_prefix = current_templates->start->name;
5126 break;
5127 case PREFIX_REP:
5128 if (current_templates->start->cpu_flags.bitfield.cpuhle)
5129 i.hle_prefix = current_templates->start->name;
5130 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5131 i.bnd_prefix = current_templates->start->name;
5132 else
5133 i.rep_prefix = current_templates->start->name;
5134 break;
5135 default:
5136 break;
5137 }
5138 }
5139 /* Skip past PREFIX_SEPARATOR and reset token_start. */
5140 token_start = ++l;
5141 }
5142 else
5143 break;
5144 }
5145
5146 if (!current_templates)
5147 {
5148 /* Deprecated functionality (new code should use pseudo-prefixes instead):
5149 Check if we should swap operand or force 32bit displacement in
5150 encoding. */
5151 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5152 i.dir_encoding = dir_encoding_swap;
5153 else if (mnem_p - 3 == dot_p
5154 && dot_p[1] == 'd'
5155 && dot_p[2] == '8')
5156 i.disp_encoding = disp_encoding_8bit;
5157 else if (mnem_p - 4 == dot_p
5158 && dot_p[1] == 'd'
5159 && dot_p[2] == '3'
5160 && dot_p[3] == '2')
5161 i.disp_encoding = disp_encoding_32bit;
5162 else
5163 goto check_suffix;
5164 mnem_p = dot_p;
5165 *dot_p = '\0';
5166 current_templates = (const templates *) hash_find (op_hash, mnemonic);
5167 }
5168
5169 if (!current_templates)
5170 {
5171 check_suffix:
5172 if (mnem_p > mnemonic)
5173 {
5174 /* See if we can get a match by trimming off a suffix. */
5175 switch (mnem_p[-1])
5176 {
5177 case WORD_MNEM_SUFFIX:
5178 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5179 i.suffix = SHORT_MNEM_SUFFIX;
5180 else
5181 /* Fall through. */
5182 case BYTE_MNEM_SUFFIX:
5183 case QWORD_MNEM_SUFFIX:
5184 i.suffix = mnem_p[-1];
5185 mnem_p[-1] = '\0';
5186 current_templates = (const templates *) hash_find (op_hash,
5187 mnemonic);
5188 break;
5189 case SHORT_MNEM_SUFFIX:
5190 case LONG_MNEM_SUFFIX:
5191 if (!intel_syntax)
5192 {
5193 i.suffix = mnem_p[-1];
5194 mnem_p[-1] = '\0';
5195 current_templates = (const templates *) hash_find (op_hash,
5196 mnemonic);
5197 }
5198 break;
5199
5200 /* Intel Syntax. */
5201 case 'd':
5202 if (intel_syntax)
5203 {
5204 if (intel_float_operand (mnemonic) == 1)
5205 i.suffix = SHORT_MNEM_SUFFIX;
5206 else
5207 i.suffix = LONG_MNEM_SUFFIX;
5208 mnem_p[-1] = '\0';
5209 current_templates = (const templates *) hash_find (op_hash,
5210 mnemonic);
5211 }
5212 break;
5213 }
5214 }
5215
5216 if (!current_templates)
5217 {
5218 as_bad (_("no such instruction: `%s'"), token_start);
5219 return NULL;
5220 }
5221 }
5222
5223 if (current_templates->start->opcode_modifier.jump == JUMP
5224 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5225 {
5226 /* Check for a branch hint. We allow ",pt" and ",pn" for
5227 predict taken and predict not taken respectively.
5228 I'm not sure that branch hints actually do anything on loop
5229 and jcxz insns (JumpByte) for current Pentium4 chips. They
5230 may work in the future and it doesn't hurt to accept them
5231 now. */
5232 if (l[0] == ',' && l[1] == 'p')
5233 {
5234 if (l[2] == 't')
5235 {
5236 if (!add_prefix (DS_PREFIX_OPCODE))
5237 return NULL;
5238 l += 3;
5239 }
5240 else if (l[2] == 'n')
5241 {
5242 if (!add_prefix (CS_PREFIX_OPCODE))
5243 return NULL;
5244 l += 3;
5245 }
5246 }
5247 }
5248 /* Any other comma loses. */
5249 if (*l == ',')
5250 {
5251 as_bad (_("invalid character %s in mnemonic"),
5252 output_invalid (*l));
5253 return NULL;
5254 }
5255
5256 /* Check if instruction is supported on specified architecture. */
5257 supported = 0;
5258 for (t = current_templates->start; t < current_templates->end; ++t)
5259 {
5260 supported |= cpu_flags_match (t);
5261 if (supported == CPU_FLAGS_PERFECT_MATCH)
5262 {
5263 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5264 as_warn (_("use .code16 to ensure correct addressing mode"));
5265
5266 return l;
5267 }
5268 }
5269
5270 if (!(supported & CPU_FLAGS_64BIT_MATCH))
5271 as_bad (flag_code == CODE_64BIT
5272 ? _("`%s' is not supported in 64-bit mode")
5273 : _("`%s' is only supported in 64-bit mode"),
5274 current_templates->start->name);
5275 else
5276 as_bad (_("`%s' is not supported on `%s%s'"),
5277 current_templates->start->name,
5278 cpu_arch_name ? cpu_arch_name : default_arch,
5279 cpu_sub_arch_name ? cpu_sub_arch_name : "");
5280
5281 return NULL;
5282 }
5283
5284 static char *
5285 parse_operands (char *l, const char *mnemonic)
5286 {
5287 char *token_start;
5288
5289 /* 1 if operand is pending after ','. */
5290 unsigned int expecting_operand = 0;
5291
5292 /* Non-zero if operand parens not balanced. */
5293 unsigned int paren_not_balanced;
5294
5295 while (*l != END_OF_INSN)
5296 {
5297 /* Skip optional white space before operand. */
5298 if (is_space_char (*l))
5299 ++l;
5300 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5301 {
5302 as_bad (_("invalid character %s before operand %d"),
5303 output_invalid (*l),
5304 i.operands + 1);
5305 return NULL;
5306 }
5307 token_start = l; /* After white space. */
5308 paren_not_balanced = 0;
5309 while (paren_not_balanced || *l != ',')
5310 {
5311 if (*l == END_OF_INSN)
5312 {
5313 if (paren_not_balanced)
5314 {
5315 if (!intel_syntax)
5316 as_bad (_("unbalanced parenthesis in operand %d."),
5317 i.operands + 1);
5318 else
5319 as_bad (_("unbalanced brackets in operand %d."),
5320 i.operands + 1);
5321 return NULL;
5322 }
5323 else
5324 break; /* we are done */
5325 }
5326 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5327 {
5328 as_bad (_("invalid character %s in operand %d"),
5329 output_invalid (*l),
5330 i.operands + 1);
5331 return NULL;
5332 }
5333 if (!intel_syntax)
5334 {
5335 if (*l == '(')
5336 ++paren_not_balanced;
5337 if (*l == ')')
5338 --paren_not_balanced;
5339 }
5340 else
5341 {
5342 if (*l == '[')
5343 ++paren_not_balanced;
5344 if (*l == ']')
5345 --paren_not_balanced;
5346 }
5347 l++;
5348 }
5349 if (l != token_start)
5350 { /* Yes, we've read in another operand. */
5351 unsigned int operand_ok;
5352 this_operand = i.operands++;
5353 if (i.operands > MAX_OPERANDS)
5354 {
5355 as_bad (_("spurious operands; (%d operands/instruction max)"),
5356 MAX_OPERANDS);
5357 return NULL;
5358 }
5359 i.types[this_operand].bitfield.unspecified = 1;
5360 /* Now parse operand adding info to 'i' as we go along. */
5361 END_STRING_AND_SAVE (l);
5362
5363 if (i.mem_operands > 1)
5364 {
5365 as_bad (_("too many memory references for `%s'"),
5366 mnemonic);
5367 return 0;
5368 }
5369
5370 if (intel_syntax)
5371 operand_ok =
5372 i386_intel_operand (token_start,
5373 intel_float_operand (mnemonic));
5374 else
5375 operand_ok = i386_att_operand (token_start);
5376
5377 RESTORE_END_STRING (l);
5378 if (!operand_ok)
5379 return NULL;
5380 }
5381 else
5382 {
5383 if (expecting_operand)
5384 {
5385 expecting_operand_after_comma:
5386 as_bad (_("expecting operand after ','; got nothing"));
5387 return NULL;
5388 }
5389 if (*l == ',')
5390 {
5391 as_bad (_("expecting operand before ','; got nothing"));
5392 return NULL;
5393 }
5394 }
5395
5396 /* Now *l must be either ',' or END_OF_INSN. */
5397 if (*l == ',')
5398 {
5399 if (*++l == END_OF_INSN)
5400 {
5401 /* Just skip it, if it's \n complain. */
5402 goto expecting_operand_after_comma;
5403 }
5404 expecting_operand = 1;
5405 }
5406 }
5407 return l;
5408 }
5409
5410 static void
5411 swap_2_operands (int xchg1, int xchg2)
5412 {
5413 union i386_op temp_op;
5414 i386_operand_type temp_type;
5415 unsigned int temp_flags;
5416 enum bfd_reloc_code_real temp_reloc;
5417
5418 temp_type = i.types[xchg2];
5419 i.types[xchg2] = i.types[xchg1];
5420 i.types[xchg1] = temp_type;
5421
5422 temp_flags = i.flags[xchg2];
5423 i.flags[xchg2] = i.flags[xchg1];
5424 i.flags[xchg1] = temp_flags;
5425
5426 temp_op = i.op[xchg2];
5427 i.op[xchg2] = i.op[xchg1];
5428 i.op[xchg1] = temp_op;
5429
5430 temp_reloc = i.reloc[xchg2];
5431 i.reloc[xchg2] = i.reloc[xchg1];
5432 i.reloc[xchg1] = temp_reloc;
5433
5434 if (i.mask)
5435 {
5436 if (i.mask->operand == xchg1)
5437 i.mask->operand = xchg2;
5438 else if (i.mask->operand == xchg2)
5439 i.mask->operand = xchg1;
5440 }
5441 if (i.broadcast)
5442 {
5443 if (i.broadcast->operand == xchg1)
5444 i.broadcast->operand = xchg2;
5445 else if (i.broadcast->operand == xchg2)
5446 i.broadcast->operand = xchg1;
5447 }
5448 if (i.rounding)
5449 {
5450 if (i.rounding->operand == xchg1)
5451 i.rounding->operand = xchg2;
5452 else if (i.rounding->operand == xchg2)
5453 i.rounding->operand = xchg1;
5454 }
5455 }
5456
5457 static void
5458 swap_operands (void)
5459 {
5460 switch (i.operands)
5461 {
5462 case 5:
5463 case 4:
5464 swap_2_operands (1, i.operands - 2);
5465 /* Fall through. */
5466 case 3:
5467 case 2:
5468 swap_2_operands (0, i.operands - 1);
5469 break;
5470 default:
5471 abort ();
5472 }
5473
5474 if (i.mem_operands == 2)
5475 {
5476 const seg_entry *temp_seg;
5477 temp_seg = i.seg[0];
5478 i.seg[0] = i.seg[1];
5479 i.seg[1] = temp_seg;
5480 }
5481 }
5482
5483 /* Try to ensure constant immediates are represented in the smallest
5484 opcode possible. */
5485 static void
5486 optimize_imm (void)
5487 {
5488 char guess_suffix = 0;
5489 int op;
5490
5491 if (i.suffix)
5492 guess_suffix = i.suffix;
5493 else if (i.reg_operands)
5494 {
5495 /* Figure out a suffix from the last register operand specified.
5496 We can't do this properly yet, i.e. excluding special register
5497 instances, but the following works for instructions with
5498 immediates. In any case, we can't set i.suffix yet. */
5499 for (op = i.operands; --op >= 0;)
5500 if (i.types[op].bitfield.class != Reg)
5501 continue;
5502 else if (i.types[op].bitfield.byte)
5503 {
5504 guess_suffix = BYTE_MNEM_SUFFIX;
5505 break;
5506 }
5507 else if (i.types[op].bitfield.word)
5508 {
5509 guess_suffix = WORD_MNEM_SUFFIX;
5510 break;
5511 }
5512 else if (i.types[op].bitfield.dword)
5513 {
5514 guess_suffix = LONG_MNEM_SUFFIX;
5515 break;
5516 }
5517 else if (i.types[op].bitfield.qword)
5518 {
5519 guess_suffix = QWORD_MNEM_SUFFIX;
5520 break;
5521 }
5522 }
5523 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5524 guess_suffix = WORD_MNEM_SUFFIX;
5525
5526 for (op = i.operands; --op >= 0;)
5527 if (operand_type_check (i.types[op], imm))
5528 {
5529 switch (i.op[op].imms->X_op)
5530 {
5531 case O_constant:
5532 /* If a suffix is given, this operand may be shortened. */
5533 switch (guess_suffix)
5534 {
5535 case LONG_MNEM_SUFFIX:
5536 i.types[op].bitfield.imm32 = 1;
5537 i.types[op].bitfield.imm64 = 1;
5538 break;
5539 case WORD_MNEM_SUFFIX:
5540 i.types[op].bitfield.imm16 = 1;
5541 i.types[op].bitfield.imm32 = 1;
5542 i.types[op].bitfield.imm32s = 1;
5543 i.types[op].bitfield.imm64 = 1;
5544 break;
5545 case BYTE_MNEM_SUFFIX:
5546 i.types[op].bitfield.imm8 = 1;
5547 i.types[op].bitfield.imm8s = 1;
5548 i.types[op].bitfield.imm16 = 1;
5549 i.types[op].bitfield.imm32 = 1;
5550 i.types[op].bitfield.imm32s = 1;
5551 i.types[op].bitfield.imm64 = 1;
5552 break;
5553 }
5554
5555 /* If this operand is at most 16 bits, convert it
5556 to a signed 16 bit number before trying to see
5557 whether it will fit in an even smaller size.
5558 This allows a 16-bit operand such as $0xffe0 to
5559 be recognised as within Imm8S range. */
5560 if ((i.types[op].bitfield.imm16)
5561 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5562 {
5563 i.op[op].imms->X_add_number =
5564 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5565 }
5566 #ifdef BFD64
5567 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5568 if ((i.types[op].bitfield.imm32)
5569 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5570 == 0))
5571 {
5572 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5573 ^ ((offsetT) 1 << 31))
5574 - ((offsetT) 1 << 31));
5575 }
5576 #endif
5577 i.types[op]
5578 = operand_type_or (i.types[op],
5579 smallest_imm_type (i.op[op].imms->X_add_number));
5580
5581 /* We must avoid matching of Imm32 templates when 64bit
5582 only immediate is available. */
5583 if (guess_suffix == QWORD_MNEM_SUFFIX)
5584 i.types[op].bitfield.imm32 = 0;
5585 break;
5586
5587 case O_absent:
5588 case O_register:
5589 abort ();
5590
5591 /* Symbols and expressions. */
5592 default:
5593 /* Convert symbolic operand to proper sizes for matching, but don't
5594 prevent matching a set of insns that only supports sizes other
5595 than those matching the insn suffix. */
5596 {
5597 i386_operand_type mask, allowed;
5598 const insn_template *t;
5599
5600 operand_type_set (&mask, 0);
5601 operand_type_set (&allowed, 0);
5602
5603 for (t = current_templates->start;
5604 t < current_templates->end;
5605 ++t)
5606 {
5607 allowed = operand_type_or (allowed, t->operand_types[op]);
5608 allowed = operand_type_and (allowed, anyimm);
5609 }
5610 switch (guess_suffix)
5611 {
5612 case QWORD_MNEM_SUFFIX:
5613 mask.bitfield.imm64 = 1;
5614 mask.bitfield.imm32s = 1;
5615 break;
5616 case LONG_MNEM_SUFFIX:
5617 mask.bitfield.imm32 = 1;
5618 break;
5619 case WORD_MNEM_SUFFIX:
5620 mask.bitfield.imm16 = 1;
5621 break;
5622 case BYTE_MNEM_SUFFIX:
5623 mask.bitfield.imm8 = 1;
5624 break;
5625 default:
5626 break;
5627 }
5628 allowed = operand_type_and (mask, allowed);
5629 if (!operand_type_all_zero (&allowed))
5630 i.types[op] = operand_type_and (i.types[op], mask);
5631 }
5632 break;
5633 }
5634 }
5635 }
5636
5637 /* Try to use the smallest displacement type too. */
5638 static void
5639 optimize_disp (void)
5640 {
5641 int op;
5642
5643 for (op = i.operands; --op >= 0;)
5644 if (operand_type_check (i.types[op], disp))
5645 {
5646 if (i.op[op].disps->X_op == O_constant)
5647 {
5648 offsetT op_disp = i.op[op].disps->X_add_number;
5649
5650 if (i.types[op].bitfield.disp16
5651 && (op_disp & ~(offsetT) 0xffff) == 0)
5652 {
5653 /* If this operand is at most 16 bits, convert
5654 to a signed 16 bit number and don't use 64bit
5655 displacement. */
5656 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5657 i.types[op].bitfield.disp64 = 0;
5658 }
5659 #ifdef BFD64
5660 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5661 if (i.types[op].bitfield.disp32
5662 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5663 {
5664 /* If this operand is at most 32 bits, convert
5665 to a signed 32 bit number and don't use 64bit
5666 displacement. */
5667 op_disp &= (((offsetT) 2 << 31) - 1);
5668 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5669 i.types[op].bitfield.disp64 = 0;
5670 }
5671 #endif
5672 if (!op_disp && i.types[op].bitfield.baseindex)
5673 {
5674 i.types[op].bitfield.disp8 = 0;
5675 i.types[op].bitfield.disp16 = 0;
5676 i.types[op].bitfield.disp32 = 0;
5677 i.types[op].bitfield.disp32s = 0;
5678 i.types[op].bitfield.disp64 = 0;
5679 i.op[op].disps = 0;
5680 i.disp_operands--;
5681 }
5682 else if (flag_code == CODE_64BIT)
5683 {
5684 if (fits_in_signed_long (op_disp))
5685 {
5686 i.types[op].bitfield.disp64 = 0;
5687 i.types[op].bitfield.disp32s = 1;
5688 }
5689 if (i.prefix[ADDR_PREFIX]
5690 && fits_in_unsigned_long (op_disp))
5691 i.types[op].bitfield.disp32 = 1;
5692 }
5693 if ((i.types[op].bitfield.disp32
5694 || i.types[op].bitfield.disp32s
5695 || i.types[op].bitfield.disp16)
5696 && fits_in_disp8 (op_disp))
5697 i.types[op].bitfield.disp8 = 1;
5698 }
5699 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5700 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5701 {
5702 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5703 i.op[op].disps, 0, i.reloc[op]);
5704 i.types[op].bitfield.disp8 = 0;
5705 i.types[op].bitfield.disp16 = 0;
5706 i.types[op].bitfield.disp32 = 0;
5707 i.types[op].bitfield.disp32s = 0;
5708 i.types[op].bitfield.disp64 = 0;
5709 }
5710 else
5711 /* We only support 64bit displacement on constants. */
5712 i.types[op].bitfield.disp64 = 0;
5713 }
5714 }
5715
5716 /* Return 1 if there is a match in broadcast bytes between operand
5717 GIVEN and instruction template T. */
5718
5719 static INLINE int
5720 match_broadcast_size (const insn_template *t, unsigned int given)
5721 {
5722 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5723 && i.types[given].bitfield.byte)
5724 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5725 && i.types[given].bitfield.word)
5726 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5727 && i.types[given].bitfield.dword)
5728 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5729 && i.types[given].bitfield.qword));
5730 }
5731
5732 /* Check if operands are valid for the instruction. */
5733
5734 static int
5735 check_VecOperands (const insn_template *t)
5736 {
5737 unsigned int op;
5738 i386_cpu_flags cpu;
5739
5740 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5741 any one operand are implicity requiring AVX512VL support if the actual
5742 operand size is YMMword or XMMword. Since this function runs after
5743 template matching, there's no need to check for YMMword/XMMword in
5744 the template. */
5745 cpu = cpu_flags_and (t->cpu_flags, avx512);
5746 if (!cpu_flags_all_zero (&cpu)
5747 && !t->cpu_flags.bitfield.cpuavx512vl
5748 && !cpu_arch_flags.bitfield.cpuavx512vl)
5749 {
5750 for (op = 0; op < t->operands; ++op)
5751 {
5752 if (t->operand_types[op].bitfield.zmmword
5753 && (i.types[op].bitfield.ymmword
5754 || i.types[op].bitfield.xmmword))
5755 {
5756 i.error = unsupported;
5757 return 1;
5758 }
5759 }
5760 }
5761
5762 /* Without VSIB byte, we can't have a vector register for index. */
5763 if (!t->opcode_modifier.vecsib
5764 && i.index_reg
5765 && (i.index_reg->reg_type.bitfield.xmmword
5766 || i.index_reg->reg_type.bitfield.ymmword
5767 || i.index_reg->reg_type.bitfield.zmmword))
5768 {
5769 i.error = unsupported_vector_index_register;
5770 return 1;
5771 }
5772
5773 /* Check if default mask is allowed. */
5774 if (t->opcode_modifier.nodefmask
5775 && (!i.mask || i.mask->mask->reg_num == 0))
5776 {
5777 i.error = no_default_mask;
5778 return 1;
5779 }
5780
5781 /* For VSIB byte, we need a vector register for index, and all vector
5782 registers must be distinct. */
5783 if (t->opcode_modifier.vecsib)
5784 {
5785 if (!i.index_reg
5786 || !((t->opcode_modifier.vecsib == VecSIB128
5787 && i.index_reg->reg_type.bitfield.xmmword)
5788 || (t->opcode_modifier.vecsib == VecSIB256
5789 && i.index_reg->reg_type.bitfield.ymmword)
5790 || (t->opcode_modifier.vecsib == VecSIB512
5791 && i.index_reg->reg_type.bitfield.zmmword)))
5792 {
5793 i.error = invalid_vsib_address;
5794 return 1;
5795 }
5796
5797 gas_assert (i.reg_operands == 2 || i.mask);
5798 if (i.reg_operands == 2 && !i.mask)
5799 {
5800 gas_assert (i.types[0].bitfield.class == RegSIMD);
5801 gas_assert (i.types[0].bitfield.xmmword
5802 || i.types[0].bitfield.ymmword);
5803 gas_assert (i.types[2].bitfield.class == RegSIMD);
5804 gas_assert (i.types[2].bitfield.xmmword
5805 || i.types[2].bitfield.ymmword);
5806 if (operand_check == check_none)
5807 return 0;
5808 if (register_number (i.op[0].regs)
5809 != register_number (i.index_reg)
5810 && register_number (i.op[2].regs)
5811 != register_number (i.index_reg)
5812 && register_number (i.op[0].regs)
5813 != register_number (i.op[2].regs))
5814 return 0;
5815 if (operand_check == check_error)
5816 {
5817 i.error = invalid_vector_register_set;
5818 return 1;
5819 }
5820 as_warn (_("mask, index, and destination registers should be distinct"));
5821 }
5822 else if (i.reg_operands == 1 && i.mask)
5823 {
5824 if (i.types[1].bitfield.class == RegSIMD
5825 && (i.types[1].bitfield.xmmword
5826 || i.types[1].bitfield.ymmword
5827 || i.types[1].bitfield.zmmword)
5828 && (register_number (i.op[1].regs)
5829 == register_number (i.index_reg)))
5830 {
5831 if (operand_check == check_error)
5832 {
5833 i.error = invalid_vector_register_set;
5834 return 1;
5835 }
5836 if (operand_check != check_none)
5837 as_warn (_("index and destination registers should be distinct"));
5838 }
5839 }
5840 }
5841
5842 /* Check if broadcast is supported by the instruction and is applied
5843 to the memory operand. */
5844 if (i.broadcast)
5845 {
5846 i386_operand_type type, overlap;
5847
5848 /* Check if specified broadcast is supported in this instruction,
5849 and its broadcast bytes match the memory operand. */
5850 op = i.broadcast->operand;
5851 if (!t->opcode_modifier.broadcast
5852 || !(i.flags[op] & Operand_Mem)
5853 || (!i.types[op].bitfield.unspecified
5854 && !match_broadcast_size (t, op)))
5855 {
5856 bad_broadcast:
5857 i.error = unsupported_broadcast;
5858 return 1;
5859 }
5860
5861 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5862 * i.broadcast->type);
5863 operand_type_set (&type, 0);
5864 switch (i.broadcast->bytes)
5865 {
5866 case 2:
5867 type.bitfield.word = 1;
5868 break;
5869 case 4:
5870 type.bitfield.dword = 1;
5871 break;
5872 case 8:
5873 type.bitfield.qword = 1;
5874 break;
5875 case 16:
5876 type.bitfield.xmmword = 1;
5877 break;
5878 case 32:
5879 type.bitfield.ymmword = 1;
5880 break;
5881 case 64:
5882 type.bitfield.zmmword = 1;
5883 break;
5884 default:
5885 goto bad_broadcast;
5886 }
5887
5888 overlap = operand_type_and (type, t->operand_types[op]);
5889 if (t->operand_types[op].bitfield.class == RegSIMD
5890 && t->operand_types[op].bitfield.byte
5891 + t->operand_types[op].bitfield.word
5892 + t->operand_types[op].bitfield.dword
5893 + t->operand_types[op].bitfield.qword > 1)
5894 {
5895 overlap.bitfield.xmmword = 0;
5896 overlap.bitfield.ymmword = 0;
5897 overlap.bitfield.zmmword = 0;
5898 }
5899 if (operand_type_all_zero (&overlap))
5900 goto bad_broadcast;
5901
5902 if (t->opcode_modifier.checkregsize)
5903 {
5904 unsigned int j;
5905
5906 type.bitfield.baseindex = 1;
5907 for (j = 0; j < i.operands; ++j)
5908 {
5909 if (j != op
5910 && !operand_type_register_match(i.types[j],
5911 t->operand_types[j],
5912 type,
5913 t->operand_types[op]))
5914 goto bad_broadcast;
5915 }
5916 }
5917 }
5918 /* If broadcast is supported in this instruction, we need to check if
5919 operand of one-element size isn't specified without broadcast. */
5920 else if (t->opcode_modifier.broadcast && i.mem_operands)
5921 {
5922 /* Find memory operand. */
5923 for (op = 0; op < i.operands; op++)
5924 if (i.flags[op] & Operand_Mem)
5925 break;
5926 gas_assert (op < i.operands);
5927 /* Check size of the memory operand. */
5928 if (match_broadcast_size (t, op))
5929 {
5930 i.error = broadcast_needed;
5931 return 1;
5932 }
5933 }
5934 else
5935 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5936
5937 /* Check if requested masking is supported. */
5938 if (i.mask)
5939 {
5940 switch (t->opcode_modifier.masking)
5941 {
5942 case BOTH_MASKING:
5943 break;
5944 case MERGING_MASKING:
5945 if (i.mask->zeroing)
5946 {
5947 case 0:
5948 i.error = unsupported_masking;
5949 return 1;
5950 }
5951 break;
5952 case DYNAMIC_MASKING:
5953 /* Memory destinations allow only merging masking. */
5954 if (i.mask->zeroing && i.mem_operands)
5955 {
5956 /* Find memory operand. */
5957 for (op = 0; op < i.operands; op++)
5958 if (i.flags[op] & Operand_Mem)
5959 break;
5960 gas_assert (op < i.operands);
5961 if (op == i.operands - 1)
5962 {
5963 i.error = unsupported_masking;
5964 return 1;
5965 }
5966 }
5967 break;
5968 default:
5969 abort ();
5970 }
5971 }
5972
5973 /* Check if masking is applied to dest operand. */
5974 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5975 {
5976 i.error = mask_not_on_destination;
5977 return 1;
5978 }
5979
5980 /* Check RC/SAE. */
5981 if (i.rounding)
5982 {
5983 if (!t->opcode_modifier.sae
5984 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5985 {
5986 i.error = unsupported_rc_sae;
5987 return 1;
5988 }
5989 /* If the instruction has several immediate operands and one of
5990 them is rounding, the rounding operand should be the last
5991 immediate operand. */
5992 if (i.imm_operands > 1
5993 && i.rounding->operand != (int) (i.imm_operands - 1))
5994 {
5995 i.error = rc_sae_operand_not_last_imm;
5996 return 1;
5997 }
5998 }
5999
6000 /* Check vector Disp8 operand. */
6001 if (t->opcode_modifier.disp8memshift
6002 && i.disp_encoding != disp_encoding_32bit)
6003 {
6004 if (i.broadcast)
6005 i.memshift = t->opcode_modifier.broadcast - 1;
6006 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6007 i.memshift = t->opcode_modifier.disp8memshift;
6008 else
6009 {
6010 const i386_operand_type *type = NULL;
6011
6012 i.memshift = 0;
6013 for (op = 0; op < i.operands; op++)
6014 if (i.flags[op] & Operand_Mem)
6015 {
6016 if (t->opcode_modifier.evex == EVEXLIG)
6017 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6018 else if (t->operand_types[op].bitfield.xmmword
6019 + t->operand_types[op].bitfield.ymmword
6020 + t->operand_types[op].bitfield.zmmword <= 1)
6021 type = &t->operand_types[op];
6022 else if (!i.types[op].bitfield.unspecified)
6023 type = &i.types[op];
6024 }
6025 else if (i.types[op].bitfield.class == RegSIMD
6026 && t->opcode_modifier.evex != EVEXLIG)
6027 {
6028 if (i.types[op].bitfield.zmmword)
6029 i.memshift = 6;
6030 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6031 i.memshift = 5;
6032 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6033 i.memshift = 4;
6034 }
6035
6036 if (type)
6037 {
6038 if (type->bitfield.zmmword)
6039 i.memshift = 6;
6040 else if (type->bitfield.ymmword)
6041 i.memshift = 5;
6042 else if (type->bitfield.xmmword)
6043 i.memshift = 4;
6044 }
6045
6046 /* For the check in fits_in_disp8(). */
6047 if (i.memshift == 0)
6048 i.memshift = -1;
6049 }
6050
6051 for (op = 0; op < i.operands; op++)
6052 if (operand_type_check (i.types[op], disp)
6053 && i.op[op].disps->X_op == O_constant)
6054 {
6055 if (fits_in_disp8 (i.op[op].disps->X_add_number))
6056 {
6057 i.types[op].bitfield.disp8 = 1;
6058 return 0;
6059 }
6060 i.types[op].bitfield.disp8 = 0;
6061 }
6062 }
6063
6064 i.memshift = 0;
6065
6066 return 0;
6067 }
6068
6069 /* Check if operands are valid for the instruction. Update VEX
6070 operand types. */
6071
6072 static int
6073 VEX_check_operands (const insn_template *t)
6074 {
6075 if (i.vec_encoding == vex_encoding_evex)
6076 {
6077 /* This instruction must be encoded with EVEX prefix. */
6078 if (!is_evex_encoding (t))
6079 {
6080 i.error = unsupported;
6081 return 1;
6082 }
6083 return 0;
6084 }
6085
6086 if (!t->opcode_modifier.vex)
6087 {
6088 /* This instruction template doesn't have VEX prefix. */
6089 if (i.vec_encoding != vex_encoding_default)
6090 {
6091 i.error = unsupported;
6092 return 1;
6093 }
6094 return 0;
6095 }
6096
6097 /* Check the special Imm4 cases; must be the first operand. */
6098 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6099 {
6100 if (i.op[0].imms->X_op != O_constant
6101 || !fits_in_imm4 (i.op[0].imms->X_add_number))
6102 {
6103 i.error = bad_imm4;
6104 return 1;
6105 }
6106
6107 /* Turn off Imm<N> so that update_imm won't complain. */
6108 operand_type_set (&i.types[0], 0);
6109 }
6110
6111 return 0;
6112 }
6113
6114 static const insn_template *
6115 match_template (char mnem_suffix)
6116 {
6117 /* Points to template once we've found it. */
6118 const insn_template *t;
6119 i386_operand_type overlap0, overlap1, overlap2, overlap3;
6120 i386_operand_type overlap4;
6121 unsigned int found_reverse_match;
6122 i386_opcode_modifier suffix_check;
6123 i386_operand_type operand_types [MAX_OPERANDS];
6124 int addr_prefix_disp;
6125 unsigned int j, size_match, check_register;
6126 enum i386_error specific_error = 0;
6127
6128 #if MAX_OPERANDS != 5
6129 # error "MAX_OPERANDS must be 5."
6130 #endif
6131
6132 found_reverse_match = 0;
6133 addr_prefix_disp = -1;
6134
6135 /* Prepare for mnemonic suffix check. */
6136 memset (&suffix_check, 0, sizeof (suffix_check));
6137 switch (mnem_suffix)
6138 {
6139 case BYTE_MNEM_SUFFIX:
6140 suffix_check.no_bsuf = 1;
6141 break;
6142 case WORD_MNEM_SUFFIX:
6143 suffix_check.no_wsuf = 1;
6144 break;
6145 case SHORT_MNEM_SUFFIX:
6146 suffix_check.no_ssuf = 1;
6147 break;
6148 case LONG_MNEM_SUFFIX:
6149 suffix_check.no_lsuf = 1;
6150 break;
6151 case QWORD_MNEM_SUFFIX:
6152 suffix_check.no_qsuf = 1;
6153 break;
6154 default:
6155 /* NB: In Intel syntax, normally we can check for memory operand
6156 size when there is no mnemonic suffix. But jmp and call have
6157 2 different encodings with Dword memory operand size, one with
6158 No_ldSuf and the other without. i.suffix is set to
6159 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
6160 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6161 suffix_check.no_ldsuf = 1;
6162 }
6163
6164 /* Must have right number of operands. */
6165 i.error = number_of_operands_mismatch;
6166
6167 for (t = current_templates->start; t < current_templates->end; t++)
6168 {
6169 addr_prefix_disp = -1;
6170 found_reverse_match = 0;
6171
6172 if (i.operands != t->operands)
6173 continue;
6174
6175 /* Check processor support. */
6176 i.error = unsupported;
6177 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6178 continue;
6179
6180 /* Check AT&T mnemonic. */
6181 i.error = unsupported_with_intel_mnemonic;
6182 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6183 continue;
6184
6185 /* Check AT&T/Intel syntax. */
6186 i.error = unsupported_syntax;
6187 if ((intel_syntax && t->opcode_modifier.attsyntax)
6188 || (!intel_syntax && t->opcode_modifier.intelsyntax))
6189 continue;
6190
6191 /* Check Intel64/AMD64 ISA. */
6192 switch (isa64)
6193 {
6194 default:
6195 /* Default: Don't accept Intel64. */
6196 if (t->opcode_modifier.isa64 == INTEL64)
6197 continue;
6198 break;
6199 case amd64:
6200 /* -mamd64: Don't accept Intel64 and Intel64 only. */
6201 if (t->opcode_modifier.isa64 >= INTEL64)
6202 continue;
6203 break;
6204 case intel64:
6205 /* -mintel64: Don't accept AMD64. */
6206 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6207 continue;
6208 break;
6209 }
6210
6211 /* Check the suffix. */
6212 i.error = invalid_instruction_suffix;
6213 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6214 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6215 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6216 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6217 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6218 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6219 continue;
6220
6221 size_match = operand_size_match (t);
6222 if (!size_match)
6223 continue;
6224
6225 /* This is intentionally not
6226
6227 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6228
6229 as the case of a missing * on the operand is accepted (perhaps with
6230 a warning, issued further down). */
6231 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6232 {
6233 i.error = operand_type_mismatch;
6234 continue;
6235 }
6236
6237 for (j = 0; j < MAX_OPERANDS; j++)
6238 operand_types[j] = t->operand_types[j];
6239
6240 /* In general, don't allow
6241 - 64-bit operands outside of 64-bit mode,
6242 - 32-bit operands on pre-386. */
6243 j = i.imm_operands + (t->operands > i.imm_operands + 1);
6244 if (((i.suffix == QWORD_MNEM_SUFFIX
6245 && flag_code != CODE_64BIT
6246 && (t->base_opcode != 0x0fc7
6247 || t->extension_opcode != 1 /* cmpxchg8b */))
6248 || (i.suffix == LONG_MNEM_SUFFIX
6249 && !cpu_arch_flags.bitfield.cpui386))
6250 && (intel_syntax
6251 ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6252 && !intel_float_operand (t->name))
6253 : intel_float_operand (t->name) != 2)
6254 && (t->operands == i.imm_operands
6255 || (operand_types[i.imm_operands].bitfield.class != RegMMX
6256 && operand_types[i.imm_operands].bitfield.class != RegSIMD
6257 && operand_types[i.imm_operands].bitfield.class != RegMask)
6258 || (operand_types[j].bitfield.class != RegMMX
6259 && operand_types[j].bitfield.class != RegSIMD
6260 && operand_types[j].bitfield.class != RegMask))
6261 && !t->opcode_modifier.vecsib)
6262 continue;
6263
6264 /* Do not verify operands when there are none. */
6265 if (!t->operands)
6266 /* We've found a match; break out of loop. */
6267 break;
6268
6269 if (!t->opcode_modifier.jump
6270 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6271 {
6272 /* There should be only one Disp operand. */
6273 for (j = 0; j < MAX_OPERANDS; j++)
6274 if (operand_type_check (operand_types[j], disp))
6275 break;
6276 if (j < MAX_OPERANDS)
6277 {
6278 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6279
6280 addr_prefix_disp = j;
6281
6282 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6283 operand into Disp32/Disp32/Disp16/Disp32 operand. */
6284 switch (flag_code)
6285 {
6286 case CODE_16BIT:
6287 override = !override;
6288 /* Fall through. */
6289 case CODE_32BIT:
6290 if (operand_types[j].bitfield.disp32
6291 && operand_types[j].bitfield.disp16)
6292 {
6293 operand_types[j].bitfield.disp16 = override;
6294 operand_types[j].bitfield.disp32 = !override;
6295 }
6296 operand_types[j].bitfield.disp32s = 0;
6297 operand_types[j].bitfield.disp64 = 0;
6298 break;
6299
6300 case CODE_64BIT:
6301 if (operand_types[j].bitfield.disp32s
6302 || operand_types[j].bitfield.disp64)
6303 {
6304 operand_types[j].bitfield.disp64 &= !override;
6305 operand_types[j].bitfield.disp32s &= !override;
6306 operand_types[j].bitfield.disp32 = override;
6307 }
6308 operand_types[j].bitfield.disp16 = 0;
6309 break;
6310 }
6311 }
6312 }
6313
6314 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
6315 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6316 continue;
6317
6318 /* We check register size if needed. */
6319 if (t->opcode_modifier.checkregsize)
6320 {
6321 check_register = (1 << t->operands) - 1;
6322 if (i.broadcast)
6323 check_register &= ~(1 << i.broadcast->operand);
6324 }
6325 else
6326 check_register = 0;
6327
6328 overlap0 = operand_type_and (i.types[0], operand_types[0]);
6329 switch (t->operands)
6330 {
6331 case 1:
6332 if (!operand_type_match (overlap0, i.types[0]))
6333 continue;
6334 break;
6335 case 2:
6336 /* xchg %eax, %eax is a special case. It is an alias for nop
6337 only in 32bit mode and we can use opcode 0x90. In 64bit
6338 mode, we can't use 0x90 for xchg %eax, %eax since it should
6339 zero-extend %eax to %rax. */
6340 if (flag_code == CODE_64BIT
6341 && t->base_opcode == 0x90
6342 && i.types[0].bitfield.instance == Accum
6343 && i.types[0].bitfield.dword
6344 && i.types[1].bitfield.instance == Accum
6345 && i.types[1].bitfield.dword)
6346 continue;
6347 /* xrelease mov %eax, <disp> is another special case. It must not
6348 match the accumulator-only encoding of mov. */
6349 if (flag_code != CODE_64BIT
6350 && i.hle_prefix
6351 && t->base_opcode == 0xa0
6352 && i.types[0].bitfield.instance == Accum
6353 && (i.flags[1] & Operand_Mem))
6354 continue;
6355 /* Fall through. */
6356
6357 case 3:
6358 if (!(size_match & MATCH_STRAIGHT))
6359 goto check_reverse;
6360 /* Reverse direction of operands if swapping is possible in the first
6361 place (operands need to be symmetric) and
6362 - the load form is requested, and the template is a store form,
6363 - the store form is requested, and the template is a load form,
6364 - the non-default (swapped) form is requested. */
6365 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6366 if (t->opcode_modifier.d && i.reg_operands == i.operands
6367 && !operand_type_all_zero (&overlap1))
6368 switch (i.dir_encoding)
6369 {
6370 case dir_encoding_load:
6371 if (operand_type_check (operand_types[i.operands - 1], anymem)
6372 || t->opcode_modifier.regmem)
6373 goto check_reverse;
6374 break;
6375
6376 case dir_encoding_store:
6377 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6378 && !t->opcode_modifier.regmem)
6379 goto check_reverse;
6380 break;
6381
6382 case dir_encoding_swap:
6383 goto check_reverse;
6384
6385 case dir_encoding_default:
6386 break;
6387 }
6388 /* If we want store form, we skip the current load. */
6389 if ((i.dir_encoding == dir_encoding_store
6390 || i.dir_encoding == dir_encoding_swap)
6391 && i.mem_operands == 0
6392 && t->opcode_modifier.load)
6393 continue;
6394 /* Fall through. */
6395 case 4:
6396 case 5:
6397 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6398 if (!operand_type_match (overlap0, i.types[0])
6399 || !operand_type_match (overlap1, i.types[1])
6400 || ((check_register & 3) == 3
6401 && !operand_type_register_match (i.types[0],
6402 operand_types[0],
6403 i.types[1],
6404 operand_types[1])))
6405 {
6406 /* Check if other direction is valid ... */
6407 if (!t->opcode_modifier.d)
6408 continue;
6409
6410 check_reverse:
6411 if (!(size_match & MATCH_REVERSE))
6412 continue;
6413 /* Try reversing direction of operands. */
6414 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6415 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6416 if (!operand_type_match (overlap0, i.types[0])
6417 || !operand_type_match (overlap1, i.types[i.operands - 1])
6418 || (check_register
6419 && !operand_type_register_match (i.types[0],
6420 operand_types[i.operands - 1],
6421 i.types[i.operands - 1],
6422 operand_types[0])))
6423 {
6424 /* Does not match either direction. */
6425 continue;
6426 }
6427 /* found_reverse_match holds which of D or FloatR
6428 we've found. */
6429 if (!t->opcode_modifier.d)
6430 found_reverse_match = 0;
6431 else if (operand_types[0].bitfield.tbyte)
6432 found_reverse_match = Opcode_FloatD;
6433 else if (operand_types[0].bitfield.xmmword
6434 || operand_types[i.operands - 1].bitfield.xmmword
6435 || operand_types[0].bitfield.class == RegMMX
6436 || operand_types[i.operands - 1].bitfield.class == RegMMX
6437 || is_any_vex_encoding(t))
6438 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6439 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6440 else
6441 found_reverse_match = Opcode_D;
6442 if (t->opcode_modifier.floatr)
6443 found_reverse_match |= Opcode_FloatR;
6444 }
6445 else
6446 {
6447 /* Found a forward 2 operand match here. */
6448 switch (t->operands)
6449 {
6450 case 5:
6451 overlap4 = operand_type_and (i.types[4],
6452 operand_types[4]);
6453 /* Fall through. */
6454 case 4:
6455 overlap3 = operand_type_and (i.types[3],
6456 operand_types[3]);
6457 /* Fall through. */
6458 case 3:
6459 overlap2 = operand_type_and (i.types[2],
6460 operand_types[2]);
6461 break;
6462 }
6463
6464 switch (t->operands)
6465 {
6466 case 5:
6467 if (!operand_type_match (overlap4, i.types[4])
6468 || !operand_type_register_match (i.types[3],
6469 operand_types[3],
6470 i.types[4],
6471 operand_types[4]))
6472 continue;
6473 /* Fall through. */
6474 case 4:
6475 if (!operand_type_match (overlap3, i.types[3])
6476 || ((check_register & 0xa) == 0xa
6477 && !operand_type_register_match (i.types[1],
6478 operand_types[1],
6479 i.types[3],
6480 operand_types[3]))
6481 || ((check_register & 0xc) == 0xc
6482 && !operand_type_register_match (i.types[2],
6483 operand_types[2],
6484 i.types[3],
6485 operand_types[3])))
6486 continue;
6487 /* Fall through. */
6488 case 3:
6489 /* Here we make use of the fact that there are no
6490 reverse match 3 operand instructions. */
6491 if (!operand_type_match (overlap2, i.types[2])
6492 || ((check_register & 5) == 5
6493 && !operand_type_register_match (i.types[0],
6494 operand_types[0],
6495 i.types[2],
6496 operand_types[2]))
6497 || ((check_register & 6) == 6
6498 && !operand_type_register_match (i.types[1],
6499 operand_types[1],
6500 i.types[2],
6501 operand_types[2])))
6502 continue;
6503 break;
6504 }
6505 }
6506 /* Found either forward/reverse 2, 3 or 4 operand match here:
6507 slip through to break. */
6508 }
6509
6510 /* Check if vector and VEX operands are valid. */
6511 if (check_VecOperands (t) || VEX_check_operands (t))
6512 {
6513 specific_error = i.error;
6514 continue;
6515 }
6516
6517 /* We've found a match; break out of loop. */
6518 break;
6519 }
6520
6521 if (t == current_templates->end)
6522 {
6523 /* We found no match. */
6524 const char *err_msg;
6525 switch (specific_error ? specific_error : i.error)
6526 {
6527 default:
6528 abort ();
6529 case operand_size_mismatch:
6530 err_msg = _("operand size mismatch");
6531 break;
6532 case operand_type_mismatch:
6533 err_msg = _("operand type mismatch");
6534 break;
6535 case register_type_mismatch:
6536 err_msg = _("register type mismatch");
6537 break;
6538 case number_of_operands_mismatch:
6539 err_msg = _("number of operands mismatch");
6540 break;
6541 case invalid_instruction_suffix:
6542 err_msg = _("invalid instruction suffix");
6543 break;
6544 case bad_imm4:
6545 err_msg = _("constant doesn't fit in 4 bits");
6546 break;
6547 case unsupported_with_intel_mnemonic:
6548 err_msg = _("unsupported with Intel mnemonic");
6549 break;
6550 case unsupported_syntax:
6551 err_msg = _("unsupported syntax");
6552 break;
6553 case unsupported:
6554 as_bad (_("unsupported instruction `%s'"),
6555 current_templates->start->name);
6556 return NULL;
6557 case invalid_vsib_address:
6558 err_msg = _("invalid VSIB address");
6559 break;
6560 case invalid_vector_register_set:
6561 err_msg = _("mask, index, and destination registers must be distinct");
6562 break;
6563 case unsupported_vector_index_register:
6564 err_msg = _("unsupported vector index register");
6565 break;
6566 case unsupported_broadcast:
6567 err_msg = _("unsupported broadcast");
6568 break;
6569 case broadcast_needed:
6570 err_msg = _("broadcast is needed for operand of such type");
6571 break;
6572 case unsupported_masking:
6573 err_msg = _("unsupported masking");
6574 break;
6575 case mask_not_on_destination:
6576 err_msg = _("mask not on destination operand");
6577 break;
6578 case no_default_mask:
6579 err_msg = _("default mask isn't allowed");
6580 break;
6581 case unsupported_rc_sae:
6582 err_msg = _("unsupported static rounding/sae");
6583 break;
6584 case rc_sae_operand_not_last_imm:
6585 if (intel_syntax)
6586 err_msg = _("RC/SAE operand must precede immediate operands");
6587 else
6588 err_msg = _("RC/SAE operand must follow immediate operands");
6589 break;
6590 case invalid_register_operand:
6591 err_msg = _("invalid register operand");
6592 break;
6593 }
6594 as_bad (_("%s for `%s'"), err_msg,
6595 current_templates->start->name);
6596 return NULL;
6597 }
6598
6599 if (!quiet_warnings)
6600 {
6601 if (!intel_syntax
6602 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6603 as_warn (_("indirect %s without `*'"), t->name);
6604
6605 if (t->opcode_modifier.isprefix
6606 && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6607 {
6608 /* Warn them that a data or address size prefix doesn't
6609 affect assembly of the next line of code. */
6610 as_warn (_("stand-alone `%s' prefix"), t->name);
6611 }
6612 }
6613
6614 /* Copy the template we found. */
6615 i.tm = *t;
6616
6617 if (addr_prefix_disp != -1)
6618 i.tm.operand_types[addr_prefix_disp]
6619 = operand_types[addr_prefix_disp];
6620
6621 if (found_reverse_match)
6622 {
6623 /* If we found a reverse match we must alter the opcode direction
6624 bit and clear/flip the regmem modifier one. found_reverse_match
6625 holds bits to change (different for int & float insns). */
6626
6627 i.tm.base_opcode ^= found_reverse_match;
6628
6629 i.tm.operand_types[0] = operand_types[i.operands - 1];
6630 i.tm.operand_types[i.operands - 1] = operand_types[0];
6631
6632 /* Certain SIMD insns have their load forms specified in the opcode
6633 table, and hence we need to _set_ RegMem instead of clearing it.
6634 We need to avoid setting the bit though on insns like KMOVW. */
6635 i.tm.opcode_modifier.regmem
6636 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6637 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6638 && !i.tm.opcode_modifier.regmem;
6639 }
6640
6641 return t;
6642 }
6643
6644 static int
6645 check_string (void)
6646 {
6647 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6648 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6649
6650 if (i.seg[op] != NULL && i.seg[op] != &es)
6651 {
6652 as_bad (_("`%s' operand %u must use `%ses' segment"),
6653 i.tm.name,
6654 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6655 register_prefix);
6656 return 0;
6657 }
6658
6659 /* There's only ever one segment override allowed per instruction.
6660 This instruction possibly has a legal segment override on the
6661 second operand, so copy the segment to where non-string
6662 instructions store it, allowing common code. */
6663 i.seg[op] = i.seg[1];
6664
6665 return 1;
6666 }
6667
6668 static int
6669 process_suffix (void)
6670 {
6671 /* If matched instruction specifies an explicit instruction mnemonic
6672 suffix, use it. */
6673 if (i.tm.opcode_modifier.size == SIZE16)
6674 i.suffix = WORD_MNEM_SUFFIX;
6675 else if (i.tm.opcode_modifier.size == SIZE32)
6676 i.suffix = LONG_MNEM_SUFFIX;
6677 else if (i.tm.opcode_modifier.size == SIZE64)
6678 i.suffix = QWORD_MNEM_SUFFIX;
6679 else if (i.reg_operands
6680 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6681 && !i.tm.opcode_modifier.addrprefixopreg)
6682 {
6683 unsigned int numop = i.operands;
6684
6685 /* movsx/movzx want only their source operand considered here, for the
6686 ambiguity checking below. The suffix will be replaced afterwards
6687 to represent the destination (register). */
6688 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6689 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6690 --i.operands;
6691
6692 /* crc32 needs REX.W set regardless of suffix / source operand size. */
6693 if (i.tm.base_opcode == 0xf20f38f0
6694 && i.tm.operand_types[1].bitfield.qword)
6695 i.rex |= REX_W;
6696
6697 /* If there's no instruction mnemonic suffix we try to invent one
6698 based on GPR operands. */
6699 if (!i.suffix)
6700 {
6701 /* We take i.suffix from the last register operand specified,
6702 Destination register type is more significant than source
6703 register type. crc32 in SSE4.2 prefers source register
6704 type. */
6705 unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6706
6707 while (op--)
6708 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6709 || i.tm.operand_types[op].bitfield.instance == Accum)
6710 {
6711 if (i.types[op].bitfield.class != Reg)
6712 continue;
6713 if (i.types[op].bitfield.byte)
6714 i.suffix = BYTE_MNEM_SUFFIX;
6715 else if (i.types[op].bitfield.word)
6716 i.suffix = WORD_MNEM_SUFFIX;
6717 else if (i.types[op].bitfield.dword)
6718 i.suffix = LONG_MNEM_SUFFIX;
6719 else if (i.types[op].bitfield.qword)
6720 i.suffix = QWORD_MNEM_SUFFIX;
6721 else
6722 continue;
6723 break;
6724 }
6725
6726 /* As an exception, movsx/movzx silently default to a byte source
6727 in AT&T mode. */
6728 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6729 && !i.suffix && !intel_syntax)
6730 i.suffix = BYTE_MNEM_SUFFIX;
6731 }
6732 else if (i.suffix == BYTE_MNEM_SUFFIX)
6733 {
6734 if (intel_syntax
6735 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6736 && i.tm.opcode_modifier.no_bsuf)
6737 i.suffix = 0;
6738 else if (!check_byte_reg ())
6739 return 0;
6740 }
6741 else if (i.suffix == LONG_MNEM_SUFFIX)
6742 {
6743 if (intel_syntax
6744 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6745 && i.tm.opcode_modifier.no_lsuf
6746 && !i.tm.opcode_modifier.todword
6747 && !i.tm.opcode_modifier.toqword)
6748 i.suffix = 0;
6749 else if (!check_long_reg ())
6750 return 0;
6751 }
6752 else if (i.suffix == QWORD_MNEM_SUFFIX)
6753 {
6754 if (intel_syntax
6755 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6756 && i.tm.opcode_modifier.no_qsuf
6757 && !i.tm.opcode_modifier.todword
6758 && !i.tm.opcode_modifier.toqword)
6759 i.suffix = 0;
6760 else if (!check_qword_reg ())
6761 return 0;
6762 }
6763 else if (i.suffix == WORD_MNEM_SUFFIX)
6764 {
6765 if (intel_syntax
6766 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6767 && i.tm.opcode_modifier.no_wsuf)
6768 i.suffix = 0;
6769 else if (!check_word_reg ())
6770 return 0;
6771 }
6772 else if (intel_syntax
6773 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6774 /* Do nothing if the instruction is going to ignore the prefix. */
6775 ;
6776 else
6777 abort ();
6778
6779 /* Undo the movsx/movzx change done above. */
6780 i.operands = numop;
6781 }
6782 else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6783 && !i.suffix)
6784 {
6785 i.suffix = stackop_size;
6786 if (stackop_size == LONG_MNEM_SUFFIX)
6787 {
6788 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6789 .code16gcc directive to support 16-bit mode with
6790 32-bit address. For IRET without a suffix, generate
6791 16-bit IRET (opcode 0xcf) to return from an interrupt
6792 handler. */
6793 if (i.tm.base_opcode == 0xcf)
6794 {
6795 i.suffix = WORD_MNEM_SUFFIX;
6796 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6797 }
6798 /* Warn about changed behavior for segment register push/pop. */
6799 else if ((i.tm.base_opcode | 1) == 0x07)
6800 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6801 i.tm.name);
6802 }
6803 }
6804 else if (!i.suffix
6805 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6806 || i.tm.opcode_modifier.jump == JUMP_BYTE
6807 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6808 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6809 && i.tm.extension_opcode <= 3)))
6810 {
6811 switch (flag_code)
6812 {
6813 case CODE_64BIT:
6814 if (!i.tm.opcode_modifier.no_qsuf)
6815 {
6816 i.suffix = QWORD_MNEM_SUFFIX;
6817 break;
6818 }
6819 /* Fall through. */
6820 case CODE_32BIT:
6821 if (!i.tm.opcode_modifier.no_lsuf)
6822 i.suffix = LONG_MNEM_SUFFIX;
6823 break;
6824 case CODE_16BIT:
6825 if (!i.tm.opcode_modifier.no_wsuf)
6826 i.suffix = WORD_MNEM_SUFFIX;
6827 break;
6828 }
6829 }
6830
6831 if (!i.suffix
6832 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6833 /* Also cover lret/retf/iret in 64-bit mode. */
6834 || (flag_code == CODE_64BIT
6835 && !i.tm.opcode_modifier.no_lsuf
6836 && !i.tm.opcode_modifier.no_qsuf))
6837 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6838 /* Accept FLDENV et al without suffix. */
6839 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6840 {
6841 unsigned int suffixes, evex = 0;
6842
6843 suffixes = !i.tm.opcode_modifier.no_bsuf;
6844 if (!i.tm.opcode_modifier.no_wsuf)
6845 suffixes |= 1 << 1;
6846 if (!i.tm.opcode_modifier.no_lsuf)
6847 suffixes |= 1 << 2;
6848 if (!i.tm.opcode_modifier.no_ldsuf)
6849 suffixes |= 1 << 3;
6850 if (!i.tm.opcode_modifier.no_ssuf)
6851 suffixes |= 1 << 4;
6852 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6853 suffixes |= 1 << 5;
6854
6855 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6856 also suitable for AT&T syntax mode, it was requested that this be
6857 restricted to just Intel syntax. */
6858 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6859 {
6860 unsigned int op;
6861
6862 for (op = 0; op < i.tm.operands; ++op)
6863 {
6864 if (is_evex_encoding (&i.tm)
6865 && !cpu_arch_flags.bitfield.cpuavx512vl)
6866 {
6867 if (i.tm.operand_types[op].bitfield.ymmword)
6868 i.tm.operand_types[op].bitfield.xmmword = 0;
6869 if (i.tm.operand_types[op].bitfield.zmmword)
6870 i.tm.operand_types[op].bitfield.ymmword = 0;
6871 if (!i.tm.opcode_modifier.evex
6872 || i.tm.opcode_modifier.evex == EVEXDYN)
6873 i.tm.opcode_modifier.evex = EVEX512;
6874 }
6875
6876 if (i.tm.operand_types[op].bitfield.xmmword
6877 + i.tm.operand_types[op].bitfield.ymmword
6878 + i.tm.operand_types[op].bitfield.zmmword < 2)
6879 continue;
6880
6881 /* Any properly sized operand disambiguates the insn. */
6882 if (i.types[op].bitfield.xmmword
6883 || i.types[op].bitfield.ymmword
6884 || i.types[op].bitfield.zmmword)
6885 {
6886 suffixes &= ~(7 << 6);
6887 evex = 0;
6888 break;
6889 }
6890
6891 if ((i.flags[op] & Operand_Mem)
6892 && i.tm.operand_types[op].bitfield.unspecified)
6893 {
6894 if (i.tm.operand_types[op].bitfield.xmmword)
6895 suffixes |= 1 << 6;
6896 if (i.tm.operand_types[op].bitfield.ymmword)
6897 suffixes |= 1 << 7;
6898 if (i.tm.operand_types[op].bitfield.zmmword)
6899 suffixes |= 1 << 8;
6900 if (is_evex_encoding (&i.tm))
6901 evex = EVEX512;
6902 }
6903 }
6904 }
6905
6906 /* Are multiple suffixes / operand sizes allowed? */
6907 if (suffixes & (suffixes - 1))
6908 {
6909 if (intel_syntax
6910 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6911 || operand_check == check_error))
6912 {
6913 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6914 return 0;
6915 }
6916 if (operand_check == check_error)
6917 {
6918 as_bad (_("no instruction mnemonic suffix given and "
6919 "no register operands; can't size `%s'"), i.tm.name);
6920 return 0;
6921 }
6922 if (operand_check == check_warning)
6923 as_warn (_("%s; using default for `%s'"),
6924 intel_syntax
6925 ? _("ambiguous operand size")
6926 : _("no instruction mnemonic suffix given and "
6927 "no register operands"),
6928 i.tm.name);
6929
6930 if (i.tm.opcode_modifier.floatmf)
6931 i.suffix = SHORT_MNEM_SUFFIX;
6932 else if ((i.tm.base_opcode | 8) == 0xfbe
6933 || (i.tm.base_opcode == 0x63
6934 && i.tm.cpu_flags.bitfield.cpu64))
6935 /* handled below */;
6936 else if (evex)
6937 i.tm.opcode_modifier.evex = evex;
6938 else if (flag_code == CODE_16BIT)
6939 i.suffix = WORD_MNEM_SUFFIX;
6940 else if (!i.tm.opcode_modifier.no_lsuf)
6941 i.suffix = LONG_MNEM_SUFFIX;
6942 else
6943 i.suffix = QWORD_MNEM_SUFFIX;
6944 }
6945 }
6946
6947 if ((i.tm.base_opcode | 8) == 0xfbe
6948 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6949 {
6950 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
6951 In AT&T syntax, if there is no suffix (warned about above), the default
6952 will be byte extension. */
6953 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
6954 i.tm.base_opcode |= 1;
6955
6956 /* For further processing, the suffix should represent the destination
6957 (register). This is already the case when one was used with
6958 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
6959 no suffix to begin with. */
6960 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
6961 {
6962 if (i.types[1].bitfield.word)
6963 i.suffix = WORD_MNEM_SUFFIX;
6964 else if (i.types[1].bitfield.qword)
6965 i.suffix = QWORD_MNEM_SUFFIX;
6966 else
6967 i.suffix = LONG_MNEM_SUFFIX;
6968
6969 i.tm.opcode_modifier.w = 0;
6970 }
6971 }
6972
6973 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
6974 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
6975 != (i.tm.operand_types[1].bitfield.class == Reg);
6976
6977 /* Change the opcode based on the operand size given by i.suffix. */
6978 switch (i.suffix)
6979 {
6980 /* Size floating point instruction. */
6981 case LONG_MNEM_SUFFIX:
6982 if (i.tm.opcode_modifier.floatmf)
6983 {
6984 i.tm.base_opcode ^= 4;
6985 break;
6986 }
6987 /* fall through */
6988 case WORD_MNEM_SUFFIX:
6989 case QWORD_MNEM_SUFFIX:
6990 /* It's not a byte, select word/dword operation. */
6991 if (i.tm.opcode_modifier.w)
6992 {
6993 if (i.short_form)
6994 i.tm.base_opcode |= 8;
6995 else
6996 i.tm.base_opcode |= 1;
6997 }
6998 /* fall through */
6999 case SHORT_MNEM_SUFFIX:
7000 /* Now select between word & dword operations via the operand
7001 size prefix, except for instructions that will ignore this
7002 prefix anyway. */
7003 if (i.suffix != QWORD_MNEM_SUFFIX
7004 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7005 && !i.tm.opcode_modifier.floatmf
7006 && !is_any_vex_encoding (&i.tm)
7007 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7008 || (flag_code == CODE_64BIT
7009 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7010 {
7011 unsigned int prefix = DATA_PREFIX_OPCODE;
7012
7013 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7014 prefix = ADDR_PREFIX_OPCODE;
7015
7016 if (!add_prefix (prefix))
7017 return 0;
7018 }
7019
7020 /* Set mode64 for an operand. */
7021 if (i.suffix == QWORD_MNEM_SUFFIX
7022 && flag_code == CODE_64BIT
7023 && !i.tm.opcode_modifier.norex64
7024 && !i.tm.opcode_modifier.vexw
7025 /* Special case for xchg %rax,%rax. It is NOP and doesn't
7026 need rex64. */
7027 && ! (i.operands == 2
7028 && i.tm.base_opcode == 0x90
7029 && i.tm.extension_opcode == None
7030 && i.types[0].bitfield.instance == Accum
7031 && i.types[0].bitfield.qword
7032 && i.types[1].bitfield.instance == Accum
7033 && i.types[1].bitfield.qword))
7034 i.rex |= REX_W;
7035
7036 break;
7037 }
7038
7039 if (i.tm.opcode_modifier.addrprefixopreg)
7040 {
7041 gas_assert (!i.suffix);
7042 gas_assert (i.reg_operands);
7043
7044 if (i.tm.operand_types[0].bitfield.instance == Accum
7045 || i.operands == 1)
7046 {
7047 /* The address size override prefix changes the size of the
7048 first operand. */
7049 if (flag_code == CODE_64BIT
7050 && i.op[0].regs->reg_type.bitfield.word)
7051 {
7052 as_bad (_("16-bit addressing unavailable for `%s'"),
7053 i.tm.name);
7054 return 0;
7055 }
7056
7057 if ((flag_code == CODE_32BIT
7058 ? i.op[0].regs->reg_type.bitfield.word
7059 : i.op[0].regs->reg_type.bitfield.dword)
7060 && !add_prefix (ADDR_PREFIX_OPCODE))
7061 return 0;
7062 }
7063 else
7064 {
7065 /* Check invalid register operand when the address size override
7066 prefix changes the size of register operands. */
7067 unsigned int op;
7068 enum { need_word, need_dword, need_qword } need;
7069
7070 if (flag_code == CODE_32BIT)
7071 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7072 else if (i.prefix[ADDR_PREFIX])
7073 need = need_dword;
7074 else
7075 need = flag_code == CODE_64BIT ? need_qword : need_word;
7076
7077 for (op = 0; op < i.operands; op++)
7078 {
7079 if (i.types[op].bitfield.class != Reg)
7080 continue;
7081
7082 switch (need)
7083 {
7084 case need_word:
7085 if (i.op[op].regs->reg_type.bitfield.word)
7086 continue;
7087 break;
7088 case need_dword:
7089 if (i.op[op].regs->reg_type.bitfield.dword)
7090 continue;
7091 break;
7092 case need_qword:
7093 if (i.op[op].regs->reg_type.bitfield.qword)
7094 continue;
7095 break;
7096 }
7097
7098 as_bad (_("invalid register operand size for `%s'"),
7099 i.tm.name);
7100 return 0;
7101 }
7102 }
7103 }
7104
7105 return 1;
7106 }
7107
7108 static int
7109 check_byte_reg (void)
7110 {
7111 int op;
7112
7113 for (op = i.operands; --op >= 0;)
7114 {
7115 /* Skip non-register operands. */
7116 if (i.types[op].bitfield.class != Reg)
7117 continue;
7118
7119 /* If this is an eight bit register, it's OK. If it's the 16 or
7120 32 bit version of an eight bit register, we will just use the
7121 low portion, and that's OK too. */
7122 if (i.types[op].bitfield.byte)
7123 continue;
7124
7125 /* I/O port address operands are OK too. */
7126 if (i.tm.operand_types[op].bitfield.instance == RegD
7127 && i.tm.operand_types[op].bitfield.word)
7128 continue;
7129
7130 /* crc32 only wants its source operand checked here. */
7131 if (i.tm.base_opcode == 0xf20f38f0 && op)
7132 continue;
7133
7134 /* Any other register is bad. */
7135 as_bad (_("`%s%s' not allowed with `%s%c'"),
7136 register_prefix, i.op[op].regs->reg_name,
7137 i.tm.name, i.suffix);
7138 return 0;
7139 }
7140 return 1;
7141 }
7142
7143 static int
7144 check_long_reg (void)
7145 {
7146 int op;
7147
7148 for (op = i.operands; --op >= 0;)
7149 /* Skip non-register operands. */
7150 if (i.types[op].bitfield.class != Reg)
7151 continue;
7152 /* Reject eight bit registers, except where the template requires
7153 them. (eg. movzb) */
7154 else if (i.types[op].bitfield.byte
7155 && (i.tm.operand_types[op].bitfield.class == Reg
7156 || i.tm.operand_types[op].bitfield.instance == Accum)
7157 && (i.tm.operand_types[op].bitfield.word
7158 || i.tm.operand_types[op].bitfield.dword))
7159 {
7160 as_bad (_("`%s%s' not allowed with `%s%c'"),
7161 register_prefix,
7162 i.op[op].regs->reg_name,
7163 i.tm.name,
7164 i.suffix);
7165 return 0;
7166 }
7167 /* Error if the e prefix on a general reg is missing. */
7168 else if (i.types[op].bitfield.word
7169 && (i.tm.operand_types[op].bitfield.class == Reg
7170 || i.tm.operand_types[op].bitfield.instance == Accum)
7171 && i.tm.operand_types[op].bitfield.dword)
7172 {
7173 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7174 register_prefix, i.op[op].regs->reg_name,
7175 i.suffix);
7176 return 0;
7177 }
7178 /* Warn if the r prefix on a general reg is present. */
7179 else if (i.types[op].bitfield.qword
7180 && (i.tm.operand_types[op].bitfield.class == Reg
7181 || i.tm.operand_types[op].bitfield.instance == Accum)
7182 && i.tm.operand_types[op].bitfield.dword)
7183 {
7184 if (intel_syntax
7185 && i.tm.opcode_modifier.toqword
7186 && i.types[0].bitfield.class != RegSIMD)
7187 {
7188 /* Convert to QWORD. We want REX byte. */
7189 i.suffix = QWORD_MNEM_SUFFIX;
7190 }
7191 else
7192 {
7193 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7194 register_prefix, i.op[op].regs->reg_name,
7195 i.suffix);
7196 return 0;
7197 }
7198 }
7199 return 1;
7200 }
7201
7202 static int
7203 check_qword_reg (void)
7204 {
7205 int op;
7206
7207 for (op = i.operands; --op >= 0; )
7208 /* Skip non-register operands. */
7209 if (i.types[op].bitfield.class != Reg)
7210 continue;
7211 /* Reject eight bit registers, except where the template requires
7212 them. (eg. movzb) */
7213 else if (i.types[op].bitfield.byte
7214 && (i.tm.operand_types[op].bitfield.class == Reg
7215 || i.tm.operand_types[op].bitfield.instance == Accum)
7216 && (i.tm.operand_types[op].bitfield.word
7217 || i.tm.operand_types[op].bitfield.dword))
7218 {
7219 as_bad (_("`%s%s' not allowed with `%s%c'"),
7220 register_prefix,
7221 i.op[op].regs->reg_name,
7222 i.tm.name,
7223 i.suffix);
7224 return 0;
7225 }
7226 /* Warn if the r prefix on a general reg is missing. */
7227 else if ((i.types[op].bitfield.word
7228 || i.types[op].bitfield.dword)
7229 && (i.tm.operand_types[op].bitfield.class == Reg
7230 || i.tm.operand_types[op].bitfield.instance == Accum)
7231 && i.tm.operand_types[op].bitfield.qword)
7232 {
7233 /* Prohibit these changes in the 64bit mode, since the
7234 lowering is more complicated. */
7235 if (intel_syntax
7236 && i.tm.opcode_modifier.todword
7237 && i.types[0].bitfield.class != RegSIMD)
7238 {
7239 /* Convert to DWORD. We don't want REX byte. */
7240 i.suffix = LONG_MNEM_SUFFIX;
7241 }
7242 else
7243 {
7244 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7245 register_prefix, i.op[op].regs->reg_name,
7246 i.suffix);
7247 return 0;
7248 }
7249 }
7250 return 1;
7251 }
7252
7253 static int
7254 check_word_reg (void)
7255 {
7256 int op;
7257 for (op = i.operands; --op >= 0;)
7258 /* Skip non-register operands. */
7259 if (i.types[op].bitfield.class != Reg)
7260 continue;
7261 /* Reject eight bit registers, except where the template requires
7262 them. (eg. movzb) */
7263 else if (i.types[op].bitfield.byte
7264 && (i.tm.operand_types[op].bitfield.class == Reg
7265 || i.tm.operand_types[op].bitfield.instance == Accum)
7266 && (i.tm.operand_types[op].bitfield.word
7267 || i.tm.operand_types[op].bitfield.dword))
7268 {
7269 as_bad (_("`%s%s' not allowed with `%s%c'"),
7270 register_prefix,
7271 i.op[op].regs->reg_name,
7272 i.tm.name,
7273 i.suffix);
7274 return 0;
7275 }
7276 /* Error if the e or r prefix on a general reg is present. */
7277 else if ((i.types[op].bitfield.dword
7278 || i.types[op].bitfield.qword)
7279 && (i.tm.operand_types[op].bitfield.class == Reg
7280 || i.tm.operand_types[op].bitfield.instance == Accum)
7281 && i.tm.operand_types[op].bitfield.word)
7282 {
7283 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7284 register_prefix, i.op[op].regs->reg_name,
7285 i.suffix);
7286 return 0;
7287 }
7288 return 1;
7289 }
7290
7291 static int
7292 update_imm (unsigned int j)
7293 {
7294 i386_operand_type overlap = i.types[j];
7295 if ((overlap.bitfield.imm8
7296 || overlap.bitfield.imm8s
7297 || overlap.bitfield.imm16
7298 || overlap.bitfield.imm32
7299 || overlap.bitfield.imm32s
7300 || overlap.bitfield.imm64)
7301 && !operand_type_equal (&overlap, &imm8)
7302 && !operand_type_equal (&overlap, &imm8s)
7303 && !operand_type_equal (&overlap, &imm16)
7304 && !operand_type_equal (&overlap, &imm32)
7305 && !operand_type_equal (&overlap, &imm32s)
7306 && !operand_type_equal (&overlap, &imm64))
7307 {
7308 if (i.suffix)
7309 {
7310 i386_operand_type temp;
7311
7312 operand_type_set (&temp, 0);
7313 if (i.suffix == BYTE_MNEM_SUFFIX)
7314 {
7315 temp.bitfield.imm8 = overlap.bitfield.imm8;
7316 temp.bitfield.imm8s = overlap.bitfield.imm8s;
7317 }
7318 else if (i.suffix == WORD_MNEM_SUFFIX)
7319 temp.bitfield.imm16 = overlap.bitfield.imm16;
7320 else if (i.suffix == QWORD_MNEM_SUFFIX)
7321 {
7322 temp.bitfield.imm64 = overlap.bitfield.imm64;
7323 temp.bitfield.imm32s = overlap.bitfield.imm32s;
7324 }
7325 else
7326 temp.bitfield.imm32 = overlap.bitfield.imm32;
7327 overlap = temp;
7328 }
7329 else if (operand_type_equal (&overlap, &imm16_32_32s)
7330 || operand_type_equal (&overlap, &imm16_32)
7331 || operand_type_equal (&overlap, &imm16_32s))
7332 {
7333 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7334 overlap = imm16;
7335 else
7336 overlap = imm32s;
7337 }
7338 if (!operand_type_equal (&overlap, &imm8)
7339 && !operand_type_equal (&overlap, &imm8s)
7340 && !operand_type_equal (&overlap, &imm16)
7341 && !operand_type_equal (&overlap, &imm32)
7342 && !operand_type_equal (&overlap, &imm32s)
7343 && !operand_type_equal (&overlap, &imm64))
7344 {
7345 as_bad (_("no instruction mnemonic suffix given; "
7346 "can't determine immediate size"));
7347 return 0;
7348 }
7349 }
7350 i.types[j] = overlap;
7351
7352 return 1;
7353 }
7354
7355 static int
7356 finalize_imm (void)
7357 {
7358 unsigned int j, n;
7359
7360 /* Update the first 2 immediate operands. */
7361 n = i.operands > 2 ? 2 : i.operands;
7362 if (n)
7363 {
7364 for (j = 0; j < n; j++)
7365 if (update_imm (j) == 0)
7366 return 0;
7367
7368 /* The 3rd operand can't be immediate operand. */
7369 gas_assert (operand_type_check (i.types[2], imm) == 0);
7370 }
7371
7372 return 1;
7373 }
7374
7375 static int
7376 process_operands (void)
7377 {
7378 /* Default segment register this instruction will use for memory
7379 accesses. 0 means unknown. This is only for optimizing out
7380 unnecessary segment overrides. */
7381 const seg_entry *default_seg = 0;
7382
7383 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7384 {
7385 unsigned int dupl = i.operands;
7386 unsigned int dest = dupl - 1;
7387 unsigned int j;
7388
7389 /* The destination must be an xmm register. */
7390 gas_assert (i.reg_operands
7391 && MAX_OPERANDS > dupl
7392 && operand_type_equal (&i.types[dest], &regxmm));
7393
7394 if (i.tm.operand_types[0].bitfield.instance == Accum
7395 && i.tm.operand_types[0].bitfield.xmmword)
7396 {
7397 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7398 {
7399 /* Keep xmm0 for instructions with VEX prefix and 3
7400 sources. */
7401 i.tm.operand_types[0].bitfield.instance = InstanceNone;
7402 i.tm.operand_types[0].bitfield.class = RegSIMD;
7403 goto duplicate;
7404 }
7405 else
7406 {
7407 /* We remove the first xmm0 and keep the number of
7408 operands unchanged, which in fact duplicates the
7409 destination. */
7410 for (j = 1; j < i.operands; j++)
7411 {
7412 i.op[j - 1] = i.op[j];
7413 i.types[j - 1] = i.types[j];
7414 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7415 i.flags[j - 1] = i.flags[j];
7416 }
7417 }
7418 }
7419 else if (i.tm.opcode_modifier.implicit1stxmm0)
7420 {
7421 gas_assert ((MAX_OPERANDS - 1) > dupl
7422 && (i.tm.opcode_modifier.vexsources
7423 == VEX3SOURCES));
7424
7425 /* Add the implicit xmm0 for instructions with VEX prefix
7426 and 3 sources. */
7427 for (j = i.operands; j > 0; j--)
7428 {
7429 i.op[j] = i.op[j - 1];
7430 i.types[j] = i.types[j - 1];
7431 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7432 i.flags[j] = i.flags[j - 1];
7433 }
7434 i.op[0].regs
7435 = (const reg_entry *) hash_find (reg_hash, "xmm0");
7436 i.types[0] = regxmm;
7437 i.tm.operand_types[0] = regxmm;
7438
7439 i.operands += 2;
7440 i.reg_operands += 2;
7441 i.tm.operands += 2;
7442
7443 dupl++;
7444 dest++;
7445 i.op[dupl] = i.op[dest];
7446 i.types[dupl] = i.types[dest];
7447 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7448 i.flags[dupl] = i.flags[dest];
7449 }
7450 else
7451 {
7452 duplicate:
7453 i.operands++;
7454 i.reg_operands++;
7455 i.tm.operands++;
7456
7457 i.op[dupl] = i.op[dest];
7458 i.types[dupl] = i.types[dest];
7459 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7460 i.flags[dupl] = i.flags[dest];
7461 }
7462
7463 if (i.tm.opcode_modifier.immext)
7464 process_immext ();
7465 }
7466 else if (i.tm.operand_types[0].bitfield.instance == Accum
7467 && i.tm.operand_types[0].bitfield.xmmword)
7468 {
7469 unsigned int j;
7470
7471 for (j = 1; j < i.operands; j++)
7472 {
7473 i.op[j - 1] = i.op[j];
7474 i.types[j - 1] = i.types[j];
7475
7476 /* We need to adjust fields in i.tm since they are used by
7477 build_modrm_byte. */
7478 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7479
7480 i.flags[j - 1] = i.flags[j];
7481 }
7482
7483 i.operands--;
7484 i.reg_operands--;
7485 i.tm.operands--;
7486 }
7487 else if (i.tm.opcode_modifier.implicitquadgroup)
7488 {
7489 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7490
7491 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7492 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7493 regnum = register_number (i.op[1].regs);
7494 first_reg_in_group = regnum & ~3;
7495 last_reg_in_group = first_reg_in_group + 3;
7496 if (regnum != first_reg_in_group)
7497 as_warn (_("source register `%s%s' implicitly denotes"
7498 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7499 register_prefix, i.op[1].regs->reg_name,
7500 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7501 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7502 i.tm.name);
7503 }
7504 else if (i.tm.opcode_modifier.regkludge)
7505 {
7506 /* The imul $imm, %reg instruction is converted into
7507 imul $imm, %reg, %reg, and the clr %reg instruction
7508 is converted into xor %reg, %reg. */
7509
7510 unsigned int first_reg_op;
7511
7512 if (operand_type_check (i.types[0], reg))
7513 first_reg_op = 0;
7514 else
7515 first_reg_op = 1;
7516 /* Pretend we saw the extra register operand. */
7517 gas_assert (i.reg_operands == 1
7518 && i.op[first_reg_op + 1].regs == 0);
7519 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7520 i.types[first_reg_op + 1] = i.types[first_reg_op];
7521 i.operands++;
7522 i.reg_operands++;
7523 }
7524
7525 if (i.tm.opcode_modifier.modrm)
7526 {
7527 /* The opcode is completed (modulo i.tm.extension_opcode which
7528 must be put into the modrm byte). Now, we make the modrm and
7529 index base bytes based on all the info we've collected. */
7530
7531 default_seg = build_modrm_byte ();
7532 }
7533 else if (i.types[0].bitfield.class == SReg)
7534 {
7535 if (flag_code != CODE_64BIT
7536 ? i.tm.base_opcode == POP_SEG_SHORT
7537 && i.op[0].regs->reg_num == 1
7538 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7539 && i.op[0].regs->reg_num < 4)
7540 {
7541 as_bad (_("you can't `%s %s%s'"),
7542 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7543 return 0;
7544 }
7545 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7546 {
7547 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7548 i.tm.opcode_length = 2;
7549 }
7550 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7551 }
7552 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7553 {
7554 default_seg = &ds;
7555 }
7556 else if (i.tm.opcode_modifier.isstring)
7557 {
7558 /* For the string instructions that allow a segment override
7559 on one of their operands, the default segment is ds. */
7560 default_seg = &ds;
7561 }
7562 else if (i.short_form)
7563 {
7564 /* The register or float register operand is in operand
7565 0 or 1. */
7566 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7567
7568 /* Register goes in low 3 bits of opcode. */
7569 i.tm.base_opcode |= i.op[op].regs->reg_num;
7570 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7571 i.rex |= REX_B;
7572 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7573 {
7574 /* Warn about some common errors, but press on regardless.
7575 The first case can be generated by gcc (<= 2.8.1). */
7576 if (i.operands == 2)
7577 {
7578 /* Reversed arguments on faddp, fsubp, etc. */
7579 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7580 register_prefix, i.op[!intel_syntax].regs->reg_name,
7581 register_prefix, i.op[intel_syntax].regs->reg_name);
7582 }
7583 else
7584 {
7585 /* Extraneous `l' suffix on fp insn. */
7586 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7587 register_prefix, i.op[0].regs->reg_name);
7588 }
7589 }
7590 }
7591
7592 if ((i.seg[0] || i.prefix[SEG_PREFIX])
7593 && i.tm.base_opcode == 0x8d /* lea */
7594 && !is_any_vex_encoding(&i.tm))
7595 {
7596 if (!quiet_warnings)
7597 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7598 if (optimize)
7599 {
7600 i.seg[0] = NULL;
7601 i.prefix[SEG_PREFIX] = 0;
7602 }
7603 }
7604
7605 /* If a segment was explicitly specified, and the specified segment
7606 is neither the default nor the one already recorded from a prefix,
7607 use an opcode prefix to select it. If we never figured out what
7608 the default segment is, then default_seg will be zero at this
7609 point, and the specified segment prefix will always be used. */
7610 if (i.seg[0]
7611 && i.seg[0] != default_seg
7612 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7613 {
7614 if (!add_prefix (i.seg[0]->seg_prefix))
7615 return 0;
7616 }
7617 return 1;
7618 }
7619
7620 static const seg_entry *
7621 build_modrm_byte (void)
7622 {
7623 const seg_entry *default_seg = 0;
7624 unsigned int source, dest;
7625 int vex_3_sources;
7626
7627 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7628 if (vex_3_sources)
7629 {
7630 unsigned int nds, reg_slot;
7631 expressionS *exp;
7632
7633 dest = i.operands - 1;
7634 nds = dest - 1;
7635
7636 /* There are 2 kinds of instructions:
7637 1. 5 operands: 4 register operands or 3 register operands
7638 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7639 VexW0 or VexW1. The destination must be either XMM, YMM or
7640 ZMM register.
7641 2. 4 operands: 4 register operands or 3 register operands
7642 plus 1 memory operand, with VexXDS. */
7643 gas_assert ((i.reg_operands == 4
7644 || (i.reg_operands == 3 && i.mem_operands == 1))
7645 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7646 && i.tm.opcode_modifier.vexw
7647 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7648
7649 /* If VexW1 is set, the first non-immediate operand is the source and
7650 the second non-immediate one is encoded in the immediate operand. */
7651 if (i.tm.opcode_modifier.vexw == VEXW1)
7652 {
7653 source = i.imm_operands;
7654 reg_slot = i.imm_operands + 1;
7655 }
7656 else
7657 {
7658 source = i.imm_operands + 1;
7659 reg_slot = i.imm_operands;
7660 }
7661
7662 if (i.imm_operands == 0)
7663 {
7664 /* When there is no immediate operand, generate an 8bit
7665 immediate operand to encode the first operand. */
7666 exp = &im_expressions[i.imm_operands++];
7667 i.op[i.operands].imms = exp;
7668 i.types[i.operands] = imm8;
7669 i.operands++;
7670
7671 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7672 exp->X_op = O_constant;
7673 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7674 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7675 }
7676 else
7677 {
7678 gas_assert (i.imm_operands == 1);
7679 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7680 gas_assert (!i.tm.opcode_modifier.immext);
7681
7682 /* Turn on Imm8 again so that output_imm will generate it. */
7683 i.types[0].bitfield.imm8 = 1;
7684
7685 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7686 i.op[0].imms->X_add_number
7687 |= register_number (i.op[reg_slot].regs) << 4;
7688 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7689 }
7690
7691 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7692 i.vex.register_specifier = i.op[nds].regs;
7693 }
7694 else
7695 source = dest = 0;
7696
7697 /* i.reg_operands MUST be the number of real register operands;
7698 implicit registers do not count. If there are 3 register
7699 operands, it must be a instruction with VexNDS. For a
7700 instruction with VexNDD, the destination register is encoded
7701 in VEX prefix. If there are 4 register operands, it must be
7702 a instruction with VEX prefix and 3 sources. */
7703 if (i.mem_operands == 0
7704 && ((i.reg_operands == 2
7705 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7706 || (i.reg_operands == 3
7707 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7708 || (i.reg_operands == 4 && vex_3_sources)))
7709 {
7710 switch (i.operands)
7711 {
7712 case 2:
7713 source = 0;
7714 break;
7715 case 3:
7716 /* When there are 3 operands, one of them may be immediate,
7717 which may be the first or the last operand. Otherwise,
7718 the first operand must be shift count register (cl) or it
7719 is an instruction with VexNDS. */
7720 gas_assert (i.imm_operands == 1
7721 || (i.imm_operands == 0
7722 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7723 || (i.types[0].bitfield.instance == RegC
7724 && i.types[0].bitfield.byte))));
7725 if (operand_type_check (i.types[0], imm)
7726 || (i.types[0].bitfield.instance == RegC
7727 && i.types[0].bitfield.byte))
7728 source = 1;
7729 else
7730 source = 0;
7731 break;
7732 case 4:
7733 /* When there are 4 operands, the first two must be 8bit
7734 immediate operands. The source operand will be the 3rd
7735 one.
7736
7737 For instructions with VexNDS, if the first operand
7738 an imm8, the source operand is the 2nd one. If the last
7739 operand is imm8, the source operand is the first one. */
7740 gas_assert ((i.imm_operands == 2
7741 && i.types[0].bitfield.imm8
7742 && i.types[1].bitfield.imm8)
7743 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7744 && i.imm_operands == 1
7745 && (i.types[0].bitfield.imm8
7746 || i.types[i.operands - 1].bitfield.imm8
7747 || i.rounding)));
7748 if (i.imm_operands == 2)
7749 source = 2;
7750 else
7751 {
7752 if (i.types[0].bitfield.imm8)
7753 source = 1;
7754 else
7755 source = 0;
7756 }
7757 break;
7758 case 5:
7759 if (is_evex_encoding (&i.tm))
7760 {
7761 /* For EVEX instructions, when there are 5 operands, the
7762 first one must be immediate operand. If the second one
7763 is immediate operand, the source operand is the 3th
7764 one. If the last one is immediate operand, the source
7765 operand is the 2nd one. */
7766 gas_assert (i.imm_operands == 2
7767 && i.tm.opcode_modifier.sae
7768 && operand_type_check (i.types[0], imm));
7769 if (operand_type_check (i.types[1], imm))
7770 source = 2;
7771 else if (operand_type_check (i.types[4], imm))
7772 source = 1;
7773 else
7774 abort ();
7775 }
7776 break;
7777 default:
7778 abort ();
7779 }
7780
7781 if (!vex_3_sources)
7782 {
7783 dest = source + 1;
7784
7785 /* RC/SAE operand could be between DEST and SRC. That happens
7786 when one operand is GPR and the other one is XMM/YMM/ZMM
7787 register. */
7788 if (i.rounding && i.rounding->operand == (int) dest)
7789 dest++;
7790
7791 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7792 {
7793 /* For instructions with VexNDS, the register-only source
7794 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7795 register. It is encoded in VEX prefix. */
7796
7797 i386_operand_type op;
7798 unsigned int vvvv;
7799
7800 /* Check register-only source operand when two source
7801 operands are swapped. */
7802 if (!i.tm.operand_types[source].bitfield.baseindex
7803 && i.tm.operand_types[dest].bitfield.baseindex)
7804 {
7805 vvvv = source;
7806 source = dest;
7807 }
7808 else
7809 vvvv = dest;
7810
7811 op = i.tm.operand_types[vvvv];
7812 if ((dest + 1) >= i.operands
7813 || ((op.bitfield.class != Reg
7814 || (!op.bitfield.dword && !op.bitfield.qword))
7815 && op.bitfield.class != RegSIMD
7816 && !operand_type_equal (&op, &regmask)))
7817 abort ();
7818 i.vex.register_specifier = i.op[vvvv].regs;
7819 dest++;
7820 }
7821 }
7822
7823 i.rm.mode = 3;
7824 /* One of the register operands will be encoded in the i.rm.reg
7825 field, the other in the combined i.rm.mode and i.rm.regmem
7826 fields. If no form of this instruction supports a memory
7827 destination operand, then we assume the source operand may
7828 sometimes be a memory operand and so we need to store the
7829 destination in the i.rm.reg field. */
7830 if (!i.tm.opcode_modifier.regmem
7831 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7832 {
7833 i.rm.reg = i.op[dest].regs->reg_num;
7834 i.rm.regmem = i.op[source].regs->reg_num;
7835 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7836 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7837 i.has_regmmx = TRUE;
7838 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7839 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7840 {
7841 if (i.types[dest].bitfield.zmmword
7842 || i.types[source].bitfield.zmmword)
7843 i.has_regzmm = TRUE;
7844 else if (i.types[dest].bitfield.ymmword
7845 || i.types[source].bitfield.ymmword)
7846 i.has_regymm = TRUE;
7847 else
7848 i.has_regxmm = TRUE;
7849 }
7850 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7851 i.rex |= REX_R;
7852 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7853 i.vrex |= REX_R;
7854 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7855 i.rex |= REX_B;
7856 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7857 i.vrex |= REX_B;
7858 }
7859 else
7860 {
7861 i.rm.reg = i.op[source].regs->reg_num;
7862 i.rm.regmem = i.op[dest].regs->reg_num;
7863 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7864 i.rex |= REX_B;
7865 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7866 i.vrex |= REX_B;
7867 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7868 i.rex |= REX_R;
7869 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7870 i.vrex |= REX_R;
7871 }
7872 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7873 {
7874 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7875 abort ();
7876 i.rex &= ~REX_R;
7877 add_prefix (LOCK_PREFIX_OPCODE);
7878 }
7879 }
7880 else
7881 { /* If it's not 2 reg operands... */
7882 unsigned int mem;
7883
7884 if (i.mem_operands)
7885 {
7886 unsigned int fake_zero_displacement = 0;
7887 unsigned int op;
7888
7889 for (op = 0; op < i.operands; op++)
7890 if (i.flags[op] & Operand_Mem)
7891 break;
7892 gas_assert (op < i.operands);
7893
7894 if (i.tm.opcode_modifier.vecsib)
7895 {
7896 if (i.index_reg->reg_num == RegIZ)
7897 abort ();
7898
7899 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7900 if (!i.base_reg)
7901 {
7902 i.sib.base = NO_BASE_REGISTER;
7903 i.sib.scale = i.log2_scale_factor;
7904 i.types[op].bitfield.disp8 = 0;
7905 i.types[op].bitfield.disp16 = 0;
7906 i.types[op].bitfield.disp64 = 0;
7907 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7908 {
7909 /* Must be 32 bit */
7910 i.types[op].bitfield.disp32 = 1;
7911 i.types[op].bitfield.disp32s = 0;
7912 }
7913 else
7914 {
7915 i.types[op].bitfield.disp32 = 0;
7916 i.types[op].bitfield.disp32s = 1;
7917 }
7918 }
7919 i.sib.index = i.index_reg->reg_num;
7920 if ((i.index_reg->reg_flags & RegRex) != 0)
7921 i.rex |= REX_X;
7922 if ((i.index_reg->reg_flags & RegVRex) != 0)
7923 i.vrex |= REX_X;
7924 }
7925
7926 default_seg = &ds;
7927
7928 if (i.base_reg == 0)
7929 {
7930 i.rm.mode = 0;
7931 if (!i.disp_operands)
7932 fake_zero_displacement = 1;
7933 if (i.index_reg == 0)
7934 {
7935 i386_operand_type newdisp;
7936
7937 gas_assert (!i.tm.opcode_modifier.vecsib);
7938 /* Operand is just <disp> */
7939 if (flag_code == CODE_64BIT)
7940 {
7941 /* 64bit mode overwrites the 32bit absolute
7942 addressing by RIP relative addressing and
7943 absolute addressing is encoded by one of the
7944 redundant SIB forms. */
7945 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7946 i.sib.base = NO_BASE_REGISTER;
7947 i.sib.index = NO_INDEX_REGISTER;
7948 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7949 }
7950 else if ((flag_code == CODE_16BIT)
7951 ^ (i.prefix[ADDR_PREFIX] != 0))
7952 {
7953 i.rm.regmem = NO_BASE_REGISTER_16;
7954 newdisp = disp16;
7955 }
7956 else
7957 {
7958 i.rm.regmem = NO_BASE_REGISTER;
7959 newdisp = disp32;
7960 }
7961 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7962 i.types[op] = operand_type_or (i.types[op], newdisp);
7963 }
7964 else if (!i.tm.opcode_modifier.vecsib)
7965 {
7966 /* !i.base_reg && i.index_reg */
7967 if (i.index_reg->reg_num == RegIZ)
7968 i.sib.index = NO_INDEX_REGISTER;
7969 else
7970 i.sib.index = i.index_reg->reg_num;
7971 i.sib.base = NO_BASE_REGISTER;
7972 i.sib.scale = i.log2_scale_factor;
7973 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7974 i.types[op].bitfield.disp8 = 0;
7975 i.types[op].bitfield.disp16 = 0;
7976 i.types[op].bitfield.disp64 = 0;
7977 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7978 {
7979 /* Must be 32 bit */
7980 i.types[op].bitfield.disp32 = 1;
7981 i.types[op].bitfield.disp32s = 0;
7982 }
7983 else
7984 {
7985 i.types[op].bitfield.disp32 = 0;
7986 i.types[op].bitfield.disp32s = 1;
7987 }
7988 if ((i.index_reg->reg_flags & RegRex) != 0)
7989 i.rex |= REX_X;
7990 }
7991 }
7992 /* RIP addressing for 64bit mode. */
7993 else if (i.base_reg->reg_num == RegIP)
7994 {
7995 gas_assert (!i.tm.opcode_modifier.vecsib);
7996 i.rm.regmem = NO_BASE_REGISTER;
7997 i.types[op].bitfield.disp8 = 0;
7998 i.types[op].bitfield.disp16 = 0;
7999 i.types[op].bitfield.disp32 = 0;
8000 i.types[op].bitfield.disp32s = 1;
8001 i.types[op].bitfield.disp64 = 0;
8002 i.flags[op] |= Operand_PCrel;
8003 if (! i.disp_operands)
8004 fake_zero_displacement = 1;
8005 }
8006 else if (i.base_reg->reg_type.bitfield.word)
8007 {
8008 gas_assert (!i.tm.opcode_modifier.vecsib);
8009 switch (i.base_reg->reg_num)
8010 {
8011 case 3: /* (%bx) */
8012 if (i.index_reg == 0)
8013 i.rm.regmem = 7;
8014 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
8015 i.rm.regmem = i.index_reg->reg_num - 6;
8016 break;
8017 case 5: /* (%bp) */
8018 default_seg = &ss;
8019 if (i.index_reg == 0)
8020 {
8021 i.rm.regmem = 6;
8022 if (operand_type_check (i.types[op], disp) == 0)
8023 {
8024 /* fake (%bp) into 0(%bp) */
8025 i.types[op].bitfield.disp8 = 1;
8026 fake_zero_displacement = 1;
8027 }
8028 }
8029 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
8030 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8031 break;
8032 default: /* (%si) -> 4 or (%di) -> 5 */
8033 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8034 }
8035 i.rm.mode = mode_from_disp_size (i.types[op]);
8036 }
8037 else /* i.base_reg and 32/64 bit mode */
8038 {
8039 if (flag_code == CODE_64BIT
8040 && operand_type_check (i.types[op], disp))
8041 {
8042 i.types[op].bitfield.disp16 = 0;
8043 i.types[op].bitfield.disp64 = 0;
8044 if (i.prefix[ADDR_PREFIX] == 0)
8045 {
8046 i.types[op].bitfield.disp32 = 0;
8047 i.types[op].bitfield.disp32s = 1;
8048 }
8049 else
8050 {
8051 i.types[op].bitfield.disp32 = 1;
8052 i.types[op].bitfield.disp32s = 0;
8053 }
8054 }
8055
8056 if (!i.tm.opcode_modifier.vecsib)
8057 i.rm.regmem = i.base_reg->reg_num;
8058 if ((i.base_reg->reg_flags & RegRex) != 0)
8059 i.rex |= REX_B;
8060 i.sib.base = i.base_reg->reg_num;
8061 /* x86-64 ignores REX prefix bit here to avoid decoder
8062 complications. */
8063 if (!(i.base_reg->reg_flags & RegRex)
8064 && (i.base_reg->reg_num == EBP_REG_NUM
8065 || i.base_reg->reg_num == ESP_REG_NUM))
8066 default_seg = &ss;
8067 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8068 {
8069 fake_zero_displacement = 1;
8070 i.types[op].bitfield.disp8 = 1;
8071 }
8072 i.sib.scale = i.log2_scale_factor;
8073 if (i.index_reg == 0)
8074 {
8075 gas_assert (!i.tm.opcode_modifier.vecsib);
8076 /* <disp>(%esp) becomes two byte modrm with no index
8077 register. We've already stored the code for esp
8078 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8079 Any base register besides %esp will not use the
8080 extra modrm byte. */
8081 i.sib.index = NO_INDEX_REGISTER;
8082 }
8083 else if (!i.tm.opcode_modifier.vecsib)
8084 {
8085 if (i.index_reg->reg_num == RegIZ)
8086 i.sib.index = NO_INDEX_REGISTER;
8087 else
8088 i.sib.index = i.index_reg->reg_num;
8089 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8090 if ((i.index_reg->reg_flags & RegRex) != 0)
8091 i.rex |= REX_X;
8092 }
8093
8094 if (i.disp_operands
8095 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8096 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8097 i.rm.mode = 0;
8098 else
8099 {
8100 if (!fake_zero_displacement
8101 && !i.disp_operands
8102 && i.disp_encoding)
8103 {
8104 fake_zero_displacement = 1;
8105 if (i.disp_encoding == disp_encoding_8bit)
8106 i.types[op].bitfield.disp8 = 1;
8107 else
8108 i.types[op].bitfield.disp32 = 1;
8109 }
8110 i.rm.mode = mode_from_disp_size (i.types[op]);
8111 }
8112 }
8113
8114 if (fake_zero_displacement)
8115 {
8116 /* Fakes a zero displacement assuming that i.types[op]
8117 holds the correct displacement size. */
8118 expressionS *exp;
8119
8120 gas_assert (i.op[op].disps == 0);
8121 exp = &disp_expressions[i.disp_operands++];
8122 i.op[op].disps = exp;
8123 exp->X_op = O_constant;
8124 exp->X_add_number = 0;
8125 exp->X_add_symbol = (symbolS *) 0;
8126 exp->X_op_symbol = (symbolS *) 0;
8127 }
8128
8129 mem = op;
8130 }
8131 else
8132 mem = ~0;
8133
8134 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8135 {
8136 if (operand_type_check (i.types[0], imm))
8137 i.vex.register_specifier = NULL;
8138 else
8139 {
8140 /* VEX.vvvv encodes one of the sources when the first
8141 operand is not an immediate. */
8142 if (i.tm.opcode_modifier.vexw == VEXW0)
8143 i.vex.register_specifier = i.op[0].regs;
8144 else
8145 i.vex.register_specifier = i.op[1].regs;
8146 }
8147
8148 /* Destination is a XMM register encoded in the ModRM.reg
8149 and VEX.R bit. */
8150 i.rm.reg = i.op[2].regs->reg_num;
8151 if ((i.op[2].regs->reg_flags & RegRex) != 0)
8152 i.rex |= REX_R;
8153
8154 /* ModRM.rm and VEX.B encodes the other source. */
8155 if (!i.mem_operands)
8156 {
8157 i.rm.mode = 3;
8158
8159 if (i.tm.opcode_modifier.vexw == VEXW0)
8160 i.rm.regmem = i.op[1].regs->reg_num;
8161 else
8162 i.rm.regmem = i.op[0].regs->reg_num;
8163
8164 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8165 i.rex |= REX_B;
8166 }
8167 }
8168 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8169 {
8170 i.vex.register_specifier = i.op[2].regs;
8171 if (!i.mem_operands)
8172 {
8173 i.rm.mode = 3;
8174 i.rm.regmem = i.op[1].regs->reg_num;
8175 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8176 i.rex |= REX_B;
8177 }
8178 }
8179 /* Fill in i.rm.reg or i.rm.regmem field with register operand
8180 (if any) based on i.tm.extension_opcode. Again, we must be
8181 careful to make sure that segment/control/debug/test/MMX
8182 registers are coded into the i.rm.reg field. */
8183 else if (i.reg_operands)
8184 {
8185 unsigned int op;
8186 unsigned int vex_reg = ~0;
8187
8188 for (op = 0; op < i.operands; op++)
8189 {
8190 if (i.types[op].bitfield.class == Reg
8191 || i.types[op].bitfield.class == RegBND
8192 || i.types[op].bitfield.class == RegMask
8193 || i.types[op].bitfield.class == SReg
8194 || i.types[op].bitfield.class == RegCR
8195 || i.types[op].bitfield.class == RegDR
8196 || i.types[op].bitfield.class == RegTR)
8197 break;
8198 if (i.types[op].bitfield.class == RegSIMD)
8199 {
8200 if (i.types[op].bitfield.zmmword)
8201 i.has_regzmm = TRUE;
8202 else if (i.types[op].bitfield.ymmword)
8203 i.has_regymm = TRUE;
8204 else
8205 i.has_regxmm = TRUE;
8206 break;
8207 }
8208 if (i.types[op].bitfield.class == RegMMX)
8209 {
8210 i.has_regmmx = TRUE;
8211 break;
8212 }
8213 }
8214
8215 if (vex_3_sources)
8216 op = dest;
8217 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8218 {
8219 /* For instructions with VexNDS, the register-only
8220 source operand is encoded in VEX prefix. */
8221 gas_assert (mem != (unsigned int) ~0);
8222
8223 if (op > mem)
8224 {
8225 vex_reg = op++;
8226 gas_assert (op < i.operands);
8227 }
8228 else
8229 {
8230 /* Check register-only source operand when two source
8231 operands are swapped. */
8232 if (!i.tm.operand_types[op].bitfield.baseindex
8233 && i.tm.operand_types[op + 1].bitfield.baseindex)
8234 {
8235 vex_reg = op;
8236 op += 2;
8237 gas_assert (mem == (vex_reg + 1)
8238 && op < i.operands);
8239 }
8240 else
8241 {
8242 vex_reg = op + 1;
8243 gas_assert (vex_reg < i.operands);
8244 }
8245 }
8246 }
8247 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8248 {
8249 /* For instructions with VexNDD, the register destination
8250 is encoded in VEX prefix. */
8251 if (i.mem_operands == 0)
8252 {
8253 /* There is no memory operand. */
8254 gas_assert ((op + 2) == i.operands);
8255 vex_reg = op + 1;
8256 }
8257 else
8258 {
8259 /* There are only 2 non-immediate operands. */
8260 gas_assert (op < i.imm_operands + 2
8261 && i.operands == i.imm_operands + 2);
8262 vex_reg = i.imm_operands + 1;
8263 }
8264 }
8265 else
8266 gas_assert (op < i.operands);
8267
8268 if (vex_reg != (unsigned int) ~0)
8269 {
8270 i386_operand_type *type = &i.tm.operand_types[vex_reg];
8271
8272 if ((type->bitfield.class != Reg
8273 || (!type->bitfield.dword && !type->bitfield.qword))
8274 && type->bitfield.class != RegSIMD
8275 && !operand_type_equal (type, &regmask))
8276 abort ();
8277
8278 i.vex.register_specifier = i.op[vex_reg].regs;
8279 }
8280
8281 /* Don't set OP operand twice. */
8282 if (vex_reg != op)
8283 {
8284 /* If there is an extension opcode to put here, the
8285 register number must be put into the regmem field. */
8286 if (i.tm.extension_opcode != None)
8287 {
8288 i.rm.regmem = i.op[op].regs->reg_num;
8289 if ((i.op[op].regs->reg_flags & RegRex) != 0)
8290 i.rex |= REX_B;
8291 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
8292 i.vrex |= REX_B;
8293 }
8294 else
8295 {
8296 i.rm.reg = i.op[op].regs->reg_num;
8297 if ((i.op[op].regs->reg_flags & RegRex) != 0)
8298 i.rex |= REX_R;
8299 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
8300 i.vrex |= REX_R;
8301 }
8302 }
8303
8304 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8305 must set it to 3 to indicate this is a register operand
8306 in the regmem field. */
8307 if (!i.mem_operands)
8308 i.rm.mode = 3;
8309 }
8310
8311 /* Fill in i.rm.reg field with extension opcode (if any). */
8312 if (i.tm.extension_opcode != None)
8313 i.rm.reg = i.tm.extension_opcode;
8314 }
8315 return default_seg;
8316 }
8317
8318 static unsigned int
8319 flip_code16 (unsigned int code16)
8320 {
8321 gas_assert (i.tm.operands == 1);
8322
8323 return !(i.prefix[REX_PREFIX] & REX_W)
8324 && (code16 ? i.tm.operand_types[0].bitfield.disp32
8325 || i.tm.operand_types[0].bitfield.disp32s
8326 : i.tm.operand_types[0].bitfield.disp16)
8327 ? CODE16 : 0;
8328 }
8329
8330 static void
8331 output_branch (void)
8332 {
8333 char *p;
8334 int size;
8335 int code16;
8336 int prefix;
8337 relax_substateT subtype;
8338 symbolS *sym;
8339 offsetT off;
8340
8341 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8342 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8343
8344 prefix = 0;
8345 if (i.prefix[DATA_PREFIX] != 0)
8346 {
8347 prefix = 1;
8348 i.prefixes -= 1;
8349 code16 ^= flip_code16(code16);
8350 }
8351 /* Pentium4 branch hints. */
8352 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8353 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8354 {
8355 prefix++;
8356 i.prefixes--;
8357 }
8358 if (i.prefix[REX_PREFIX] != 0)
8359 {
8360 prefix++;
8361 i.prefixes--;
8362 }
8363
8364 /* BND prefixed jump. */
8365 if (i.prefix[BND_PREFIX] != 0)
8366 {
8367 prefix++;
8368 i.prefixes--;
8369 }
8370
8371 if (i.prefixes != 0)
8372 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8373
8374 /* It's always a symbol; End frag & setup for relax.
8375 Make sure there is enough room in this frag for the largest
8376 instruction we may generate in md_convert_frag. This is 2
8377 bytes for the opcode and room for the prefix and largest
8378 displacement. */
8379 frag_grow (prefix + 2 + 4);
8380 /* Prefix and 1 opcode byte go in fr_fix. */
8381 p = frag_more (prefix + 1);
8382 if (i.prefix[DATA_PREFIX] != 0)
8383 *p++ = DATA_PREFIX_OPCODE;
8384 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8385 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8386 *p++ = i.prefix[SEG_PREFIX];
8387 if (i.prefix[BND_PREFIX] != 0)
8388 *p++ = BND_PREFIX_OPCODE;
8389 if (i.prefix[REX_PREFIX] != 0)
8390 *p++ = i.prefix[REX_PREFIX];
8391 *p = i.tm.base_opcode;
8392
8393 if ((unsigned char) *p == JUMP_PC_RELATIVE)
8394 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8395 else if (cpu_arch_flags.bitfield.cpui386)
8396 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8397 else
8398 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8399 subtype |= code16;
8400
8401 sym = i.op[0].disps->X_add_symbol;
8402 off = i.op[0].disps->X_add_number;
8403
8404 if (i.op[0].disps->X_op != O_constant
8405 && i.op[0].disps->X_op != O_symbol)
8406 {
8407 /* Handle complex expressions. */
8408 sym = make_expr_symbol (i.op[0].disps);
8409 off = 0;
8410 }
8411
8412 /* 1 possible extra opcode + 4 byte displacement go in var part.
8413 Pass reloc in fr_var. */
8414 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8415 }
8416
8417 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8418 /* Return TRUE iff PLT32 relocation should be used for branching to
8419 symbol S. */
8420
8421 static bfd_boolean
8422 need_plt32_p (symbolS *s)
8423 {
8424 /* PLT32 relocation is ELF only. */
8425 if (!IS_ELF)
8426 return FALSE;
8427
8428 #ifdef TE_SOLARIS
8429 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8430 krtld support it. */
8431 return FALSE;
8432 #endif
8433
8434 /* Since there is no need to prepare for PLT branch on x86-64, we
8435 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8436 be used as a marker for 32-bit PC-relative branches. */
8437 if (!object_64bit)
8438 return FALSE;
8439
8440 /* Weak or undefined symbol need PLT32 relocation. */
8441 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8442 return TRUE;
8443
8444 /* Non-global symbol doesn't need PLT32 relocation. */
8445 if (! S_IS_EXTERNAL (s))
8446 return FALSE;
8447
8448 /* Other global symbols need PLT32 relocation. NB: Symbol with
8449 non-default visibilities are treated as normal global symbol
8450 so that PLT32 relocation can be used as a marker for 32-bit
8451 PC-relative branches. It is useful for linker relaxation. */
8452 return TRUE;
8453 }
8454 #endif
8455
8456 static void
8457 output_jump (void)
8458 {
8459 char *p;
8460 int size;
8461 fixS *fixP;
8462 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8463
8464 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8465 {
8466 /* This is a loop or jecxz type instruction. */
8467 size = 1;
8468 if (i.prefix[ADDR_PREFIX] != 0)
8469 {
8470 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8471 i.prefixes -= 1;
8472 }
8473 /* Pentium4 branch hints. */
8474 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8475 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8476 {
8477 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8478 i.prefixes--;
8479 }
8480 }
8481 else
8482 {
8483 int code16;
8484
8485 code16 = 0;
8486 if (flag_code == CODE_16BIT)
8487 code16 = CODE16;
8488
8489 if (i.prefix[DATA_PREFIX] != 0)
8490 {
8491 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8492 i.prefixes -= 1;
8493 code16 ^= flip_code16(code16);
8494 }
8495
8496 size = 4;
8497 if (code16)
8498 size = 2;
8499 }
8500
8501 /* BND prefixed jump. */
8502 if (i.prefix[BND_PREFIX] != 0)
8503 {
8504 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8505 i.prefixes -= 1;
8506 }
8507
8508 if (i.prefix[REX_PREFIX] != 0)
8509 {
8510 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8511 i.prefixes -= 1;
8512 }
8513
8514 if (i.prefixes != 0)
8515 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8516
8517 p = frag_more (i.tm.opcode_length + size);
8518 switch (i.tm.opcode_length)
8519 {
8520 case 2:
8521 *p++ = i.tm.base_opcode >> 8;
8522 /* Fall through. */
8523 case 1:
8524 *p++ = i.tm.base_opcode;
8525 break;
8526 default:
8527 abort ();
8528 }
8529
8530 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8531 if (size == 4
8532 && jump_reloc == NO_RELOC
8533 && need_plt32_p (i.op[0].disps->X_add_symbol))
8534 jump_reloc = BFD_RELOC_X86_64_PLT32;
8535 #endif
8536
8537 jump_reloc = reloc (size, 1, 1, jump_reloc);
8538
8539 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8540 i.op[0].disps, 1, jump_reloc);
8541
8542 /* All jumps handled here are signed, but don't use a signed limit
8543 check for 32 and 16 bit jumps as we want to allow wrap around at
8544 4G and 64k respectively. */
8545 if (size == 1)
8546 fixP->fx_signed = 1;
8547 }
8548
8549 static void
8550 output_interseg_jump (void)
8551 {
8552 char *p;
8553 int size;
8554 int prefix;
8555 int code16;
8556
8557 code16 = 0;
8558 if (flag_code == CODE_16BIT)
8559 code16 = CODE16;
8560
8561 prefix = 0;
8562 if (i.prefix[DATA_PREFIX] != 0)
8563 {
8564 prefix = 1;
8565 i.prefixes -= 1;
8566 code16 ^= CODE16;
8567 }
8568
8569 gas_assert (!i.prefix[REX_PREFIX]);
8570
8571 size = 4;
8572 if (code16)
8573 size = 2;
8574
8575 if (i.prefixes != 0)
8576 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8577
8578 /* 1 opcode; 2 segment; offset */
8579 p = frag_more (prefix + 1 + 2 + size);
8580
8581 if (i.prefix[DATA_PREFIX] != 0)
8582 *p++ = DATA_PREFIX_OPCODE;
8583
8584 if (i.prefix[REX_PREFIX] != 0)
8585 *p++ = i.prefix[REX_PREFIX];
8586
8587 *p++ = i.tm.base_opcode;
8588 if (i.op[1].imms->X_op == O_constant)
8589 {
8590 offsetT n = i.op[1].imms->X_add_number;
8591
8592 if (size == 2
8593 && !fits_in_unsigned_word (n)
8594 && !fits_in_signed_word (n))
8595 {
8596 as_bad (_("16-bit jump out of range"));
8597 return;
8598 }
8599 md_number_to_chars (p, n, size);
8600 }
8601 else
8602 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8603 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8604 if (i.op[0].imms->X_op != O_constant)
8605 as_bad (_("can't handle non absolute segment in `%s'"),
8606 i.tm.name);
8607 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8608 }
8609
8610 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8611 void
8612 x86_cleanup (void)
8613 {
8614 char *p;
8615 asection *seg = now_seg;
8616 subsegT subseg = now_subseg;
8617 asection *sec;
8618 unsigned int alignment, align_size_1;
8619 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8620 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8621 unsigned int padding;
8622
8623 if (!IS_ELF || !x86_used_note)
8624 return;
8625
8626 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8627
8628 /* The .note.gnu.property section layout:
8629
8630 Field Length Contents
8631 ---- ---- ----
8632 n_namsz 4 4
8633 n_descsz 4 The note descriptor size
8634 n_type 4 NT_GNU_PROPERTY_TYPE_0
8635 n_name 4 "GNU"
8636 n_desc n_descsz The program property array
8637 .... .... ....
8638 */
8639
8640 /* Create the .note.gnu.property section. */
8641 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8642 bfd_set_section_flags (sec,
8643 (SEC_ALLOC
8644 | SEC_LOAD
8645 | SEC_DATA
8646 | SEC_HAS_CONTENTS
8647 | SEC_READONLY));
8648
8649 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8650 {
8651 align_size_1 = 7;
8652 alignment = 3;
8653 }
8654 else
8655 {
8656 align_size_1 = 3;
8657 alignment = 2;
8658 }
8659
8660 bfd_set_section_alignment (sec, alignment);
8661 elf_section_type (sec) = SHT_NOTE;
8662
8663 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8664 + 4-byte data */
8665 isa_1_descsz_raw = 4 + 4 + 4;
8666 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8667 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8668
8669 feature_2_descsz_raw = isa_1_descsz;
8670 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8671 + 4-byte data */
8672 feature_2_descsz_raw += 4 + 4 + 4;
8673 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8674 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8675 & ~align_size_1);
8676
8677 descsz = feature_2_descsz;
8678 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8679 p = frag_more (4 + 4 + 4 + 4 + descsz);
8680
8681 /* Write n_namsz. */
8682 md_number_to_chars (p, (valueT) 4, 4);
8683
8684 /* Write n_descsz. */
8685 md_number_to_chars (p + 4, (valueT) descsz, 4);
8686
8687 /* Write n_type. */
8688 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8689
8690 /* Write n_name. */
8691 memcpy (p + 4 * 3, "GNU", 4);
8692
8693 /* Write 4-byte type. */
8694 md_number_to_chars (p + 4 * 4,
8695 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8696
8697 /* Write 4-byte data size. */
8698 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8699
8700 /* Write 4-byte data. */
8701 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8702
8703 /* Zero out paddings. */
8704 padding = isa_1_descsz - isa_1_descsz_raw;
8705 if (padding)
8706 memset (p + 4 * 7, 0, padding);
8707
8708 /* Write 4-byte type. */
8709 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8710 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8711
8712 /* Write 4-byte data size. */
8713 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8714
8715 /* Write 4-byte data. */
8716 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8717 (valueT) x86_feature_2_used, 4);
8718
8719 /* Zero out paddings. */
8720 padding = feature_2_descsz - feature_2_descsz_raw;
8721 if (padding)
8722 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8723
8724 /* We probably can't restore the current segment, for there likely
8725 isn't one yet... */
8726 if (seg && subseg)
8727 subseg_set (seg, subseg);
8728 }
8729 #endif
8730
8731 static unsigned int
8732 encoding_length (const fragS *start_frag, offsetT start_off,
8733 const char *frag_now_ptr)
8734 {
8735 unsigned int len = 0;
8736
8737 if (start_frag != frag_now)
8738 {
8739 const fragS *fr = start_frag;
8740
8741 do {
8742 len += fr->fr_fix;
8743 fr = fr->fr_next;
8744 } while (fr && fr != frag_now);
8745 }
8746
8747 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8748 }
8749
8750 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8751 be macro-fused with conditional jumps.
8752 NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8753 or is one of the following format:
8754
8755 cmp m, imm
8756 add m, imm
8757 sub m, imm
8758 test m, imm
8759 and m, imm
8760 inc m
8761 dec m
8762
8763 it is unfusible. */
8764
8765 static int
8766 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8767 {
8768 /* No RIP address. */
8769 if (i.base_reg && i.base_reg->reg_num == RegIP)
8770 return 0;
8771
8772 /* No VEX/EVEX encoding. */
8773 if (is_any_vex_encoding (&i.tm))
8774 return 0;
8775
8776 /* add, sub without add/sub m, imm. */
8777 if (i.tm.base_opcode <= 5
8778 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8779 || ((i.tm.base_opcode | 3) == 0x83
8780 && (i.tm.extension_opcode == 0x5
8781 || i.tm.extension_opcode == 0x0)))
8782 {
8783 *mf_cmp_p = mf_cmp_alu_cmp;
8784 return !(i.mem_operands && i.imm_operands);
8785 }
8786
8787 /* and without and m, imm. */
8788 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8789 || ((i.tm.base_opcode | 3) == 0x83
8790 && i.tm.extension_opcode == 0x4))
8791 {
8792 *mf_cmp_p = mf_cmp_test_and;
8793 return !(i.mem_operands && i.imm_operands);
8794 }
8795
8796 /* test without test m imm. */
8797 if ((i.tm.base_opcode | 1) == 0x85
8798 || (i.tm.base_opcode | 1) == 0xa9
8799 || ((i.tm.base_opcode | 1) == 0xf7
8800 && i.tm.extension_opcode == 0))
8801 {
8802 *mf_cmp_p = mf_cmp_test_and;
8803 return !(i.mem_operands && i.imm_operands);
8804 }
8805
8806 /* cmp without cmp m, imm. */
8807 if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8808 || ((i.tm.base_opcode | 3) == 0x83
8809 && (i.tm.extension_opcode == 0x7)))
8810 {
8811 *mf_cmp_p = mf_cmp_alu_cmp;
8812 return !(i.mem_operands && i.imm_operands);
8813 }
8814
8815 /* inc, dec without inc/dec m. */
8816 if ((i.tm.cpu_flags.bitfield.cpuno64
8817 && (i.tm.base_opcode | 0xf) == 0x4f)
8818 || ((i.tm.base_opcode | 1) == 0xff
8819 && i.tm.extension_opcode <= 0x1))
8820 {
8821 *mf_cmp_p = mf_cmp_incdec;
8822 return !i.mem_operands;
8823 }
8824
8825 return 0;
8826 }
8827
8828 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8829
8830 static int
8831 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
8832 {
8833 /* NB: Don't work with COND_JUMP86 without i386. */
8834 if (!align_branch_power
8835 || now_seg == absolute_section
8836 || !cpu_arch_flags.bitfield.cpui386
8837 || !(align_branch & align_branch_fused_bit))
8838 return 0;
8839
8840 if (maybe_fused_with_jcc_p (mf_cmp_p))
8841 {
8842 if (last_insn.kind == last_insn_other
8843 || last_insn.seg != now_seg)
8844 return 1;
8845 if (flag_debug)
8846 as_warn_where (last_insn.file, last_insn.line,
8847 _("`%s` skips -malign-branch-boundary on `%s`"),
8848 last_insn.name, i.tm.name);
8849 }
8850
8851 return 0;
8852 }
8853
8854 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
8855
8856 static int
8857 add_branch_prefix_frag_p (void)
8858 {
8859 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8860 to PadLock instructions since they include prefixes in opcode. */
8861 if (!align_branch_power
8862 || !align_branch_prefix_size
8863 || now_seg == absolute_section
8864 || i.tm.cpu_flags.bitfield.cpupadlock
8865 || !cpu_arch_flags.bitfield.cpui386)
8866 return 0;
8867
8868 /* Don't add prefix if it is a prefix or there is no operand in case
8869 that segment prefix is special. */
8870 if (!i.operands || i.tm.opcode_modifier.isprefix)
8871 return 0;
8872
8873 if (last_insn.kind == last_insn_other
8874 || last_insn.seg != now_seg)
8875 return 1;
8876
8877 if (flag_debug)
8878 as_warn_where (last_insn.file, last_insn.line,
8879 _("`%s` skips -malign-branch-boundary on `%s`"),
8880 last_insn.name, i.tm.name);
8881
8882 return 0;
8883 }
8884
8885 /* Return 1 if a BRANCH_PADDING frag should be generated. */
8886
8887 static int
8888 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
8889 enum mf_jcc_kind *mf_jcc_p)
8890 {
8891 int add_padding;
8892
8893 /* NB: Don't work with COND_JUMP86 without i386. */
8894 if (!align_branch_power
8895 || now_seg == absolute_section
8896 || !cpu_arch_flags.bitfield.cpui386)
8897 return 0;
8898
8899 add_padding = 0;
8900
8901 /* Check for jcc and direct jmp. */
8902 if (i.tm.opcode_modifier.jump == JUMP)
8903 {
8904 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8905 {
8906 *branch_p = align_branch_jmp;
8907 add_padding = align_branch & align_branch_jmp_bit;
8908 }
8909 else
8910 {
8911 /* Because J<cc> and JN<cc> share same group in macro-fusible table,
8912 igore the lowest bit. */
8913 *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
8914 *branch_p = align_branch_jcc;
8915 if ((align_branch & align_branch_jcc_bit))
8916 add_padding = 1;
8917 }
8918 }
8919 else if (is_any_vex_encoding (&i.tm))
8920 return 0;
8921 else if ((i.tm.base_opcode | 1) == 0xc3)
8922 {
8923 /* Near ret. */
8924 *branch_p = align_branch_ret;
8925 if ((align_branch & align_branch_ret_bit))
8926 add_padding = 1;
8927 }
8928 else
8929 {
8930 /* Check for indirect jmp, direct and indirect calls. */
8931 if (i.tm.base_opcode == 0xe8)
8932 {
8933 /* Direct call. */
8934 *branch_p = align_branch_call;
8935 if ((align_branch & align_branch_call_bit))
8936 add_padding = 1;
8937 }
8938 else if (i.tm.base_opcode == 0xff
8939 && (i.tm.extension_opcode == 2
8940 || i.tm.extension_opcode == 4))
8941 {
8942 /* Indirect call and jmp. */
8943 *branch_p = align_branch_indirect;
8944 if ((align_branch & align_branch_indirect_bit))
8945 add_padding = 1;
8946 }
8947
8948 if (add_padding
8949 && i.disp_operands
8950 && tls_get_addr
8951 && (i.op[0].disps->X_op == O_symbol
8952 || (i.op[0].disps->X_op == O_subtract
8953 && i.op[0].disps->X_op_symbol == GOT_symbol)))
8954 {
8955 symbolS *s = i.op[0].disps->X_add_symbol;
8956 /* No padding to call to global or undefined tls_get_addr. */
8957 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
8958 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
8959 return 0;
8960 }
8961 }
8962
8963 if (add_padding
8964 && last_insn.kind != last_insn_other
8965 && last_insn.seg == now_seg)
8966 {
8967 if (flag_debug)
8968 as_warn_where (last_insn.file, last_insn.line,
8969 _("`%s` skips -malign-branch-boundary on `%s`"),
8970 last_insn.name, i.tm.name);
8971 return 0;
8972 }
8973
8974 return add_padding;
8975 }
8976
8977 static void
8978 output_insn (void)
8979 {
8980 fragS *insn_start_frag;
8981 offsetT insn_start_off;
8982 fragS *fragP = NULL;
8983 enum align_branch_kind branch = align_branch_none;
8984 /* The initializer is arbitrary just to avoid uninitialized error.
8985 it's actually either assigned in add_branch_padding_frag_p
8986 or never be used. */
8987 enum mf_jcc_kind mf_jcc = mf_jcc_jo;
8988
8989 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8990 if (IS_ELF && x86_used_note)
8991 {
8992 if (i.tm.cpu_flags.bitfield.cpucmov)
8993 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8994 if (i.tm.cpu_flags.bitfield.cpusse)
8995 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8996 if (i.tm.cpu_flags.bitfield.cpusse2)
8997 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8998 if (i.tm.cpu_flags.bitfield.cpusse3)
8999 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
9000 if (i.tm.cpu_flags.bitfield.cpussse3)
9001 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
9002 if (i.tm.cpu_flags.bitfield.cpusse4_1)
9003 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
9004 if (i.tm.cpu_flags.bitfield.cpusse4_2)
9005 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
9006 if (i.tm.cpu_flags.bitfield.cpuavx)
9007 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
9008 if (i.tm.cpu_flags.bitfield.cpuavx2)
9009 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
9010 if (i.tm.cpu_flags.bitfield.cpufma)
9011 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
9012 if (i.tm.cpu_flags.bitfield.cpuavx512f)
9013 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
9014 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
9015 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
9016 if (i.tm.cpu_flags.bitfield.cpuavx512er)
9017 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
9018 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
9019 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
9020 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
9021 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
9022 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
9023 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
9024 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
9025 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
9026 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
9027 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
9028 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
9029 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
9030 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
9031 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
9032 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
9033 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
9034 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
9035 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
9036 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
9037 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
9038 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
9039 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
9040 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
9041 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
9042
9043 if (i.tm.cpu_flags.bitfield.cpu8087
9044 || i.tm.cpu_flags.bitfield.cpu287
9045 || i.tm.cpu_flags.bitfield.cpu387
9046 || i.tm.cpu_flags.bitfield.cpu687
9047 || i.tm.cpu_flags.bitfield.cpufisttp)
9048 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9049 if (i.has_regmmx
9050 || i.tm.base_opcode == 0xf77 /* emms */
9051 || i.tm.base_opcode == 0xf0e /* femms */
9052 || i.tm.base_opcode == 0xf2a /* cvtpi2ps */
9053 || i.tm.base_opcode == 0x660f2a /* cvtpi2pd */)
9054 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9055 if (i.has_regxmm)
9056 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9057 if (i.has_regymm)
9058 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9059 if (i.has_regzmm)
9060 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9061 if (i.tm.cpu_flags.bitfield.cpufxsr)
9062 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9063 if (i.tm.cpu_flags.bitfield.cpuxsave)
9064 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9065 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9066 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9067 if (i.tm.cpu_flags.bitfield.cpuxsavec)
9068 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9069 }
9070 #endif
9071
9072 /* Tie dwarf2 debug info to the address at the start of the insn.
9073 We can't do this after the insn has been output as the current
9074 frag may have been closed off. eg. by frag_var. */
9075 dwarf2_emit_insn (0);
9076
9077 insn_start_frag = frag_now;
9078 insn_start_off = frag_now_fix ();
9079
9080 if (add_branch_padding_frag_p (&branch, &mf_jcc))
9081 {
9082 char *p;
9083 /* Branch can be 8 bytes. Leave some room for prefixes. */
9084 unsigned int max_branch_padding_size = 14;
9085
9086 /* Align section to boundary. */
9087 record_alignment (now_seg, align_branch_power);
9088
9089 /* Make room for padding. */
9090 frag_grow (max_branch_padding_size);
9091
9092 /* Start of the padding. */
9093 p = frag_more (0);
9094
9095 fragP = frag_now;
9096
9097 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9098 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9099 NULL, 0, p);
9100
9101 fragP->tc_frag_data.mf_type = mf_jcc;
9102 fragP->tc_frag_data.branch_type = branch;
9103 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9104 }
9105
9106 /* Output jumps. */
9107 if (i.tm.opcode_modifier.jump == JUMP)
9108 output_branch ();
9109 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9110 || i.tm.opcode_modifier.jump == JUMP_DWORD)
9111 output_jump ();
9112 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9113 output_interseg_jump ();
9114 else
9115 {
9116 /* Output normal instructions here. */
9117 char *p;
9118 unsigned char *q;
9119 unsigned int j;
9120 unsigned int prefix;
9121 enum mf_cmp_kind mf_cmp;
9122
9123 if (avoid_fence
9124 && (i.tm.base_opcode == 0xfaee8
9125 || i.tm.base_opcode == 0xfaef0
9126 || i.tm.base_opcode == 0xfaef8))
9127 {
9128 /* Encode lfence, mfence, and sfence as
9129 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
9130 offsetT val = 0x240483f0ULL;
9131 p = frag_more (5);
9132 md_number_to_chars (p, val, 5);
9133 return;
9134 }
9135
9136 /* Some processors fail on LOCK prefix. This options makes
9137 assembler ignore LOCK prefix and serves as a workaround. */
9138 if (omit_lock_prefix)
9139 {
9140 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9141 return;
9142 i.prefix[LOCK_PREFIX] = 0;
9143 }
9144
9145 if (branch)
9146 /* Skip if this is a branch. */
9147 ;
9148 else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9149 {
9150 /* Make room for padding. */
9151 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9152 p = frag_more (0);
9153
9154 fragP = frag_now;
9155
9156 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9157 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9158 NULL, 0, p);
9159
9160 fragP->tc_frag_data.mf_type = mf_cmp;
9161 fragP->tc_frag_data.branch_type = align_branch_fused;
9162 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9163 }
9164 else if (add_branch_prefix_frag_p ())
9165 {
9166 unsigned int max_prefix_size = align_branch_prefix_size;
9167
9168 /* Make room for padding. */
9169 frag_grow (max_prefix_size);
9170 p = frag_more (0);
9171
9172 fragP = frag_now;
9173
9174 frag_var (rs_machine_dependent, max_prefix_size, 0,
9175 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9176 NULL, 0, p);
9177
9178 fragP->tc_frag_data.max_bytes = max_prefix_size;
9179 }
9180
9181 /* Since the VEX/EVEX prefix contains the implicit prefix, we
9182 don't need the explicit prefix. */
9183 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9184 {
9185 switch (i.tm.opcode_length)
9186 {
9187 case 3:
9188 if (i.tm.base_opcode & 0xff000000)
9189 {
9190 prefix = (i.tm.base_opcode >> 24) & 0xff;
9191 if (!i.tm.cpu_flags.bitfield.cpupadlock
9192 || prefix != REPE_PREFIX_OPCODE
9193 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
9194 add_prefix (prefix);
9195 }
9196 break;
9197 case 2:
9198 if ((i.tm.base_opcode & 0xff0000) != 0)
9199 {
9200 prefix = (i.tm.base_opcode >> 16) & 0xff;
9201 add_prefix (prefix);
9202 }
9203 break;
9204 case 1:
9205 break;
9206 case 0:
9207 /* Check for pseudo prefixes. */
9208 as_bad_where (insn_start_frag->fr_file,
9209 insn_start_frag->fr_line,
9210 _("pseudo prefix without instruction"));
9211 return;
9212 default:
9213 abort ();
9214 }
9215
9216 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9217 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9218 R_X86_64_GOTTPOFF relocation so that linker can safely
9219 perform IE->LE optimization. A dummy REX_OPCODE prefix
9220 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9221 relocation for GDesc -> IE/LE optimization. */
9222 if (x86_elf_abi == X86_64_X32_ABI
9223 && i.operands == 2
9224 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9225 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9226 && i.prefix[REX_PREFIX] == 0)
9227 add_prefix (REX_OPCODE);
9228 #endif
9229
9230 /* The prefix bytes. */
9231 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9232 if (*q)
9233 FRAG_APPEND_1_CHAR (*q);
9234 }
9235 else
9236 {
9237 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9238 if (*q)
9239 switch (j)
9240 {
9241 case REX_PREFIX:
9242 /* REX byte is encoded in VEX prefix. */
9243 break;
9244 case SEG_PREFIX:
9245 case ADDR_PREFIX:
9246 FRAG_APPEND_1_CHAR (*q);
9247 break;
9248 default:
9249 /* There should be no other prefixes for instructions
9250 with VEX prefix. */
9251 abort ();
9252 }
9253
9254 /* For EVEX instructions i.vrex should become 0 after
9255 build_evex_prefix. For VEX instructions upper 16 registers
9256 aren't available, so VREX should be 0. */
9257 if (i.vrex)
9258 abort ();
9259 /* Now the VEX prefix. */
9260 p = frag_more (i.vex.length);
9261 for (j = 0; j < i.vex.length; j++)
9262 p[j] = i.vex.bytes[j];
9263 }
9264
9265 /* Now the opcode; be careful about word order here! */
9266 if (i.tm.opcode_length == 1)
9267 {
9268 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9269 }
9270 else
9271 {
9272 switch (i.tm.opcode_length)
9273 {
9274 case 4:
9275 p = frag_more (4);
9276 *p++ = (i.tm.base_opcode >> 24) & 0xff;
9277 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9278 break;
9279 case 3:
9280 p = frag_more (3);
9281 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9282 break;
9283 case 2:
9284 p = frag_more (2);
9285 break;
9286 default:
9287 abort ();
9288 break;
9289 }
9290
9291 /* Put out high byte first: can't use md_number_to_chars! */
9292 *p++ = (i.tm.base_opcode >> 8) & 0xff;
9293 *p = i.tm.base_opcode & 0xff;
9294 }
9295
9296 /* Now the modrm byte and sib byte (if present). */
9297 if (i.tm.opcode_modifier.modrm)
9298 {
9299 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
9300 | i.rm.reg << 3
9301 | i.rm.mode << 6));
9302 /* If i.rm.regmem == ESP (4)
9303 && i.rm.mode != (Register mode)
9304 && not 16 bit
9305 ==> need second modrm byte. */
9306 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9307 && i.rm.mode != 3
9308 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9309 FRAG_APPEND_1_CHAR ((i.sib.base << 0
9310 | i.sib.index << 3
9311 | i.sib.scale << 6));
9312 }
9313
9314 if (i.disp_operands)
9315 output_disp (insn_start_frag, insn_start_off);
9316
9317 if (i.imm_operands)
9318 output_imm (insn_start_frag, insn_start_off);
9319
9320 /*
9321 * frag_now_fix () returning plain abs_section_offset when we're in the
9322 * absolute section, and abs_section_offset not getting updated as data
9323 * gets added to the frag breaks the logic below.
9324 */
9325 if (now_seg != absolute_section)
9326 {
9327 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9328 if (j > 15)
9329 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9330 j);
9331 else if (fragP)
9332 {
9333 /* NB: Don't add prefix with GOTPC relocation since
9334 output_disp() above depends on the fixed encoding
9335 length. Can't add prefix with TLS relocation since
9336 it breaks TLS linker optimization. */
9337 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9338 /* Prefix count on the current instruction. */
9339 unsigned int count = i.vex.length;
9340 unsigned int k;
9341 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9342 /* REX byte is encoded in VEX/EVEX prefix. */
9343 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9344 count++;
9345
9346 /* Count prefixes for extended opcode maps. */
9347 if (!i.vex.length)
9348 switch (i.tm.opcode_length)
9349 {
9350 case 3:
9351 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9352 {
9353 count++;
9354 switch ((i.tm.base_opcode >> 8) & 0xff)
9355 {
9356 case 0x38:
9357 case 0x3a:
9358 count++;
9359 break;
9360 default:
9361 break;
9362 }
9363 }
9364 break;
9365 case 2:
9366 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9367 count++;
9368 break;
9369 case 1:
9370 break;
9371 default:
9372 abort ();
9373 }
9374
9375 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9376 == BRANCH_PREFIX)
9377 {
9378 /* Set the maximum prefix size in BRANCH_PREFIX
9379 frag. */
9380 if (fragP->tc_frag_data.max_bytes > max)
9381 fragP->tc_frag_data.max_bytes = max;
9382 if (fragP->tc_frag_data.max_bytes > count)
9383 fragP->tc_frag_data.max_bytes -= count;
9384 else
9385 fragP->tc_frag_data.max_bytes = 0;
9386 }
9387 else
9388 {
9389 /* Remember the maximum prefix size in FUSED_JCC_PADDING
9390 frag. */
9391 unsigned int max_prefix_size;
9392 if (align_branch_prefix_size > max)
9393 max_prefix_size = max;
9394 else
9395 max_prefix_size = align_branch_prefix_size;
9396 if (max_prefix_size > count)
9397 fragP->tc_frag_data.max_prefix_length
9398 = max_prefix_size - count;
9399 }
9400
9401 /* Use existing segment prefix if possible. Use CS
9402 segment prefix in 64-bit mode. In 32-bit mode, use SS
9403 segment prefix with ESP/EBP base register and use DS
9404 segment prefix without ESP/EBP base register. */
9405 if (i.prefix[SEG_PREFIX])
9406 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9407 else if (flag_code == CODE_64BIT)
9408 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9409 else if (i.base_reg
9410 && (i.base_reg->reg_num == 4
9411 || i.base_reg->reg_num == 5))
9412 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9413 else
9414 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9415 }
9416 }
9417 }
9418
9419 /* NB: Don't work with COND_JUMP86 without i386. */
9420 if (align_branch_power
9421 && now_seg != absolute_section
9422 && cpu_arch_flags.bitfield.cpui386)
9423 {
9424 /* Terminate each frag so that we can add prefix and check for
9425 fused jcc. */
9426 frag_wane (frag_now);
9427 frag_new (0);
9428 }
9429
9430 #ifdef DEBUG386
9431 if (flag_debug)
9432 {
9433 pi ("" /*line*/, &i);
9434 }
9435 #endif /* DEBUG386 */
9436 }
9437
9438 /* Return the size of the displacement operand N. */
9439
9440 static int
9441 disp_size (unsigned int n)
9442 {
9443 int size = 4;
9444
9445 if (i.types[n].bitfield.disp64)
9446 size = 8;
9447 else if (i.types[n].bitfield.disp8)
9448 size = 1;
9449 else if (i.types[n].bitfield.disp16)
9450 size = 2;
9451 return size;
9452 }
9453
9454 /* Return the size of the immediate operand N. */
9455
9456 static int
9457 imm_size (unsigned int n)
9458 {
9459 int size = 4;
9460 if (i.types[n].bitfield.imm64)
9461 size = 8;
9462 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9463 size = 1;
9464 else if (i.types[n].bitfield.imm16)
9465 size = 2;
9466 return size;
9467 }
9468
9469 static void
9470 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9471 {
9472 char *p;
9473 unsigned int n;
9474
9475 for (n = 0; n < i.operands; n++)
9476 {
9477 if (operand_type_check (i.types[n], disp))
9478 {
9479 if (i.op[n].disps->X_op == O_constant)
9480 {
9481 int size = disp_size (n);
9482 offsetT val = i.op[n].disps->X_add_number;
9483
9484 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9485 size);
9486 p = frag_more (size);
9487 md_number_to_chars (p, val, size);
9488 }
9489 else
9490 {
9491 enum bfd_reloc_code_real reloc_type;
9492 int size = disp_size (n);
9493 int sign = i.types[n].bitfield.disp32s;
9494 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9495 fixS *fixP;
9496
9497 /* We can't have 8 bit displacement here. */
9498 gas_assert (!i.types[n].bitfield.disp8);
9499
9500 /* The PC relative address is computed relative
9501 to the instruction boundary, so in case immediate
9502 fields follows, we need to adjust the value. */
9503 if (pcrel && i.imm_operands)
9504 {
9505 unsigned int n1;
9506 int sz = 0;
9507
9508 for (n1 = 0; n1 < i.operands; n1++)
9509 if (operand_type_check (i.types[n1], imm))
9510 {
9511 /* Only one immediate is allowed for PC
9512 relative address. */
9513 gas_assert (sz == 0);
9514 sz = imm_size (n1);
9515 i.op[n].disps->X_add_number -= sz;
9516 }
9517 /* We should find the immediate. */
9518 gas_assert (sz != 0);
9519 }
9520
9521 p = frag_more (size);
9522 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9523 if (GOT_symbol
9524 && GOT_symbol == i.op[n].disps->X_add_symbol
9525 && (((reloc_type == BFD_RELOC_32
9526 || reloc_type == BFD_RELOC_X86_64_32S
9527 || (reloc_type == BFD_RELOC_64
9528 && object_64bit))
9529 && (i.op[n].disps->X_op == O_symbol
9530 || (i.op[n].disps->X_op == O_add
9531 && ((symbol_get_value_expression
9532 (i.op[n].disps->X_op_symbol)->X_op)
9533 == O_subtract))))
9534 || reloc_type == BFD_RELOC_32_PCREL))
9535 {
9536 if (!object_64bit)
9537 {
9538 reloc_type = BFD_RELOC_386_GOTPC;
9539 i.has_gotpc_tls_reloc = TRUE;
9540 i.op[n].imms->X_add_number +=
9541 encoding_length (insn_start_frag, insn_start_off, p);
9542 }
9543 else if (reloc_type == BFD_RELOC_64)
9544 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9545 else
9546 /* Don't do the adjustment for x86-64, as there
9547 the pcrel addressing is relative to the _next_
9548 insn, and that is taken care of in other code. */
9549 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9550 }
9551 else if (align_branch_power)
9552 {
9553 switch (reloc_type)
9554 {
9555 case BFD_RELOC_386_TLS_GD:
9556 case BFD_RELOC_386_TLS_LDM:
9557 case BFD_RELOC_386_TLS_IE:
9558 case BFD_RELOC_386_TLS_IE_32:
9559 case BFD_RELOC_386_TLS_GOTIE:
9560 case BFD_RELOC_386_TLS_GOTDESC:
9561 case BFD_RELOC_386_TLS_DESC_CALL:
9562 case BFD_RELOC_X86_64_TLSGD:
9563 case BFD_RELOC_X86_64_TLSLD:
9564 case BFD_RELOC_X86_64_GOTTPOFF:
9565 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9566 case BFD_RELOC_X86_64_TLSDESC_CALL:
9567 i.has_gotpc_tls_reloc = TRUE;
9568 default:
9569 break;
9570 }
9571 }
9572 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9573 size, i.op[n].disps, pcrel,
9574 reloc_type);
9575 /* Check for "call/jmp *mem", "mov mem, %reg",
9576 "test %reg, mem" and "binop mem, %reg" where binop
9577 is one of adc, add, and, cmp, or, sbb, sub, xor
9578 instructions without data prefix. Always generate
9579 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9580 if (i.prefix[DATA_PREFIX] == 0
9581 && (generate_relax_relocations
9582 || (!object_64bit
9583 && i.rm.mode == 0
9584 && i.rm.regmem == 5))
9585 && (i.rm.mode == 2
9586 || (i.rm.mode == 0 && i.rm.regmem == 5))
9587 && !is_any_vex_encoding(&i.tm)
9588 && ((i.operands == 1
9589 && i.tm.base_opcode == 0xff
9590 && (i.rm.reg == 2 || i.rm.reg == 4))
9591 || (i.operands == 2
9592 && (i.tm.base_opcode == 0x8b
9593 || i.tm.base_opcode == 0x85
9594 || (i.tm.base_opcode & ~0x38) == 0x03))))
9595 {
9596 if (object_64bit)
9597 {
9598 fixP->fx_tcbit = i.rex != 0;
9599 if (i.base_reg
9600 && (i.base_reg->reg_num == RegIP))
9601 fixP->fx_tcbit2 = 1;
9602 }
9603 else
9604 fixP->fx_tcbit2 = 1;
9605 }
9606 }
9607 }
9608 }
9609 }
9610
9611 static void
9612 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9613 {
9614 char *p;
9615 unsigned int n;
9616
9617 for (n = 0; n < i.operands; n++)
9618 {
9619 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9620 if (i.rounding && (int) n == i.rounding->operand)
9621 continue;
9622
9623 if (operand_type_check (i.types[n], imm))
9624 {
9625 if (i.op[n].imms->X_op == O_constant)
9626 {
9627 int size = imm_size (n);
9628 offsetT val;
9629
9630 val = offset_in_range (i.op[n].imms->X_add_number,
9631 size);
9632 p = frag_more (size);
9633 md_number_to_chars (p, val, size);
9634 }
9635 else
9636 {
9637 /* Not absolute_section.
9638 Need a 32-bit fixup (don't support 8bit
9639 non-absolute imms). Try to support other
9640 sizes ... */
9641 enum bfd_reloc_code_real reloc_type;
9642 int size = imm_size (n);
9643 int sign;
9644
9645 if (i.types[n].bitfield.imm32s
9646 && (i.suffix == QWORD_MNEM_SUFFIX
9647 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9648 sign = 1;
9649 else
9650 sign = 0;
9651
9652 p = frag_more (size);
9653 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9654
9655 /* This is tough to explain. We end up with this one if we
9656 * have operands that look like
9657 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9658 * obtain the absolute address of the GOT, and it is strongly
9659 * preferable from a performance point of view to avoid using
9660 * a runtime relocation for this. The actual sequence of
9661 * instructions often look something like:
9662 *
9663 * call .L66
9664 * .L66:
9665 * popl %ebx
9666 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9667 *
9668 * The call and pop essentially return the absolute address
9669 * of the label .L66 and store it in %ebx. The linker itself
9670 * will ultimately change the first operand of the addl so
9671 * that %ebx points to the GOT, but to keep things simple, the
9672 * .o file must have this operand set so that it generates not
9673 * the absolute address of .L66, but the absolute address of
9674 * itself. This allows the linker itself simply treat a GOTPC
9675 * relocation as asking for a pcrel offset to the GOT to be
9676 * added in, and the addend of the relocation is stored in the
9677 * operand field for the instruction itself.
9678 *
9679 * Our job here is to fix the operand so that it would add
9680 * the correct offset so that %ebx would point to itself. The
9681 * thing that is tricky is that .-.L66 will point to the
9682 * beginning of the instruction, so we need to further modify
9683 * the operand so that it will point to itself. There are
9684 * other cases where you have something like:
9685 *
9686 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9687 *
9688 * and here no correction would be required. Internally in
9689 * the assembler we treat operands of this form as not being
9690 * pcrel since the '.' is explicitly mentioned, and I wonder
9691 * whether it would simplify matters to do it this way. Who
9692 * knows. In earlier versions of the PIC patches, the
9693 * pcrel_adjust field was used to store the correction, but
9694 * since the expression is not pcrel, I felt it would be
9695 * confusing to do it this way. */
9696
9697 if ((reloc_type == BFD_RELOC_32
9698 || reloc_type == BFD_RELOC_X86_64_32S
9699 || reloc_type == BFD_RELOC_64)
9700 && GOT_symbol
9701 && GOT_symbol == i.op[n].imms->X_add_symbol
9702 && (i.op[n].imms->X_op == O_symbol
9703 || (i.op[n].imms->X_op == O_add
9704 && ((symbol_get_value_expression
9705 (i.op[n].imms->X_op_symbol)->X_op)
9706 == O_subtract))))
9707 {
9708 if (!object_64bit)
9709 reloc_type = BFD_RELOC_386_GOTPC;
9710 else if (size == 4)
9711 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9712 else if (size == 8)
9713 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9714 i.has_gotpc_tls_reloc = TRUE;
9715 i.op[n].imms->X_add_number +=
9716 encoding_length (insn_start_frag, insn_start_off, p);
9717 }
9718 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9719 i.op[n].imms, 0, reloc_type);
9720 }
9721 }
9722 }
9723 }
9724 \f
9725 /* x86_cons_fix_new is called via the expression parsing code when a
9726 reloc is needed. We use this hook to get the correct .got reloc. */
9727 static int cons_sign = -1;
9728
9729 void
9730 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9731 expressionS *exp, bfd_reloc_code_real_type r)
9732 {
9733 r = reloc (len, 0, cons_sign, r);
9734
9735 #ifdef TE_PE
9736 if (exp->X_op == O_secrel)
9737 {
9738 exp->X_op = O_symbol;
9739 r = BFD_RELOC_32_SECREL;
9740 }
9741 #endif
9742
9743 fix_new_exp (frag, off, len, exp, 0, r);
9744 }
9745
9746 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9747 purpose of the `.dc.a' internal pseudo-op. */
9748
9749 int
9750 x86_address_bytes (void)
9751 {
9752 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9753 return 4;
9754 return stdoutput->arch_info->bits_per_address / 8;
9755 }
9756
9757 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9758 || defined (LEX_AT)
9759 # define lex_got(reloc, adjust, types) NULL
9760 #else
9761 /* Parse operands of the form
9762 <symbol>@GOTOFF+<nnn>
9763 and similar .plt or .got references.
9764
9765 If we find one, set up the correct relocation in RELOC and copy the
9766 input string, minus the `@GOTOFF' into a malloc'd buffer for
9767 parsing by the calling routine. Return this buffer, and if ADJUST
9768 is non-null set it to the length of the string we removed from the
9769 input line. Otherwise return NULL. */
9770 static char *
9771 lex_got (enum bfd_reloc_code_real *rel,
9772 int *adjust,
9773 i386_operand_type *types)
9774 {
9775 /* Some of the relocations depend on the size of what field is to
9776 be relocated. But in our callers i386_immediate and i386_displacement
9777 we don't yet know the operand size (this will be set by insn
9778 matching). Hence we record the word32 relocation here,
9779 and adjust the reloc according to the real size in reloc(). */
9780 static const struct {
9781 const char *str;
9782 int len;
9783 const enum bfd_reloc_code_real rel[2];
9784 const i386_operand_type types64;
9785 } gotrel[] = {
9786 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9787 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9788 BFD_RELOC_SIZE32 },
9789 OPERAND_TYPE_IMM32_64 },
9790 #endif
9791 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9792 BFD_RELOC_X86_64_PLTOFF64 },
9793 OPERAND_TYPE_IMM64 },
9794 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9795 BFD_RELOC_X86_64_PLT32 },
9796 OPERAND_TYPE_IMM32_32S_DISP32 },
9797 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9798 BFD_RELOC_X86_64_GOTPLT64 },
9799 OPERAND_TYPE_IMM64_DISP64 },
9800 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9801 BFD_RELOC_X86_64_GOTOFF64 },
9802 OPERAND_TYPE_IMM64_DISP64 },
9803 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9804 BFD_RELOC_X86_64_GOTPCREL },
9805 OPERAND_TYPE_IMM32_32S_DISP32 },
9806 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9807 BFD_RELOC_X86_64_TLSGD },
9808 OPERAND_TYPE_IMM32_32S_DISP32 },
9809 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9810 _dummy_first_bfd_reloc_code_real },
9811 OPERAND_TYPE_NONE },
9812 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9813 BFD_RELOC_X86_64_TLSLD },
9814 OPERAND_TYPE_IMM32_32S_DISP32 },
9815 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9816 BFD_RELOC_X86_64_GOTTPOFF },
9817 OPERAND_TYPE_IMM32_32S_DISP32 },
9818 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9819 BFD_RELOC_X86_64_TPOFF32 },
9820 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9821 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9822 _dummy_first_bfd_reloc_code_real },
9823 OPERAND_TYPE_NONE },
9824 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9825 BFD_RELOC_X86_64_DTPOFF32 },
9826 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9827 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9828 _dummy_first_bfd_reloc_code_real },
9829 OPERAND_TYPE_NONE },
9830 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9831 _dummy_first_bfd_reloc_code_real },
9832 OPERAND_TYPE_NONE },
9833 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9834 BFD_RELOC_X86_64_GOT32 },
9835 OPERAND_TYPE_IMM32_32S_64_DISP32 },
9836 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9837 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9838 OPERAND_TYPE_IMM32_32S_DISP32 },
9839 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9840 BFD_RELOC_X86_64_TLSDESC_CALL },
9841 OPERAND_TYPE_IMM32_32S_DISP32 },
9842 };
9843 char *cp;
9844 unsigned int j;
9845
9846 #if defined (OBJ_MAYBE_ELF)
9847 if (!IS_ELF)
9848 return NULL;
9849 #endif
9850
9851 for (cp = input_line_pointer; *cp != '@'; cp++)
9852 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9853 return NULL;
9854
9855 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9856 {
9857 int len = gotrel[j].len;
9858 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9859 {
9860 if (gotrel[j].rel[object_64bit] != 0)
9861 {
9862 int first, second;
9863 char *tmpbuf, *past_reloc;
9864
9865 *rel = gotrel[j].rel[object_64bit];
9866
9867 if (types)
9868 {
9869 if (flag_code != CODE_64BIT)
9870 {
9871 types->bitfield.imm32 = 1;
9872 types->bitfield.disp32 = 1;
9873 }
9874 else
9875 *types = gotrel[j].types64;
9876 }
9877
9878 if (j != 0 && GOT_symbol == NULL)
9879 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9880
9881 /* The length of the first part of our input line. */
9882 first = cp - input_line_pointer;
9883
9884 /* The second part goes from after the reloc token until
9885 (and including) an end_of_line char or comma. */
9886 past_reloc = cp + 1 + len;
9887 cp = past_reloc;
9888 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9889 ++cp;
9890 second = cp + 1 - past_reloc;
9891
9892 /* Allocate and copy string. The trailing NUL shouldn't
9893 be necessary, but be safe. */
9894 tmpbuf = XNEWVEC (char, first + second + 2);
9895 memcpy (tmpbuf, input_line_pointer, first);
9896 if (second != 0 && *past_reloc != ' ')
9897 /* Replace the relocation token with ' ', so that
9898 errors like foo@GOTOFF1 will be detected. */
9899 tmpbuf[first++] = ' ';
9900 else
9901 /* Increment length by 1 if the relocation token is
9902 removed. */
9903 len++;
9904 if (adjust)
9905 *adjust = len;
9906 memcpy (tmpbuf + first, past_reloc, second);
9907 tmpbuf[first + second] = '\0';
9908 return tmpbuf;
9909 }
9910
9911 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9912 gotrel[j].str, 1 << (5 + object_64bit));
9913 return NULL;
9914 }
9915 }
9916
9917 /* Might be a symbol version string. Don't as_bad here. */
9918 return NULL;
9919 }
9920 #endif
9921
9922 #ifdef TE_PE
9923 #ifdef lex_got
9924 #undef lex_got
9925 #endif
9926 /* Parse operands of the form
9927 <symbol>@SECREL32+<nnn>
9928
9929 If we find one, set up the correct relocation in RELOC and copy the
9930 input string, minus the `@SECREL32' into a malloc'd buffer for
9931 parsing by the calling routine. Return this buffer, and if ADJUST
9932 is non-null set it to the length of the string we removed from the
9933 input line. Otherwise return NULL.
9934
9935 This function is copied from the ELF version above adjusted for PE targets. */
9936
9937 static char *
9938 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
9939 int *adjust ATTRIBUTE_UNUSED,
9940 i386_operand_type *types)
9941 {
9942 static const struct
9943 {
9944 const char *str;
9945 int len;
9946 const enum bfd_reloc_code_real rel[2];
9947 const i386_operand_type types64;
9948 }
9949 gotrel[] =
9950 {
9951 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
9952 BFD_RELOC_32_SECREL },
9953 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9954 };
9955
9956 char *cp;
9957 unsigned j;
9958
9959 for (cp = input_line_pointer; *cp != '@'; cp++)
9960 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9961 return NULL;
9962
9963 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9964 {
9965 int len = gotrel[j].len;
9966
9967 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9968 {
9969 if (gotrel[j].rel[object_64bit] != 0)
9970 {
9971 int first, second;
9972 char *tmpbuf, *past_reloc;
9973
9974 *rel = gotrel[j].rel[object_64bit];
9975 if (adjust)
9976 *adjust = len;
9977
9978 if (types)
9979 {
9980 if (flag_code != CODE_64BIT)
9981 {
9982 types->bitfield.imm32 = 1;
9983 types->bitfield.disp32 = 1;
9984 }
9985 else
9986 *types = gotrel[j].types64;
9987 }
9988
9989 /* The length of the first part of our input line. */
9990 first = cp - input_line_pointer;
9991
9992 /* The second part goes from after the reloc token until
9993 (and including) an end_of_line char or comma. */
9994 past_reloc = cp + 1 + len;
9995 cp = past_reloc;
9996 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9997 ++cp;
9998 second = cp + 1 - past_reloc;
9999
10000 /* Allocate and copy string. The trailing NUL shouldn't
10001 be necessary, but be safe. */
10002 tmpbuf = XNEWVEC (char, first + second + 2);
10003 memcpy (tmpbuf, input_line_pointer, first);
10004 if (second != 0 && *past_reloc != ' ')
10005 /* Replace the relocation token with ' ', so that
10006 errors like foo@SECLREL321 will be detected. */
10007 tmpbuf[first++] = ' ';
10008 memcpy (tmpbuf + first, past_reloc, second);
10009 tmpbuf[first + second] = '\0';
10010 return tmpbuf;
10011 }
10012
10013 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10014 gotrel[j].str, 1 << (5 + object_64bit));
10015 return NULL;
10016 }
10017 }
10018
10019 /* Might be a symbol version string. Don't as_bad here. */
10020 return NULL;
10021 }
10022
10023 #endif /* TE_PE */
10024
10025 bfd_reloc_code_real_type
10026 x86_cons (expressionS *exp, int size)
10027 {
10028 bfd_reloc_code_real_type got_reloc = NO_RELOC;
10029
10030 intel_syntax = -intel_syntax;
10031
10032 exp->X_md = 0;
10033 if (size == 4 || (object_64bit && size == 8))
10034 {
10035 /* Handle @GOTOFF and the like in an expression. */
10036 char *save;
10037 char *gotfree_input_line;
10038 int adjust = 0;
10039
10040 save = input_line_pointer;
10041 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10042 if (gotfree_input_line)
10043 input_line_pointer = gotfree_input_line;
10044
10045 expression (exp);
10046
10047 if (gotfree_input_line)
10048 {
10049 /* expression () has merrily parsed up to the end of line,
10050 or a comma - in the wrong buffer. Transfer how far
10051 input_line_pointer has moved to the right buffer. */
10052 input_line_pointer = (save
10053 + (input_line_pointer - gotfree_input_line)
10054 + adjust);
10055 free (gotfree_input_line);
10056 if (exp->X_op == O_constant
10057 || exp->X_op == O_absent
10058 || exp->X_op == O_illegal
10059 || exp->X_op == O_register
10060 || exp->X_op == O_big)
10061 {
10062 char c = *input_line_pointer;
10063 *input_line_pointer = 0;
10064 as_bad (_("missing or invalid expression `%s'"), save);
10065 *input_line_pointer = c;
10066 }
10067 else if ((got_reloc == BFD_RELOC_386_PLT32
10068 || got_reloc == BFD_RELOC_X86_64_PLT32)
10069 && exp->X_op != O_symbol)
10070 {
10071 char c = *input_line_pointer;
10072 *input_line_pointer = 0;
10073 as_bad (_("invalid PLT expression `%s'"), save);
10074 *input_line_pointer = c;
10075 }
10076 }
10077 }
10078 else
10079 expression (exp);
10080
10081 intel_syntax = -intel_syntax;
10082
10083 if (intel_syntax)
10084 i386_intel_simplify (exp);
10085
10086 return got_reloc;
10087 }
10088
10089 static void
10090 signed_cons (int size)
10091 {
10092 if (flag_code == CODE_64BIT)
10093 cons_sign = 1;
10094 cons (size);
10095 cons_sign = -1;
10096 }
10097
10098 #ifdef TE_PE
10099 static void
10100 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10101 {
10102 expressionS exp;
10103
10104 do
10105 {
10106 expression (&exp);
10107 if (exp.X_op == O_symbol)
10108 exp.X_op = O_secrel;
10109
10110 emit_expr (&exp, 4);
10111 }
10112 while (*input_line_pointer++ == ',');
10113
10114 input_line_pointer--;
10115 demand_empty_rest_of_line ();
10116 }
10117 #endif
10118
10119 /* Handle Vector operations. */
10120
10121 static char *
10122 check_VecOperations (char *op_string, char *op_end)
10123 {
10124 const reg_entry *mask;
10125 const char *saved;
10126 char *end_op;
10127
10128 while (*op_string
10129 && (op_end == NULL || op_string < op_end))
10130 {
10131 saved = op_string;
10132 if (*op_string == '{')
10133 {
10134 op_string++;
10135
10136 /* Check broadcasts. */
10137 if (strncmp (op_string, "1to", 3) == 0)
10138 {
10139 int bcst_type;
10140
10141 if (i.broadcast)
10142 goto duplicated_vec_op;
10143
10144 op_string += 3;
10145 if (*op_string == '8')
10146 bcst_type = 8;
10147 else if (*op_string == '4')
10148 bcst_type = 4;
10149 else if (*op_string == '2')
10150 bcst_type = 2;
10151 else if (*op_string == '1'
10152 && *(op_string+1) == '6')
10153 {
10154 bcst_type = 16;
10155 op_string++;
10156 }
10157 else
10158 {
10159 as_bad (_("Unsupported broadcast: `%s'"), saved);
10160 return NULL;
10161 }
10162 op_string++;
10163
10164 broadcast_op.type = bcst_type;
10165 broadcast_op.operand = this_operand;
10166 broadcast_op.bytes = 0;
10167 i.broadcast = &broadcast_op;
10168 }
10169 /* Check masking operation. */
10170 else if ((mask = parse_register (op_string, &end_op)) != NULL)
10171 {
10172 if (mask == &bad_reg)
10173 return NULL;
10174
10175 /* k0 can't be used for write mask. */
10176 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10177 {
10178 as_bad (_("`%s%s' can't be used for write mask"),
10179 register_prefix, mask->reg_name);
10180 return NULL;
10181 }
10182
10183 if (!i.mask)
10184 {
10185 mask_op.mask = mask;
10186 mask_op.zeroing = 0;
10187 mask_op.operand = this_operand;
10188 i.mask = &mask_op;
10189 }
10190 else
10191 {
10192 if (i.mask->mask)
10193 goto duplicated_vec_op;
10194
10195 i.mask->mask = mask;
10196
10197 /* Only "{z}" is allowed here. No need to check
10198 zeroing mask explicitly. */
10199 if (i.mask->operand != this_operand)
10200 {
10201 as_bad (_("invalid write mask `%s'"), saved);
10202 return NULL;
10203 }
10204 }
10205
10206 op_string = end_op;
10207 }
10208 /* Check zeroing-flag for masking operation. */
10209 else if (*op_string == 'z')
10210 {
10211 if (!i.mask)
10212 {
10213 mask_op.mask = NULL;
10214 mask_op.zeroing = 1;
10215 mask_op.operand = this_operand;
10216 i.mask = &mask_op;
10217 }
10218 else
10219 {
10220 if (i.mask->zeroing)
10221 {
10222 duplicated_vec_op:
10223 as_bad (_("duplicated `%s'"), saved);
10224 return NULL;
10225 }
10226
10227 i.mask->zeroing = 1;
10228
10229 /* Only "{%k}" is allowed here. No need to check mask
10230 register explicitly. */
10231 if (i.mask->operand != this_operand)
10232 {
10233 as_bad (_("invalid zeroing-masking `%s'"),
10234 saved);
10235 return NULL;
10236 }
10237 }
10238
10239 op_string++;
10240 }
10241 else
10242 goto unknown_vec_op;
10243
10244 if (*op_string != '}')
10245 {
10246 as_bad (_("missing `}' in `%s'"), saved);
10247 return NULL;
10248 }
10249 op_string++;
10250
10251 /* Strip whitespace since the addition of pseudo prefixes
10252 changed how the scrubber treats '{'. */
10253 if (is_space_char (*op_string))
10254 ++op_string;
10255
10256 continue;
10257 }
10258 unknown_vec_op:
10259 /* We don't know this one. */
10260 as_bad (_("unknown vector operation: `%s'"), saved);
10261 return NULL;
10262 }
10263
10264 if (i.mask && i.mask->zeroing && !i.mask->mask)
10265 {
10266 as_bad (_("zeroing-masking only allowed with write mask"));
10267 return NULL;
10268 }
10269
10270 return op_string;
10271 }
10272
10273 static int
10274 i386_immediate (char *imm_start)
10275 {
10276 char *save_input_line_pointer;
10277 char *gotfree_input_line;
10278 segT exp_seg = 0;
10279 expressionS *exp;
10280 i386_operand_type types;
10281
10282 operand_type_set (&types, ~0);
10283
10284 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10285 {
10286 as_bad (_("at most %d immediate operands are allowed"),
10287 MAX_IMMEDIATE_OPERANDS);
10288 return 0;
10289 }
10290
10291 exp = &im_expressions[i.imm_operands++];
10292 i.op[this_operand].imms = exp;
10293
10294 if (is_space_char (*imm_start))
10295 ++imm_start;
10296
10297 save_input_line_pointer = input_line_pointer;
10298 input_line_pointer = imm_start;
10299
10300 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10301 if (gotfree_input_line)
10302 input_line_pointer = gotfree_input_line;
10303
10304 exp_seg = expression (exp);
10305
10306 SKIP_WHITESPACE ();
10307
10308 /* Handle vector operations. */
10309 if (*input_line_pointer == '{')
10310 {
10311 input_line_pointer = check_VecOperations (input_line_pointer,
10312 NULL);
10313 if (input_line_pointer == NULL)
10314 return 0;
10315 }
10316
10317 if (*input_line_pointer)
10318 as_bad (_("junk `%s' after expression"), input_line_pointer);
10319
10320 input_line_pointer = save_input_line_pointer;
10321 if (gotfree_input_line)
10322 {
10323 free (gotfree_input_line);
10324
10325 if (exp->X_op == O_constant || exp->X_op == O_register)
10326 exp->X_op = O_illegal;
10327 }
10328
10329 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10330 }
10331
10332 static int
10333 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10334 i386_operand_type types, const char *imm_start)
10335 {
10336 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10337 {
10338 if (imm_start)
10339 as_bad (_("missing or invalid immediate expression `%s'"),
10340 imm_start);
10341 return 0;
10342 }
10343 else if (exp->X_op == O_constant)
10344 {
10345 /* Size it properly later. */
10346 i.types[this_operand].bitfield.imm64 = 1;
10347 /* If not 64bit, sign extend val. */
10348 if (flag_code != CODE_64BIT
10349 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10350 exp->X_add_number
10351 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10352 }
10353 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10354 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10355 && exp_seg != absolute_section
10356 && exp_seg != text_section
10357 && exp_seg != data_section
10358 && exp_seg != bss_section
10359 && exp_seg != undefined_section
10360 && !bfd_is_com_section (exp_seg))
10361 {
10362 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10363 return 0;
10364 }
10365 #endif
10366 else if (!intel_syntax && exp_seg == reg_section)
10367 {
10368 if (imm_start)
10369 as_bad (_("illegal immediate register operand %s"), imm_start);
10370 return 0;
10371 }
10372 else
10373 {
10374 /* This is an address. The size of the address will be
10375 determined later, depending on destination register,
10376 suffix, or the default for the section. */
10377 i.types[this_operand].bitfield.imm8 = 1;
10378 i.types[this_operand].bitfield.imm16 = 1;
10379 i.types[this_operand].bitfield.imm32 = 1;
10380 i.types[this_operand].bitfield.imm32s = 1;
10381 i.types[this_operand].bitfield.imm64 = 1;
10382 i.types[this_operand] = operand_type_and (i.types[this_operand],
10383 types);
10384 }
10385
10386 return 1;
10387 }
10388
10389 static char *
10390 i386_scale (char *scale)
10391 {
10392 offsetT val;
10393 char *save = input_line_pointer;
10394
10395 input_line_pointer = scale;
10396 val = get_absolute_expression ();
10397
10398 switch (val)
10399 {
10400 case 1:
10401 i.log2_scale_factor = 0;
10402 break;
10403 case 2:
10404 i.log2_scale_factor = 1;
10405 break;
10406 case 4:
10407 i.log2_scale_factor = 2;
10408 break;
10409 case 8:
10410 i.log2_scale_factor = 3;
10411 break;
10412 default:
10413 {
10414 char sep = *input_line_pointer;
10415
10416 *input_line_pointer = '\0';
10417 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10418 scale);
10419 *input_line_pointer = sep;
10420 input_line_pointer = save;
10421 return NULL;
10422 }
10423 }
10424 if (i.log2_scale_factor != 0 && i.index_reg == 0)
10425 {
10426 as_warn (_("scale factor of %d without an index register"),
10427 1 << i.log2_scale_factor);
10428 i.log2_scale_factor = 0;
10429 }
10430 scale = input_line_pointer;
10431 input_line_pointer = save;
10432 return scale;
10433 }
10434
10435 static int
10436 i386_displacement (char *disp_start, char *disp_end)
10437 {
10438 expressionS *exp;
10439 segT exp_seg = 0;
10440 char *save_input_line_pointer;
10441 char *gotfree_input_line;
10442 int override;
10443 i386_operand_type bigdisp, types = anydisp;
10444 int ret;
10445
10446 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10447 {
10448 as_bad (_("at most %d displacement operands are allowed"),
10449 MAX_MEMORY_OPERANDS);
10450 return 0;
10451 }
10452
10453 operand_type_set (&bigdisp, 0);
10454 if (i.jumpabsolute
10455 || i.types[this_operand].bitfield.baseindex
10456 || (current_templates->start->opcode_modifier.jump != JUMP
10457 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10458 {
10459 i386_addressing_mode ();
10460 override = (i.prefix[ADDR_PREFIX] != 0);
10461 if (flag_code == CODE_64BIT)
10462 {
10463 if (!override)
10464 {
10465 bigdisp.bitfield.disp32s = 1;
10466 bigdisp.bitfield.disp64 = 1;
10467 }
10468 else
10469 bigdisp.bitfield.disp32 = 1;
10470 }
10471 else if ((flag_code == CODE_16BIT) ^ override)
10472 bigdisp.bitfield.disp16 = 1;
10473 else
10474 bigdisp.bitfield.disp32 = 1;
10475 }
10476 else
10477 {
10478 /* For PC-relative branches, the width of the displacement may be
10479 dependent upon data size, but is never dependent upon address size.
10480 Also make sure to not unintentionally match against a non-PC-relative
10481 branch template. */
10482 static templates aux_templates;
10483 const insn_template *t = current_templates->start;
10484 bfd_boolean has_intel64 = FALSE;
10485
10486 aux_templates.start = t;
10487 while (++t < current_templates->end)
10488 {
10489 if (t->opcode_modifier.jump
10490 != current_templates->start->opcode_modifier.jump)
10491 break;
10492 if ((t->opcode_modifier.isa64 >= INTEL64))
10493 has_intel64 = TRUE;
10494 }
10495 if (t < current_templates->end)
10496 {
10497 aux_templates.end = t;
10498 current_templates = &aux_templates;
10499 }
10500
10501 override = (i.prefix[DATA_PREFIX] != 0);
10502 if (flag_code == CODE_64BIT)
10503 {
10504 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10505 && (!intel64 || !has_intel64))
10506 bigdisp.bitfield.disp16 = 1;
10507 else
10508 bigdisp.bitfield.disp32s = 1;
10509 }
10510 else
10511 {
10512 if (!override)
10513 override = (i.suffix == (flag_code != CODE_16BIT
10514 ? WORD_MNEM_SUFFIX
10515 : LONG_MNEM_SUFFIX));
10516 bigdisp.bitfield.disp32 = 1;
10517 if ((flag_code == CODE_16BIT) ^ override)
10518 {
10519 bigdisp.bitfield.disp32 = 0;
10520 bigdisp.bitfield.disp16 = 1;
10521 }
10522 }
10523 }
10524 i.types[this_operand] = operand_type_or (i.types[this_operand],
10525 bigdisp);
10526
10527 exp = &disp_expressions[i.disp_operands];
10528 i.op[this_operand].disps = exp;
10529 i.disp_operands++;
10530 save_input_line_pointer = input_line_pointer;
10531 input_line_pointer = disp_start;
10532 END_STRING_AND_SAVE (disp_end);
10533
10534 #ifndef GCC_ASM_O_HACK
10535 #define GCC_ASM_O_HACK 0
10536 #endif
10537 #if GCC_ASM_O_HACK
10538 END_STRING_AND_SAVE (disp_end + 1);
10539 if (i.types[this_operand].bitfield.baseIndex
10540 && displacement_string_end[-1] == '+')
10541 {
10542 /* This hack is to avoid a warning when using the "o"
10543 constraint within gcc asm statements.
10544 For instance:
10545
10546 #define _set_tssldt_desc(n,addr,limit,type) \
10547 __asm__ __volatile__ ( \
10548 "movw %w2,%0\n\t" \
10549 "movw %w1,2+%0\n\t" \
10550 "rorl $16,%1\n\t" \
10551 "movb %b1,4+%0\n\t" \
10552 "movb %4,5+%0\n\t" \
10553 "movb $0,6+%0\n\t" \
10554 "movb %h1,7+%0\n\t" \
10555 "rorl $16,%1" \
10556 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10557
10558 This works great except that the output assembler ends
10559 up looking a bit weird if it turns out that there is
10560 no offset. You end up producing code that looks like:
10561
10562 #APP
10563 movw $235,(%eax)
10564 movw %dx,2+(%eax)
10565 rorl $16,%edx
10566 movb %dl,4+(%eax)
10567 movb $137,5+(%eax)
10568 movb $0,6+(%eax)
10569 movb %dh,7+(%eax)
10570 rorl $16,%edx
10571 #NO_APP
10572
10573 So here we provide the missing zero. */
10574
10575 *displacement_string_end = '0';
10576 }
10577 #endif
10578 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10579 if (gotfree_input_line)
10580 input_line_pointer = gotfree_input_line;
10581
10582 exp_seg = expression (exp);
10583
10584 SKIP_WHITESPACE ();
10585 if (*input_line_pointer)
10586 as_bad (_("junk `%s' after expression"), input_line_pointer);
10587 #if GCC_ASM_O_HACK
10588 RESTORE_END_STRING (disp_end + 1);
10589 #endif
10590 input_line_pointer = save_input_line_pointer;
10591 if (gotfree_input_line)
10592 {
10593 free (gotfree_input_line);
10594
10595 if (exp->X_op == O_constant || exp->X_op == O_register)
10596 exp->X_op = O_illegal;
10597 }
10598
10599 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10600
10601 RESTORE_END_STRING (disp_end);
10602
10603 return ret;
10604 }
10605
10606 static int
10607 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10608 i386_operand_type types, const char *disp_start)
10609 {
10610 i386_operand_type bigdisp;
10611 int ret = 1;
10612
10613 /* We do this to make sure that the section symbol is in
10614 the symbol table. We will ultimately change the relocation
10615 to be relative to the beginning of the section. */
10616 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10617 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10618 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10619 {
10620 if (exp->X_op != O_symbol)
10621 goto inv_disp;
10622
10623 if (S_IS_LOCAL (exp->X_add_symbol)
10624 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10625 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10626 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10627 exp->X_op = O_subtract;
10628 exp->X_op_symbol = GOT_symbol;
10629 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10630 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10631 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10632 i.reloc[this_operand] = BFD_RELOC_64;
10633 else
10634 i.reloc[this_operand] = BFD_RELOC_32;
10635 }
10636
10637 else if (exp->X_op == O_absent
10638 || exp->X_op == O_illegal
10639 || exp->X_op == O_big)
10640 {
10641 inv_disp:
10642 as_bad (_("missing or invalid displacement expression `%s'"),
10643 disp_start);
10644 ret = 0;
10645 }
10646
10647 else if (flag_code == CODE_64BIT
10648 && !i.prefix[ADDR_PREFIX]
10649 && exp->X_op == O_constant)
10650 {
10651 /* Since displacement is signed extended to 64bit, don't allow
10652 disp32 and turn off disp32s if they are out of range. */
10653 i.types[this_operand].bitfield.disp32 = 0;
10654 if (!fits_in_signed_long (exp->X_add_number))
10655 {
10656 i.types[this_operand].bitfield.disp32s = 0;
10657 if (i.types[this_operand].bitfield.baseindex)
10658 {
10659 as_bad (_("0x%lx out range of signed 32bit displacement"),
10660 (long) exp->X_add_number);
10661 ret = 0;
10662 }
10663 }
10664 }
10665
10666 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10667 else if (exp->X_op != O_constant
10668 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10669 && exp_seg != absolute_section
10670 && exp_seg != text_section
10671 && exp_seg != data_section
10672 && exp_seg != bss_section
10673 && exp_seg != undefined_section
10674 && !bfd_is_com_section (exp_seg))
10675 {
10676 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10677 ret = 0;
10678 }
10679 #endif
10680
10681 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10682 /* Constants get taken care of by optimize_disp(). */
10683 && exp->X_op != O_constant)
10684 i.types[this_operand].bitfield.disp8 = 1;
10685
10686 /* Check if this is a displacement only operand. */
10687 bigdisp = i.types[this_operand];
10688 bigdisp.bitfield.disp8 = 0;
10689 bigdisp.bitfield.disp16 = 0;
10690 bigdisp.bitfield.disp32 = 0;
10691 bigdisp.bitfield.disp32s = 0;
10692 bigdisp.bitfield.disp64 = 0;
10693 if (operand_type_all_zero (&bigdisp))
10694 i.types[this_operand] = operand_type_and (i.types[this_operand],
10695 types);
10696
10697 return ret;
10698 }
10699
10700 /* Return the active addressing mode, taking address override and
10701 registers forming the address into consideration. Update the
10702 address override prefix if necessary. */
10703
10704 static enum flag_code
10705 i386_addressing_mode (void)
10706 {
10707 enum flag_code addr_mode;
10708
10709 if (i.prefix[ADDR_PREFIX])
10710 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10711 else if (flag_code == CODE_16BIT
10712 && current_templates->start->cpu_flags.bitfield.cpumpx
10713 /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10714 from md_assemble() by "is not a valid base/index expression"
10715 when there is a base and/or index. */
10716 && !i.types[this_operand].bitfield.baseindex)
10717 {
10718 /* MPX insn memory operands with neither base nor index must be forced
10719 to use 32-bit addressing in 16-bit mode. */
10720 addr_mode = CODE_32BIT;
10721 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10722 ++i.prefixes;
10723 gas_assert (!i.types[this_operand].bitfield.disp16);
10724 gas_assert (!i.types[this_operand].bitfield.disp32);
10725 }
10726 else
10727 {
10728 addr_mode = flag_code;
10729
10730 #if INFER_ADDR_PREFIX
10731 if (i.mem_operands == 0)
10732 {
10733 /* Infer address prefix from the first memory operand. */
10734 const reg_entry *addr_reg = i.base_reg;
10735
10736 if (addr_reg == NULL)
10737 addr_reg = i.index_reg;
10738
10739 if (addr_reg)
10740 {
10741 if (addr_reg->reg_type.bitfield.dword)
10742 addr_mode = CODE_32BIT;
10743 else if (flag_code != CODE_64BIT
10744 && addr_reg->reg_type.bitfield.word)
10745 addr_mode = CODE_16BIT;
10746
10747 if (addr_mode != flag_code)
10748 {
10749 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10750 i.prefixes += 1;
10751 /* Change the size of any displacement too. At most one
10752 of Disp16 or Disp32 is set.
10753 FIXME. There doesn't seem to be any real need for
10754 separate Disp16 and Disp32 flags. The same goes for
10755 Imm16 and Imm32. Removing them would probably clean
10756 up the code quite a lot. */
10757 if (flag_code != CODE_64BIT
10758 && (i.types[this_operand].bitfield.disp16
10759 || i.types[this_operand].bitfield.disp32))
10760 i.types[this_operand]
10761 = operand_type_xor (i.types[this_operand], disp16_32);
10762 }
10763 }
10764 }
10765 #endif
10766 }
10767
10768 return addr_mode;
10769 }
10770
10771 /* Make sure the memory operand we've been dealt is valid.
10772 Return 1 on success, 0 on a failure. */
10773
10774 static int
10775 i386_index_check (const char *operand_string)
10776 {
10777 const char *kind = "base/index";
10778 enum flag_code addr_mode = i386_addressing_mode ();
10779
10780 if (current_templates->start->opcode_modifier.isstring
10781 && !current_templates->start->cpu_flags.bitfield.cpupadlock
10782 && (current_templates->end[-1].opcode_modifier.isstring
10783 || i.mem_operands))
10784 {
10785 /* Memory operands of string insns are special in that they only allow
10786 a single register (rDI, rSI, or rBX) as their memory address. */
10787 const reg_entry *expected_reg;
10788 static const char *di_si[][2] =
10789 {
10790 { "esi", "edi" },
10791 { "si", "di" },
10792 { "rsi", "rdi" }
10793 };
10794 static const char *bx[] = { "ebx", "bx", "rbx" };
10795
10796 kind = "string address";
10797
10798 if (current_templates->start->opcode_modifier.repprefixok)
10799 {
10800 int es_op = current_templates->end[-1].opcode_modifier.isstring
10801 - IS_STRING_ES_OP0;
10802 int op = 0;
10803
10804 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10805 || ((!i.mem_operands != !intel_syntax)
10806 && current_templates->end[-1].operand_types[1]
10807 .bitfield.baseindex))
10808 op = 1;
10809 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10810 }
10811 else
10812 expected_reg = hash_find (reg_hash, bx[addr_mode]);
10813
10814 if (i.base_reg != expected_reg
10815 || i.index_reg
10816 || operand_type_check (i.types[this_operand], disp))
10817 {
10818 /* The second memory operand must have the same size as
10819 the first one. */
10820 if (i.mem_operands
10821 && i.base_reg
10822 && !((addr_mode == CODE_64BIT
10823 && i.base_reg->reg_type.bitfield.qword)
10824 || (addr_mode == CODE_32BIT
10825 ? i.base_reg->reg_type.bitfield.dword
10826 : i.base_reg->reg_type.bitfield.word)))
10827 goto bad_address;
10828
10829 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10830 operand_string,
10831 intel_syntax ? '[' : '(',
10832 register_prefix,
10833 expected_reg->reg_name,
10834 intel_syntax ? ']' : ')');
10835 return 1;
10836 }
10837 else
10838 return 1;
10839
10840 bad_address:
10841 as_bad (_("`%s' is not a valid %s expression"),
10842 operand_string, kind);
10843 return 0;
10844 }
10845 else
10846 {
10847 if (addr_mode != CODE_16BIT)
10848 {
10849 /* 32-bit/64-bit checks. */
10850 if ((i.base_reg
10851 && ((addr_mode == CODE_64BIT
10852 ? !i.base_reg->reg_type.bitfield.qword
10853 : !i.base_reg->reg_type.bitfield.dword)
10854 || (i.index_reg && i.base_reg->reg_num == RegIP)
10855 || i.base_reg->reg_num == RegIZ))
10856 || (i.index_reg
10857 && !i.index_reg->reg_type.bitfield.xmmword
10858 && !i.index_reg->reg_type.bitfield.ymmword
10859 && !i.index_reg->reg_type.bitfield.zmmword
10860 && ((addr_mode == CODE_64BIT
10861 ? !i.index_reg->reg_type.bitfield.qword
10862 : !i.index_reg->reg_type.bitfield.dword)
10863 || !i.index_reg->reg_type.bitfield.baseindex)))
10864 goto bad_address;
10865
10866 /* bndmk, bndldx, and bndstx have special restrictions. */
10867 if (current_templates->start->base_opcode == 0xf30f1b
10868 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10869 {
10870 /* They cannot use RIP-relative addressing. */
10871 if (i.base_reg && i.base_reg->reg_num == RegIP)
10872 {
10873 as_bad (_("`%s' cannot be used here"), operand_string);
10874 return 0;
10875 }
10876
10877 /* bndldx and bndstx ignore their scale factor. */
10878 if (current_templates->start->base_opcode != 0xf30f1b
10879 && i.log2_scale_factor)
10880 as_warn (_("register scaling is being ignored here"));
10881 }
10882 }
10883 else
10884 {
10885 /* 16-bit checks. */
10886 if ((i.base_reg
10887 && (!i.base_reg->reg_type.bitfield.word
10888 || !i.base_reg->reg_type.bitfield.baseindex))
10889 || (i.index_reg
10890 && (!i.index_reg->reg_type.bitfield.word
10891 || !i.index_reg->reg_type.bitfield.baseindex
10892 || !(i.base_reg
10893 && i.base_reg->reg_num < 6
10894 && i.index_reg->reg_num >= 6
10895 && i.log2_scale_factor == 0))))
10896 goto bad_address;
10897 }
10898 }
10899 return 1;
10900 }
10901
10902 /* Handle vector immediates. */
10903
10904 static int
10905 RC_SAE_immediate (const char *imm_start)
10906 {
10907 unsigned int match_found, j;
10908 const char *pstr = imm_start;
10909 expressionS *exp;
10910
10911 if (*pstr != '{')
10912 return 0;
10913
10914 pstr++;
10915 match_found = 0;
10916 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10917 {
10918 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10919 {
10920 if (!i.rounding)
10921 {
10922 rc_op.type = RC_NamesTable[j].type;
10923 rc_op.operand = this_operand;
10924 i.rounding = &rc_op;
10925 }
10926 else
10927 {
10928 as_bad (_("duplicated `%s'"), imm_start);
10929 return 0;
10930 }
10931 pstr += RC_NamesTable[j].len;
10932 match_found = 1;
10933 break;
10934 }
10935 }
10936 if (!match_found)
10937 return 0;
10938
10939 if (*pstr++ != '}')
10940 {
10941 as_bad (_("Missing '}': '%s'"), imm_start);
10942 return 0;
10943 }
10944 /* RC/SAE immediate string should contain nothing more. */;
10945 if (*pstr != 0)
10946 {
10947 as_bad (_("Junk after '}': '%s'"), imm_start);
10948 return 0;
10949 }
10950
10951 exp = &im_expressions[i.imm_operands++];
10952 i.op[this_operand].imms = exp;
10953
10954 exp->X_op = O_constant;
10955 exp->X_add_number = 0;
10956 exp->X_add_symbol = (symbolS *) 0;
10957 exp->X_op_symbol = (symbolS *) 0;
10958
10959 i.types[this_operand].bitfield.imm8 = 1;
10960 return 1;
10961 }
10962
10963 /* Only string instructions can have a second memory operand, so
10964 reduce current_templates to just those if it contains any. */
10965 static int
10966 maybe_adjust_templates (void)
10967 {
10968 const insn_template *t;
10969
10970 gas_assert (i.mem_operands == 1);
10971
10972 for (t = current_templates->start; t < current_templates->end; ++t)
10973 if (t->opcode_modifier.isstring)
10974 break;
10975
10976 if (t < current_templates->end)
10977 {
10978 static templates aux_templates;
10979 bfd_boolean recheck;
10980
10981 aux_templates.start = t;
10982 for (; t < current_templates->end; ++t)
10983 if (!t->opcode_modifier.isstring)
10984 break;
10985 aux_templates.end = t;
10986
10987 /* Determine whether to re-check the first memory operand. */
10988 recheck = (aux_templates.start != current_templates->start
10989 || t != current_templates->end);
10990
10991 current_templates = &aux_templates;
10992
10993 if (recheck)
10994 {
10995 i.mem_operands = 0;
10996 if (i.memop1_string != NULL
10997 && i386_index_check (i.memop1_string) == 0)
10998 return 0;
10999 i.mem_operands = 1;
11000 }
11001 }
11002
11003 return 1;
11004 }
11005
11006 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
11007 on error. */
11008
11009 static int
11010 i386_att_operand (char *operand_string)
11011 {
11012 const reg_entry *r;
11013 char *end_op;
11014 char *op_string = operand_string;
11015
11016 if (is_space_char (*op_string))
11017 ++op_string;
11018
11019 /* We check for an absolute prefix (differentiating,
11020 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
11021 if (*op_string == ABSOLUTE_PREFIX)
11022 {
11023 ++op_string;
11024 if (is_space_char (*op_string))
11025 ++op_string;
11026 i.jumpabsolute = TRUE;
11027 }
11028
11029 /* Check if operand is a register. */
11030 if ((r = parse_register (op_string, &end_op)) != NULL)
11031 {
11032 i386_operand_type temp;
11033
11034 if (r == &bad_reg)
11035 return 0;
11036
11037 /* Check for a segment override by searching for ':' after a
11038 segment register. */
11039 op_string = end_op;
11040 if (is_space_char (*op_string))
11041 ++op_string;
11042 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11043 {
11044 switch (r->reg_num)
11045 {
11046 case 0:
11047 i.seg[i.mem_operands] = &es;
11048 break;
11049 case 1:
11050 i.seg[i.mem_operands] = &cs;
11051 break;
11052 case 2:
11053 i.seg[i.mem_operands] = &ss;
11054 break;
11055 case 3:
11056 i.seg[i.mem_operands] = &ds;
11057 break;
11058 case 4:
11059 i.seg[i.mem_operands] = &fs;
11060 break;
11061 case 5:
11062 i.seg[i.mem_operands] = &gs;
11063 break;
11064 }
11065
11066 /* Skip the ':' and whitespace. */
11067 ++op_string;
11068 if (is_space_char (*op_string))
11069 ++op_string;
11070
11071 if (!is_digit_char (*op_string)
11072 && !is_identifier_char (*op_string)
11073 && *op_string != '('
11074 && *op_string != ABSOLUTE_PREFIX)
11075 {
11076 as_bad (_("bad memory operand `%s'"), op_string);
11077 return 0;
11078 }
11079 /* Handle case of %es:*foo. */
11080 if (*op_string == ABSOLUTE_PREFIX)
11081 {
11082 ++op_string;
11083 if (is_space_char (*op_string))
11084 ++op_string;
11085 i.jumpabsolute = TRUE;
11086 }
11087 goto do_memory_reference;
11088 }
11089
11090 /* Handle vector operations. */
11091 if (*op_string == '{')
11092 {
11093 op_string = check_VecOperations (op_string, NULL);
11094 if (op_string == NULL)
11095 return 0;
11096 }
11097
11098 if (*op_string)
11099 {
11100 as_bad (_("junk `%s' after register"), op_string);
11101 return 0;
11102 }
11103 temp = r->reg_type;
11104 temp.bitfield.baseindex = 0;
11105 i.types[this_operand] = operand_type_or (i.types[this_operand],
11106 temp);
11107 i.types[this_operand].bitfield.unspecified = 0;
11108 i.op[this_operand].regs = r;
11109 i.reg_operands++;
11110 }
11111 else if (*op_string == REGISTER_PREFIX)
11112 {
11113 as_bad (_("bad register name `%s'"), op_string);
11114 return 0;
11115 }
11116 else if (*op_string == IMMEDIATE_PREFIX)
11117 {
11118 ++op_string;
11119 if (i.jumpabsolute)
11120 {
11121 as_bad (_("immediate operand illegal with absolute jump"));
11122 return 0;
11123 }
11124 if (!i386_immediate (op_string))
11125 return 0;
11126 }
11127 else if (RC_SAE_immediate (operand_string))
11128 {
11129 /* If it is a RC or SAE immediate, do nothing. */
11130 ;
11131 }
11132 else if (is_digit_char (*op_string)
11133 || is_identifier_char (*op_string)
11134 || *op_string == '"'
11135 || *op_string == '(')
11136 {
11137 /* This is a memory reference of some sort. */
11138 char *base_string;
11139
11140 /* Start and end of displacement string expression (if found). */
11141 char *displacement_string_start;
11142 char *displacement_string_end;
11143 char *vop_start;
11144
11145 do_memory_reference:
11146 if (i.mem_operands == 1 && !maybe_adjust_templates ())
11147 return 0;
11148 if ((i.mem_operands == 1
11149 && !current_templates->start->opcode_modifier.isstring)
11150 || i.mem_operands == 2)
11151 {
11152 as_bad (_("too many memory references for `%s'"),
11153 current_templates->start->name);
11154 return 0;
11155 }
11156
11157 /* Check for base index form. We detect the base index form by
11158 looking for an ')' at the end of the operand, searching
11159 for the '(' matching it, and finding a REGISTER_PREFIX or ','
11160 after the '('. */
11161 base_string = op_string + strlen (op_string);
11162
11163 /* Handle vector operations. */
11164 vop_start = strchr (op_string, '{');
11165 if (vop_start && vop_start < base_string)
11166 {
11167 if (check_VecOperations (vop_start, base_string) == NULL)
11168 return 0;
11169 base_string = vop_start;
11170 }
11171
11172 --base_string;
11173 if (is_space_char (*base_string))
11174 --base_string;
11175
11176 /* If we only have a displacement, set-up for it to be parsed later. */
11177 displacement_string_start = op_string;
11178 displacement_string_end = base_string + 1;
11179
11180 if (*base_string == ')')
11181 {
11182 char *temp_string;
11183 unsigned int parens_balanced = 1;
11184 /* We've already checked that the number of left & right ()'s are
11185 equal, so this loop will not be infinite. */
11186 do
11187 {
11188 base_string--;
11189 if (*base_string == ')')
11190 parens_balanced++;
11191 if (*base_string == '(')
11192 parens_balanced--;
11193 }
11194 while (parens_balanced);
11195
11196 temp_string = base_string;
11197
11198 /* Skip past '(' and whitespace. */
11199 ++base_string;
11200 if (is_space_char (*base_string))
11201 ++base_string;
11202
11203 if (*base_string == ','
11204 || ((i.base_reg = parse_register (base_string, &end_op))
11205 != NULL))
11206 {
11207 displacement_string_end = temp_string;
11208
11209 i.types[this_operand].bitfield.baseindex = 1;
11210
11211 if (i.base_reg)
11212 {
11213 if (i.base_reg == &bad_reg)
11214 return 0;
11215 base_string = end_op;
11216 if (is_space_char (*base_string))
11217 ++base_string;
11218 }
11219
11220 /* There may be an index reg or scale factor here. */
11221 if (*base_string == ',')
11222 {
11223 ++base_string;
11224 if (is_space_char (*base_string))
11225 ++base_string;
11226
11227 if ((i.index_reg = parse_register (base_string, &end_op))
11228 != NULL)
11229 {
11230 if (i.index_reg == &bad_reg)
11231 return 0;
11232 base_string = end_op;
11233 if (is_space_char (*base_string))
11234 ++base_string;
11235 if (*base_string == ',')
11236 {
11237 ++base_string;
11238 if (is_space_char (*base_string))
11239 ++base_string;
11240 }
11241 else if (*base_string != ')')
11242 {
11243 as_bad (_("expecting `,' or `)' "
11244 "after index register in `%s'"),
11245 operand_string);
11246 return 0;
11247 }
11248 }
11249 else if (*base_string == REGISTER_PREFIX)
11250 {
11251 end_op = strchr (base_string, ',');
11252 if (end_op)
11253 *end_op = '\0';
11254 as_bad (_("bad register name `%s'"), base_string);
11255 return 0;
11256 }
11257
11258 /* Check for scale factor. */
11259 if (*base_string != ')')
11260 {
11261 char *end_scale = i386_scale (base_string);
11262
11263 if (!end_scale)
11264 return 0;
11265
11266 base_string = end_scale;
11267 if (is_space_char (*base_string))
11268 ++base_string;
11269 if (*base_string != ')')
11270 {
11271 as_bad (_("expecting `)' "
11272 "after scale factor in `%s'"),
11273 operand_string);
11274 return 0;
11275 }
11276 }
11277 else if (!i.index_reg)
11278 {
11279 as_bad (_("expecting index register or scale factor "
11280 "after `,'; got '%c'"),
11281 *base_string);
11282 return 0;
11283 }
11284 }
11285 else if (*base_string != ')')
11286 {
11287 as_bad (_("expecting `,' or `)' "
11288 "after base register in `%s'"),
11289 operand_string);
11290 return 0;
11291 }
11292 }
11293 else if (*base_string == REGISTER_PREFIX)
11294 {
11295 end_op = strchr (base_string, ',');
11296 if (end_op)
11297 *end_op = '\0';
11298 as_bad (_("bad register name `%s'"), base_string);
11299 return 0;
11300 }
11301 }
11302
11303 /* If there's an expression beginning the operand, parse it,
11304 assuming displacement_string_start and
11305 displacement_string_end are meaningful. */
11306 if (displacement_string_start != displacement_string_end)
11307 {
11308 if (!i386_displacement (displacement_string_start,
11309 displacement_string_end))
11310 return 0;
11311 }
11312
11313 /* Special case for (%dx) while doing input/output op. */
11314 if (i.base_reg
11315 && i.base_reg->reg_type.bitfield.instance == RegD
11316 && i.base_reg->reg_type.bitfield.word
11317 && i.index_reg == 0
11318 && i.log2_scale_factor == 0
11319 && i.seg[i.mem_operands] == 0
11320 && !operand_type_check (i.types[this_operand], disp))
11321 {
11322 i.types[this_operand] = i.base_reg->reg_type;
11323 return 1;
11324 }
11325
11326 if (i386_index_check (operand_string) == 0)
11327 return 0;
11328 i.flags[this_operand] |= Operand_Mem;
11329 if (i.mem_operands == 0)
11330 i.memop1_string = xstrdup (operand_string);
11331 i.mem_operands++;
11332 }
11333 else
11334 {
11335 /* It's not a memory operand; argh! */
11336 as_bad (_("invalid char %s beginning operand %d `%s'"),
11337 output_invalid (*op_string),
11338 this_operand + 1,
11339 op_string);
11340 return 0;
11341 }
11342 return 1; /* Normal return. */
11343 }
11344 \f
11345 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11346 that an rs_machine_dependent frag may reach. */
11347
11348 unsigned int
11349 i386_frag_max_var (fragS *frag)
11350 {
11351 /* The only relaxable frags are for jumps.
11352 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
11353 gas_assert (frag->fr_type == rs_machine_dependent);
11354 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11355 }
11356
11357 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11358 static int
11359 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11360 {
11361 /* STT_GNU_IFUNC symbol must go through PLT. */
11362 if ((symbol_get_bfdsym (fr_symbol)->flags
11363 & BSF_GNU_INDIRECT_FUNCTION) != 0)
11364 return 0;
11365
11366 if (!S_IS_EXTERNAL (fr_symbol))
11367 /* Symbol may be weak or local. */
11368 return !S_IS_WEAK (fr_symbol);
11369
11370 /* Global symbols with non-default visibility can't be preempted. */
11371 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11372 return 1;
11373
11374 if (fr_var != NO_RELOC)
11375 switch ((enum bfd_reloc_code_real) fr_var)
11376 {
11377 case BFD_RELOC_386_PLT32:
11378 case BFD_RELOC_X86_64_PLT32:
11379 /* Symbol with PLT relocation may be preempted. */
11380 return 0;
11381 default:
11382 abort ();
11383 }
11384
11385 /* Global symbols with default visibility in a shared library may be
11386 preempted by another definition. */
11387 return !shared;
11388 }
11389 #endif
11390
11391 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11392 Note also work for Skylake and Cascadelake.
11393 ---------------------------------------------------------------------
11394 | JCC | ADD/SUB/CMP | INC/DEC | TEST/AND |
11395 | ------ | ----------- | ------- | -------- |
11396 | Jo | N | N | Y |
11397 | Jno | N | N | Y |
11398 | Jc/Jb | Y | N | Y |
11399 | Jae/Jnb | Y | N | Y |
11400 | Je/Jz | Y | Y | Y |
11401 | Jne/Jnz | Y | Y | Y |
11402 | Jna/Jbe | Y | N | Y |
11403 | Ja/Jnbe | Y | N | Y |
11404 | Js | N | N | Y |
11405 | Jns | N | N | Y |
11406 | Jp/Jpe | N | N | Y |
11407 | Jnp/Jpo | N | N | Y |
11408 | Jl/Jnge | Y | Y | Y |
11409 | Jge/Jnl | Y | Y | Y |
11410 | Jle/Jng | Y | Y | Y |
11411 | Jg/Jnle | Y | Y | Y |
11412 --------------------------------------------------------------------- */
11413 static int
11414 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11415 {
11416 if (mf_cmp == mf_cmp_alu_cmp)
11417 return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11418 || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11419 if (mf_cmp == mf_cmp_incdec)
11420 return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11421 || mf_jcc == mf_jcc_jle);
11422 if (mf_cmp == mf_cmp_test_and)
11423 return 1;
11424 return 0;
11425 }
11426
11427 /* Return the next non-empty frag. */
11428
11429 static fragS *
11430 i386_next_non_empty_frag (fragS *fragP)
11431 {
11432 /* There may be a frag with a ".fill 0" when there is no room in
11433 the current frag for frag_grow in output_insn. */
11434 for (fragP = fragP->fr_next;
11435 (fragP != NULL
11436 && fragP->fr_type == rs_fill
11437 && fragP->fr_fix == 0);
11438 fragP = fragP->fr_next)
11439 ;
11440 return fragP;
11441 }
11442
11443 /* Return the next jcc frag after BRANCH_PADDING. */
11444
11445 static fragS *
11446 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11447 {
11448 fragS *branch_fragP;
11449 if (!pad_fragP)
11450 return NULL;
11451
11452 if (pad_fragP->fr_type == rs_machine_dependent
11453 && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11454 == BRANCH_PADDING))
11455 {
11456 branch_fragP = i386_next_non_empty_frag (pad_fragP);
11457 if (branch_fragP->fr_type != rs_machine_dependent)
11458 return NULL;
11459 if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11460 && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11461 pad_fragP->tc_frag_data.mf_type))
11462 return branch_fragP;
11463 }
11464
11465 return NULL;
11466 }
11467
11468 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
11469
11470 static void
11471 i386_classify_machine_dependent_frag (fragS *fragP)
11472 {
11473 fragS *cmp_fragP;
11474 fragS *pad_fragP;
11475 fragS *branch_fragP;
11476 fragS *next_fragP;
11477 unsigned int max_prefix_length;
11478
11479 if (fragP->tc_frag_data.classified)
11480 return;
11481
11482 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11483 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11484 for (next_fragP = fragP;
11485 next_fragP != NULL;
11486 next_fragP = next_fragP->fr_next)
11487 {
11488 next_fragP->tc_frag_data.classified = 1;
11489 if (next_fragP->fr_type == rs_machine_dependent)
11490 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11491 {
11492 case BRANCH_PADDING:
11493 /* The BRANCH_PADDING frag must be followed by a branch
11494 frag. */
11495 branch_fragP = i386_next_non_empty_frag (next_fragP);
11496 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11497 break;
11498 case FUSED_JCC_PADDING:
11499 /* Check if this is a fused jcc:
11500 FUSED_JCC_PADDING
11501 CMP like instruction
11502 BRANCH_PADDING
11503 COND_JUMP
11504 */
11505 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11506 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11507 branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11508 if (branch_fragP)
11509 {
11510 /* The BRANCH_PADDING frag is merged with the
11511 FUSED_JCC_PADDING frag. */
11512 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11513 /* CMP like instruction size. */
11514 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11515 frag_wane (pad_fragP);
11516 /* Skip to branch_fragP. */
11517 next_fragP = branch_fragP;
11518 }
11519 else if (next_fragP->tc_frag_data.max_prefix_length)
11520 {
11521 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11522 a fused jcc. */
11523 next_fragP->fr_subtype
11524 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11525 next_fragP->tc_frag_data.max_bytes
11526 = next_fragP->tc_frag_data.max_prefix_length;
11527 /* This will be updated in the BRANCH_PREFIX scan. */
11528 next_fragP->tc_frag_data.max_prefix_length = 0;
11529 }
11530 else
11531 frag_wane (next_fragP);
11532 break;
11533 }
11534 }
11535
11536 /* Stop if there is no BRANCH_PREFIX. */
11537 if (!align_branch_prefix_size)
11538 return;
11539
11540 /* Scan for BRANCH_PREFIX. */
11541 for (; fragP != NULL; fragP = fragP->fr_next)
11542 {
11543 if (fragP->fr_type != rs_machine_dependent
11544 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11545 != BRANCH_PREFIX))
11546 continue;
11547
11548 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11549 COND_JUMP_PREFIX. */
11550 max_prefix_length = 0;
11551 for (next_fragP = fragP;
11552 next_fragP != NULL;
11553 next_fragP = next_fragP->fr_next)
11554 {
11555 if (next_fragP->fr_type == rs_fill)
11556 /* Skip rs_fill frags. */
11557 continue;
11558 else if (next_fragP->fr_type != rs_machine_dependent)
11559 /* Stop for all other frags. */
11560 break;
11561
11562 /* rs_machine_dependent frags. */
11563 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11564 == BRANCH_PREFIX)
11565 {
11566 /* Count BRANCH_PREFIX frags. */
11567 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11568 {
11569 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11570 frag_wane (next_fragP);
11571 }
11572 else
11573 max_prefix_length
11574 += next_fragP->tc_frag_data.max_bytes;
11575 }
11576 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11577 == BRANCH_PADDING)
11578 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11579 == FUSED_JCC_PADDING))
11580 {
11581 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11582 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11583 break;
11584 }
11585 else
11586 /* Stop for other rs_machine_dependent frags. */
11587 break;
11588 }
11589
11590 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11591
11592 /* Skip to the next frag. */
11593 fragP = next_fragP;
11594 }
11595 }
11596
11597 /* Compute padding size for
11598
11599 FUSED_JCC_PADDING
11600 CMP like instruction
11601 BRANCH_PADDING
11602 COND_JUMP/UNCOND_JUMP
11603
11604 or
11605
11606 BRANCH_PADDING
11607 COND_JUMP/UNCOND_JUMP
11608 */
11609
11610 static int
11611 i386_branch_padding_size (fragS *fragP, offsetT address)
11612 {
11613 unsigned int offset, size, padding_size;
11614 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11615
11616 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11617 if (!address)
11618 address = fragP->fr_address;
11619 address += fragP->fr_fix;
11620
11621 /* CMP like instrunction size. */
11622 size = fragP->tc_frag_data.cmp_size;
11623
11624 /* The base size of the branch frag. */
11625 size += branch_fragP->fr_fix;
11626
11627 /* Add opcode and displacement bytes for the rs_machine_dependent
11628 branch frag. */
11629 if (branch_fragP->fr_type == rs_machine_dependent)
11630 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11631
11632 /* Check if branch is within boundary and doesn't end at the last
11633 byte. */
11634 offset = address & ((1U << align_branch_power) - 1);
11635 if ((offset + size) >= (1U << align_branch_power))
11636 /* Padding needed to avoid crossing boundary. */
11637 padding_size = (1U << align_branch_power) - offset;
11638 else
11639 /* No padding needed. */
11640 padding_size = 0;
11641
11642 /* The return value may be saved in tc_frag_data.length which is
11643 unsigned byte. */
11644 if (!fits_in_unsigned_byte (padding_size))
11645 abort ();
11646
11647 return padding_size;
11648 }
11649
11650 /* i386_generic_table_relax_frag()
11651
11652 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11653 grow/shrink padding to align branch frags. Hand others to
11654 relax_frag(). */
11655
11656 long
11657 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11658 {
11659 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11660 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11661 {
11662 long padding_size = i386_branch_padding_size (fragP, 0);
11663 long grow = padding_size - fragP->tc_frag_data.length;
11664
11665 /* When the BRANCH_PREFIX frag is used, the computed address
11666 must match the actual address and there should be no padding. */
11667 if (fragP->tc_frag_data.padding_address
11668 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11669 || padding_size))
11670 abort ();
11671
11672 /* Update the padding size. */
11673 if (grow)
11674 fragP->tc_frag_data.length = padding_size;
11675
11676 return grow;
11677 }
11678 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11679 {
11680 fragS *padding_fragP, *next_fragP;
11681 long padding_size, left_size, last_size;
11682
11683 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11684 if (!padding_fragP)
11685 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11686 return (fragP->tc_frag_data.length
11687 - fragP->tc_frag_data.last_length);
11688
11689 /* Compute the relative address of the padding frag in the very
11690 first time where the BRANCH_PREFIX frag sizes are zero. */
11691 if (!fragP->tc_frag_data.padding_address)
11692 fragP->tc_frag_data.padding_address
11693 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11694
11695 /* First update the last length from the previous interation. */
11696 left_size = fragP->tc_frag_data.prefix_length;
11697 for (next_fragP = fragP;
11698 next_fragP != padding_fragP;
11699 next_fragP = next_fragP->fr_next)
11700 if (next_fragP->fr_type == rs_machine_dependent
11701 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11702 == BRANCH_PREFIX))
11703 {
11704 if (left_size)
11705 {
11706 int max = next_fragP->tc_frag_data.max_bytes;
11707 if (max)
11708 {
11709 int size;
11710 if (max > left_size)
11711 size = left_size;
11712 else
11713 size = max;
11714 left_size -= size;
11715 next_fragP->tc_frag_data.last_length = size;
11716 }
11717 }
11718 else
11719 next_fragP->tc_frag_data.last_length = 0;
11720 }
11721
11722 /* Check the padding size for the padding frag. */
11723 padding_size = i386_branch_padding_size
11724 (padding_fragP, (fragP->fr_address
11725 + fragP->tc_frag_data.padding_address));
11726
11727 last_size = fragP->tc_frag_data.prefix_length;
11728 /* Check if there is change from the last interation. */
11729 if (padding_size == last_size)
11730 {
11731 /* Update the expected address of the padding frag. */
11732 padding_fragP->tc_frag_data.padding_address
11733 = (fragP->fr_address + padding_size
11734 + fragP->tc_frag_data.padding_address);
11735 return 0;
11736 }
11737
11738 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11739 {
11740 /* No padding if there is no sufficient room. Clear the
11741 expected address of the padding frag. */
11742 padding_fragP->tc_frag_data.padding_address = 0;
11743 padding_size = 0;
11744 }
11745 else
11746 /* Store the expected address of the padding frag. */
11747 padding_fragP->tc_frag_data.padding_address
11748 = (fragP->fr_address + padding_size
11749 + fragP->tc_frag_data.padding_address);
11750
11751 fragP->tc_frag_data.prefix_length = padding_size;
11752
11753 /* Update the length for the current interation. */
11754 left_size = padding_size;
11755 for (next_fragP = fragP;
11756 next_fragP != padding_fragP;
11757 next_fragP = next_fragP->fr_next)
11758 if (next_fragP->fr_type == rs_machine_dependent
11759 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11760 == BRANCH_PREFIX))
11761 {
11762 if (left_size)
11763 {
11764 int max = next_fragP->tc_frag_data.max_bytes;
11765 if (max)
11766 {
11767 int size;
11768 if (max > left_size)
11769 size = left_size;
11770 else
11771 size = max;
11772 left_size -= size;
11773 next_fragP->tc_frag_data.length = size;
11774 }
11775 }
11776 else
11777 next_fragP->tc_frag_data.length = 0;
11778 }
11779
11780 return (fragP->tc_frag_data.length
11781 - fragP->tc_frag_data.last_length);
11782 }
11783 return relax_frag (segment, fragP, stretch);
11784 }
11785
11786 /* md_estimate_size_before_relax()
11787
11788 Called just before relax() for rs_machine_dependent frags. The x86
11789 assembler uses these frags to handle variable size jump
11790 instructions.
11791
11792 Any symbol that is now undefined will not become defined.
11793 Return the correct fr_subtype in the frag.
11794 Return the initial "guess for variable size of frag" to caller.
11795 The guess is actually the growth beyond the fixed part. Whatever
11796 we do to grow the fixed or variable part contributes to our
11797 returned value. */
11798
11799 int
11800 md_estimate_size_before_relax (fragS *fragP, segT segment)
11801 {
11802 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11803 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11804 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11805 {
11806 i386_classify_machine_dependent_frag (fragP);
11807 return fragP->tc_frag_data.length;
11808 }
11809
11810 /* We've already got fragP->fr_subtype right; all we have to do is
11811 check for un-relaxable symbols. On an ELF system, we can't relax
11812 an externally visible symbol, because it may be overridden by a
11813 shared library. */
11814 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11815 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11816 || (IS_ELF
11817 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11818 fragP->fr_var))
11819 #endif
11820 #if defined (OBJ_COFF) && defined (TE_PE)
11821 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11822 && S_IS_WEAK (fragP->fr_symbol))
11823 #endif
11824 )
11825 {
11826 /* Symbol is undefined in this segment, or we need to keep a
11827 reloc so that weak symbols can be overridden. */
11828 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11829 enum bfd_reloc_code_real reloc_type;
11830 unsigned char *opcode;
11831 int old_fr_fix;
11832
11833 if (fragP->fr_var != NO_RELOC)
11834 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11835 else if (size == 2)
11836 reloc_type = BFD_RELOC_16_PCREL;
11837 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11838 else if (need_plt32_p (fragP->fr_symbol))
11839 reloc_type = BFD_RELOC_X86_64_PLT32;
11840 #endif
11841 else
11842 reloc_type = BFD_RELOC_32_PCREL;
11843
11844 old_fr_fix = fragP->fr_fix;
11845 opcode = (unsigned char *) fragP->fr_opcode;
11846
11847 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11848 {
11849 case UNCOND_JUMP:
11850 /* Make jmp (0xeb) a (d)word displacement jump. */
11851 opcode[0] = 0xe9;
11852 fragP->fr_fix += size;
11853 fix_new (fragP, old_fr_fix, size,
11854 fragP->fr_symbol,
11855 fragP->fr_offset, 1,
11856 reloc_type);
11857 break;
11858
11859 case COND_JUMP86:
11860 if (size == 2
11861 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11862 {
11863 /* Negate the condition, and branch past an
11864 unconditional jump. */
11865 opcode[0] ^= 1;
11866 opcode[1] = 3;
11867 /* Insert an unconditional jump. */
11868 opcode[2] = 0xe9;
11869 /* We added two extra opcode bytes, and have a two byte
11870 offset. */
11871 fragP->fr_fix += 2 + 2;
11872 fix_new (fragP, old_fr_fix + 2, 2,
11873 fragP->fr_symbol,
11874 fragP->fr_offset, 1,
11875 reloc_type);
11876 break;
11877 }
11878 /* Fall through. */
11879
11880 case COND_JUMP:
11881 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11882 {
11883 fixS *fixP;
11884
11885 fragP->fr_fix += 1;
11886 fixP = fix_new (fragP, old_fr_fix, 1,
11887 fragP->fr_symbol,
11888 fragP->fr_offset, 1,
11889 BFD_RELOC_8_PCREL);
11890 fixP->fx_signed = 1;
11891 break;
11892 }
11893
11894 /* This changes the byte-displacement jump 0x7N
11895 to the (d)word-displacement jump 0x0f,0x8N. */
11896 opcode[1] = opcode[0] + 0x10;
11897 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11898 /* We've added an opcode byte. */
11899 fragP->fr_fix += 1 + size;
11900 fix_new (fragP, old_fr_fix + 1, size,
11901 fragP->fr_symbol,
11902 fragP->fr_offset, 1,
11903 reloc_type);
11904 break;
11905
11906 default:
11907 BAD_CASE (fragP->fr_subtype);
11908 break;
11909 }
11910 frag_wane (fragP);
11911 return fragP->fr_fix - old_fr_fix;
11912 }
11913
11914 /* Guess size depending on current relax state. Initially the relax
11915 state will correspond to a short jump and we return 1, because
11916 the variable part of the frag (the branch offset) is one byte
11917 long. However, we can relax a section more than once and in that
11918 case we must either set fr_subtype back to the unrelaxed state,
11919 or return the value for the appropriate branch. */
11920 return md_relax_table[fragP->fr_subtype].rlx_length;
11921 }
11922
11923 /* Called after relax() is finished.
11924
11925 In: Address of frag.
11926 fr_type == rs_machine_dependent.
11927 fr_subtype is what the address relaxed to.
11928
11929 Out: Any fixSs and constants are set up.
11930 Caller will turn frag into a ".space 0". */
11931
11932 void
11933 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
11934 fragS *fragP)
11935 {
11936 unsigned char *opcode;
11937 unsigned char *where_to_put_displacement = NULL;
11938 offsetT target_address;
11939 offsetT opcode_address;
11940 unsigned int extension = 0;
11941 offsetT displacement_from_opcode_start;
11942
11943 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11944 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
11945 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11946 {
11947 /* Generate nop padding. */
11948 unsigned int size = fragP->tc_frag_data.length;
11949 if (size)
11950 {
11951 if (size > fragP->tc_frag_data.max_bytes)
11952 abort ();
11953
11954 if (flag_debug)
11955 {
11956 const char *msg;
11957 const char *branch = "branch";
11958 const char *prefix = "";
11959 fragS *padding_fragP;
11960 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11961 == BRANCH_PREFIX)
11962 {
11963 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11964 switch (fragP->tc_frag_data.default_prefix)
11965 {
11966 default:
11967 abort ();
11968 break;
11969 case CS_PREFIX_OPCODE:
11970 prefix = " cs";
11971 break;
11972 case DS_PREFIX_OPCODE:
11973 prefix = " ds";
11974 break;
11975 case ES_PREFIX_OPCODE:
11976 prefix = " es";
11977 break;
11978 case FS_PREFIX_OPCODE:
11979 prefix = " fs";
11980 break;
11981 case GS_PREFIX_OPCODE:
11982 prefix = " gs";
11983 break;
11984 case SS_PREFIX_OPCODE:
11985 prefix = " ss";
11986 break;
11987 }
11988 if (padding_fragP)
11989 msg = _("%s:%u: add %d%s at 0x%llx to align "
11990 "%s within %d-byte boundary\n");
11991 else
11992 msg = _("%s:%u: add additional %d%s at 0x%llx to "
11993 "align %s within %d-byte boundary\n");
11994 }
11995 else
11996 {
11997 padding_fragP = fragP;
11998 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
11999 "%s within %d-byte boundary\n");
12000 }
12001
12002 if (padding_fragP)
12003 switch (padding_fragP->tc_frag_data.branch_type)
12004 {
12005 case align_branch_jcc:
12006 branch = "jcc";
12007 break;
12008 case align_branch_fused:
12009 branch = "fused jcc";
12010 break;
12011 case align_branch_jmp:
12012 branch = "jmp";
12013 break;
12014 case align_branch_call:
12015 branch = "call";
12016 break;
12017 case align_branch_indirect:
12018 branch = "indiret branch";
12019 break;
12020 case align_branch_ret:
12021 branch = "ret";
12022 break;
12023 default:
12024 break;
12025 }
12026
12027 fprintf (stdout, msg,
12028 fragP->fr_file, fragP->fr_line, size, prefix,
12029 (long long) fragP->fr_address, branch,
12030 1 << align_branch_power);
12031 }
12032 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12033 memset (fragP->fr_opcode,
12034 fragP->tc_frag_data.default_prefix, size);
12035 else
12036 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12037 size, 0);
12038 fragP->fr_fix += size;
12039 }
12040 return;
12041 }
12042
12043 opcode = (unsigned char *) fragP->fr_opcode;
12044
12045 /* Address we want to reach in file space. */
12046 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12047
12048 /* Address opcode resides at in file space. */
12049 opcode_address = fragP->fr_address + fragP->fr_fix;
12050
12051 /* Displacement from opcode start to fill into instruction. */
12052 displacement_from_opcode_start = target_address - opcode_address;
12053
12054 if ((fragP->fr_subtype & BIG) == 0)
12055 {
12056 /* Don't have to change opcode. */
12057 extension = 1; /* 1 opcode + 1 displacement */
12058 where_to_put_displacement = &opcode[1];
12059 }
12060 else
12061 {
12062 if (no_cond_jump_promotion
12063 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12064 as_warn_where (fragP->fr_file, fragP->fr_line,
12065 _("long jump required"));
12066
12067 switch (fragP->fr_subtype)
12068 {
12069 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12070 extension = 4; /* 1 opcode + 4 displacement */
12071 opcode[0] = 0xe9;
12072 where_to_put_displacement = &opcode[1];
12073 break;
12074
12075 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12076 extension = 2; /* 1 opcode + 2 displacement */
12077 opcode[0] = 0xe9;
12078 where_to_put_displacement = &opcode[1];
12079 break;
12080
12081 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12082 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12083 extension = 5; /* 2 opcode + 4 displacement */
12084 opcode[1] = opcode[0] + 0x10;
12085 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12086 where_to_put_displacement = &opcode[2];
12087 break;
12088
12089 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12090 extension = 3; /* 2 opcode + 2 displacement */
12091 opcode[1] = opcode[0] + 0x10;
12092 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12093 where_to_put_displacement = &opcode[2];
12094 break;
12095
12096 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12097 extension = 4;
12098 opcode[0] ^= 1;
12099 opcode[1] = 3;
12100 opcode[2] = 0xe9;
12101 where_to_put_displacement = &opcode[3];
12102 break;
12103
12104 default:
12105 BAD_CASE (fragP->fr_subtype);
12106 break;
12107 }
12108 }
12109
12110 /* If size if less then four we are sure that the operand fits,
12111 but if it's 4, then it could be that the displacement is larger
12112 then -/+ 2GB. */
12113 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12114 && object_64bit
12115 && ((addressT) (displacement_from_opcode_start - extension
12116 + ((addressT) 1 << 31))
12117 > (((addressT) 2 << 31) - 1)))
12118 {
12119 as_bad_where (fragP->fr_file, fragP->fr_line,
12120 _("jump target out of range"));
12121 /* Make us emit 0. */
12122 displacement_from_opcode_start = extension;
12123 }
12124 /* Now put displacement after opcode. */
12125 md_number_to_chars ((char *) where_to_put_displacement,
12126 (valueT) (displacement_from_opcode_start - extension),
12127 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12128 fragP->fr_fix += extension;
12129 }
12130 \f
12131 /* Apply a fixup (fixP) to segment data, once it has been determined
12132 by our caller that we have all the info we need to fix it up.
12133
12134 Parameter valP is the pointer to the value of the bits.
12135
12136 On the 386, immediates, displacements, and data pointers are all in
12137 the same (little-endian) format, so we don't need to care about which
12138 we are handling. */
12139
12140 void
12141 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12142 {
12143 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12144 valueT value = *valP;
12145
12146 #if !defined (TE_Mach)
12147 if (fixP->fx_pcrel)
12148 {
12149 switch (fixP->fx_r_type)
12150 {
12151 default:
12152 break;
12153
12154 case BFD_RELOC_64:
12155 fixP->fx_r_type = BFD_RELOC_64_PCREL;
12156 break;
12157 case BFD_RELOC_32:
12158 case BFD_RELOC_X86_64_32S:
12159 fixP->fx_r_type = BFD_RELOC_32_PCREL;
12160 break;
12161 case BFD_RELOC_16:
12162 fixP->fx_r_type = BFD_RELOC_16_PCREL;
12163 break;
12164 case BFD_RELOC_8:
12165 fixP->fx_r_type = BFD_RELOC_8_PCREL;
12166 break;
12167 }
12168 }
12169
12170 if (fixP->fx_addsy != NULL
12171 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12172 || fixP->fx_r_type == BFD_RELOC_64_PCREL
12173 || fixP->fx_r_type == BFD_RELOC_16_PCREL
12174 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12175 && !use_rela_relocations)
12176 {
12177 /* This is a hack. There should be a better way to handle this.
12178 This covers for the fact that bfd_install_relocation will
12179 subtract the current location (for partial_inplace, PC relative
12180 relocations); see more below. */
12181 #ifndef OBJ_AOUT
12182 if (IS_ELF
12183 #ifdef TE_PE
12184 || OUTPUT_FLAVOR == bfd_target_coff_flavour
12185 #endif
12186 )
12187 value += fixP->fx_where + fixP->fx_frag->fr_address;
12188 #endif
12189 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12190 if (IS_ELF)
12191 {
12192 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12193
12194 if ((sym_seg == seg
12195 || (symbol_section_p (fixP->fx_addsy)
12196 && sym_seg != absolute_section))
12197 && !generic_force_reloc (fixP))
12198 {
12199 /* Yes, we add the values in twice. This is because
12200 bfd_install_relocation subtracts them out again. I think
12201 bfd_install_relocation is broken, but I don't dare change
12202 it. FIXME. */
12203 value += fixP->fx_where + fixP->fx_frag->fr_address;
12204 }
12205 }
12206 #endif
12207 #if defined (OBJ_COFF) && defined (TE_PE)
12208 /* For some reason, the PE format does not store a
12209 section address offset for a PC relative symbol. */
12210 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12211 || S_IS_WEAK (fixP->fx_addsy))
12212 value += md_pcrel_from (fixP);
12213 #endif
12214 }
12215 #if defined (OBJ_COFF) && defined (TE_PE)
12216 if (fixP->fx_addsy != NULL
12217 && S_IS_WEAK (fixP->fx_addsy)
12218 /* PR 16858: Do not modify weak function references. */
12219 && ! fixP->fx_pcrel)
12220 {
12221 #if !defined (TE_PEP)
12222 /* For x86 PE weak function symbols are neither PC-relative
12223 nor do they set S_IS_FUNCTION. So the only reliable way
12224 to detect them is to check the flags of their containing
12225 section. */
12226 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12227 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12228 ;
12229 else
12230 #endif
12231 value -= S_GET_VALUE (fixP->fx_addsy);
12232 }
12233 #endif
12234
12235 /* Fix a few things - the dynamic linker expects certain values here,
12236 and we must not disappoint it. */
12237 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12238 if (IS_ELF && fixP->fx_addsy)
12239 switch (fixP->fx_r_type)
12240 {
12241 case BFD_RELOC_386_PLT32:
12242 case BFD_RELOC_X86_64_PLT32:
12243 /* Make the jump instruction point to the address of the operand.
12244 At runtime we merely add the offset to the actual PLT entry.
12245 NB: Subtract the offset size only for jump instructions. */
12246 if (fixP->fx_pcrel)
12247 value = -4;
12248 break;
12249
12250 case BFD_RELOC_386_TLS_GD:
12251 case BFD_RELOC_386_TLS_LDM:
12252 case BFD_RELOC_386_TLS_IE_32:
12253 case BFD_RELOC_386_TLS_IE:
12254 case BFD_RELOC_386_TLS_GOTIE:
12255 case BFD_RELOC_386_TLS_GOTDESC:
12256 case BFD_RELOC_X86_64_TLSGD:
12257 case BFD_RELOC_X86_64_TLSLD:
12258 case BFD_RELOC_X86_64_GOTTPOFF:
12259 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12260 value = 0; /* Fully resolved at runtime. No addend. */
12261 /* Fallthrough */
12262 case BFD_RELOC_386_TLS_LE:
12263 case BFD_RELOC_386_TLS_LDO_32:
12264 case BFD_RELOC_386_TLS_LE_32:
12265 case BFD_RELOC_X86_64_DTPOFF32:
12266 case BFD_RELOC_X86_64_DTPOFF64:
12267 case BFD_RELOC_X86_64_TPOFF32:
12268 case BFD_RELOC_X86_64_TPOFF64:
12269 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12270 break;
12271
12272 case BFD_RELOC_386_TLS_DESC_CALL:
12273 case BFD_RELOC_X86_64_TLSDESC_CALL:
12274 value = 0; /* Fully resolved at runtime. No addend. */
12275 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12276 fixP->fx_done = 0;
12277 return;
12278
12279 case BFD_RELOC_VTABLE_INHERIT:
12280 case BFD_RELOC_VTABLE_ENTRY:
12281 fixP->fx_done = 0;
12282 return;
12283
12284 default:
12285 break;
12286 }
12287 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
12288 *valP = value;
12289 #endif /* !defined (TE_Mach) */
12290
12291 /* Are we finished with this relocation now? */
12292 if (fixP->fx_addsy == NULL)
12293 fixP->fx_done = 1;
12294 #if defined (OBJ_COFF) && defined (TE_PE)
12295 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12296 {
12297 fixP->fx_done = 0;
12298 /* Remember value for tc_gen_reloc. */
12299 fixP->fx_addnumber = value;
12300 /* Clear out the frag for now. */
12301 value = 0;
12302 }
12303 #endif
12304 else if (use_rela_relocations)
12305 {
12306 fixP->fx_no_overflow = 1;
12307 /* Remember value for tc_gen_reloc. */
12308 fixP->fx_addnumber = value;
12309 value = 0;
12310 }
12311
12312 md_number_to_chars (p, value, fixP->fx_size);
12313 }
12314 \f
12315 const char *
12316 md_atof (int type, char *litP, int *sizeP)
12317 {
12318 /* This outputs the LITTLENUMs in REVERSE order;
12319 in accord with the bigendian 386. */
12320 return ieee_md_atof (type, litP, sizeP, FALSE);
12321 }
12322 \f
12323 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12324
12325 static char *
12326 output_invalid (int c)
12327 {
12328 if (ISPRINT (c))
12329 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12330 "'%c'", c);
12331 else
12332 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12333 "(0x%x)", (unsigned char) c);
12334 return output_invalid_buf;
12335 }
12336
12337 /* Verify that @r can be used in the current context. */
12338
12339 static bfd_boolean check_register (const reg_entry *r)
12340 {
12341 if (allow_pseudo_reg)
12342 return TRUE;
12343
12344 if (operand_type_all_zero (&r->reg_type))
12345 return FALSE;
12346
12347 if ((r->reg_type.bitfield.dword
12348 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12349 || r->reg_type.bitfield.class == RegCR
12350 || r->reg_type.bitfield.class == RegDR)
12351 && !cpu_arch_flags.bitfield.cpui386)
12352 return FALSE;
12353
12354 if (r->reg_type.bitfield.class == RegTR
12355 && (flag_code == CODE_64BIT
12356 || !cpu_arch_flags.bitfield.cpui386
12357 || cpu_arch_isa_flags.bitfield.cpui586
12358 || cpu_arch_isa_flags.bitfield.cpui686))
12359 return FALSE;
12360
12361 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12362 return FALSE;
12363
12364 if (!cpu_arch_flags.bitfield.cpuavx512f)
12365 {
12366 if (r->reg_type.bitfield.zmmword
12367 || r->reg_type.bitfield.class == RegMask)
12368 return FALSE;
12369
12370 if (!cpu_arch_flags.bitfield.cpuavx)
12371 {
12372 if (r->reg_type.bitfield.ymmword)
12373 return FALSE;
12374
12375 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12376 return FALSE;
12377 }
12378 }
12379
12380 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12381 return FALSE;
12382
12383 /* Don't allow fake index register unless allow_index_reg isn't 0. */
12384 if (!allow_index_reg && r->reg_num == RegIZ)
12385 return FALSE;
12386
12387 /* Upper 16 vector registers are only available with VREX in 64bit
12388 mode, and require EVEX encoding. */
12389 if (r->reg_flags & RegVRex)
12390 {
12391 if (!cpu_arch_flags.bitfield.cpuavx512f
12392 || flag_code != CODE_64BIT)
12393 return FALSE;
12394
12395 i.vec_encoding = vex_encoding_evex;
12396 }
12397
12398 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12399 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12400 && flag_code != CODE_64BIT)
12401 return FALSE;
12402
12403 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12404 && !intel_syntax)
12405 return FALSE;
12406
12407 return TRUE;
12408 }
12409
12410 /* REG_STRING starts *before* REGISTER_PREFIX. */
12411
12412 static const reg_entry *
12413 parse_real_register (char *reg_string, char **end_op)
12414 {
12415 char *s = reg_string;
12416 char *p;
12417 char reg_name_given[MAX_REG_NAME_SIZE + 1];
12418 const reg_entry *r;
12419
12420 /* Skip possible REGISTER_PREFIX and possible whitespace. */
12421 if (*s == REGISTER_PREFIX)
12422 ++s;
12423
12424 if (is_space_char (*s))
12425 ++s;
12426
12427 p = reg_name_given;
12428 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12429 {
12430 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12431 return (const reg_entry *) NULL;
12432 s++;
12433 }
12434
12435 /* For naked regs, make sure that we are not dealing with an identifier.
12436 This prevents confusing an identifier like `eax_var' with register
12437 `eax'. */
12438 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12439 return (const reg_entry *) NULL;
12440
12441 *end_op = s;
12442
12443 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
12444
12445 /* Handle floating point regs, allowing spaces in the (i) part. */
12446 if (r == i386_regtab /* %st is first entry of table */)
12447 {
12448 if (!cpu_arch_flags.bitfield.cpu8087
12449 && !cpu_arch_flags.bitfield.cpu287
12450 && !cpu_arch_flags.bitfield.cpu387
12451 && !allow_pseudo_reg)
12452 return (const reg_entry *) NULL;
12453
12454 if (is_space_char (*s))
12455 ++s;
12456 if (*s == '(')
12457 {
12458 ++s;
12459 if (is_space_char (*s))
12460 ++s;
12461 if (*s >= '0' && *s <= '7')
12462 {
12463 int fpr = *s - '0';
12464 ++s;
12465 if (is_space_char (*s))
12466 ++s;
12467 if (*s == ')')
12468 {
12469 *end_op = s + 1;
12470 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
12471 know (r);
12472 return r + fpr;
12473 }
12474 }
12475 /* We have "%st(" then garbage. */
12476 return (const reg_entry *) NULL;
12477 }
12478 }
12479
12480 return r && check_register (r) ? r : NULL;
12481 }
12482
12483 /* REG_STRING starts *before* REGISTER_PREFIX. */
12484
12485 static const reg_entry *
12486 parse_register (char *reg_string, char **end_op)
12487 {
12488 const reg_entry *r;
12489
12490 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12491 r = parse_real_register (reg_string, end_op);
12492 else
12493 r = NULL;
12494 if (!r)
12495 {
12496 char *save = input_line_pointer;
12497 char c;
12498 symbolS *symbolP;
12499
12500 input_line_pointer = reg_string;
12501 c = get_symbol_name (&reg_string);
12502 symbolP = symbol_find (reg_string);
12503 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12504 {
12505 const expressionS *e = symbol_get_value_expression (symbolP);
12506
12507 know (e->X_op == O_register);
12508 know (e->X_add_number >= 0
12509 && (valueT) e->X_add_number < i386_regtab_size);
12510 r = i386_regtab + e->X_add_number;
12511 if (!check_register (r))
12512 {
12513 as_bad (_("register '%s%s' cannot be used here"),
12514 register_prefix, r->reg_name);
12515 r = &bad_reg;
12516 }
12517 *end_op = input_line_pointer;
12518 }
12519 *input_line_pointer = c;
12520 input_line_pointer = save;
12521 }
12522 return r;
12523 }
12524
12525 int
12526 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12527 {
12528 const reg_entry *r;
12529 char *end = input_line_pointer;
12530
12531 *end = *nextcharP;
12532 r = parse_register (name, &input_line_pointer);
12533 if (r && end <= input_line_pointer)
12534 {
12535 *nextcharP = *input_line_pointer;
12536 *input_line_pointer = 0;
12537 if (r != &bad_reg)
12538 {
12539 e->X_op = O_register;
12540 e->X_add_number = r - i386_regtab;
12541 }
12542 else
12543 e->X_op = O_illegal;
12544 return 1;
12545 }
12546 input_line_pointer = end;
12547 *end = 0;
12548 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12549 }
12550
12551 void
12552 md_operand (expressionS *e)
12553 {
12554 char *end;
12555 const reg_entry *r;
12556
12557 switch (*input_line_pointer)
12558 {
12559 case REGISTER_PREFIX:
12560 r = parse_real_register (input_line_pointer, &end);
12561 if (r)
12562 {
12563 e->X_op = O_register;
12564 e->X_add_number = r - i386_regtab;
12565 input_line_pointer = end;
12566 }
12567 break;
12568
12569 case '[':
12570 gas_assert (intel_syntax);
12571 end = input_line_pointer++;
12572 expression (e);
12573 if (*input_line_pointer == ']')
12574 {
12575 ++input_line_pointer;
12576 e->X_op_symbol = make_expr_symbol (e);
12577 e->X_add_symbol = NULL;
12578 e->X_add_number = 0;
12579 e->X_op = O_index;
12580 }
12581 else
12582 {
12583 e->X_op = O_absent;
12584 input_line_pointer = end;
12585 }
12586 break;
12587 }
12588 }
12589
12590 \f
12591 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12592 const char *md_shortopts = "kVQ:sqnO::";
12593 #else
12594 const char *md_shortopts = "qnO::";
12595 #endif
12596
12597 #define OPTION_32 (OPTION_MD_BASE + 0)
12598 #define OPTION_64 (OPTION_MD_BASE + 1)
12599 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12600 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12601 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12602 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12603 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12604 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12605 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12606 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12607 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12608 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12609 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12610 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12611 #define OPTION_X32 (OPTION_MD_BASE + 14)
12612 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12613 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12614 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12615 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12616 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12617 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12618 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12619 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12620 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12621 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12622 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12623 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12624 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12625 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12626 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12627 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12628 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12629 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12630 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12631
12632 struct option md_longopts[] =
12633 {
12634 {"32", no_argument, NULL, OPTION_32},
12635 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12636 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12637 {"64", no_argument, NULL, OPTION_64},
12638 #endif
12639 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12640 {"x32", no_argument, NULL, OPTION_X32},
12641 {"mshared", no_argument, NULL, OPTION_MSHARED},
12642 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12643 #endif
12644 {"divide", no_argument, NULL, OPTION_DIVIDE},
12645 {"march", required_argument, NULL, OPTION_MARCH},
12646 {"mtune", required_argument, NULL, OPTION_MTUNE},
12647 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12648 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12649 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12650 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12651 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12652 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12653 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12654 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12655 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12656 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12657 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12658 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12659 # if defined (TE_PE) || defined (TE_PEP)
12660 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12661 #endif
12662 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12663 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12664 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12665 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12666 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12667 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12668 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12669 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12670 {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12671 {"mlfence-before-indirect-branch", required_argument, NULL,
12672 OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12673 {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12674 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12675 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12676 {NULL, no_argument, NULL, 0}
12677 };
12678 size_t md_longopts_size = sizeof (md_longopts);
12679
12680 int
12681 md_parse_option (int c, const char *arg)
12682 {
12683 unsigned int j;
12684 char *arch, *next, *saved, *type;
12685
12686 switch (c)
12687 {
12688 case 'n':
12689 optimize_align_code = 0;
12690 break;
12691
12692 case 'q':
12693 quiet_warnings = 1;
12694 break;
12695
12696 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12697 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12698 should be emitted or not. FIXME: Not implemented. */
12699 case 'Q':
12700 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12701 return 0;
12702 break;
12703
12704 /* -V: SVR4 argument to print version ID. */
12705 case 'V':
12706 print_version_id ();
12707 break;
12708
12709 /* -k: Ignore for FreeBSD compatibility. */
12710 case 'k':
12711 break;
12712
12713 case 's':
12714 /* -s: On i386 Solaris, this tells the native assembler to use
12715 .stab instead of .stab.excl. We always use .stab anyhow. */
12716 break;
12717
12718 case OPTION_MSHARED:
12719 shared = 1;
12720 break;
12721
12722 case OPTION_X86_USED_NOTE:
12723 if (strcasecmp (arg, "yes") == 0)
12724 x86_used_note = 1;
12725 else if (strcasecmp (arg, "no") == 0)
12726 x86_used_note = 0;
12727 else
12728 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12729 break;
12730
12731
12732 #endif
12733 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12734 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12735 case OPTION_64:
12736 {
12737 const char **list, **l;
12738
12739 list = bfd_target_list ();
12740 for (l = list; *l != NULL; l++)
12741 if (CONST_STRNEQ (*l, "elf64-x86-64")
12742 || strcmp (*l, "coff-x86-64") == 0
12743 || strcmp (*l, "pe-x86-64") == 0
12744 || strcmp (*l, "pei-x86-64") == 0
12745 || strcmp (*l, "mach-o-x86-64") == 0)
12746 {
12747 default_arch = "x86_64";
12748 break;
12749 }
12750 if (*l == NULL)
12751 as_fatal (_("no compiled in support for x86_64"));
12752 free (list);
12753 }
12754 break;
12755 #endif
12756
12757 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12758 case OPTION_X32:
12759 if (IS_ELF)
12760 {
12761 const char **list, **l;
12762
12763 list = bfd_target_list ();
12764 for (l = list; *l != NULL; l++)
12765 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12766 {
12767 default_arch = "x86_64:32";
12768 break;
12769 }
12770 if (*l == NULL)
12771 as_fatal (_("no compiled in support for 32bit x86_64"));
12772 free (list);
12773 }
12774 else
12775 as_fatal (_("32bit x86_64 is only supported for ELF"));
12776 break;
12777 #endif
12778
12779 case OPTION_32:
12780 default_arch = "i386";
12781 break;
12782
12783 case OPTION_DIVIDE:
12784 #ifdef SVR4_COMMENT_CHARS
12785 {
12786 char *n, *t;
12787 const char *s;
12788
12789 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12790 t = n;
12791 for (s = i386_comment_chars; *s != '\0'; s++)
12792 if (*s != '/')
12793 *t++ = *s;
12794 *t = '\0';
12795 i386_comment_chars = n;
12796 }
12797 #endif
12798 break;
12799
12800 case OPTION_MARCH:
12801 saved = xstrdup (arg);
12802 arch = saved;
12803 /* Allow -march=+nosse. */
12804 if (*arch == '+')
12805 arch++;
12806 do
12807 {
12808 if (*arch == '.')
12809 as_fatal (_("invalid -march= option: `%s'"), arg);
12810 next = strchr (arch, '+');
12811 if (next)
12812 *next++ = '\0';
12813 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12814 {
12815 if (strcmp (arch, cpu_arch [j].name) == 0)
12816 {
12817 /* Processor. */
12818 if (! cpu_arch[j].flags.bitfield.cpui386)
12819 continue;
12820
12821 cpu_arch_name = cpu_arch[j].name;
12822 cpu_sub_arch_name = NULL;
12823 cpu_arch_flags = cpu_arch[j].flags;
12824 cpu_arch_isa = cpu_arch[j].type;
12825 cpu_arch_isa_flags = cpu_arch[j].flags;
12826 if (!cpu_arch_tune_set)
12827 {
12828 cpu_arch_tune = cpu_arch_isa;
12829 cpu_arch_tune_flags = cpu_arch_isa_flags;
12830 }
12831 break;
12832 }
12833 else if (*cpu_arch [j].name == '.'
12834 && strcmp (arch, cpu_arch [j].name + 1) == 0)
12835 {
12836 /* ISA extension. */
12837 i386_cpu_flags flags;
12838
12839 flags = cpu_flags_or (cpu_arch_flags,
12840 cpu_arch[j].flags);
12841
12842 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12843 {
12844 if (cpu_sub_arch_name)
12845 {
12846 char *name = cpu_sub_arch_name;
12847 cpu_sub_arch_name = concat (name,
12848 cpu_arch[j].name,
12849 (const char *) NULL);
12850 free (name);
12851 }
12852 else
12853 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12854 cpu_arch_flags = flags;
12855 cpu_arch_isa_flags = flags;
12856 }
12857 else
12858 cpu_arch_isa_flags
12859 = cpu_flags_or (cpu_arch_isa_flags,
12860 cpu_arch[j].flags);
12861 break;
12862 }
12863 }
12864
12865 if (j >= ARRAY_SIZE (cpu_arch))
12866 {
12867 /* Disable an ISA extension. */
12868 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12869 if (strcmp (arch, cpu_noarch [j].name) == 0)
12870 {
12871 i386_cpu_flags flags;
12872
12873 flags = cpu_flags_and_not (cpu_arch_flags,
12874 cpu_noarch[j].flags);
12875 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12876 {
12877 if (cpu_sub_arch_name)
12878 {
12879 char *name = cpu_sub_arch_name;
12880 cpu_sub_arch_name = concat (arch,
12881 (const char *) NULL);
12882 free (name);
12883 }
12884 else
12885 cpu_sub_arch_name = xstrdup (arch);
12886 cpu_arch_flags = flags;
12887 cpu_arch_isa_flags = flags;
12888 }
12889 break;
12890 }
12891
12892 if (j >= ARRAY_SIZE (cpu_noarch))
12893 j = ARRAY_SIZE (cpu_arch);
12894 }
12895
12896 if (j >= ARRAY_SIZE (cpu_arch))
12897 as_fatal (_("invalid -march= option: `%s'"), arg);
12898
12899 arch = next;
12900 }
12901 while (next != NULL);
12902 free (saved);
12903 break;
12904
12905 case OPTION_MTUNE:
12906 if (*arg == '.')
12907 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12908 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12909 {
12910 if (strcmp (arg, cpu_arch [j].name) == 0)
12911 {
12912 cpu_arch_tune_set = 1;
12913 cpu_arch_tune = cpu_arch [j].type;
12914 cpu_arch_tune_flags = cpu_arch[j].flags;
12915 break;
12916 }
12917 }
12918 if (j >= ARRAY_SIZE (cpu_arch))
12919 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12920 break;
12921
12922 case OPTION_MMNEMONIC:
12923 if (strcasecmp (arg, "att") == 0)
12924 intel_mnemonic = 0;
12925 else if (strcasecmp (arg, "intel") == 0)
12926 intel_mnemonic = 1;
12927 else
12928 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
12929 break;
12930
12931 case OPTION_MSYNTAX:
12932 if (strcasecmp (arg, "att") == 0)
12933 intel_syntax = 0;
12934 else if (strcasecmp (arg, "intel") == 0)
12935 intel_syntax = 1;
12936 else
12937 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
12938 break;
12939
12940 case OPTION_MINDEX_REG:
12941 allow_index_reg = 1;
12942 break;
12943
12944 case OPTION_MNAKED_REG:
12945 allow_naked_reg = 1;
12946 break;
12947
12948 case OPTION_MSSE2AVX:
12949 sse2avx = 1;
12950 break;
12951
12952 case OPTION_MSSE_CHECK:
12953 if (strcasecmp (arg, "error") == 0)
12954 sse_check = check_error;
12955 else if (strcasecmp (arg, "warning") == 0)
12956 sse_check = check_warning;
12957 else if (strcasecmp (arg, "none") == 0)
12958 sse_check = check_none;
12959 else
12960 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
12961 break;
12962
12963 case OPTION_MOPERAND_CHECK:
12964 if (strcasecmp (arg, "error") == 0)
12965 operand_check = check_error;
12966 else if (strcasecmp (arg, "warning") == 0)
12967 operand_check = check_warning;
12968 else if (strcasecmp (arg, "none") == 0)
12969 operand_check = check_none;
12970 else
12971 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
12972 break;
12973
12974 case OPTION_MAVXSCALAR:
12975 if (strcasecmp (arg, "128") == 0)
12976 avxscalar = vex128;
12977 else if (strcasecmp (arg, "256") == 0)
12978 avxscalar = vex256;
12979 else
12980 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
12981 break;
12982
12983 case OPTION_MVEXWIG:
12984 if (strcmp (arg, "0") == 0)
12985 vexwig = vexw0;
12986 else if (strcmp (arg, "1") == 0)
12987 vexwig = vexw1;
12988 else
12989 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
12990 break;
12991
12992 case OPTION_MADD_BND_PREFIX:
12993 add_bnd_prefix = 1;
12994 break;
12995
12996 case OPTION_MEVEXLIG:
12997 if (strcmp (arg, "128") == 0)
12998 evexlig = evexl128;
12999 else if (strcmp (arg, "256") == 0)
13000 evexlig = evexl256;
13001 else if (strcmp (arg, "512") == 0)
13002 evexlig = evexl512;
13003 else
13004 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13005 break;
13006
13007 case OPTION_MEVEXRCIG:
13008 if (strcmp (arg, "rne") == 0)
13009 evexrcig = rne;
13010 else if (strcmp (arg, "rd") == 0)
13011 evexrcig = rd;
13012 else if (strcmp (arg, "ru") == 0)
13013 evexrcig = ru;
13014 else if (strcmp (arg, "rz") == 0)
13015 evexrcig = rz;
13016 else
13017 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13018 break;
13019
13020 case OPTION_MEVEXWIG:
13021 if (strcmp (arg, "0") == 0)
13022 evexwig = evexw0;
13023 else if (strcmp (arg, "1") == 0)
13024 evexwig = evexw1;
13025 else
13026 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13027 break;
13028
13029 # if defined (TE_PE) || defined (TE_PEP)
13030 case OPTION_MBIG_OBJ:
13031 use_big_obj = 1;
13032 break;
13033 #endif
13034
13035 case OPTION_MOMIT_LOCK_PREFIX:
13036 if (strcasecmp (arg, "yes") == 0)
13037 omit_lock_prefix = 1;
13038 else if (strcasecmp (arg, "no") == 0)
13039 omit_lock_prefix = 0;
13040 else
13041 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13042 break;
13043
13044 case OPTION_MFENCE_AS_LOCK_ADD:
13045 if (strcasecmp (arg, "yes") == 0)
13046 avoid_fence = 1;
13047 else if (strcasecmp (arg, "no") == 0)
13048 avoid_fence = 0;
13049 else
13050 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13051 break;
13052
13053 case OPTION_MLFENCE_AFTER_LOAD:
13054 if (strcasecmp (arg, "yes") == 0)
13055 lfence_after_load = 1;
13056 else if (strcasecmp (arg, "no") == 0)
13057 lfence_after_load = 0;
13058 else
13059 as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13060 break;
13061
13062 case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13063 if (strcasecmp (arg, "all") == 0)
13064 {
13065 lfence_before_indirect_branch = lfence_branch_all;
13066 if (lfence_before_ret == lfence_before_ret_none)
13067 lfence_before_ret = lfence_before_ret_shl;
13068 }
13069 else if (strcasecmp (arg, "memory") == 0)
13070 lfence_before_indirect_branch = lfence_branch_memory;
13071 else if (strcasecmp (arg, "register") == 0)
13072 lfence_before_indirect_branch = lfence_branch_register;
13073 else if (strcasecmp (arg, "none") == 0)
13074 lfence_before_indirect_branch = lfence_branch_none;
13075 else
13076 as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13077 arg);
13078 break;
13079
13080 case OPTION_MLFENCE_BEFORE_RET:
13081 if (strcasecmp (arg, "or") == 0)
13082 lfence_before_ret = lfence_before_ret_or;
13083 else if (strcasecmp (arg, "not") == 0)
13084 lfence_before_ret = lfence_before_ret_not;
13085 else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13086 lfence_before_ret = lfence_before_ret_shl;
13087 else if (strcasecmp (arg, "none") == 0)
13088 lfence_before_ret = lfence_before_ret_none;
13089 else
13090 as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13091 arg);
13092 break;
13093
13094 case OPTION_MRELAX_RELOCATIONS:
13095 if (strcasecmp (arg, "yes") == 0)
13096 generate_relax_relocations = 1;
13097 else if (strcasecmp (arg, "no") == 0)
13098 generate_relax_relocations = 0;
13099 else
13100 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13101 break;
13102
13103 case OPTION_MALIGN_BRANCH_BOUNDARY:
13104 {
13105 char *end;
13106 long int align = strtoul (arg, &end, 0);
13107 if (*end == '\0')
13108 {
13109 if (align == 0)
13110 {
13111 align_branch_power = 0;
13112 break;
13113 }
13114 else if (align >= 16)
13115 {
13116 int align_power;
13117 for (align_power = 0;
13118 (align & 1) == 0;
13119 align >>= 1, align_power++)
13120 continue;
13121 /* Limit alignment power to 31. */
13122 if (align == 1 && align_power < 32)
13123 {
13124 align_branch_power = align_power;
13125 break;
13126 }
13127 }
13128 }
13129 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13130 }
13131 break;
13132
13133 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13134 {
13135 char *end;
13136 int align = strtoul (arg, &end, 0);
13137 /* Some processors only support 5 prefixes. */
13138 if (*end == '\0' && align >= 0 && align < 6)
13139 {
13140 align_branch_prefix_size = align;
13141 break;
13142 }
13143 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13144 arg);
13145 }
13146 break;
13147
13148 case OPTION_MALIGN_BRANCH:
13149 align_branch = 0;
13150 saved = xstrdup (arg);
13151 type = saved;
13152 do
13153 {
13154 next = strchr (type, '+');
13155 if (next)
13156 *next++ = '\0';
13157 if (strcasecmp (type, "jcc") == 0)
13158 align_branch |= align_branch_jcc_bit;
13159 else if (strcasecmp (type, "fused") == 0)
13160 align_branch |= align_branch_fused_bit;
13161 else if (strcasecmp (type, "jmp") == 0)
13162 align_branch |= align_branch_jmp_bit;
13163 else if (strcasecmp (type, "call") == 0)
13164 align_branch |= align_branch_call_bit;
13165 else if (strcasecmp (type, "ret") == 0)
13166 align_branch |= align_branch_ret_bit;
13167 else if (strcasecmp (type, "indirect") == 0)
13168 align_branch |= align_branch_indirect_bit;
13169 else
13170 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13171 type = next;
13172 }
13173 while (next != NULL);
13174 free (saved);
13175 break;
13176
13177 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13178 align_branch_power = 5;
13179 align_branch_prefix_size = 5;
13180 align_branch = (align_branch_jcc_bit
13181 | align_branch_fused_bit
13182 | align_branch_jmp_bit);
13183 break;
13184
13185 case OPTION_MAMD64:
13186 isa64 = amd64;
13187 break;
13188
13189 case OPTION_MINTEL64:
13190 isa64 = intel64;
13191 break;
13192
13193 case 'O':
13194 if (arg == NULL)
13195 {
13196 optimize = 1;
13197 /* Turn off -Os. */
13198 optimize_for_space = 0;
13199 }
13200 else if (*arg == 's')
13201 {
13202 optimize_for_space = 1;
13203 /* Turn on all encoding optimizations. */
13204 optimize = INT_MAX;
13205 }
13206 else
13207 {
13208 optimize = atoi (arg);
13209 /* Turn off -Os. */
13210 optimize_for_space = 0;
13211 }
13212 break;
13213
13214 default:
13215 return 0;
13216 }
13217 return 1;
13218 }
13219
13220 #define MESSAGE_TEMPLATE \
13221 " "
13222
13223 static char *
13224 output_message (FILE *stream, char *p, char *message, char *start,
13225 int *left_p, const char *name, int len)
13226 {
13227 int size = sizeof (MESSAGE_TEMPLATE);
13228 int left = *left_p;
13229
13230 /* Reserve 2 spaces for ", " or ",\0" */
13231 left -= len + 2;
13232
13233 /* Check if there is any room. */
13234 if (left >= 0)
13235 {
13236 if (p != start)
13237 {
13238 *p++ = ',';
13239 *p++ = ' ';
13240 }
13241 p = mempcpy (p, name, len);
13242 }
13243 else
13244 {
13245 /* Output the current message now and start a new one. */
13246 *p++ = ',';
13247 *p = '\0';
13248 fprintf (stream, "%s\n", message);
13249 p = start;
13250 left = size - (start - message) - len - 2;
13251
13252 gas_assert (left >= 0);
13253
13254 p = mempcpy (p, name, len);
13255 }
13256
13257 *left_p = left;
13258 return p;
13259 }
13260
13261 static void
13262 show_arch (FILE *stream, int ext, int check)
13263 {
13264 static char message[] = MESSAGE_TEMPLATE;
13265 char *start = message + 27;
13266 char *p;
13267 int size = sizeof (MESSAGE_TEMPLATE);
13268 int left;
13269 const char *name;
13270 int len;
13271 unsigned int j;
13272
13273 p = start;
13274 left = size - (start - message);
13275 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13276 {
13277 /* Should it be skipped? */
13278 if (cpu_arch [j].skip)
13279 continue;
13280
13281 name = cpu_arch [j].name;
13282 len = cpu_arch [j].len;
13283 if (*name == '.')
13284 {
13285 /* It is an extension. Skip if we aren't asked to show it. */
13286 if (ext)
13287 {
13288 name++;
13289 len--;
13290 }
13291 else
13292 continue;
13293 }
13294 else if (ext)
13295 {
13296 /* It is an processor. Skip if we show only extension. */
13297 continue;
13298 }
13299 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13300 {
13301 /* It is an impossible processor - skip. */
13302 continue;
13303 }
13304
13305 p = output_message (stream, p, message, start, &left, name, len);
13306 }
13307
13308 /* Display disabled extensions. */
13309 if (ext)
13310 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13311 {
13312 name = cpu_noarch [j].name;
13313 len = cpu_noarch [j].len;
13314 p = output_message (stream, p, message, start, &left, name,
13315 len);
13316 }
13317
13318 *p = '\0';
13319 fprintf (stream, "%s\n", message);
13320 }
13321
13322 void
13323 md_show_usage (FILE *stream)
13324 {
13325 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13326 fprintf (stream, _("\
13327 -Qy, -Qn ignored\n\
13328 -V print assembler version number\n\
13329 -k ignored\n"));
13330 #endif
13331 fprintf (stream, _("\
13332 -n Do not optimize code alignment\n\
13333 -q quieten some warnings\n"));
13334 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13335 fprintf (stream, _("\
13336 -s ignored\n"));
13337 #endif
13338 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13339 || defined (TE_PE) || defined (TE_PEP))
13340 fprintf (stream, _("\
13341 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
13342 #endif
13343 #ifdef SVR4_COMMENT_CHARS
13344 fprintf (stream, _("\
13345 --divide do not treat `/' as a comment character\n"));
13346 #else
13347 fprintf (stream, _("\
13348 --divide ignored\n"));
13349 #endif
13350 fprintf (stream, _("\
13351 -march=CPU[,+EXTENSION...]\n\
13352 generate code for CPU and EXTENSION, CPU is one of:\n"));
13353 show_arch (stream, 0, 1);
13354 fprintf (stream, _("\
13355 EXTENSION is combination of:\n"));
13356 show_arch (stream, 1, 0);
13357 fprintf (stream, _("\
13358 -mtune=CPU optimize for CPU, CPU is one of:\n"));
13359 show_arch (stream, 0, 0);
13360 fprintf (stream, _("\
13361 -msse2avx encode SSE instructions with VEX prefix\n"));
13362 fprintf (stream, _("\
13363 -msse-check=[none|error|warning] (default: warning)\n\
13364 check SSE instructions\n"));
13365 fprintf (stream, _("\
13366 -moperand-check=[none|error|warning] (default: warning)\n\
13367 check operand combinations for validity\n"));
13368 fprintf (stream, _("\
13369 -mavxscalar=[128|256] (default: 128)\n\
13370 encode scalar AVX instructions with specific vector\n\
13371 length\n"));
13372 fprintf (stream, _("\
13373 -mvexwig=[0|1] (default: 0)\n\
13374 encode VEX instructions with specific VEX.W value\n\
13375 for VEX.W bit ignored instructions\n"));
13376 fprintf (stream, _("\
13377 -mevexlig=[128|256|512] (default: 128)\n\
13378 encode scalar EVEX instructions with specific vector\n\
13379 length\n"));
13380 fprintf (stream, _("\
13381 -mevexwig=[0|1] (default: 0)\n\
13382 encode EVEX instructions with specific EVEX.W value\n\
13383 for EVEX.W bit ignored instructions\n"));
13384 fprintf (stream, _("\
13385 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13386 encode EVEX instructions with specific EVEX.RC value\n\
13387 for SAE-only ignored instructions\n"));
13388 fprintf (stream, _("\
13389 -mmnemonic=[att|intel] "));
13390 if (SYSV386_COMPAT)
13391 fprintf (stream, _("(default: att)\n"));
13392 else
13393 fprintf (stream, _("(default: intel)\n"));
13394 fprintf (stream, _("\
13395 use AT&T/Intel mnemonic\n"));
13396 fprintf (stream, _("\
13397 -msyntax=[att|intel] (default: att)\n\
13398 use AT&T/Intel syntax\n"));
13399 fprintf (stream, _("\
13400 -mindex-reg support pseudo index registers\n"));
13401 fprintf (stream, _("\
13402 -mnaked-reg don't require `%%' prefix for registers\n"));
13403 fprintf (stream, _("\
13404 -madd-bnd-prefix add BND prefix for all valid branches\n"));
13405 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13406 fprintf (stream, _("\
13407 -mshared disable branch optimization for shared code\n"));
13408 fprintf (stream, _("\
13409 -mx86-used-note=[no|yes] "));
13410 if (DEFAULT_X86_USED_NOTE)
13411 fprintf (stream, _("(default: yes)\n"));
13412 else
13413 fprintf (stream, _("(default: no)\n"));
13414 fprintf (stream, _("\
13415 generate x86 used ISA and feature properties\n"));
13416 #endif
13417 #if defined (TE_PE) || defined (TE_PEP)
13418 fprintf (stream, _("\
13419 -mbig-obj generate big object files\n"));
13420 #endif
13421 fprintf (stream, _("\
13422 -momit-lock-prefix=[no|yes] (default: no)\n\
13423 strip all lock prefixes\n"));
13424 fprintf (stream, _("\
13425 -mfence-as-lock-add=[no|yes] (default: no)\n\
13426 encode lfence, mfence and sfence as\n\
13427 lock addl $0x0, (%%{re}sp)\n"));
13428 fprintf (stream, _("\
13429 -mrelax-relocations=[no|yes] "));
13430 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13431 fprintf (stream, _("(default: yes)\n"));
13432 else
13433 fprintf (stream, _("(default: no)\n"));
13434 fprintf (stream, _("\
13435 generate relax relocations\n"));
13436 fprintf (stream, _("\
13437 -malign-branch-boundary=NUM (default: 0)\n\
13438 align branches within NUM byte boundary\n"));
13439 fprintf (stream, _("\
13440 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13441 TYPE is combination of jcc, fused, jmp, call, ret,\n\
13442 indirect\n\
13443 specify types of branches to align\n"));
13444 fprintf (stream, _("\
13445 -malign-branch-prefix-size=NUM (default: 5)\n\
13446 align branches with NUM prefixes per instruction\n"));
13447 fprintf (stream, _("\
13448 -mbranches-within-32B-boundaries\n\
13449 align branches within 32 byte boundary\n"));
13450 fprintf (stream, _("\
13451 -mlfence-after-load=[no|yes] (default: no)\n\
13452 generate lfence after load\n"));
13453 fprintf (stream, _("\
13454 -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13455 generate lfence before indirect near branch\n"));
13456 fprintf (stream, _("\
13457 -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13458 generate lfence before ret\n"));
13459 fprintf (stream, _("\
13460 -mamd64 accept only AMD64 ISA [default]\n"));
13461 fprintf (stream, _("\
13462 -mintel64 accept only Intel64 ISA\n"));
13463 }
13464
13465 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13466 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13467 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13468
13469 /* Pick the target format to use. */
13470
13471 const char *
13472 i386_target_format (void)
13473 {
13474 if (!strncmp (default_arch, "x86_64", 6))
13475 {
13476 update_code_flag (CODE_64BIT, 1);
13477 if (default_arch[6] == '\0')
13478 x86_elf_abi = X86_64_ABI;
13479 else
13480 x86_elf_abi = X86_64_X32_ABI;
13481 }
13482 else if (!strcmp (default_arch, "i386"))
13483 update_code_flag (CODE_32BIT, 1);
13484 else if (!strcmp (default_arch, "iamcu"))
13485 {
13486 update_code_flag (CODE_32BIT, 1);
13487 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13488 {
13489 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13490 cpu_arch_name = "iamcu";
13491 cpu_sub_arch_name = NULL;
13492 cpu_arch_flags = iamcu_flags;
13493 cpu_arch_isa = PROCESSOR_IAMCU;
13494 cpu_arch_isa_flags = iamcu_flags;
13495 if (!cpu_arch_tune_set)
13496 {
13497 cpu_arch_tune = cpu_arch_isa;
13498 cpu_arch_tune_flags = cpu_arch_isa_flags;
13499 }
13500 }
13501 else if (cpu_arch_isa != PROCESSOR_IAMCU)
13502 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13503 cpu_arch_name);
13504 }
13505 else
13506 as_fatal (_("unknown architecture"));
13507
13508 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13509 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13510 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13511 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13512
13513 switch (OUTPUT_FLAVOR)
13514 {
13515 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13516 case bfd_target_aout_flavour:
13517 return AOUT_TARGET_FORMAT;
13518 #endif
13519 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13520 # if defined (TE_PE) || defined (TE_PEP)
13521 case bfd_target_coff_flavour:
13522 if (flag_code == CODE_64BIT)
13523 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13524 else
13525 return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13526 # elif defined (TE_GO32)
13527 case bfd_target_coff_flavour:
13528 return "coff-go32";
13529 # else
13530 case bfd_target_coff_flavour:
13531 return "coff-i386";
13532 # endif
13533 #endif
13534 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13535 case bfd_target_elf_flavour:
13536 {
13537 const char *format;
13538
13539 switch (x86_elf_abi)
13540 {
13541 default:
13542 format = ELF_TARGET_FORMAT;
13543 #ifndef TE_SOLARIS
13544 tls_get_addr = "___tls_get_addr";
13545 #endif
13546 break;
13547 case X86_64_ABI:
13548 use_rela_relocations = 1;
13549 object_64bit = 1;
13550 #ifndef TE_SOLARIS
13551 tls_get_addr = "__tls_get_addr";
13552 #endif
13553 format = ELF_TARGET_FORMAT64;
13554 break;
13555 case X86_64_X32_ABI:
13556 use_rela_relocations = 1;
13557 object_64bit = 1;
13558 #ifndef TE_SOLARIS
13559 tls_get_addr = "__tls_get_addr";
13560 #endif
13561 disallow_64bit_reloc = 1;
13562 format = ELF_TARGET_FORMAT32;
13563 break;
13564 }
13565 if (cpu_arch_isa == PROCESSOR_L1OM)
13566 {
13567 if (x86_elf_abi != X86_64_ABI)
13568 as_fatal (_("Intel L1OM is 64bit only"));
13569 return ELF_TARGET_L1OM_FORMAT;
13570 }
13571 else if (cpu_arch_isa == PROCESSOR_K1OM)
13572 {
13573 if (x86_elf_abi != X86_64_ABI)
13574 as_fatal (_("Intel K1OM is 64bit only"));
13575 return ELF_TARGET_K1OM_FORMAT;
13576 }
13577 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13578 {
13579 if (x86_elf_abi != I386_ABI)
13580 as_fatal (_("Intel MCU is 32bit only"));
13581 return ELF_TARGET_IAMCU_FORMAT;
13582 }
13583 else
13584 return format;
13585 }
13586 #endif
13587 #if defined (OBJ_MACH_O)
13588 case bfd_target_mach_o_flavour:
13589 if (flag_code == CODE_64BIT)
13590 {
13591 use_rela_relocations = 1;
13592 object_64bit = 1;
13593 return "mach-o-x86-64";
13594 }
13595 else
13596 return "mach-o-i386";
13597 #endif
13598 default:
13599 abort ();
13600 return NULL;
13601 }
13602 }
13603
13604 #endif /* OBJ_MAYBE_ more than one */
13605 \f
13606 symbolS *
13607 md_undefined_symbol (char *name)
13608 {
13609 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13610 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13611 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13612 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13613 {
13614 if (!GOT_symbol)
13615 {
13616 if (symbol_find (name))
13617 as_bad (_("GOT already in symbol table"));
13618 GOT_symbol = symbol_new (name, undefined_section,
13619 (valueT) 0, &zero_address_frag);
13620 };
13621 return GOT_symbol;
13622 }
13623 return 0;
13624 }
13625
13626 /* Round up a section size to the appropriate boundary. */
13627
13628 valueT
13629 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13630 {
13631 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13632 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13633 {
13634 /* For a.out, force the section size to be aligned. If we don't do
13635 this, BFD will align it for us, but it will not write out the
13636 final bytes of the section. This may be a bug in BFD, but it is
13637 easier to fix it here since that is how the other a.out targets
13638 work. */
13639 int align;
13640
13641 align = bfd_section_alignment (segment);
13642 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13643 }
13644 #endif
13645
13646 return size;
13647 }
13648
13649 /* On the i386, PC-relative offsets are relative to the start of the
13650 next instruction. That is, the address of the offset, plus its
13651 size, since the offset is always the last part of the insn. */
13652
13653 long
13654 md_pcrel_from (fixS *fixP)
13655 {
13656 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13657 }
13658
13659 #ifndef I386COFF
13660
13661 static void
13662 s_bss (int ignore ATTRIBUTE_UNUSED)
13663 {
13664 int temp;
13665
13666 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13667 if (IS_ELF)
13668 obj_elf_section_change_hook ();
13669 #endif
13670 temp = get_absolute_expression ();
13671 subseg_set (bss_section, (subsegT) temp);
13672 demand_empty_rest_of_line ();
13673 }
13674
13675 #endif
13676
13677 /* Remember constant directive. */
13678
13679 void
13680 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13681 {
13682 if (last_insn.kind != last_insn_directive
13683 && (bfd_section_flags (now_seg) & SEC_CODE))
13684 {
13685 last_insn.seg = now_seg;
13686 last_insn.kind = last_insn_directive;
13687 last_insn.name = "constant directive";
13688 last_insn.file = as_where (&last_insn.line);
13689 if (lfence_before_ret != lfence_before_ret_none)
13690 {
13691 if (lfence_before_indirect_branch != lfence_branch_none)
13692 as_warn (_("constant directive skips -mlfence-before-ret "
13693 "and -mlfence-before-indirect-branch"));
13694 else
13695 as_warn (_("constant directive skips -mlfence-before-ret"));
13696 }
13697 else if (lfence_before_indirect_branch != lfence_branch_none)
13698 as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13699 }
13700 }
13701
13702 void
13703 i386_validate_fix (fixS *fixp)
13704 {
13705 if (fixp->fx_subsy)
13706 {
13707 if (fixp->fx_subsy == GOT_symbol)
13708 {
13709 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13710 {
13711 if (!object_64bit)
13712 abort ();
13713 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13714 if (fixp->fx_tcbit2)
13715 fixp->fx_r_type = (fixp->fx_tcbit
13716 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13717 : BFD_RELOC_X86_64_GOTPCRELX);
13718 else
13719 #endif
13720 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13721 }
13722 else
13723 {
13724 if (!object_64bit)
13725 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13726 else
13727 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13728 }
13729 fixp->fx_subsy = 0;
13730 }
13731 }
13732 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13733 else if (!object_64bit)
13734 {
13735 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13736 && fixp->fx_tcbit2)
13737 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13738 }
13739 #endif
13740 }
13741
13742 arelent *
13743 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13744 {
13745 arelent *rel;
13746 bfd_reloc_code_real_type code;
13747
13748 switch (fixp->fx_r_type)
13749 {
13750 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13751 case BFD_RELOC_SIZE32:
13752 case BFD_RELOC_SIZE64:
13753 if (S_IS_DEFINED (fixp->fx_addsy)
13754 && !S_IS_EXTERNAL (fixp->fx_addsy))
13755 {
13756 /* Resolve size relocation against local symbol to size of
13757 the symbol plus addend. */
13758 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13759 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13760 && !fits_in_unsigned_long (value))
13761 as_bad_where (fixp->fx_file, fixp->fx_line,
13762 _("symbol size computation overflow"));
13763 fixp->fx_addsy = NULL;
13764 fixp->fx_subsy = NULL;
13765 md_apply_fix (fixp, (valueT *) &value, NULL);
13766 return NULL;
13767 }
13768 #endif
13769 /* Fall through. */
13770
13771 case BFD_RELOC_X86_64_PLT32:
13772 case BFD_RELOC_X86_64_GOT32:
13773 case BFD_RELOC_X86_64_GOTPCREL:
13774 case BFD_RELOC_X86_64_GOTPCRELX:
13775 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13776 case BFD_RELOC_386_PLT32:
13777 case BFD_RELOC_386_GOT32:
13778 case BFD_RELOC_386_GOT32X:
13779 case BFD_RELOC_386_GOTOFF:
13780 case BFD_RELOC_386_GOTPC:
13781 case BFD_RELOC_386_TLS_GD:
13782 case BFD_RELOC_386_TLS_LDM:
13783 case BFD_RELOC_386_TLS_LDO_32:
13784 case BFD_RELOC_386_TLS_IE_32:
13785 case BFD_RELOC_386_TLS_IE:
13786 case BFD_RELOC_386_TLS_GOTIE:
13787 case BFD_RELOC_386_TLS_LE_32:
13788 case BFD_RELOC_386_TLS_LE:
13789 case BFD_RELOC_386_TLS_GOTDESC:
13790 case BFD_RELOC_386_TLS_DESC_CALL:
13791 case BFD_RELOC_X86_64_TLSGD:
13792 case BFD_RELOC_X86_64_TLSLD:
13793 case BFD_RELOC_X86_64_DTPOFF32:
13794 case BFD_RELOC_X86_64_DTPOFF64:
13795 case BFD_RELOC_X86_64_GOTTPOFF:
13796 case BFD_RELOC_X86_64_TPOFF32:
13797 case BFD_RELOC_X86_64_TPOFF64:
13798 case BFD_RELOC_X86_64_GOTOFF64:
13799 case BFD_RELOC_X86_64_GOTPC32:
13800 case BFD_RELOC_X86_64_GOT64:
13801 case BFD_RELOC_X86_64_GOTPCREL64:
13802 case BFD_RELOC_X86_64_GOTPC64:
13803 case BFD_RELOC_X86_64_GOTPLT64:
13804 case BFD_RELOC_X86_64_PLTOFF64:
13805 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13806 case BFD_RELOC_X86_64_TLSDESC_CALL:
13807 case BFD_RELOC_RVA:
13808 case BFD_RELOC_VTABLE_ENTRY:
13809 case BFD_RELOC_VTABLE_INHERIT:
13810 #ifdef TE_PE
13811 case BFD_RELOC_32_SECREL:
13812 #endif
13813 code = fixp->fx_r_type;
13814 break;
13815 case BFD_RELOC_X86_64_32S:
13816 if (!fixp->fx_pcrel)
13817 {
13818 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13819 code = fixp->fx_r_type;
13820 break;
13821 }
13822 /* Fall through. */
13823 default:
13824 if (fixp->fx_pcrel)
13825 {
13826 switch (fixp->fx_size)
13827 {
13828 default:
13829 as_bad_where (fixp->fx_file, fixp->fx_line,
13830 _("can not do %d byte pc-relative relocation"),
13831 fixp->fx_size);
13832 code = BFD_RELOC_32_PCREL;
13833 break;
13834 case 1: code = BFD_RELOC_8_PCREL; break;
13835 case 2: code = BFD_RELOC_16_PCREL; break;
13836 case 4: code = BFD_RELOC_32_PCREL; break;
13837 #ifdef BFD64
13838 case 8: code = BFD_RELOC_64_PCREL; break;
13839 #endif
13840 }
13841 }
13842 else
13843 {
13844 switch (fixp->fx_size)
13845 {
13846 default:
13847 as_bad_where (fixp->fx_file, fixp->fx_line,
13848 _("can not do %d byte relocation"),
13849 fixp->fx_size);
13850 code = BFD_RELOC_32;
13851 break;
13852 case 1: code = BFD_RELOC_8; break;
13853 case 2: code = BFD_RELOC_16; break;
13854 case 4: code = BFD_RELOC_32; break;
13855 #ifdef BFD64
13856 case 8: code = BFD_RELOC_64; break;
13857 #endif
13858 }
13859 }
13860 break;
13861 }
13862
13863 if ((code == BFD_RELOC_32
13864 || code == BFD_RELOC_32_PCREL
13865 || code == BFD_RELOC_X86_64_32S)
13866 && GOT_symbol
13867 && fixp->fx_addsy == GOT_symbol)
13868 {
13869 if (!object_64bit)
13870 code = BFD_RELOC_386_GOTPC;
13871 else
13872 code = BFD_RELOC_X86_64_GOTPC32;
13873 }
13874 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13875 && GOT_symbol
13876 && fixp->fx_addsy == GOT_symbol)
13877 {
13878 code = BFD_RELOC_X86_64_GOTPC64;
13879 }
13880
13881 rel = XNEW (arelent);
13882 rel->sym_ptr_ptr = XNEW (asymbol *);
13883 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13884
13885 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13886
13887 if (!use_rela_relocations)
13888 {
13889 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13890 vtable entry to be used in the relocation's section offset. */
13891 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13892 rel->address = fixp->fx_offset;
13893 #if defined (OBJ_COFF) && defined (TE_PE)
13894 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13895 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13896 else
13897 #endif
13898 rel->addend = 0;
13899 }
13900 /* Use the rela in 64bit mode. */
13901 else
13902 {
13903 if (disallow_64bit_reloc)
13904 switch (code)
13905 {
13906 case BFD_RELOC_X86_64_DTPOFF64:
13907 case BFD_RELOC_X86_64_TPOFF64:
13908 case BFD_RELOC_64_PCREL:
13909 case BFD_RELOC_X86_64_GOTOFF64:
13910 case BFD_RELOC_X86_64_GOT64:
13911 case BFD_RELOC_X86_64_GOTPCREL64:
13912 case BFD_RELOC_X86_64_GOTPC64:
13913 case BFD_RELOC_X86_64_GOTPLT64:
13914 case BFD_RELOC_X86_64_PLTOFF64:
13915 as_bad_where (fixp->fx_file, fixp->fx_line,
13916 _("cannot represent relocation type %s in x32 mode"),
13917 bfd_get_reloc_code_name (code));
13918 break;
13919 default:
13920 break;
13921 }
13922
13923 if (!fixp->fx_pcrel)
13924 rel->addend = fixp->fx_offset;
13925 else
13926 switch (code)
13927 {
13928 case BFD_RELOC_X86_64_PLT32:
13929 case BFD_RELOC_X86_64_GOT32:
13930 case BFD_RELOC_X86_64_GOTPCREL:
13931 case BFD_RELOC_X86_64_GOTPCRELX:
13932 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13933 case BFD_RELOC_X86_64_TLSGD:
13934 case BFD_RELOC_X86_64_TLSLD:
13935 case BFD_RELOC_X86_64_GOTTPOFF:
13936 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13937 case BFD_RELOC_X86_64_TLSDESC_CALL:
13938 rel->addend = fixp->fx_offset - fixp->fx_size;
13939 break;
13940 default:
13941 rel->addend = (section->vma
13942 - fixp->fx_size
13943 + fixp->fx_addnumber
13944 + md_pcrel_from (fixp));
13945 break;
13946 }
13947 }
13948
13949 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
13950 if (rel->howto == NULL)
13951 {
13952 as_bad_where (fixp->fx_file, fixp->fx_line,
13953 _("cannot represent relocation type %s"),
13954 bfd_get_reloc_code_name (code));
13955 /* Set howto to a garbage value so that we can keep going. */
13956 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
13957 gas_assert (rel->howto != NULL);
13958 }
13959
13960 return rel;
13961 }
13962
13963 #include "tc-i386-intel.c"
13964
13965 void
13966 tc_x86_parse_to_dw2regnum (expressionS *exp)
13967 {
13968 int saved_naked_reg;
13969 char saved_register_dot;
13970
13971 saved_naked_reg = allow_naked_reg;
13972 allow_naked_reg = 1;
13973 saved_register_dot = register_chars['.'];
13974 register_chars['.'] = '.';
13975 allow_pseudo_reg = 1;
13976 expression_and_evaluate (exp);
13977 allow_pseudo_reg = 0;
13978 register_chars['.'] = saved_register_dot;
13979 allow_naked_reg = saved_naked_reg;
13980
13981 if (exp->X_op == O_register && exp->X_add_number >= 0)
13982 {
13983 if ((addressT) exp->X_add_number < i386_regtab_size)
13984 {
13985 exp->X_op = O_constant;
13986 exp->X_add_number = i386_regtab[exp->X_add_number]
13987 .dw2_regnum[flag_code >> 1];
13988 }
13989 else
13990 exp->X_op = O_illegal;
13991 }
13992 }
13993
13994 void
13995 tc_x86_frame_initial_instructions (void)
13996 {
13997 static unsigned int sp_regno[2];
13998
13999 if (!sp_regno[flag_code >> 1])
14000 {
14001 char *saved_input = input_line_pointer;
14002 char sp[][4] = {"esp", "rsp"};
14003 expressionS exp;
14004
14005 input_line_pointer = sp[flag_code >> 1];
14006 tc_x86_parse_to_dw2regnum (&exp);
14007 gas_assert (exp.X_op == O_constant);
14008 sp_regno[flag_code >> 1] = exp.X_add_number;
14009 input_line_pointer = saved_input;
14010 }
14011
14012 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14013 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14014 }
14015
14016 int
14017 x86_dwarf2_addr_size (void)
14018 {
14019 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14020 if (x86_elf_abi == X86_64_X32_ABI)
14021 return 4;
14022 #endif
14023 return bfd_arch_bits_per_address (stdoutput) / 8;
14024 }
14025
14026 int
14027 i386_elf_section_type (const char *str, size_t len)
14028 {
14029 if (flag_code == CODE_64BIT
14030 && len == sizeof ("unwind") - 1
14031 && strncmp (str, "unwind", 6) == 0)
14032 return SHT_X86_64_UNWIND;
14033
14034 return -1;
14035 }
14036
14037 #ifdef TE_SOLARIS
14038 void
14039 i386_solaris_fix_up_eh_frame (segT sec)
14040 {
14041 if (flag_code == CODE_64BIT)
14042 elf_section_type (sec) = SHT_X86_64_UNWIND;
14043 }
14044 #endif
14045
14046 #ifdef TE_PE
14047 void
14048 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14049 {
14050 expressionS exp;
14051
14052 exp.X_op = O_secrel;
14053 exp.X_add_symbol = symbol;
14054 exp.X_add_number = 0;
14055 emit_expr (&exp, size);
14056 }
14057 #endif
14058
14059 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14060 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
14061
14062 bfd_vma
14063 x86_64_section_letter (int letter, const char **ptr_msg)
14064 {
14065 if (flag_code == CODE_64BIT)
14066 {
14067 if (letter == 'l')
14068 return SHF_X86_64_LARGE;
14069
14070 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14071 }
14072 else
14073 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14074 return -1;
14075 }
14076
14077 bfd_vma
14078 x86_64_section_word (char *str, size_t len)
14079 {
14080 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
14081 return SHF_X86_64_LARGE;
14082
14083 return -1;
14084 }
14085
14086 static void
14087 handle_large_common (int small ATTRIBUTE_UNUSED)
14088 {
14089 if (flag_code != CODE_64BIT)
14090 {
14091 s_comm_internal (0, elf_common_parse);
14092 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14093 }
14094 else
14095 {
14096 static segT lbss_section;
14097 asection *saved_com_section_ptr = elf_com_section_ptr;
14098 asection *saved_bss_section = bss_section;
14099
14100 if (lbss_section == NULL)
14101 {
14102 flagword applicable;
14103 segT seg = now_seg;
14104 subsegT subseg = now_subseg;
14105
14106 /* The .lbss section is for local .largecomm symbols. */
14107 lbss_section = subseg_new (".lbss", 0);
14108 applicable = bfd_applicable_section_flags (stdoutput);
14109 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14110 seg_info (lbss_section)->bss = 1;
14111
14112 subseg_set (seg, subseg);
14113 }
14114
14115 elf_com_section_ptr = &_bfd_elf_large_com_section;
14116 bss_section = lbss_section;
14117
14118 s_comm_internal (0, elf_common_parse);
14119
14120 elf_com_section_ptr = saved_com_section_ptr;
14121 bss_section = saved_bss_section;
14122 }
14123 }
14124 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 0.315998 seconds and 5 git commands to generate.