x86: StaticRounding implies SAE
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2019 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef REGISTER_WARNINGS
48 #define REGISTER_WARNINGS 1
49 #endif
50
51 #ifndef INFER_ADDR_PREFIX
52 #define INFER_ADDR_PREFIX 1
53 #endif
54
55 #ifndef DEFAULT_ARCH
56 #define DEFAULT_ARCH "i386"
57 #endif
58
59 #ifndef INLINE
60 #if __GNUC__ >= 2
61 #define INLINE __inline__
62 #else
63 #define INLINE
64 #endif
65 #endif
66
67 /* Prefixes will be emitted in the order defined below.
68 WAIT_PREFIX must be the first prefix since FWAIT is really is an
69 instruction, and so must come before any prefixes.
70 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
71 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
72 #define WAIT_PREFIX 0
73 #define SEG_PREFIX 1
74 #define ADDR_PREFIX 2
75 #define DATA_PREFIX 3
76 #define REP_PREFIX 4
77 #define HLE_PREFIX REP_PREFIX
78 #define BND_PREFIX REP_PREFIX
79 #define LOCK_PREFIX 5
80 #define REX_PREFIX 6 /* must come last. */
81 #define MAX_PREFIXES 7 /* max prefixes per opcode */
82
83 /* we define the syntax here (modulo base,index,scale syntax) */
84 #define REGISTER_PREFIX '%'
85 #define IMMEDIATE_PREFIX '$'
86 #define ABSOLUTE_PREFIX '*'
87
88 /* these are the instruction mnemonic suffixes in AT&T syntax or
89 memory operand size in Intel syntax. */
90 #define WORD_MNEM_SUFFIX 'w'
91 #define BYTE_MNEM_SUFFIX 'b'
92 #define SHORT_MNEM_SUFFIX 's'
93 #define LONG_MNEM_SUFFIX 'l'
94 #define QWORD_MNEM_SUFFIX 'q'
95 /* Intel Syntax. Use a non-ascii letter since since it never appears
96 in instructions. */
97 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
98
99 #define END_OF_INSN '\0'
100
101 /*
102 'templates' is for grouping together 'template' structures for opcodes
103 of the same name. This is only used for storing the insns in the grand
104 ole hash table of insns.
105 The templates themselves start at START and range up to (but not including)
106 END.
107 */
108 typedef struct
109 {
110 const insn_template *start;
111 const insn_template *end;
112 }
113 templates;
114
115 /* 386 operand encoding bytes: see 386 book for details of this. */
116 typedef struct
117 {
118 unsigned int regmem; /* codes register or memory operand */
119 unsigned int reg; /* codes register operand (or extended opcode) */
120 unsigned int mode; /* how to interpret regmem & reg */
121 }
122 modrm_byte;
123
124 /* x86-64 extension prefix. */
125 typedef int rex_byte;
126
127 /* 386 opcode byte to code indirect addressing. */
128 typedef struct
129 {
130 unsigned base;
131 unsigned index;
132 unsigned scale;
133 }
134 sib_byte;
135
136 /* x86 arch names, types and features */
137 typedef struct
138 {
139 const char *name; /* arch name */
140 unsigned int len; /* arch string length */
141 enum processor_type type; /* arch type */
142 i386_cpu_flags flags; /* cpu feature flags */
143 unsigned int skip; /* show_arch should skip this. */
144 }
145 arch_entry;
146
147 /* Used to turn off indicated flags. */
148 typedef struct
149 {
150 const char *name; /* arch name */
151 unsigned int len; /* arch string length */
152 i386_cpu_flags flags; /* cpu feature flags */
153 }
154 noarch_entry;
155
156 static void update_code_flag (int, int);
157 static void set_code_flag (int);
158 static void set_16bit_gcc_code_flag (int);
159 static void set_intel_syntax (int);
160 static void set_intel_mnemonic (int);
161 static void set_allow_index_reg (int);
162 static void set_check (int);
163 static void set_cpu_arch (int);
164 #ifdef TE_PE
165 static void pe_directive_secrel (int);
166 #endif
167 static void signed_cons (int);
168 static char *output_invalid (int c);
169 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
170 const char *);
171 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
172 const char *);
173 static int i386_att_operand (char *);
174 static int i386_intel_operand (char *, int);
175 static int i386_intel_simplify (expressionS *);
176 static int i386_intel_parse_name (const char *, expressionS *);
177 static const reg_entry *parse_register (char *, char **);
178 static char *parse_insn (char *, char *);
179 static char *parse_operands (char *, const char *);
180 static void swap_operands (void);
181 static void swap_2_operands (int, int);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
202
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
210
211 static const char *default_arch = DEFAULT_ARCH;
212
213 /* This struct describes rounding control and SAE in the instruction. */
214 struct RC_Operation
215 {
216 enum rc_type
217 {
218 rne = 0,
219 rd,
220 ru,
221 rz,
222 saeonly
223 } type;
224 int operand;
225 };
226
227 static struct RC_Operation rc_op;
228
229 /* The struct describes masking, applied to OPERAND in the instruction.
230 MASK is a pointer to the corresponding mask register. ZEROING tells
231 whether merging or zeroing mask is used. */
232 struct Mask_Operation
233 {
234 const reg_entry *mask;
235 unsigned int zeroing;
236 /* The operand where this operation is associated. */
237 int operand;
238 };
239
240 static struct Mask_Operation mask_op;
241
242 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
243 broadcast factor. */
244 struct Broadcast_Operation
245 {
246 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
247 int type;
248
249 /* Index of broadcasted operand. */
250 int operand;
251
252 /* Number of bytes to broadcast. */
253 int bytes;
254 };
255
256 static struct Broadcast_Operation broadcast_op;
257
258 /* VEX prefix. */
259 typedef struct
260 {
261 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
262 unsigned char bytes[4];
263 unsigned int length;
264 /* Destination or source register specifier. */
265 const reg_entry *register_specifier;
266 } vex_prefix;
267
268 /* 'md_assemble ()' gathers together information and puts it into a
269 i386_insn. */
270
271 union i386_op
272 {
273 expressionS *disps;
274 expressionS *imms;
275 const reg_entry *regs;
276 };
277
278 enum i386_error
279 {
280 operand_size_mismatch,
281 operand_type_mismatch,
282 register_type_mismatch,
283 number_of_operands_mismatch,
284 invalid_instruction_suffix,
285 bad_imm4,
286 unsupported_with_intel_mnemonic,
287 unsupported_syntax,
288 unsupported,
289 invalid_vsib_address,
290 invalid_vector_register_set,
291 unsupported_vector_index_register,
292 unsupported_broadcast,
293 broadcast_needed,
294 unsupported_masking,
295 mask_not_on_destination,
296 no_default_mask,
297 unsupported_rc_sae,
298 rc_sae_operand_not_last_imm,
299 invalid_register_operand,
300 };
301
302 struct _i386_insn
303 {
304 /* TM holds the template for the insn were currently assembling. */
305 insn_template tm;
306
307 /* SUFFIX holds the instruction size suffix for byte, word, dword
308 or qword, if given. */
309 char suffix;
310
311 /* OPERANDS gives the number of given operands. */
312 unsigned int operands;
313
314 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
315 of given register, displacement, memory operands and immediate
316 operands. */
317 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
318
319 /* TYPES [i] is the type (see above #defines) which tells us how to
320 use OP[i] for the corresponding operand. */
321 i386_operand_type types[MAX_OPERANDS];
322
323 /* Displacement expression, immediate expression, or register for each
324 operand. */
325 union i386_op op[MAX_OPERANDS];
326
327 /* Flags for operands. */
328 unsigned int flags[MAX_OPERANDS];
329 #define Operand_PCrel 1
330 #define Operand_Mem 2
331
332 /* Relocation type for operand */
333 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
334
335 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
336 the base index byte below. */
337 const reg_entry *base_reg;
338 const reg_entry *index_reg;
339 unsigned int log2_scale_factor;
340
341 /* SEG gives the seg_entries of this insn. They are zero unless
342 explicit segment overrides are given. */
343 const seg_entry *seg[2];
344
345 /* Copied first memory operand string, for re-checking. */
346 char *memop1_string;
347
348 /* PREFIX holds all the given prefix opcodes (usually null).
349 PREFIXES is the number of prefix opcodes. */
350 unsigned int prefixes;
351 unsigned char prefix[MAX_PREFIXES];
352
353 /* Has MMX register operands. */
354 bfd_boolean has_regmmx;
355
356 /* Has XMM register operands. */
357 bfd_boolean has_regxmm;
358
359 /* Has YMM register operands. */
360 bfd_boolean has_regymm;
361
362 /* Has ZMM register operands. */
363 bfd_boolean has_regzmm;
364
365 /* RM and SIB are the modrm byte and the sib byte where the
366 addressing modes of this insn are encoded. */
367 modrm_byte rm;
368 rex_byte rex;
369 rex_byte vrex;
370 sib_byte sib;
371 vex_prefix vex;
372
373 /* Masking attributes. */
374 struct Mask_Operation *mask;
375
376 /* Rounding control and SAE attributes. */
377 struct RC_Operation *rounding;
378
379 /* Broadcasting attributes. */
380 struct Broadcast_Operation *broadcast;
381
382 /* Compressed disp8*N attribute. */
383 unsigned int memshift;
384
385 /* Prefer load or store in encoding. */
386 enum
387 {
388 dir_encoding_default = 0,
389 dir_encoding_load,
390 dir_encoding_store,
391 dir_encoding_swap
392 } dir_encoding;
393
394 /* Prefer 8bit or 32bit displacement in encoding. */
395 enum
396 {
397 disp_encoding_default = 0,
398 disp_encoding_8bit,
399 disp_encoding_32bit
400 } disp_encoding;
401
402 /* Prefer the REX byte in encoding. */
403 bfd_boolean rex_encoding;
404
405 /* Disable instruction size optimization. */
406 bfd_boolean no_optimize;
407
408 /* How to encode vector instructions. */
409 enum
410 {
411 vex_encoding_default = 0,
412 vex_encoding_vex2,
413 vex_encoding_vex3,
414 vex_encoding_evex
415 } vec_encoding;
416
417 /* REP prefix. */
418 const char *rep_prefix;
419
420 /* HLE prefix. */
421 const char *hle_prefix;
422
423 /* Have BND prefix. */
424 const char *bnd_prefix;
425
426 /* Have NOTRACK prefix. */
427 const char *notrack_prefix;
428
429 /* Error message. */
430 enum i386_error error;
431 };
432
433 typedef struct _i386_insn i386_insn;
434
435 /* Link RC type with corresponding string, that'll be looked for in
436 asm. */
437 struct RC_name
438 {
439 enum rc_type type;
440 const char *name;
441 unsigned int len;
442 };
443
444 static const struct RC_name RC_NamesTable[] =
445 {
446 { rne, STRING_COMMA_LEN ("rn-sae") },
447 { rd, STRING_COMMA_LEN ("rd-sae") },
448 { ru, STRING_COMMA_LEN ("ru-sae") },
449 { rz, STRING_COMMA_LEN ("rz-sae") },
450 { saeonly, STRING_COMMA_LEN ("sae") },
451 };
452
453 /* List of chars besides those in app.c:symbol_chars that can start an
454 operand. Used to prevent the scrubber eating vital white-space. */
455 const char extra_symbol_chars[] = "*%-([{}"
456 #ifdef LEX_AT
457 "@"
458 #endif
459 #ifdef LEX_QM
460 "?"
461 #endif
462 ;
463
464 #if (defined (TE_I386AIX) \
465 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
466 && !defined (TE_GNU) \
467 && !defined (TE_LINUX) \
468 && !defined (TE_NACL) \
469 && !defined (TE_FreeBSD) \
470 && !defined (TE_DragonFly) \
471 && !defined (TE_NetBSD)))
472 /* This array holds the chars that always start a comment. If the
473 pre-processor is disabled, these aren't very useful. The option
474 --divide will remove '/' from this list. */
475 const char *i386_comment_chars = "#/";
476 #define SVR4_COMMENT_CHARS 1
477 #define PREFIX_SEPARATOR '\\'
478
479 #else
480 const char *i386_comment_chars = "#";
481 #define PREFIX_SEPARATOR '/'
482 #endif
483
484 /* This array holds the chars that only start a comment at the beginning of
485 a line. If the line seems to have the form '# 123 filename'
486 .line and .file directives will appear in the pre-processed output.
487 Note that input_file.c hand checks for '#' at the beginning of the
488 first line of the input file. This is because the compiler outputs
489 #NO_APP at the beginning of its output.
490 Also note that comments started like this one will always work if
491 '/' isn't otherwise defined. */
492 const char line_comment_chars[] = "#/";
493
494 const char line_separator_chars[] = ";";
495
496 /* Chars that can be used to separate mant from exp in floating point
497 nums. */
498 const char EXP_CHARS[] = "eE";
499
500 /* Chars that mean this number is a floating point constant
501 As in 0f12.456
502 or 0d1.2345e12. */
503 const char FLT_CHARS[] = "fFdDxX";
504
505 /* Tables for lexical analysis. */
506 static char mnemonic_chars[256];
507 static char register_chars[256];
508 static char operand_chars[256];
509 static char identifier_chars[256];
510 static char digit_chars[256];
511
512 /* Lexical macros. */
513 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
514 #define is_operand_char(x) (operand_chars[(unsigned char) x])
515 #define is_register_char(x) (register_chars[(unsigned char) x])
516 #define is_space_char(x) ((x) == ' ')
517 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
518 #define is_digit_char(x) (digit_chars[(unsigned char) x])
519
520 /* All non-digit non-letter characters that may occur in an operand. */
521 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
522
523 /* md_assemble() always leaves the strings it's passed unaltered. To
524 effect this we maintain a stack of saved characters that we've smashed
525 with '\0's (indicating end of strings for various sub-fields of the
526 assembler instruction). */
527 static char save_stack[32];
528 static char *save_stack_p;
529 #define END_STRING_AND_SAVE(s) \
530 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
531 #define RESTORE_END_STRING(s) \
532 do { *(s) = *--save_stack_p; } while (0)
533
534 /* The instruction we're assembling. */
535 static i386_insn i;
536
537 /* Possible templates for current insn. */
538 static const templates *current_templates;
539
540 /* Per instruction expressionS buffers: max displacements & immediates. */
541 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
542 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
543
544 /* Current operand we are working on. */
545 static int this_operand = -1;
546
547 /* We support four different modes. FLAG_CODE variable is used to distinguish
548 these. */
549
550 enum flag_code {
551 CODE_32BIT,
552 CODE_16BIT,
553 CODE_64BIT };
554
555 static enum flag_code flag_code;
556 static unsigned int object_64bit;
557 static unsigned int disallow_64bit_reloc;
558 static int use_rela_relocations = 0;
559
560 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
561 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
562 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
563
564 /* The ELF ABI to use. */
565 enum x86_elf_abi
566 {
567 I386_ABI,
568 X86_64_ABI,
569 X86_64_X32_ABI
570 };
571
572 static enum x86_elf_abi x86_elf_abi = I386_ABI;
573 #endif
574
575 #if defined (TE_PE) || defined (TE_PEP)
576 /* Use big object file format. */
577 static int use_big_obj = 0;
578 #endif
579
580 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
581 /* 1 if generating code for a shared library. */
582 static int shared = 0;
583 #endif
584
585 /* 1 for intel syntax,
586 0 if att syntax. */
587 static int intel_syntax = 0;
588
589 /* 1 for Intel64 ISA,
590 0 if AMD64 ISA. */
591 static int intel64;
592
593 /* 1 for intel mnemonic,
594 0 if att mnemonic. */
595 static int intel_mnemonic = !SYSV386_COMPAT;
596
597 /* 1 if pseudo registers are permitted. */
598 static int allow_pseudo_reg = 0;
599
600 /* 1 if register prefix % not required. */
601 static int allow_naked_reg = 0;
602
603 /* 1 if the assembler should add BND prefix for all control-transferring
604 instructions supporting it, even if this prefix wasn't specified
605 explicitly. */
606 static int add_bnd_prefix = 0;
607
608 /* 1 if pseudo index register, eiz/riz, is allowed . */
609 static int allow_index_reg = 0;
610
611 /* 1 if the assembler should ignore LOCK prefix, even if it was
612 specified explicitly. */
613 static int omit_lock_prefix = 0;
614
615 /* 1 if the assembler should encode lfence, mfence, and sfence as
616 "lock addl $0, (%{re}sp)". */
617 static int avoid_fence = 0;
618
619 /* 1 if the assembler should generate relax relocations. */
620
621 static int generate_relax_relocations
622 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
623
624 static enum check_kind
625 {
626 check_none = 0,
627 check_warning,
628 check_error
629 }
630 sse_check, operand_check = check_warning;
631
632 /* Optimization:
633 1. Clear the REX_W bit with register operand if possible.
634 2. Above plus use 128bit vector instruction to clear the full vector
635 register.
636 */
637 static int optimize = 0;
638
639 /* Optimization:
640 1. Clear the REX_W bit with register operand if possible.
641 2. Above plus use 128bit vector instruction to clear the full vector
642 register.
643 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
644 "testb $imm7,%r8".
645 */
646 static int optimize_for_space = 0;
647
648 /* Register prefix used for error message. */
649 static const char *register_prefix = "%";
650
651 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
652 leave, push, and pop instructions so that gcc has the same stack
653 frame as in 32 bit mode. */
654 static char stackop_size = '\0';
655
656 /* Non-zero to optimize code alignment. */
657 int optimize_align_code = 1;
658
659 /* Non-zero to quieten some warnings. */
660 static int quiet_warnings = 0;
661
662 /* CPU name. */
663 static const char *cpu_arch_name = NULL;
664 static char *cpu_sub_arch_name = NULL;
665
666 /* CPU feature flags. */
667 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
668
669 /* If we have selected a cpu we are generating instructions for. */
670 static int cpu_arch_tune_set = 0;
671
672 /* Cpu we are generating instructions for. */
673 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
674
675 /* CPU feature flags of cpu we are generating instructions for. */
676 static i386_cpu_flags cpu_arch_tune_flags;
677
678 /* CPU instruction set architecture used. */
679 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
680
681 /* CPU feature flags of instruction set architecture used. */
682 i386_cpu_flags cpu_arch_isa_flags;
683
684 /* If set, conditional jumps are not automatically promoted to handle
685 larger than a byte offset. */
686 static unsigned int no_cond_jump_promotion = 0;
687
688 /* Encode SSE instructions with VEX prefix. */
689 static unsigned int sse2avx;
690
691 /* Encode scalar AVX instructions with specific vector length. */
692 static enum
693 {
694 vex128 = 0,
695 vex256
696 } avxscalar;
697
698 /* Encode VEX WIG instructions with specific vex.w. */
699 static enum
700 {
701 vexw0 = 0,
702 vexw1
703 } vexwig;
704
705 /* Encode scalar EVEX LIG instructions with specific vector length. */
706 static enum
707 {
708 evexl128 = 0,
709 evexl256,
710 evexl512
711 } evexlig;
712
713 /* Encode EVEX WIG instructions with specific evex.w. */
714 static enum
715 {
716 evexw0 = 0,
717 evexw1
718 } evexwig;
719
720 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
721 static enum rc_type evexrcig = rne;
722
723 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
724 static symbolS *GOT_symbol;
725
726 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
727 unsigned int x86_dwarf2_return_column;
728
729 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
730 int x86_cie_data_alignment;
731
732 /* Interface to relax_segment.
733 There are 3 major relax states for 386 jump insns because the
734 different types of jumps add different sizes to frags when we're
735 figuring out what sort of jump to choose to reach a given label. */
736
737 /* Types. */
738 #define UNCOND_JUMP 0
739 #define COND_JUMP 1
740 #define COND_JUMP86 2
741
742 /* Sizes. */
743 #define CODE16 1
744 #define SMALL 0
745 #define SMALL16 (SMALL | CODE16)
746 #define BIG 2
747 #define BIG16 (BIG | CODE16)
748
749 #ifndef INLINE
750 #ifdef __GNUC__
751 #define INLINE __inline__
752 #else
753 #define INLINE
754 #endif
755 #endif
756
757 #define ENCODE_RELAX_STATE(type, size) \
758 ((relax_substateT) (((type) << 2) | (size)))
759 #define TYPE_FROM_RELAX_STATE(s) \
760 ((s) >> 2)
761 #define DISP_SIZE_FROM_RELAX_STATE(s) \
762 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
763
764 /* This table is used by relax_frag to promote short jumps to long
765 ones where necessary. SMALL (short) jumps may be promoted to BIG
766 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
767 don't allow a short jump in a 32 bit code segment to be promoted to
768 a 16 bit offset jump because it's slower (requires data size
769 prefix), and doesn't work, unless the destination is in the bottom
770 64k of the code segment (The top 16 bits of eip are zeroed). */
771
772 const relax_typeS md_relax_table[] =
773 {
774 /* The fields are:
775 1) most positive reach of this state,
776 2) most negative reach of this state,
777 3) how many bytes this mode will have in the variable part of the frag
778 4) which index into the table to try if we can't fit into this one. */
779
780 /* UNCOND_JUMP states. */
781 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
782 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
783 /* dword jmp adds 4 bytes to frag:
784 0 extra opcode bytes, 4 displacement bytes. */
785 {0, 0, 4, 0},
786 /* word jmp adds 2 byte2 to frag:
787 0 extra opcode bytes, 2 displacement bytes. */
788 {0, 0, 2, 0},
789
790 /* COND_JUMP states. */
791 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
792 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
793 /* dword conditionals adds 5 bytes to frag:
794 1 extra opcode byte, 4 displacement bytes. */
795 {0, 0, 5, 0},
796 /* word conditionals add 3 bytes to frag:
797 1 extra opcode byte, 2 displacement bytes. */
798 {0, 0, 3, 0},
799
800 /* COND_JUMP86 states. */
801 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
802 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
803 /* dword conditionals adds 5 bytes to frag:
804 1 extra opcode byte, 4 displacement bytes. */
805 {0, 0, 5, 0},
806 /* word conditionals add 4 bytes to frag:
807 1 displacement byte and a 3 byte long branch insn. */
808 {0, 0, 4, 0}
809 };
810
811 static const arch_entry cpu_arch[] =
812 {
813 /* Do not replace the first two entries - i386_target_format()
814 relies on them being there in this order. */
815 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
816 CPU_GENERIC32_FLAGS, 0 },
817 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
818 CPU_GENERIC64_FLAGS, 0 },
819 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
820 CPU_NONE_FLAGS, 0 },
821 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
822 CPU_I186_FLAGS, 0 },
823 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
824 CPU_I286_FLAGS, 0 },
825 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
826 CPU_I386_FLAGS, 0 },
827 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
828 CPU_I486_FLAGS, 0 },
829 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
830 CPU_I586_FLAGS, 0 },
831 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
832 CPU_I686_FLAGS, 0 },
833 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
834 CPU_I586_FLAGS, 0 },
835 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
836 CPU_PENTIUMPRO_FLAGS, 0 },
837 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
838 CPU_P2_FLAGS, 0 },
839 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
840 CPU_P3_FLAGS, 0 },
841 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
842 CPU_P4_FLAGS, 0 },
843 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
844 CPU_CORE_FLAGS, 0 },
845 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
846 CPU_NOCONA_FLAGS, 0 },
847 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
848 CPU_CORE_FLAGS, 1 },
849 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
850 CPU_CORE_FLAGS, 0 },
851 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
852 CPU_CORE2_FLAGS, 1 },
853 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
854 CPU_CORE2_FLAGS, 0 },
855 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
856 CPU_COREI7_FLAGS, 0 },
857 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
858 CPU_L1OM_FLAGS, 0 },
859 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
860 CPU_K1OM_FLAGS, 0 },
861 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
862 CPU_IAMCU_FLAGS, 0 },
863 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
864 CPU_K6_FLAGS, 0 },
865 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
866 CPU_K6_2_FLAGS, 0 },
867 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
868 CPU_ATHLON_FLAGS, 0 },
869 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
870 CPU_K8_FLAGS, 1 },
871 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
872 CPU_K8_FLAGS, 0 },
873 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
874 CPU_K8_FLAGS, 0 },
875 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
876 CPU_AMDFAM10_FLAGS, 0 },
877 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
878 CPU_BDVER1_FLAGS, 0 },
879 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
880 CPU_BDVER2_FLAGS, 0 },
881 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
882 CPU_BDVER3_FLAGS, 0 },
883 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
884 CPU_BDVER4_FLAGS, 0 },
885 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
886 CPU_ZNVER1_FLAGS, 0 },
887 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
888 CPU_ZNVER2_FLAGS, 0 },
889 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
890 CPU_BTVER1_FLAGS, 0 },
891 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
892 CPU_BTVER2_FLAGS, 0 },
893 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
894 CPU_8087_FLAGS, 0 },
895 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
896 CPU_287_FLAGS, 0 },
897 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
898 CPU_387_FLAGS, 0 },
899 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
900 CPU_687_FLAGS, 0 },
901 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
902 CPU_CMOV_FLAGS, 0 },
903 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
904 CPU_FXSR_FLAGS, 0 },
905 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
906 CPU_MMX_FLAGS, 0 },
907 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
908 CPU_SSE_FLAGS, 0 },
909 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
910 CPU_SSE2_FLAGS, 0 },
911 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
912 CPU_SSE3_FLAGS, 0 },
913 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
914 CPU_SSSE3_FLAGS, 0 },
915 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
916 CPU_SSE4_1_FLAGS, 0 },
917 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
918 CPU_SSE4_2_FLAGS, 0 },
919 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
920 CPU_SSE4_2_FLAGS, 0 },
921 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
922 CPU_AVX_FLAGS, 0 },
923 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
924 CPU_AVX2_FLAGS, 0 },
925 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
926 CPU_AVX512F_FLAGS, 0 },
927 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
928 CPU_AVX512CD_FLAGS, 0 },
929 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
930 CPU_AVX512ER_FLAGS, 0 },
931 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
932 CPU_AVX512PF_FLAGS, 0 },
933 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
934 CPU_AVX512DQ_FLAGS, 0 },
935 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
936 CPU_AVX512BW_FLAGS, 0 },
937 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
938 CPU_AVX512VL_FLAGS, 0 },
939 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
940 CPU_VMX_FLAGS, 0 },
941 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
942 CPU_VMFUNC_FLAGS, 0 },
943 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
944 CPU_SMX_FLAGS, 0 },
945 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
946 CPU_XSAVE_FLAGS, 0 },
947 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
948 CPU_XSAVEOPT_FLAGS, 0 },
949 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
950 CPU_XSAVEC_FLAGS, 0 },
951 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
952 CPU_XSAVES_FLAGS, 0 },
953 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
954 CPU_AES_FLAGS, 0 },
955 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
956 CPU_PCLMUL_FLAGS, 0 },
957 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
958 CPU_PCLMUL_FLAGS, 1 },
959 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
960 CPU_FSGSBASE_FLAGS, 0 },
961 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
962 CPU_RDRND_FLAGS, 0 },
963 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
964 CPU_F16C_FLAGS, 0 },
965 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
966 CPU_BMI2_FLAGS, 0 },
967 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
968 CPU_FMA_FLAGS, 0 },
969 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
970 CPU_FMA4_FLAGS, 0 },
971 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
972 CPU_XOP_FLAGS, 0 },
973 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
974 CPU_LWP_FLAGS, 0 },
975 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
976 CPU_MOVBE_FLAGS, 0 },
977 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
978 CPU_CX16_FLAGS, 0 },
979 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
980 CPU_EPT_FLAGS, 0 },
981 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
982 CPU_LZCNT_FLAGS, 0 },
983 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
984 CPU_HLE_FLAGS, 0 },
985 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
986 CPU_RTM_FLAGS, 0 },
987 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
988 CPU_INVPCID_FLAGS, 0 },
989 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
990 CPU_CLFLUSH_FLAGS, 0 },
991 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
992 CPU_NOP_FLAGS, 0 },
993 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
994 CPU_SYSCALL_FLAGS, 0 },
995 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
996 CPU_RDTSCP_FLAGS, 0 },
997 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
998 CPU_3DNOW_FLAGS, 0 },
999 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1000 CPU_3DNOWA_FLAGS, 0 },
1001 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1002 CPU_PADLOCK_FLAGS, 0 },
1003 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1004 CPU_SVME_FLAGS, 1 },
1005 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1006 CPU_SVME_FLAGS, 0 },
1007 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1008 CPU_SSE4A_FLAGS, 0 },
1009 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1010 CPU_ABM_FLAGS, 0 },
1011 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1012 CPU_BMI_FLAGS, 0 },
1013 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1014 CPU_TBM_FLAGS, 0 },
1015 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1016 CPU_ADX_FLAGS, 0 },
1017 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1018 CPU_RDSEED_FLAGS, 0 },
1019 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1020 CPU_PRFCHW_FLAGS, 0 },
1021 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1022 CPU_SMAP_FLAGS, 0 },
1023 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1024 CPU_MPX_FLAGS, 0 },
1025 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1026 CPU_SHA_FLAGS, 0 },
1027 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1028 CPU_CLFLUSHOPT_FLAGS, 0 },
1029 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1030 CPU_PREFETCHWT1_FLAGS, 0 },
1031 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1032 CPU_SE1_FLAGS, 0 },
1033 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1034 CPU_CLWB_FLAGS, 0 },
1035 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1036 CPU_AVX512IFMA_FLAGS, 0 },
1037 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1038 CPU_AVX512VBMI_FLAGS, 0 },
1039 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1040 CPU_AVX512_4FMAPS_FLAGS, 0 },
1041 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1042 CPU_AVX512_4VNNIW_FLAGS, 0 },
1043 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1044 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1045 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1046 CPU_AVX512_VBMI2_FLAGS, 0 },
1047 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1048 CPU_AVX512_VNNI_FLAGS, 0 },
1049 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1050 CPU_AVX512_BITALG_FLAGS, 0 },
1051 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1052 CPU_CLZERO_FLAGS, 0 },
1053 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1054 CPU_MWAITX_FLAGS, 0 },
1055 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1056 CPU_OSPKE_FLAGS, 0 },
1057 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1058 CPU_RDPID_FLAGS, 0 },
1059 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1060 CPU_PTWRITE_FLAGS, 0 },
1061 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1062 CPU_IBT_FLAGS, 0 },
1063 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1064 CPU_SHSTK_FLAGS, 0 },
1065 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1066 CPU_GFNI_FLAGS, 0 },
1067 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1068 CPU_VAES_FLAGS, 0 },
1069 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1070 CPU_VPCLMULQDQ_FLAGS, 0 },
1071 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1072 CPU_WBNOINVD_FLAGS, 0 },
1073 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1074 CPU_PCONFIG_FLAGS, 0 },
1075 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1076 CPU_WAITPKG_FLAGS, 0 },
1077 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1078 CPU_CLDEMOTE_FLAGS, 0 },
1079 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1080 CPU_MOVDIRI_FLAGS, 0 },
1081 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1082 CPU_MOVDIR64B_FLAGS, 0 },
1083 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1084 CPU_AVX512_BF16_FLAGS, 0 },
1085 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1086 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1087 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1088 CPU_ENQCMD_FLAGS, 0 },
1089 };
1090
1091 static const noarch_entry cpu_noarch[] =
1092 {
1093 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1094 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1095 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1096 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1097 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1098 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1099 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1100 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1101 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1102 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1103 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1104 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1105 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1106 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1107 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1108 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1109 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1110 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1111 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1112 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1113 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1114 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1115 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1116 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1117 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1118 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1119 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1120 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1121 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1122 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1123 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1124 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1125 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1126 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1127 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1128 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1129 { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1130 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1131 };
1132
1133 #ifdef I386COFF
1134 /* Like s_lcomm_internal in gas/read.c but the alignment string
1135 is allowed to be optional. */
1136
1137 static symbolS *
1138 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1139 {
1140 addressT align = 0;
1141
1142 SKIP_WHITESPACE ();
1143
1144 if (needs_align
1145 && *input_line_pointer == ',')
1146 {
1147 align = parse_align (needs_align - 1);
1148
1149 if (align == (addressT) -1)
1150 return NULL;
1151 }
1152 else
1153 {
1154 if (size >= 8)
1155 align = 3;
1156 else if (size >= 4)
1157 align = 2;
1158 else if (size >= 2)
1159 align = 1;
1160 else
1161 align = 0;
1162 }
1163
1164 bss_alloc (symbolP, size, align);
1165 return symbolP;
1166 }
1167
1168 static void
1169 pe_lcomm (int needs_align)
1170 {
1171 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1172 }
1173 #endif
1174
1175 const pseudo_typeS md_pseudo_table[] =
1176 {
1177 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1178 {"align", s_align_bytes, 0},
1179 #else
1180 {"align", s_align_ptwo, 0},
1181 #endif
1182 {"arch", set_cpu_arch, 0},
1183 #ifndef I386COFF
1184 {"bss", s_bss, 0},
1185 #else
1186 {"lcomm", pe_lcomm, 1},
1187 #endif
1188 {"ffloat", float_cons, 'f'},
1189 {"dfloat", float_cons, 'd'},
1190 {"tfloat", float_cons, 'x'},
1191 {"value", cons, 2},
1192 {"slong", signed_cons, 4},
1193 {"noopt", s_ignore, 0},
1194 {"optim", s_ignore, 0},
1195 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1196 {"code16", set_code_flag, CODE_16BIT},
1197 {"code32", set_code_flag, CODE_32BIT},
1198 #ifdef BFD64
1199 {"code64", set_code_flag, CODE_64BIT},
1200 #endif
1201 {"intel_syntax", set_intel_syntax, 1},
1202 {"att_syntax", set_intel_syntax, 0},
1203 {"intel_mnemonic", set_intel_mnemonic, 1},
1204 {"att_mnemonic", set_intel_mnemonic, 0},
1205 {"allow_index_reg", set_allow_index_reg, 1},
1206 {"disallow_index_reg", set_allow_index_reg, 0},
1207 {"sse_check", set_check, 0},
1208 {"operand_check", set_check, 1},
1209 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1210 {"largecomm", handle_large_common, 0},
1211 #else
1212 {"file", dwarf2_directive_file, 0},
1213 {"loc", dwarf2_directive_loc, 0},
1214 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1215 #endif
1216 #ifdef TE_PE
1217 {"secrel32", pe_directive_secrel, 0},
1218 #endif
1219 {0, 0, 0}
1220 };
1221
1222 /* For interface with expression (). */
1223 extern char *input_line_pointer;
1224
1225 /* Hash table for instruction mnemonic lookup. */
1226 static struct hash_control *op_hash;
1227
1228 /* Hash table for register lookup. */
1229 static struct hash_control *reg_hash;
1230 \f
1231 /* Various efficient no-op patterns for aligning code labels.
1232 Note: Don't try to assemble the instructions in the comments.
1233 0L and 0w are not legal. */
1234 static const unsigned char f32_1[] =
1235 {0x90}; /* nop */
1236 static const unsigned char f32_2[] =
1237 {0x66,0x90}; /* xchg %ax,%ax */
1238 static const unsigned char f32_3[] =
1239 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1240 static const unsigned char f32_4[] =
1241 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1242 static const unsigned char f32_6[] =
1243 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1244 static const unsigned char f32_7[] =
1245 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1246 static const unsigned char f16_3[] =
1247 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1248 static const unsigned char f16_4[] =
1249 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1250 static const unsigned char jump_disp8[] =
1251 {0xeb}; /* jmp disp8 */
1252 static const unsigned char jump32_disp32[] =
1253 {0xe9}; /* jmp disp32 */
1254 static const unsigned char jump16_disp32[] =
1255 {0x66,0xe9}; /* jmp disp32 */
1256 /* 32-bit NOPs patterns. */
1257 static const unsigned char *const f32_patt[] = {
1258 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1259 };
1260 /* 16-bit NOPs patterns. */
1261 static const unsigned char *const f16_patt[] = {
1262 f32_1, f32_2, f16_3, f16_4
1263 };
1264 /* nopl (%[re]ax) */
1265 static const unsigned char alt_3[] =
1266 {0x0f,0x1f,0x00};
1267 /* nopl 0(%[re]ax) */
1268 static const unsigned char alt_4[] =
1269 {0x0f,0x1f,0x40,0x00};
1270 /* nopl 0(%[re]ax,%[re]ax,1) */
1271 static const unsigned char alt_5[] =
1272 {0x0f,0x1f,0x44,0x00,0x00};
1273 /* nopw 0(%[re]ax,%[re]ax,1) */
1274 static const unsigned char alt_6[] =
1275 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1276 /* nopl 0L(%[re]ax) */
1277 static const unsigned char alt_7[] =
1278 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1279 /* nopl 0L(%[re]ax,%[re]ax,1) */
1280 static const unsigned char alt_8[] =
1281 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1282 /* nopw 0L(%[re]ax,%[re]ax,1) */
1283 static const unsigned char alt_9[] =
1284 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1285 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1286 static const unsigned char alt_10[] =
1287 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1288 /* data16 nopw %cs:0L(%eax,%eax,1) */
1289 static const unsigned char alt_11[] =
1290 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1291 /* 32-bit and 64-bit NOPs patterns. */
1292 static const unsigned char *const alt_patt[] = {
1293 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1294 alt_9, alt_10, alt_11
1295 };
1296
1297 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1298 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1299
1300 static void
1301 i386_output_nops (char *where, const unsigned char *const *patt,
1302 int count, int max_single_nop_size)
1303
1304 {
1305 /* Place the longer NOP first. */
1306 int last;
1307 int offset;
1308 const unsigned char *nops;
1309
1310 if (max_single_nop_size < 1)
1311 {
1312 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1313 max_single_nop_size);
1314 return;
1315 }
1316
1317 nops = patt[max_single_nop_size - 1];
1318
1319 /* Use the smaller one if the requsted one isn't available. */
1320 if (nops == NULL)
1321 {
1322 max_single_nop_size--;
1323 nops = patt[max_single_nop_size - 1];
1324 }
1325
1326 last = count % max_single_nop_size;
1327
1328 count -= last;
1329 for (offset = 0; offset < count; offset += max_single_nop_size)
1330 memcpy (where + offset, nops, max_single_nop_size);
1331
1332 if (last)
1333 {
1334 nops = patt[last - 1];
1335 if (nops == NULL)
1336 {
1337 /* Use the smaller one plus one-byte NOP if the needed one
1338 isn't available. */
1339 last--;
1340 nops = patt[last - 1];
1341 memcpy (where + offset, nops, last);
1342 where[offset + last] = *patt[0];
1343 }
1344 else
1345 memcpy (where + offset, nops, last);
1346 }
1347 }
1348
1349 static INLINE int
1350 fits_in_imm7 (offsetT num)
1351 {
1352 return (num & 0x7f) == num;
1353 }
1354
1355 static INLINE int
1356 fits_in_imm31 (offsetT num)
1357 {
1358 return (num & 0x7fffffff) == num;
1359 }
1360
1361 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1362 single NOP instruction LIMIT. */
1363
1364 void
1365 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1366 {
1367 const unsigned char *const *patt = NULL;
1368 int max_single_nop_size;
1369 /* Maximum number of NOPs before switching to jump over NOPs. */
1370 int max_number_of_nops;
1371
1372 switch (fragP->fr_type)
1373 {
1374 case rs_fill_nop:
1375 case rs_align_code:
1376 break;
1377 default:
1378 return;
1379 }
1380
1381 /* We need to decide which NOP sequence to use for 32bit and
1382 64bit. When -mtune= is used:
1383
1384 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1385 PROCESSOR_GENERIC32, f32_patt will be used.
1386 2. For the rest, alt_patt will be used.
1387
1388 When -mtune= isn't used, alt_patt will be used if
1389 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1390 be used.
1391
1392 When -march= or .arch is used, we can't use anything beyond
1393 cpu_arch_isa_flags. */
1394
1395 if (flag_code == CODE_16BIT)
1396 {
1397 patt = f16_patt;
1398 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1399 /* Limit number of NOPs to 2 in 16-bit mode. */
1400 max_number_of_nops = 2;
1401 }
1402 else
1403 {
1404 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1405 {
1406 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1407 switch (cpu_arch_tune)
1408 {
1409 case PROCESSOR_UNKNOWN:
1410 /* We use cpu_arch_isa_flags to check if we SHOULD
1411 optimize with nops. */
1412 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1413 patt = alt_patt;
1414 else
1415 patt = f32_patt;
1416 break;
1417 case PROCESSOR_PENTIUM4:
1418 case PROCESSOR_NOCONA:
1419 case PROCESSOR_CORE:
1420 case PROCESSOR_CORE2:
1421 case PROCESSOR_COREI7:
1422 case PROCESSOR_L1OM:
1423 case PROCESSOR_K1OM:
1424 case PROCESSOR_GENERIC64:
1425 case PROCESSOR_K6:
1426 case PROCESSOR_ATHLON:
1427 case PROCESSOR_K8:
1428 case PROCESSOR_AMDFAM10:
1429 case PROCESSOR_BD:
1430 case PROCESSOR_ZNVER:
1431 case PROCESSOR_BT:
1432 patt = alt_patt;
1433 break;
1434 case PROCESSOR_I386:
1435 case PROCESSOR_I486:
1436 case PROCESSOR_PENTIUM:
1437 case PROCESSOR_PENTIUMPRO:
1438 case PROCESSOR_IAMCU:
1439 case PROCESSOR_GENERIC32:
1440 patt = f32_patt;
1441 break;
1442 }
1443 }
1444 else
1445 {
1446 switch (fragP->tc_frag_data.tune)
1447 {
1448 case PROCESSOR_UNKNOWN:
1449 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1450 PROCESSOR_UNKNOWN. */
1451 abort ();
1452 break;
1453
1454 case PROCESSOR_I386:
1455 case PROCESSOR_I486:
1456 case PROCESSOR_PENTIUM:
1457 case PROCESSOR_IAMCU:
1458 case PROCESSOR_K6:
1459 case PROCESSOR_ATHLON:
1460 case PROCESSOR_K8:
1461 case PROCESSOR_AMDFAM10:
1462 case PROCESSOR_BD:
1463 case PROCESSOR_ZNVER:
1464 case PROCESSOR_BT:
1465 case PROCESSOR_GENERIC32:
1466 /* We use cpu_arch_isa_flags to check if we CAN optimize
1467 with nops. */
1468 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1469 patt = alt_patt;
1470 else
1471 patt = f32_patt;
1472 break;
1473 case PROCESSOR_PENTIUMPRO:
1474 case PROCESSOR_PENTIUM4:
1475 case PROCESSOR_NOCONA:
1476 case PROCESSOR_CORE:
1477 case PROCESSOR_CORE2:
1478 case PROCESSOR_COREI7:
1479 case PROCESSOR_L1OM:
1480 case PROCESSOR_K1OM:
1481 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1482 patt = alt_patt;
1483 else
1484 patt = f32_patt;
1485 break;
1486 case PROCESSOR_GENERIC64:
1487 patt = alt_patt;
1488 break;
1489 }
1490 }
1491
1492 if (patt == f32_patt)
1493 {
1494 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1495 /* Limit number of NOPs to 2 for older processors. */
1496 max_number_of_nops = 2;
1497 }
1498 else
1499 {
1500 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1501 /* Limit number of NOPs to 7 for newer processors. */
1502 max_number_of_nops = 7;
1503 }
1504 }
1505
1506 if (limit == 0)
1507 limit = max_single_nop_size;
1508
1509 if (fragP->fr_type == rs_fill_nop)
1510 {
1511 /* Output NOPs for .nop directive. */
1512 if (limit > max_single_nop_size)
1513 {
1514 as_bad_where (fragP->fr_file, fragP->fr_line,
1515 _("invalid single nop size: %d "
1516 "(expect within [0, %d])"),
1517 limit, max_single_nop_size);
1518 return;
1519 }
1520 }
1521 else
1522 fragP->fr_var = count;
1523
1524 if ((count / max_single_nop_size) > max_number_of_nops)
1525 {
1526 /* Generate jump over NOPs. */
1527 offsetT disp = count - 2;
1528 if (fits_in_imm7 (disp))
1529 {
1530 /* Use "jmp disp8" if possible. */
1531 count = disp;
1532 where[0] = jump_disp8[0];
1533 where[1] = count;
1534 where += 2;
1535 }
1536 else
1537 {
1538 unsigned int size_of_jump;
1539
1540 if (flag_code == CODE_16BIT)
1541 {
1542 where[0] = jump16_disp32[0];
1543 where[1] = jump16_disp32[1];
1544 size_of_jump = 2;
1545 }
1546 else
1547 {
1548 where[0] = jump32_disp32[0];
1549 size_of_jump = 1;
1550 }
1551
1552 count -= size_of_jump + 4;
1553 if (!fits_in_imm31 (count))
1554 {
1555 as_bad_where (fragP->fr_file, fragP->fr_line,
1556 _("jump over nop padding out of range"));
1557 return;
1558 }
1559
1560 md_number_to_chars (where + size_of_jump, count, 4);
1561 where += size_of_jump + 4;
1562 }
1563 }
1564
1565 /* Generate multiple NOPs. */
1566 i386_output_nops (where, patt, count, limit);
1567 }
1568
1569 static INLINE int
1570 operand_type_all_zero (const union i386_operand_type *x)
1571 {
1572 switch (ARRAY_SIZE(x->array))
1573 {
1574 case 3:
1575 if (x->array[2])
1576 return 0;
1577 /* Fall through. */
1578 case 2:
1579 if (x->array[1])
1580 return 0;
1581 /* Fall through. */
1582 case 1:
1583 return !x->array[0];
1584 default:
1585 abort ();
1586 }
1587 }
1588
1589 static INLINE void
1590 operand_type_set (union i386_operand_type *x, unsigned int v)
1591 {
1592 switch (ARRAY_SIZE(x->array))
1593 {
1594 case 3:
1595 x->array[2] = v;
1596 /* Fall through. */
1597 case 2:
1598 x->array[1] = v;
1599 /* Fall through. */
1600 case 1:
1601 x->array[0] = v;
1602 /* Fall through. */
1603 break;
1604 default:
1605 abort ();
1606 }
1607 }
1608
1609 static INLINE int
1610 operand_type_equal (const union i386_operand_type *x,
1611 const union i386_operand_type *y)
1612 {
1613 switch (ARRAY_SIZE(x->array))
1614 {
1615 case 3:
1616 if (x->array[2] != y->array[2])
1617 return 0;
1618 /* Fall through. */
1619 case 2:
1620 if (x->array[1] != y->array[1])
1621 return 0;
1622 /* Fall through. */
1623 case 1:
1624 return x->array[0] == y->array[0];
1625 break;
1626 default:
1627 abort ();
1628 }
1629 }
1630
1631 static INLINE int
1632 cpu_flags_all_zero (const union i386_cpu_flags *x)
1633 {
1634 switch (ARRAY_SIZE(x->array))
1635 {
1636 case 4:
1637 if (x->array[3])
1638 return 0;
1639 /* Fall through. */
1640 case 3:
1641 if (x->array[2])
1642 return 0;
1643 /* Fall through. */
1644 case 2:
1645 if (x->array[1])
1646 return 0;
1647 /* Fall through. */
1648 case 1:
1649 return !x->array[0];
1650 default:
1651 abort ();
1652 }
1653 }
1654
1655 static INLINE int
1656 cpu_flags_equal (const union i386_cpu_flags *x,
1657 const union i386_cpu_flags *y)
1658 {
1659 switch (ARRAY_SIZE(x->array))
1660 {
1661 case 4:
1662 if (x->array[3] != y->array[3])
1663 return 0;
1664 /* Fall through. */
1665 case 3:
1666 if (x->array[2] != y->array[2])
1667 return 0;
1668 /* Fall through. */
1669 case 2:
1670 if (x->array[1] != y->array[1])
1671 return 0;
1672 /* Fall through. */
1673 case 1:
1674 return x->array[0] == y->array[0];
1675 break;
1676 default:
1677 abort ();
1678 }
1679 }
1680
1681 static INLINE int
1682 cpu_flags_check_cpu64 (i386_cpu_flags f)
1683 {
1684 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1685 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1686 }
1687
1688 static INLINE i386_cpu_flags
1689 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1690 {
1691 switch (ARRAY_SIZE (x.array))
1692 {
1693 case 4:
1694 x.array [3] &= y.array [3];
1695 /* Fall through. */
1696 case 3:
1697 x.array [2] &= y.array [2];
1698 /* Fall through. */
1699 case 2:
1700 x.array [1] &= y.array [1];
1701 /* Fall through. */
1702 case 1:
1703 x.array [0] &= y.array [0];
1704 break;
1705 default:
1706 abort ();
1707 }
1708 return x;
1709 }
1710
1711 static INLINE i386_cpu_flags
1712 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1713 {
1714 switch (ARRAY_SIZE (x.array))
1715 {
1716 case 4:
1717 x.array [3] |= y.array [3];
1718 /* Fall through. */
1719 case 3:
1720 x.array [2] |= y.array [2];
1721 /* Fall through. */
1722 case 2:
1723 x.array [1] |= y.array [1];
1724 /* Fall through. */
1725 case 1:
1726 x.array [0] |= y.array [0];
1727 break;
1728 default:
1729 abort ();
1730 }
1731 return x;
1732 }
1733
1734 static INLINE i386_cpu_flags
1735 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1736 {
1737 switch (ARRAY_SIZE (x.array))
1738 {
1739 case 4:
1740 x.array [3] &= ~y.array [3];
1741 /* Fall through. */
1742 case 3:
1743 x.array [2] &= ~y.array [2];
1744 /* Fall through. */
1745 case 2:
1746 x.array [1] &= ~y.array [1];
1747 /* Fall through. */
1748 case 1:
1749 x.array [0] &= ~y.array [0];
1750 break;
1751 default:
1752 abort ();
1753 }
1754 return x;
1755 }
1756
1757 #define CPU_FLAGS_ARCH_MATCH 0x1
1758 #define CPU_FLAGS_64BIT_MATCH 0x2
1759
1760 #define CPU_FLAGS_PERFECT_MATCH \
1761 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1762
1763 /* Return CPU flags match bits. */
1764
1765 static int
1766 cpu_flags_match (const insn_template *t)
1767 {
1768 i386_cpu_flags x = t->cpu_flags;
1769 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1770
1771 x.bitfield.cpu64 = 0;
1772 x.bitfield.cpuno64 = 0;
1773
1774 if (cpu_flags_all_zero (&x))
1775 {
1776 /* This instruction is available on all archs. */
1777 match |= CPU_FLAGS_ARCH_MATCH;
1778 }
1779 else
1780 {
1781 /* This instruction is available only on some archs. */
1782 i386_cpu_flags cpu = cpu_arch_flags;
1783
1784 /* AVX512VL is no standalone feature - match it and then strip it. */
1785 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1786 return match;
1787 x.bitfield.cpuavx512vl = 0;
1788
1789 cpu = cpu_flags_and (x, cpu);
1790 if (!cpu_flags_all_zero (&cpu))
1791 {
1792 if (x.bitfield.cpuavx)
1793 {
1794 /* We need to check a few extra flags with AVX. */
1795 if (cpu.bitfield.cpuavx
1796 && (!t->opcode_modifier.sse2avx || sse2avx)
1797 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1798 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1799 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1800 match |= CPU_FLAGS_ARCH_MATCH;
1801 }
1802 else if (x.bitfield.cpuavx512f)
1803 {
1804 /* We need to check a few extra flags with AVX512F. */
1805 if (cpu.bitfield.cpuavx512f
1806 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1807 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1808 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1809 match |= CPU_FLAGS_ARCH_MATCH;
1810 }
1811 else
1812 match |= CPU_FLAGS_ARCH_MATCH;
1813 }
1814 }
1815 return match;
1816 }
1817
1818 static INLINE i386_operand_type
1819 operand_type_and (i386_operand_type x, i386_operand_type y)
1820 {
1821 switch (ARRAY_SIZE (x.array))
1822 {
1823 case 3:
1824 x.array [2] &= y.array [2];
1825 /* Fall through. */
1826 case 2:
1827 x.array [1] &= y.array [1];
1828 /* Fall through. */
1829 case 1:
1830 x.array [0] &= y.array [0];
1831 break;
1832 default:
1833 abort ();
1834 }
1835 return x;
1836 }
1837
1838 static INLINE i386_operand_type
1839 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1840 {
1841 switch (ARRAY_SIZE (x.array))
1842 {
1843 case 3:
1844 x.array [2] &= ~y.array [2];
1845 /* Fall through. */
1846 case 2:
1847 x.array [1] &= ~y.array [1];
1848 /* Fall through. */
1849 case 1:
1850 x.array [0] &= ~y.array [0];
1851 break;
1852 default:
1853 abort ();
1854 }
1855 return x;
1856 }
1857
1858 static INLINE i386_operand_type
1859 operand_type_or (i386_operand_type x, i386_operand_type y)
1860 {
1861 switch (ARRAY_SIZE (x.array))
1862 {
1863 case 3:
1864 x.array [2] |= y.array [2];
1865 /* Fall through. */
1866 case 2:
1867 x.array [1] |= y.array [1];
1868 /* Fall through. */
1869 case 1:
1870 x.array [0] |= y.array [0];
1871 break;
1872 default:
1873 abort ();
1874 }
1875 return x;
1876 }
1877
1878 static INLINE i386_operand_type
1879 operand_type_xor (i386_operand_type x, i386_operand_type y)
1880 {
1881 switch (ARRAY_SIZE (x.array))
1882 {
1883 case 3:
1884 x.array [2] ^= y.array [2];
1885 /* Fall through. */
1886 case 2:
1887 x.array [1] ^= y.array [1];
1888 /* Fall through. */
1889 case 1:
1890 x.array [0] ^= y.array [0];
1891 break;
1892 default:
1893 abort ();
1894 }
1895 return x;
1896 }
1897
1898 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1899 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1900 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1901 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1902 static const i386_operand_type anydisp
1903 = OPERAND_TYPE_ANYDISP;
1904 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1905 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
1906 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1907 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1908 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1909 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1910 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1911 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1912 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1913 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1914 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1915 static const i386_operand_type vec_imm4 = OPERAND_TYPE_VEC_IMM4;
1916
1917 enum operand_type
1918 {
1919 reg,
1920 imm,
1921 disp,
1922 anymem
1923 };
1924
1925 static INLINE int
1926 operand_type_check (i386_operand_type t, enum operand_type c)
1927 {
1928 switch (c)
1929 {
1930 case reg:
1931 return t.bitfield.reg;
1932
1933 case imm:
1934 return (t.bitfield.imm8
1935 || t.bitfield.imm8s
1936 || t.bitfield.imm16
1937 || t.bitfield.imm32
1938 || t.bitfield.imm32s
1939 || t.bitfield.imm64);
1940
1941 case disp:
1942 return (t.bitfield.disp8
1943 || t.bitfield.disp16
1944 || t.bitfield.disp32
1945 || t.bitfield.disp32s
1946 || t.bitfield.disp64);
1947
1948 case anymem:
1949 return (t.bitfield.disp8
1950 || t.bitfield.disp16
1951 || t.bitfield.disp32
1952 || t.bitfield.disp32s
1953 || t.bitfield.disp64
1954 || t.bitfield.baseindex);
1955
1956 default:
1957 abort ();
1958 }
1959
1960 return 0;
1961 }
1962
1963 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
1964 between operand GIVEN and opeand WANTED for instruction template T. */
1965
1966 static INLINE int
1967 match_operand_size (const insn_template *t, unsigned int wanted,
1968 unsigned int given)
1969 {
1970 return !((i.types[given].bitfield.byte
1971 && !t->operand_types[wanted].bitfield.byte)
1972 || (i.types[given].bitfield.word
1973 && !t->operand_types[wanted].bitfield.word)
1974 || (i.types[given].bitfield.dword
1975 && !t->operand_types[wanted].bitfield.dword)
1976 || (i.types[given].bitfield.qword
1977 && !t->operand_types[wanted].bitfield.qword)
1978 || (i.types[given].bitfield.tbyte
1979 && !t->operand_types[wanted].bitfield.tbyte));
1980 }
1981
1982 /* Return 1 if there is no conflict in SIMD register between operand
1983 GIVEN and opeand WANTED for instruction template T. */
1984
1985 static INLINE int
1986 match_simd_size (const insn_template *t, unsigned int wanted,
1987 unsigned int given)
1988 {
1989 return !((i.types[given].bitfield.xmmword
1990 && !t->operand_types[wanted].bitfield.xmmword)
1991 || (i.types[given].bitfield.ymmword
1992 && !t->operand_types[wanted].bitfield.ymmword)
1993 || (i.types[given].bitfield.zmmword
1994 && !t->operand_types[wanted].bitfield.zmmword));
1995 }
1996
1997 /* Return 1 if there is no conflict in any size between operand GIVEN
1998 and opeand WANTED for instruction template T. */
1999
2000 static INLINE int
2001 match_mem_size (const insn_template *t, unsigned int wanted,
2002 unsigned int given)
2003 {
2004 return (match_operand_size (t, wanted, given)
2005 && !((i.types[given].bitfield.unspecified
2006 && !i.broadcast
2007 && !t->operand_types[wanted].bitfield.unspecified)
2008 || (i.types[given].bitfield.fword
2009 && !t->operand_types[wanted].bitfield.fword)
2010 /* For scalar opcode templates to allow register and memory
2011 operands at the same time, some special casing is needed
2012 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2013 down-conversion vpmov*. */
2014 || ((t->operand_types[wanted].bitfield.regsimd
2015 && !t->opcode_modifier.broadcast
2016 && (t->operand_types[wanted].bitfield.byte
2017 || t->operand_types[wanted].bitfield.word
2018 || t->operand_types[wanted].bitfield.dword
2019 || t->operand_types[wanted].bitfield.qword))
2020 ? (i.types[given].bitfield.xmmword
2021 || i.types[given].bitfield.ymmword
2022 || i.types[given].bitfield.zmmword)
2023 : !match_simd_size(t, wanted, given))));
2024 }
2025
2026 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2027 operands for instruction template T, and it has MATCH_REVERSE set if there
2028 is no size conflict on any operands for the template with operands reversed
2029 (and the template allows for reversing in the first place). */
2030
2031 #define MATCH_STRAIGHT 1
2032 #define MATCH_REVERSE 2
2033
2034 static INLINE unsigned int
2035 operand_size_match (const insn_template *t)
2036 {
2037 unsigned int j, match = MATCH_STRAIGHT;
2038
2039 /* Don't check jump instructions. */
2040 if (t->opcode_modifier.jump
2041 || t->opcode_modifier.jumpbyte
2042 || t->opcode_modifier.jumpdword
2043 || t->opcode_modifier.jumpintersegment)
2044 return match;
2045
2046 /* Check memory and accumulator operand size. */
2047 for (j = 0; j < i.operands; j++)
2048 {
2049 if (!i.types[j].bitfield.reg && !i.types[j].bitfield.regsimd
2050 && t->operand_types[j].bitfield.anysize)
2051 continue;
2052
2053 if (t->operand_types[j].bitfield.reg
2054 && !match_operand_size (t, j, j))
2055 {
2056 match = 0;
2057 break;
2058 }
2059
2060 if (t->operand_types[j].bitfield.regsimd
2061 && !match_simd_size (t, j, j))
2062 {
2063 match = 0;
2064 break;
2065 }
2066
2067 if (t->operand_types[j].bitfield.acc
2068 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2069 {
2070 match = 0;
2071 break;
2072 }
2073
2074 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2075 {
2076 match = 0;
2077 break;
2078 }
2079 }
2080
2081 if (!t->opcode_modifier.d)
2082 {
2083 mismatch:
2084 if (!match)
2085 i.error = operand_size_mismatch;
2086 return match;
2087 }
2088
2089 /* Check reverse. */
2090 gas_assert (i.operands >= 2 && i.operands <= 3);
2091
2092 for (j = 0; j < i.operands; j++)
2093 {
2094 unsigned int given = i.operands - j - 1;
2095
2096 if (t->operand_types[j].bitfield.reg
2097 && !match_operand_size (t, j, given))
2098 goto mismatch;
2099
2100 if (t->operand_types[j].bitfield.regsimd
2101 && !match_simd_size (t, j, given))
2102 goto mismatch;
2103
2104 if (t->operand_types[j].bitfield.acc
2105 && (!match_operand_size (t, j, given)
2106 || !match_simd_size (t, j, given)))
2107 goto mismatch;
2108
2109 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2110 goto mismatch;
2111 }
2112
2113 return match | MATCH_REVERSE;
2114 }
2115
2116 static INLINE int
2117 operand_type_match (i386_operand_type overlap,
2118 i386_operand_type given)
2119 {
2120 i386_operand_type temp = overlap;
2121
2122 temp.bitfield.jumpabsolute = 0;
2123 temp.bitfield.unspecified = 0;
2124 temp.bitfield.byte = 0;
2125 temp.bitfield.word = 0;
2126 temp.bitfield.dword = 0;
2127 temp.bitfield.fword = 0;
2128 temp.bitfield.qword = 0;
2129 temp.bitfield.tbyte = 0;
2130 temp.bitfield.xmmword = 0;
2131 temp.bitfield.ymmword = 0;
2132 temp.bitfield.zmmword = 0;
2133 if (operand_type_all_zero (&temp))
2134 goto mismatch;
2135
2136 if (given.bitfield.baseindex == overlap.bitfield.baseindex
2137 && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
2138 return 1;
2139
2140 mismatch:
2141 i.error = operand_type_mismatch;
2142 return 0;
2143 }
2144
2145 /* If given types g0 and g1 are registers they must be of the same type
2146 unless the expected operand type register overlap is null.
2147 Memory operand size of certain SIMD instructions is also being checked
2148 here. */
2149
2150 static INLINE int
2151 operand_type_register_match (i386_operand_type g0,
2152 i386_operand_type t0,
2153 i386_operand_type g1,
2154 i386_operand_type t1)
2155 {
2156 if (!g0.bitfield.reg
2157 && !g0.bitfield.regsimd
2158 && (!operand_type_check (g0, anymem)
2159 || g0.bitfield.unspecified
2160 || !t0.bitfield.regsimd))
2161 return 1;
2162
2163 if (!g1.bitfield.reg
2164 && !g1.bitfield.regsimd
2165 && (!operand_type_check (g1, anymem)
2166 || g1.bitfield.unspecified
2167 || !t1.bitfield.regsimd))
2168 return 1;
2169
2170 if (g0.bitfield.byte == g1.bitfield.byte
2171 && g0.bitfield.word == g1.bitfield.word
2172 && g0.bitfield.dword == g1.bitfield.dword
2173 && g0.bitfield.qword == g1.bitfield.qword
2174 && g0.bitfield.xmmword == g1.bitfield.xmmword
2175 && g0.bitfield.ymmword == g1.bitfield.ymmword
2176 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2177 return 1;
2178
2179 if (!(t0.bitfield.byte & t1.bitfield.byte)
2180 && !(t0.bitfield.word & t1.bitfield.word)
2181 && !(t0.bitfield.dword & t1.bitfield.dword)
2182 && !(t0.bitfield.qword & t1.bitfield.qword)
2183 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2184 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2185 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2186 return 1;
2187
2188 i.error = register_type_mismatch;
2189
2190 return 0;
2191 }
2192
2193 static INLINE unsigned int
2194 register_number (const reg_entry *r)
2195 {
2196 unsigned int nr = r->reg_num;
2197
2198 if (r->reg_flags & RegRex)
2199 nr += 8;
2200
2201 if (r->reg_flags & RegVRex)
2202 nr += 16;
2203
2204 return nr;
2205 }
2206
2207 static INLINE unsigned int
2208 mode_from_disp_size (i386_operand_type t)
2209 {
2210 if (t.bitfield.disp8)
2211 return 1;
2212 else if (t.bitfield.disp16
2213 || t.bitfield.disp32
2214 || t.bitfield.disp32s)
2215 return 2;
2216 else
2217 return 0;
2218 }
2219
2220 static INLINE int
2221 fits_in_signed_byte (addressT num)
2222 {
2223 return num + 0x80 <= 0xff;
2224 }
2225
2226 static INLINE int
2227 fits_in_unsigned_byte (addressT num)
2228 {
2229 return num <= 0xff;
2230 }
2231
2232 static INLINE int
2233 fits_in_unsigned_word (addressT num)
2234 {
2235 return num <= 0xffff;
2236 }
2237
2238 static INLINE int
2239 fits_in_signed_word (addressT num)
2240 {
2241 return num + 0x8000 <= 0xffff;
2242 }
2243
2244 static INLINE int
2245 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2246 {
2247 #ifndef BFD64
2248 return 1;
2249 #else
2250 return num + 0x80000000 <= 0xffffffff;
2251 #endif
2252 } /* fits_in_signed_long() */
2253
2254 static INLINE int
2255 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2256 {
2257 #ifndef BFD64
2258 return 1;
2259 #else
2260 return num <= 0xffffffff;
2261 #endif
2262 } /* fits_in_unsigned_long() */
2263
2264 static INLINE int
2265 fits_in_disp8 (offsetT num)
2266 {
2267 int shift = i.memshift;
2268 unsigned int mask;
2269
2270 if (shift == -1)
2271 abort ();
2272
2273 mask = (1 << shift) - 1;
2274
2275 /* Return 0 if NUM isn't properly aligned. */
2276 if ((num & mask))
2277 return 0;
2278
2279 /* Check if NUM will fit in 8bit after shift. */
2280 return fits_in_signed_byte (num >> shift);
2281 }
2282
2283 static INLINE int
2284 fits_in_imm4 (offsetT num)
2285 {
2286 return (num & 0xf) == num;
2287 }
2288
2289 static i386_operand_type
2290 smallest_imm_type (offsetT num)
2291 {
2292 i386_operand_type t;
2293
2294 operand_type_set (&t, 0);
2295 t.bitfield.imm64 = 1;
2296
2297 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2298 {
2299 /* This code is disabled on the 486 because all the Imm1 forms
2300 in the opcode table are slower on the i486. They're the
2301 versions with the implicitly specified single-position
2302 displacement, which has another syntax if you really want to
2303 use that form. */
2304 t.bitfield.imm1 = 1;
2305 t.bitfield.imm8 = 1;
2306 t.bitfield.imm8s = 1;
2307 t.bitfield.imm16 = 1;
2308 t.bitfield.imm32 = 1;
2309 t.bitfield.imm32s = 1;
2310 }
2311 else if (fits_in_signed_byte (num))
2312 {
2313 t.bitfield.imm8 = 1;
2314 t.bitfield.imm8s = 1;
2315 t.bitfield.imm16 = 1;
2316 t.bitfield.imm32 = 1;
2317 t.bitfield.imm32s = 1;
2318 }
2319 else if (fits_in_unsigned_byte (num))
2320 {
2321 t.bitfield.imm8 = 1;
2322 t.bitfield.imm16 = 1;
2323 t.bitfield.imm32 = 1;
2324 t.bitfield.imm32s = 1;
2325 }
2326 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2327 {
2328 t.bitfield.imm16 = 1;
2329 t.bitfield.imm32 = 1;
2330 t.bitfield.imm32s = 1;
2331 }
2332 else if (fits_in_signed_long (num))
2333 {
2334 t.bitfield.imm32 = 1;
2335 t.bitfield.imm32s = 1;
2336 }
2337 else if (fits_in_unsigned_long (num))
2338 t.bitfield.imm32 = 1;
2339
2340 return t;
2341 }
2342
2343 static offsetT
2344 offset_in_range (offsetT val, int size)
2345 {
2346 addressT mask;
2347
2348 switch (size)
2349 {
2350 case 1: mask = ((addressT) 1 << 8) - 1; break;
2351 case 2: mask = ((addressT) 1 << 16) - 1; break;
2352 case 4: mask = ((addressT) 2 << 31) - 1; break;
2353 #ifdef BFD64
2354 case 8: mask = ((addressT) 2 << 63) - 1; break;
2355 #endif
2356 default: abort ();
2357 }
2358
2359 #ifdef BFD64
2360 /* If BFD64, sign extend val for 32bit address mode. */
2361 if (flag_code != CODE_64BIT
2362 || i.prefix[ADDR_PREFIX])
2363 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2364 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2365 #endif
2366
2367 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2368 {
2369 char buf1[40], buf2[40];
2370
2371 sprint_value (buf1, val);
2372 sprint_value (buf2, val & mask);
2373 as_warn (_("%s shortened to %s"), buf1, buf2);
2374 }
2375 return val & mask;
2376 }
2377
2378 enum PREFIX_GROUP
2379 {
2380 PREFIX_EXIST = 0,
2381 PREFIX_LOCK,
2382 PREFIX_REP,
2383 PREFIX_DS,
2384 PREFIX_OTHER
2385 };
2386
2387 /* Returns
2388 a. PREFIX_EXIST if attempting to add a prefix where one from the
2389 same class already exists.
2390 b. PREFIX_LOCK if lock prefix is added.
2391 c. PREFIX_REP if rep/repne prefix is added.
2392 d. PREFIX_DS if ds prefix is added.
2393 e. PREFIX_OTHER if other prefix is added.
2394 */
2395
2396 static enum PREFIX_GROUP
2397 add_prefix (unsigned int prefix)
2398 {
2399 enum PREFIX_GROUP ret = PREFIX_OTHER;
2400 unsigned int q;
2401
2402 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2403 && flag_code == CODE_64BIT)
2404 {
2405 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2406 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2407 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2408 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2409 ret = PREFIX_EXIST;
2410 q = REX_PREFIX;
2411 }
2412 else
2413 {
2414 switch (prefix)
2415 {
2416 default:
2417 abort ();
2418
2419 case DS_PREFIX_OPCODE:
2420 ret = PREFIX_DS;
2421 /* Fall through. */
2422 case CS_PREFIX_OPCODE:
2423 case ES_PREFIX_OPCODE:
2424 case FS_PREFIX_OPCODE:
2425 case GS_PREFIX_OPCODE:
2426 case SS_PREFIX_OPCODE:
2427 q = SEG_PREFIX;
2428 break;
2429
2430 case REPNE_PREFIX_OPCODE:
2431 case REPE_PREFIX_OPCODE:
2432 q = REP_PREFIX;
2433 ret = PREFIX_REP;
2434 break;
2435
2436 case LOCK_PREFIX_OPCODE:
2437 q = LOCK_PREFIX;
2438 ret = PREFIX_LOCK;
2439 break;
2440
2441 case FWAIT_OPCODE:
2442 q = WAIT_PREFIX;
2443 break;
2444
2445 case ADDR_PREFIX_OPCODE:
2446 q = ADDR_PREFIX;
2447 break;
2448
2449 case DATA_PREFIX_OPCODE:
2450 q = DATA_PREFIX;
2451 break;
2452 }
2453 if (i.prefix[q] != 0)
2454 ret = PREFIX_EXIST;
2455 }
2456
2457 if (ret)
2458 {
2459 if (!i.prefix[q])
2460 ++i.prefixes;
2461 i.prefix[q] |= prefix;
2462 }
2463 else
2464 as_bad (_("same type of prefix used twice"));
2465
2466 return ret;
2467 }
2468
2469 static void
2470 update_code_flag (int value, int check)
2471 {
2472 PRINTF_LIKE ((*as_error));
2473
2474 flag_code = (enum flag_code) value;
2475 if (flag_code == CODE_64BIT)
2476 {
2477 cpu_arch_flags.bitfield.cpu64 = 1;
2478 cpu_arch_flags.bitfield.cpuno64 = 0;
2479 }
2480 else
2481 {
2482 cpu_arch_flags.bitfield.cpu64 = 0;
2483 cpu_arch_flags.bitfield.cpuno64 = 1;
2484 }
2485 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2486 {
2487 if (check)
2488 as_error = as_fatal;
2489 else
2490 as_error = as_bad;
2491 (*as_error) (_("64bit mode not supported on `%s'."),
2492 cpu_arch_name ? cpu_arch_name : default_arch);
2493 }
2494 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2495 {
2496 if (check)
2497 as_error = as_fatal;
2498 else
2499 as_error = as_bad;
2500 (*as_error) (_("32bit mode not supported on `%s'."),
2501 cpu_arch_name ? cpu_arch_name : default_arch);
2502 }
2503 stackop_size = '\0';
2504 }
2505
2506 static void
2507 set_code_flag (int value)
2508 {
2509 update_code_flag (value, 0);
2510 }
2511
2512 static void
2513 set_16bit_gcc_code_flag (int new_code_flag)
2514 {
2515 flag_code = (enum flag_code) new_code_flag;
2516 if (flag_code != CODE_16BIT)
2517 abort ();
2518 cpu_arch_flags.bitfield.cpu64 = 0;
2519 cpu_arch_flags.bitfield.cpuno64 = 1;
2520 stackop_size = LONG_MNEM_SUFFIX;
2521 }
2522
2523 static void
2524 set_intel_syntax (int syntax_flag)
2525 {
2526 /* Find out if register prefixing is specified. */
2527 int ask_naked_reg = 0;
2528
2529 SKIP_WHITESPACE ();
2530 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2531 {
2532 char *string;
2533 int e = get_symbol_name (&string);
2534
2535 if (strcmp (string, "prefix") == 0)
2536 ask_naked_reg = 1;
2537 else if (strcmp (string, "noprefix") == 0)
2538 ask_naked_reg = -1;
2539 else
2540 as_bad (_("bad argument to syntax directive."));
2541 (void) restore_line_pointer (e);
2542 }
2543 demand_empty_rest_of_line ();
2544
2545 intel_syntax = syntax_flag;
2546
2547 if (ask_naked_reg == 0)
2548 allow_naked_reg = (intel_syntax
2549 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2550 else
2551 allow_naked_reg = (ask_naked_reg < 0);
2552
2553 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2554
2555 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2556 identifier_chars['$'] = intel_syntax ? '$' : 0;
2557 register_prefix = allow_naked_reg ? "" : "%";
2558 }
2559
2560 static void
2561 set_intel_mnemonic (int mnemonic_flag)
2562 {
2563 intel_mnemonic = mnemonic_flag;
2564 }
2565
2566 static void
2567 set_allow_index_reg (int flag)
2568 {
2569 allow_index_reg = flag;
2570 }
2571
2572 static void
2573 set_check (int what)
2574 {
2575 enum check_kind *kind;
2576 const char *str;
2577
2578 if (what)
2579 {
2580 kind = &operand_check;
2581 str = "operand";
2582 }
2583 else
2584 {
2585 kind = &sse_check;
2586 str = "sse";
2587 }
2588
2589 SKIP_WHITESPACE ();
2590
2591 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2592 {
2593 char *string;
2594 int e = get_symbol_name (&string);
2595
2596 if (strcmp (string, "none") == 0)
2597 *kind = check_none;
2598 else if (strcmp (string, "warning") == 0)
2599 *kind = check_warning;
2600 else if (strcmp (string, "error") == 0)
2601 *kind = check_error;
2602 else
2603 as_bad (_("bad argument to %s_check directive."), str);
2604 (void) restore_line_pointer (e);
2605 }
2606 else
2607 as_bad (_("missing argument for %s_check directive"), str);
2608
2609 demand_empty_rest_of_line ();
2610 }
2611
2612 static void
2613 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2614 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2615 {
2616 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2617 static const char *arch;
2618
2619 /* Intel LIOM is only supported on ELF. */
2620 if (!IS_ELF)
2621 return;
2622
2623 if (!arch)
2624 {
2625 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2626 use default_arch. */
2627 arch = cpu_arch_name;
2628 if (!arch)
2629 arch = default_arch;
2630 }
2631
2632 /* If we are targeting Intel MCU, we must enable it. */
2633 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2634 || new_flag.bitfield.cpuiamcu)
2635 return;
2636
2637 /* If we are targeting Intel L1OM, we must enable it. */
2638 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2639 || new_flag.bitfield.cpul1om)
2640 return;
2641
2642 /* If we are targeting Intel K1OM, we must enable it. */
2643 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2644 || new_flag.bitfield.cpuk1om)
2645 return;
2646
2647 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2648 #endif
2649 }
2650
2651 static void
2652 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2653 {
2654 SKIP_WHITESPACE ();
2655
2656 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2657 {
2658 char *string;
2659 int e = get_symbol_name (&string);
2660 unsigned int j;
2661 i386_cpu_flags flags;
2662
2663 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2664 {
2665 if (strcmp (string, cpu_arch[j].name) == 0)
2666 {
2667 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2668
2669 if (*string != '.')
2670 {
2671 cpu_arch_name = cpu_arch[j].name;
2672 cpu_sub_arch_name = NULL;
2673 cpu_arch_flags = cpu_arch[j].flags;
2674 if (flag_code == CODE_64BIT)
2675 {
2676 cpu_arch_flags.bitfield.cpu64 = 1;
2677 cpu_arch_flags.bitfield.cpuno64 = 0;
2678 }
2679 else
2680 {
2681 cpu_arch_flags.bitfield.cpu64 = 0;
2682 cpu_arch_flags.bitfield.cpuno64 = 1;
2683 }
2684 cpu_arch_isa = cpu_arch[j].type;
2685 cpu_arch_isa_flags = cpu_arch[j].flags;
2686 if (!cpu_arch_tune_set)
2687 {
2688 cpu_arch_tune = cpu_arch_isa;
2689 cpu_arch_tune_flags = cpu_arch_isa_flags;
2690 }
2691 break;
2692 }
2693
2694 flags = cpu_flags_or (cpu_arch_flags,
2695 cpu_arch[j].flags);
2696
2697 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2698 {
2699 if (cpu_sub_arch_name)
2700 {
2701 char *name = cpu_sub_arch_name;
2702 cpu_sub_arch_name = concat (name,
2703 cpu_arch[j].name,
2704 (const char *) NULL);
2705 free (name);
2706 }
2707 else
2708 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2709 cpu_arch_flags = flags;
2710 cpu_arch_isa_flags = flags;
2711 }
2712 else
2713 cpu_arch_isa_flags
2714 = cpu_flags_or (cpu_arch_isa_flags,
2715 cpu_arch[j].flags);
2716 (void) restore_line_pointer (e);
2717 demand_empty_rest_of_line ();
2718 return;
2719 }
2720 }
2721
2722 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2723 {
2724 /* Disable an ISA extension. */
2725 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2726 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2727 {
2728 flags = cpu_flags_and_not (cpu_arch_flags,
2729 cpu_noarch[j].flags);
2730 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2731 {
2732 if (cpu_sub_arch_name)
2733 {
2734 char *name = cpu_sub_arch_name;
2735 cpu_sub_arch_name = concat (name, string,
2736 (const char *) NULL);
2737 free (name);
2738 }
2739 else
2740 cpu_sub_arch_name = xstrdup (string);
2741 cpu_arch_flags = flags;
2742 cpu_arch_isa_flags = flags;
2743 }
2744 (void) restore_line_pointer (e);
2745 demand_empty_rest_of_line ();
2746 return;
2747 }
2748
2749 j = ARRAY_SIZE (cpu_arch);
2750 }
2751
2752 if (j >= ARRAY_SIZE (cpu_arch))
2753 as_bad (_("no such architecture: `%s'"), string);
2754
2755 *input_line_pointer = e;
2756 }
2757 else
2758 as_bad (_("missing cpu architecture"));
2759
2760 no_cond_jump_promotion = 0;
2761 if (*input_line_pointer == ','
2762 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2763 {
2764 char *string;
2765 char e;
2766
2767 ++input_line_pointer;
2768 e = get_symbol_name (&string);
2769
2770 if (strcmp (string, "nojumps") == 0)
2771 no_cond_jump_promotion = 1;
2772 else if (strcmp (string, "jumps") == 0)
2773 ;
2774 else
2775 as_bad (_("no such architecture modifier: `%s'"), string);
2776
2777 (void) restore_line_pointer (e);
2778 }
2779
2780 demand_empty_rest_of_line ();
2781 }
2782
2783 enum bfd_architecture
2784 i386_arch (void)
2785 {
2786 if (cpu_arch_isa == PROCESSOR_L1OM)
2787 {
2788 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2789 || flag_code != CODE_64BIT)
2790 as_fatal (_("Intel L1OM is 64bit ELF only"));
2791 return bfd_arch_l1om;
2792 }
2793 else if (cpu_arch_isa == PROCESSOR_K1OM)
2794 {
2795 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2796 || flag_code != CODE_64BIT)
2797 as_fatal (_("Intel K1OM is 64bit ELF only"));
2798 return bfd_arch_k1om;
2799 }
2800 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2801 {
2802 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2803 || flag_code == CODE_64BIT)
2804 as_fatal (_("Intel MCU is 32bit ELF only"));
2805 return bfd_arch_iamcu;
2806 }
2807 else
2808 return bfd_arch_i386;
2809 }
2810
2811 unsigned long
2812 i386_mach (void)
2813 {
2814 if (!strncmp (default_arch, "x86_64", 6))
2815 {
2816 if (cpu_arch_isa == PROCESSOR_L1OM)
2817 {
2818 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2819 || default_arch[6] != '\0')
2820 as_fatal (_("Intel L1OM is 64bit ELF only"));
2821 return bfd_mach_l1om;
2822 }
2823 else if (cpu_arch_isa == PROCESSOR_K1OM)
2824 {
2825 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2826 || default_arch[6] != '\0')
2827 as_fatal (_("Intel K1OM is 64bit ELF only"));
2828 return bfd_mach_k1om;
2829 }
2830 else if (default_arch[6] == '\0')
2831 return bfd_mach_x86_64;
2832 else
2833 return bfd_mach_x64_32;
2834 }
2835 else if (!strcmp (default_arch, "i386")
2836 || !strcmp (default_arch, "iamcu"))
2837 {
2838 if (cpu_arch_isa == PROCESSOR_IAMCU)
2839 {
2840 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2841 as_fatal (_("Intel MCU is 32bit ELF only"));
2842 return bfd_mach_i386_iamcu;
2843 }
2844 else
2845 return bfd_mach_i386_i386;
2846 }
2847 else
2848 as_fatal (_("unknown architecture"));
2849 }
2850 \f
2851 void
2852 md_begin (void)
2853 {
2854 const char *hash_err;
2855
2856 /* Support pseudo prefixes like {disp32}. */
2857 lex_type ['{'] = LEX_BEGIN_NAME;
2858
2859 /* Initialize op_hash hash table. */
2860 op_hash = hash_new ();
2861
2862 {
2863 const insn_template *optab;
2864 templates *core_optab;
2865
2866 /* Setup for loop. */
2867 optab = i386_optab;
2868 core_optab = XNEW (templates);
2869 core_optab->start = optab;
2870
2871 while (1)
2872 {
2873 ++optab;
2874 if (optab->name == NULL
2875 || strcmp (optab->name, (optab - 1)->name) != 0)
2876 {
2877 /* different name --> ship out current template list;
2878 add to hash table; & begin anew. */
2879 core_optab->end = optab;
2880 hash_err = hash_insert (op_hash,
2881 (optab - 1)->name,
2882 (void *) core_optab);
2883 if (hash_err)
2884 {
2885 as_fatal (_("can't hash %s: %s"),
2886 (optab - 1)->name,
2887 hash_err);
2888 }
2889 if (optab->name == NULL)
2890 break;
2891 core_optab = XNEW (templates);
2892 core_optab->start = optab;
2893 }
2894 }
2895 }
2896
2897 /* Initialize reg_hash hash table. */
2898 reg_hash = hash_new ();
2899 {
2900 const reg_entry *regtab;
2901 unsigned int regtab_size = i386_regtab_size;
2902
2903 for (regtab = i386_regtab; regtab_size--; regtab++)
2904 {
2905 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2906 if (hash_err)
2907 as_fatal (_("can't hash %s: %s"),
2908 regtab->reg_name,
2909 hash_err);
2910 }
2911 }
2912
2913 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
2914 {
2915 int c;
2916 char *p;
2917
2918 for (c = 0; c < 256; c++)
2919 {
2920 if (ISDIGIT (c))
2921 {
2922 digit_chars[c] = c;
2923 mnemonic_chars[c] = c;
2924 register_chars[c] = c;
2925 operand_chars[c] = c;
2926 }
2927 else if (ISLOWER (c))
2928 {
2929 mnemonic_chars[c] = c;
2930 register_chars[c] = c;
2931 operand_chars[c] = c;
2932 }
2933 else if (ISUPPER (c))
2934 {
2935 mnemonic_chars[c] = TOLOWER (c);
2936 register_chars[c] = mnemonic_chars[c];
2937 operand_chars[c] = c;
2938 }
2939 else if (c == '{' || c == '}')
2940 {
2941 mnemonic_chars[c] = c;
2942 operand_chars[c] = c;
2943 }
2944
2945 if (ISALPHA (c) || ISDIGIT (c))
2946 identifier_chars[c] = c;
2947 else if (c >= 128)
2948 {
2949 identifier_chars[c] = c;
2950 operand_chars[c] = c;
2951 }
2952 }
2953
2954 #ifdef LEX_AT
2955 identifier_chars['@'] = '@';
2956 #endif
2957 #ifdef LEX_QM
2958 identifier_chars['?'] = '?';
2959 operand_chars['?'] = '?';
2960 #endif
2961 digit_chars['-'] = '-';
2962 mnemonic_chars['_'] = '_';
2963 mnemonic_chars['-'] = '-';
2964 mnemonic_chars['.'] = '.';
2965 identifier_chars['_'] = '_';
2966 identifier_chars['.'] = '.';
2967
2968 for (p = operand_special_chars; *p != '\0'; p++)
2969 operand_chars[(unsigned char) *p] = *p;
2970 }
2971
2972 if (flag_code == CODE_64BIT)
2973 {
2974 #if defined (OBJ_COFF) && defined (TE_PE)
2975 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2976 ? 32 : 16);
2977 #else
2978 x86_dwarf2_return_column = 16;
2979 #endif
2980 x86_cie_data_alignment = -8;
2981 }
2982 else
2983 {
2984 x86_dwarf2_return_column = 8;
2985 x86_cie_data_alignment = -4;
2986 }
2987 }
2988
2989 void
2990 i386_print_statistics (FILE *file)
2991 {
2992 hash_print_statistics (file, "i386 opcode", op_hash);
2993 hash_print_statistics (file, "i386 register", reg_hash);
2994 }
2995 \f
2996 #ifdef DEBUG386
2997
2998 /* Debugging routines for md_assemble. */
2999 static void pte (insn_template *);
3000 static void pt (i386_operand_type);
3001 static void pe (expressionS *);
3002 static void ps (symbolS *);
3003
3004 static void
3005 pi (const char *line, i386_insn *x)
3006 {
3007 unsigned int j;
3008
3009 fprintf (stdout, "%s: template ", line);
3010 pte (&x->tm);
3011 fprintf (stdout, " address: base %s index %s scale %x\n",
3012 x->base_reg ? x->base_reg->reg_name : "none",
3013 x->index_reg ? x->index_reg->reg_name : "none",
3014 x->log2_scale_factor);
3015 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3016 x->rm.mode, x->rm.reg, x->rm.regmem);
3017 fprintf (stdout, " sib: base %x index %x scale %x\n",
3018 x->sib.base, x->sib.index, x->sib.scale);
3019 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3020 (x->rex & REX_W) != 0,
3021 (x->rex & REX_R) != 0,
3022 (x->rex & REX_X) != 0,
3023 (x->rex & REX_B) != 0);
3024 for (j = 0; j < x->operands; j++)
3025 {
3026 fprintf (stdout, " #%d: ", j + 1);
3027 pt (x->types[j]);
3028 fprintf (stdout, "\n");
3029 if (x->types[j].bitfield.reg
3030 || x->types[j].bitfield.regmmx
3031 || x->types[j].bitfield.regsimd
3032 || x->types[j].bitfield.sreg2
3033 || x->types[j].bitfield.sreg3
3034 || x->types[j].bitfield.control
3035 || x->types[j].bitfield.debug
3036 || x->types[j].bitfield.test)
3037 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3038 if (operand_type_check (x->types[j], imm))
3039 pe (x->op[j].imms);
3040 if (operand_type_check (x->types[j], disp))
3041 pe (x->op[j].disps);
3042 }
3043 }
3044
3045 static void
3046 pte (insn_template *t)
3047 {
3048 unsigned int j;
3049 fprintf (stdout, " %d operands ", t->operands);
3050 fprintf (stdout, "opcode %x ", t->base_opcode);
3051 if (t->extension_opcode != None)
3052 fprintf (stdout, "ext %x ", t->extension_opcode);
3053 if (t->opcode_modifier.d)
3054 fprintf (stdout, "D");
3055 if (t->opcode_modifier.w)
3056 fprintf (stdout, "W");
3057 fprintf (stdout, "\n");
3058 for (j = 0; j < t->operands; j++)
3059 {
3060 fprintf (stdout, " #%d type ", j + 1);
3061 pt (t->operand_types[j]);
3062 fprintf (stdout, "\n");
3063 }
3064 }
3065
3066 static void
3067 pe (expressionS *e)
3068 {
3069 fprintf (stdout, " operation %d\n", e->X_op);
3070 fprintf (stdout, " add_number %ld (%lx)\n",
3071 (long) e->X_add_number, (long) e->X_add_number);
3072 if (e->X_add_symbol)
3073 {
3074 fprintf (stdout, " add_symbol ");
3075 ps (e->X_add_symbol);
3076 fprintf (stdout, "\n");
3077 }
3078 if (e->X_op_symbol)
3079 {
3080 fprintf (stdout, " op_symbol ");
3081 ps (e->X_op_symbol);
3082 fprintf (stdout, "\n");
3083 }
3084 }
3085
3086 static void
3087 ps (symbolS *s)
3088 {
3089 fprintf (stdout, "%s type %s%s",
3090 S_GET_NAME (s),
3091 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3092 segment_name (S_GET_SEGMENT (s)));
3093 }
3094
3095 static struct type_name
3096 {
3097 i386_operand_type mask;
3098 const char *name;
3099 }
3100 const type_names[] =
3101 {
3102 { OPERAND_TYPE_REG8, "r8" },
3103 { OPERAND_TYPE_REG16, "r16" },
3104 { OPERAND_TYPE_REG32, "r32" },
3105 { OPERAND_TYPE_REG64, "r64" },
3106 { OPERAND_TYPE_ACC8, "acc8" },
3107 { OPERAND_TYPE_ACC16, "acc16" },
3108 { OPERAND_TYPE_ACC32, "acc32" },
3109 { OPERAND_TYPE_ACC64, "acc64" },
3110 { OPERAND_TYPE_IMM8, "i8" },
3111 { OPERAND_TYPE_IMM8, "i8s" },
3112 { OPERAND_TYPE_IMM16, "i16" },
3113 { OPERAND_TYPE_IMM32, "i32" },
3114 { OPERAND_TYPE_IMM32S, "i32s" },
3115 { OPERAND_TYPE_IMM64, "i64" },
3116 { OPERAND_TYPE_IMM1, "i1" },
3117 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3118 { OPERAND_TYPE_DISP8, "d8" },
3119 { OPERAND_TYPE_DISP16, "d16" },
3120 { OPERAND_TYPE_DISP32, "d32" },
3121 { OPERAND_TYPE_DISP32S, "d32s" },
3122 { OPERAND_TYPE_DISP64, "d64" },
3123 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3124 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3125 { OPERAND_TYPE_CONTROL, "control reg" },
3126 { OPERAND_TYPE_TEST, "test reg" },
3127 { OPERAND_TYPE_DEBUG, "debug reg" },
3128 { OPERAND_TYPE_FLOATREG, "FReg" },
3129 { OPERAND_TYPE_FLOATACC, "FAcc" },
3130 { OPERAND_TYPE_SREG2, "SReg2" },
3131 { OPERAND_TYPE_SREG3, "SReg3" },
3132 { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
3133 { OPERAND_TYPE_REGMMX, "rMMX" },
3134 { OPERAND_TYPE_REGXMM, "rXMM" },
3135 { OPERAND_TYPE_REGYMM, "rYMM" },
3136 { OPERAND_TYPE_REGZMM, "rZMM" },
3137 { OPERAND_TYPE_REGMASK, "Mask reg" },
3138 { OPERAND_TYPE_ESSEG, "es" },
3139 };
3140
3141 static void
3142 pt (i386_operand_type t)
3143 {
3144 unsigned int j;
3145 i386_operand_type a;
3146
3147 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3148 {
3149 a = operand_type_and (t, type_names[j].mask);
3150 if (operand_type_equal (&a, &type_names[j].mask))
3151 fprintf (stdout, "%s, ", type_names[j].name);
3152 }
3153 fflush (stdout);
3154 }
3155
3156 #endif /* DEBUG386 */
3157 \f
3158 static bfd_reloc_code_real_type
3159 reloc (unsigned int size,
3160 int pcrel,
3161 int sign,
3162 bfd_reloc_code_real_type other)
3163 {
3164 if (other != NO_RELOC)
3165 {
3166 reloc_howto_type *rel;
3167
3168 if (size == 8)
3169 switch (other)
3170 {
3171 case BFD_RELOC_X86_64_GOT32:
3172 return BFD_RELOC_X86_64_GOT64;
3173 break;
3174 case BFD_RELOC_X86_64_GOTPLT64:
3175 return BFD_RELOC_X86_64_GOTPLT64;
3176 break;
3177 case BFD_RELOC_X86_64_PLTOFF64:
3178 return BFD_RELOC_X86_64_PLTOFF64;
3179 break;
3180 case BFD_RELOC_X86_64_GOTPC32:
3181 other = BFD_RELOC_X86_64_GOTPC64;
3182 break;
3183 case BFD_RELOC_X86_64_GOTPCREL:
3184 other = BFD_RELOC_X86_64_GOTPCREL64;
3185 break;
3186 case BFD_RELOC_X86_64_TPOFF32:
3187 other = BFD_RELOC_X86_64_TPOFF64;
3188 break;
3189 case BFD_RELOC_X86_64_DTPOFF32:
3190 other = BFD_RELOC_X86_64_DTPOFF64;
3191 break;
3192 default:
3193 break;
3194 }
3195
3196 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3197 if (other == BFD_RELOC_SIZE32)
3198 {
3199 if (size == 8)
3200 other = BFD_RELOC_SIZE64;
3201 if (pcrel)
3202 {
3203 as_bad (_("there are no pc-relative size relocations"));
3204 return NO_RELOC;
3205 }
3206 }
3207 #endif
3208
3209 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3210 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3211 sign = -1;
3212
3213 rel = bfd_reloc_type_lookup (stdoutput, other);
3214 if (!rel)
3215 as_bad (_("unknown relocation (%u)"), other);
3216 else if (size != bfd_get_reloc_size (rel))
3217 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3218 bfd_get_reloc_size (rel),
3219 size);
3220 else if (pcrel && !rel->pc_relative)
3221 as_bad (_("non-pc-relative relocation for pc-relative field"));
3222 else if ((rel->complain_on_overflow == complain_overflow_signed
3223 && !sign)
3224 || (rel->complain_on_overflow == complain_overflow_unsigned
3225 && sign > 0))
3226 as_bad (_("relocated field and relocation type differ in signedness"));
3227 else
3228 return other;
3229 return NO_RELOC;
3230 }
3231
3232 if (pcrel)
3233 {
3234 if (!sign)
3235 as_bad (_("there are no unsigned pc-relative relocations"));
3236 switch (size)
3237 {
3238 case 1: return BFD_RELOC_8_PCREL;
3239 case 2: return BFD_RELOC_16_PCREL;
3240 case 4: return BFD_RELOC_32_PCREL;
3241 case 8: return BFD_RELOC_64_PCREL;
3242 }
3243 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3244 }
3245 else
3246 {
3247 if (sign > 0)
3248 switch (size)
3249 {
3250 case 4: return BFD_RELOC_X86_64_32S;
3251 }
3252 else
3253 switch (size)
3254 {
3255 case 1: return BFD_RELOC_8;
3256 case 2: return BFD_RELOC_16;
3257 case 4: return BFD_RELOC_32;
3258 case 8: return BFD_RELOC_64;
3259 }
3260 as_bad (_("cannot do %s %u byte relocation"),
3261 sign > 0 ? "signed" : "unsigned", size);
3262 }
3263
3264 return NO_RELOC;
3265 }
3266
3267 /* Here we decide which fixups can be adjusted to make them relative to
3268 the beginning of the section instead of the symbol. Basically we need
3269 to make sure that the dynamic relocations are done correctly, so in
3270 some cases we force the original symbol to be used. */
3271
3272 int
3273 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3274 {
3275 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3276 if (!IS_ELF)
3277 return 1;
3278
3279 /* Don't adjust pc-relative references to merge sections in 64-bit
3280 mode. */
3281 if (use_rela_relocations
3282 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3283 && fixP->fx_pcrel)
3284 return 0;
3285
3286 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3287 and changed later by validate_fix. */
3288 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3289 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3290 return 0;
3291
3292 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3293 for size relocations. */
3294 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3295 || fixP->fx_r_type == BFD_RELOC_SIZE64
3296 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3297 || fixP->fx_r_type == BFD_RELOC_386_PLT32
3298 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3299 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3300 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3301 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3302 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3303 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3304 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3305 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3306 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3307 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3308 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3309 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3310 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
3311 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3312 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3313 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3314 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3315 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3316 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3317 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3318 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3319 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3320 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3321 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3322 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3323 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3324 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3325 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3326 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3327 return 0;
3328 #endif
3329 return 1;
3330 }
3331
3332 static int
3333 intel_float_operand (const char *mnemonic)
3334 {
3335 /* Note that the value returned is meaningful only for opcodes with (memory)
3336 operands, hence the code here is free to improperly handle opcodes that
3337 have no operands (for better performance and smaller code). */
3338
3339 if (mnemonic[0] != 'f')
3340 return 0; /* non-math */
3341
3342 switch (mnemonic[1])
3343 {
3344 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3345 the fs segment override prefix not currently handled because no
3346 call path can make opcodes without operands get here */
3347 case 'i':
3348 return 2 /* integer op */;
3349 case 'l':
3350 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3351 return 3; /* fldcw/fldenv */
3352 break;
3353 case 'n':
3354 if (mnemonic[2] != 'o' /* fnop */)
3355 return 3; /* non-waiting control op */
3356 break;
3357 case 'r':
3358 if (mnemonic[2] == 's')
3359 return 3; /* frstor/frstpm */
3360 break;
3361 case 's':
3362 if (mnemonic[2] == 'a')
3363 return 3; /* fsave */
3364 if (mnemonic[2] == 't')
3365 {
3366 switch (mnemonic[3])
3367 {
3368 case 'c': /* fstcw */
3369 case 'd': /* fstdw */
3370 case 'e': /* fstenv */
3371 case 's': /* fsts[gw] */
3372 return 3;
3373 }
3374 }
3375 break;
3376 case 'x':
3377 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3378 return 0; /* fxsave/fxrstor are not really math ops */
3379 break;
3380 }
3381
3382 return 1;
3383 }
3384
3385 /* Build the VEX prefix. */
3386
3387 static void
3388 build_vex_prefix (const insn_template *t)
3389 {
3390 unsigned int register_specifier;
3391 unsigned int implied_prefix;
3392 unsigned int vector_length;
3393 unsigned int w;
3394
3395 /* Check register specifier. */
3396 if (i.vex.register_specifier)
3397 {
3398 register_specifier =
3399 ~register_number (i.vex.register_specifier) & 0xf;
3400 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3401 }
3402 else
3403 register_specifier = 0xf;
3404
3405 /* Use 2-byte VEX prefix by swapping destination and source operand
3406 if there are more than 1 register operand. */
3407 if (i.reg_operands > 1
3408 && i.vec_encoding != vex_encoding_vex3
3409 && i.dir_encoding == dir_encoding_default
3410 && i.operands == i.reg_operands
3411 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3412 && i.tm.opcode_modifier.vexopcode == VEX0F
3413 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3414 && i.rex == REX_B)
3415 {
3416 unsigned int xchg = i.operands - 1;
3417 union i386_op temp_op;
3418 i386_operand_type temp_type;
3419
3420 temp_type = i.types[xchg];
3421 i.types[xchg] = i.types[0];
3422 i.types[0] = temp_type;
3423 temp_op = i.op[xchg];
3424 i.op[xchg] = i.op[0];
3425 i.op[0] = temp_op;
3426
3427 gas_assert (i.rm.mode == 3);
3428
3429 i.rex = REX_R;
3430 xchg = i.rm.regmem;
3431 i.rm.regmem = i.rm.reg;
3432 i.rm.reg = xchg;
3433
3434 if (i.tm.opcode_modifier.d)
3435 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3436 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3437 else /* Use the next insn. */
3438 i.tm = t[1];
3439 }
3440
3441 if (i.tm.opcode_modifier.vex == VEXScalar)
3442 vector_length = avxscalar;
3443 else if (i.tm.opcode_modifier.vex == VEX256)
3444 vector_length = 1;
3445 else
3446 {
3447 unsigned int op;
3448
3449 /* Determine vector length from the last multi-length vector
3450 operand. */
3451 vector_length = 0;
3452 for (op = t->operands; op--;)
3453 if (t->operand_types[op].bitfield.xmmword
3454 && t->operand_types[op].bitfield.ymmword
3455 && i.types[op].bitfield.ymmword)
3456 {
3457 vector_length = 1;
3458 break;
3459 }
3460 }
3461
3462 switch ((i.tm.base_opcode >> 8) & 0xff)
3463 {
3464 case 0:
3465 implied_prefix = 0;
3466 break;
3467 case DATA_PREFIX_OPCODE:
3468 implied_prefix = 1;
3469 break;
3470 case REPE_PREFIX_OPCODE:
3471 implied_prefix = 2;
3472 break;
3473 case REPNE_PREFIX_OPCODE:
3474 implied_prefix = 3;
3475 break;
3476 default:
3477 abort ();
3478 }
3479
3480 /* Check the REX.W bit and VEXW. */
3481 if (i.tm.opcode_modifier.vexw == VEXWIG)
3482 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3483 else if (i.tm.opcode_modifier.vexw)
3484 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3485 else
3486 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3487
3488 /* Use 2-byte VEX prefix if possible. */
3489 if (w == 0
3490 && i.vec_encoding != vex_encoding_vex3
3491 && i.tm.opcode_modifier.vexopcode == VEX0F
3492 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3493 {
3494 /* 2-byte VEX prefix. */
3495 unsigned int r;
3496
3497 i.vex.length = 2;
3498 i.vex.bytes[0] = 0xc5;
3499
3500 /* Check the REX.R bit. */
3501 r = (i.rex & REX_R) ? 0 : 1;
3502 i.vex.bytes[1] = (r << 7
3503 | register_specifier << 3
3504 | vector_length << 2
3505 | implied_prefix);
3506 }
3507 else
3508 {
3509 /* 3-byte VEX prefix. */
3510 unsigned int m;
3511
3512 i.vex.length = 3;
3513
3514 switch (i.tm.opcode_modifier.vexopcode)
3515 {
3516 case VEX0F:
3517 m = 0x1;
3518 i.vex.bytes[0] = 0xc4;
3519 break;
3520 case VEX0F38:
3521 m = 0x2;
3522 i.vex.bytes[0] = 0xc4;
3523 break;
3524 case VEX0F3A:
3525 m = 0x3;
3526 i.vex.bytes[0] = 0xc4;
3527 break;
3528 case XOP08:
3529 m = 0x8;
3530 i.vex.bytes[0] = 0x8f;
3531 break;
3532 case XOP09:
3533 m = 0x9;
3534 i.vex.bytes[0] = 0x8f;
3535 break;
3536 case XOP0A:
3537 m = 0xa;
3538 i.vex.bytes[0] = 0x8f;
3539 break;
3540 default:
3541 abort ();
3542 }
3543
3544 /* The high 3 bits of the second VEX byte are 1's compliment
3545 of RXB bits from REX. */
3546 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3547
3548 i.vex.bytes[2] = (w << 7
3549 | register_specifier << 3
3550 | vector_length << 2
3551 | implied_prefix);
3552 }
3553 }
3554
3555 static INLINE bfd_boolean
3556 is_evex_encoding (const insn_template *t)
3557 {
3558 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3559 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3560 || t->opcode_modifier.sae;
3561 }
3562
3563 static INLINE bfd_boolean
3564 is_any_vex_encoding (const insn_template *t)
3565 {
3566 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3567 || is_evex_encoding (t);
3568 }
3569
3570 /* Build the EVEX prefix. */
3571
3572 static void
3573 build_evex_prefix (void)
3574 {
3575 unsigned int register_specifier;
3576 unsigned int implied_prefix;
3577 unsigned int m, w;
3578 rex_byte vrex_used = 0;
3579
3580 /* Check register specifier. */
3581 if (i.vex.register_specifier)
3582 {
3583 gas_assert ((i.vrex & REX_X) == 0);
3584
3585 register_specifier = i.vex.register_specifier->reg_num;
3586 if ((i.vex.register_specifier->reg_flags & RegRex))
3587 register_specifier += 8;
3588 /* The upper 16 registers are encoded in the fourth byte of the
3589 EVEX prefix. */
3590 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3591 i.vex.bytes[3] = 0x8;
3592 register_specifier = ~register_specifier & 0xf;
3593 }
3594 else
3595 {
3596 register_specifier = 0xf;
3597
3598 /* Encode upper 16 vector index register in the fourth byte of
3599 the EVEX prefix. */
3600 if (!(i.vrex & REX_X))
3601 i.vex.bytes[3] = 0x8;
3602 else
3603 vrex_used |= REX_X;
3604 }
3605
3606 switch ((i.tm.base_opcode >> 8) & 0xff)
3607 {
3608 case 0:
3609 implied_prefix = 0;
3610 break;
3611 case DATA_PREFIX_OPCODE:
3612 implied_prefix = 1;
3613 break;
3614 case REPE_PREFIX_OPCODE:
3615 implied_prefix = 2;
3616 break;
3617 case REPNE_PREFIX_OPCODE:
3618 implied_prefix = 3;
3619 break;
3620 default:
3621 abort ();
3622 }
3623
3624 /* 4 byte EVEX prefix. */
3625 i.vex.length = 4;
3626 i.vex.bytes[0] = 0x62;
3627
3628 /* mmmm bits. */
3629 switch (i.tm.opcode_modifier.vexopcode)
3630 {
3631 case VEX0F:
3632 m = 1;
3633 break;
3634 case VEX0F38:
3635 m = 2;
3636 break;
3637 case VEX0F3A:
3638 m = 3;
3639 break;
3640 default:
3641 abort ();
3642 break;
3643 }
3644
3645 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3646 bits from REX. */
3647 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3648
3649 /* The fifth bit of the second EVEX byte is 1's compliment of the
3650 REX_R bit in VREX. */
3651 if (!(i.vrex & REX_R))
3652 i.vex.bytes[1] |= 0x10;
3653 else
3654 vrex_used |= REX_R;
3655
3656 if ((i.reg_operands + i.imm_operands) == i.operands)
3657 {
3658 /* When all operands are registers, the REX_X bit in REX is not
3659 used. We reuse it to encode the upper 16 registers, which is
3660 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3661 as 1's compliment. */
3662 if ((i.vrex & REX_B))
3663 {
3664 vrex_used |= REX_B;
3665 i.vex.bytes[1] &= ~0x40;
3666 }
3667 }
3668
3669 /* EVEX instructions shouldn't need the REX prefix. */
3670 i.vrex &= ~vrex_used;
3671 gas_assert (i.vrex == 0);
3672
3673 /* Check the REX.W bit and VEXW. */
3674 if (i.tm.opcode_modifier.vexw == VEXWIG)
3675 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3676 else if (i.tm.opcode_modifier.vexw)
3677 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3678 else
3679 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3680
3681 /* Encode the U bit. */
3682 implied_prefix |= 0x4;
3683
3684 /* The third byte of the EVEX prefix. */
3685 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3686
3687 /* The fourth byte of the EVEX prefix. */
3688 /* The zeroing-masking bit. */
3689 if (i.mask && i.mask->zeroing)
3690 i.vex.bytes[3] |= 0x80;
3691
3692 /* Don't always set the broadcast bit if there is no RC. */
3693 if (!i.rounding)
3694 {
3695 /* Encode the vector length. */
3696 unsigned int vec_length;
3697
3698 if (!i.tm.opcode_modifier.evex
3699 || i.tm.opcode_modifier.evex == EVEXDYN)
3700 {
3701 unsigned int op;
3702
3703 /* Determine vector length from the last multi-length vector
3704 operand. */
3705 vec_length = 0;
3706 for (op = i.operands; op--;)
3707 if (i.tm.operand_types[op].bitfield.xmmword
3708 + i.tm.operand_types[op].bitfield.ymmword
3709 + i.tm.operand_types[op].bitfield.zmmword > 1)
3710 {
3711 if (i.types[op].bitfield.zmmword)
3712 {
3713 i.tm.opcode_modifier.evex = EVEX512;
3714 break;
3715 }
3716 else if (i.types[op].bitfield.ymmword)
3717 {
3718 i.tm.opcode_modifier.evex = EVEX256;
3719 break;
3720 }
3721 else if (i.types[op].bitfield.xmmword)
3722 {
3723 i.tm.opcode_modifier.evex = EVEX128;
3724 break;
3725 }
3726 else if (i.broadcast && (int) op == i.broadcast->operand)
3727 {
3728 switch (i.broadcast->bytes)
3729 {
3730 case 64:
3731 i.tm.opcode_modifier.evex = EVEX512;
3732 break;
3733 case 32:
3734 i.tm.opcode_modifier.evex = EVEX256;
3735 break;
3736 case 16:
3737 i.tm.opcode_modifier.evex = EVEX128;
3738 break;
3739 default:
3740 abort ();
3741 }
3742 break;
3743 }
3744 }
3745
3746 if (op >= MAX_OPERANDS)
3747 abort ();
3748 }
3749
3750 switch (i.tm.opcode_modifier.evex)
3751 {
3752 case EVEXLIG: /* LL' is ignored */
3753 vec_length = evexlig << 5;
3754 break;
3755 case EVEX128:
3756 vec_length = 0 << 5;
3757 break;
3758 case EVEX256:
3759 vec_length = 1 << 5;
3760 break;
3761 case EVEX512:
3762 vec_length = 2 << 5;
3763 break;
3764 default:
3765 abort ();
3766 break;
3767 }
3768 i.vex.bytes[3] |= vec_length;
3769 /* Encode the broadcast bit. */
3770 if (i.broadcast)
3771 i.vex.bytes[3] |= 0x10;
3772 }
3773 else
3774 {
3775 if (i.rounding->type != saeonly)
3776 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3777 else
3778 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3779 }
3780
3781 if (i.mask && i.mask->mask)
3782 i.vex.bytes[3] |= i.mask->mask->reg_num;
3783 }
3784
3785 static void
3786 process_immext (void)
3787 {
3788 expressionS *exp;
3789
3790 if ((i.tm.cpu_flags.bitfield.cpusse3 || i.tm.cpu_flags.bitfield.cpusvme)
3791 && i.operands > 0)
3792 {
3793 /* MONITOR/MWAIT as well as SVME instructions have fixed operands
3794 with an opcode suffix which is coded in the same place as an
3795 8-bit immediate field would be.
3796 Here we check those operands and remove them afterwards. */
3797 unsigned int x;
3798
3799 for (x = 0; x < i.operands; x++)
3800 if (register_number (i.op[x].regs) != x)
3801 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3802 register_prefix, i.op[x].regs->reg_name, x + 1,
3803 i.tm.name);
3804
3805 i.operands = 0;
3806 }
3807
3808 if (i.tm.cpu_flags.bitfield.cpumwaitx && i.operands > 0)
3809 {
3810 /* MONITORX/MWAITX instructions have fixed operands with an opcode
3811 suffix which is coded in the same place as an 8-bit immediate
3812 field would be.
3813 Here we check those operands and remove them afterwards. */
3814 unsigned int x;
3815
3816 if (i.operands != 3)
3817 abort();
3818
3819 for (x = 0; x < 2; x++)
3820 if (register_number (i.op[x].regs) != x)
3821 goto bad_register_operand;
3822
3823 /* Check for third operand for mwaitx/monitorx insn. */
3824 if (register_number (i.op[x].regs)
3825 != (x + (i.tm.extension_opcode == 0xfb)))
3826 {
3827 bad_register_operand:
3828 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3829 register_prefix, i.op[x].regs->reg_name, x+1,
3830 i.tm.name);
3831 }
3832
3833 i.operands = 0;
3834 }
3835
3836 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3837 which is coded in the same place as an 8-bit immediate field
3838 would be. Here we fake an 8-bit immediate operand from the
3839 opcode suffix stored in tm.extension_opcode.
3840
3841 AVX instructions also use this encoding, for some of
3842 3 argument instructions. */
3843
3844 gas_assert (i.imm_operands <= 1
3845 && (i.operands <= 2
3846 || (is_any_vex_encoding (&i.tm)
3847 && i.operands <= 4)));
3848
3849 exp = &im_expressions[i.imm_operands++];
3850 i.op[i.operands].imms = exp;
3851 i.types[i.operands] = imm8;
3852 i.operands++;
3853 exp->X_op = O_constant;
3854 exp->X_add_number = i.tm.extension_opcode;
3855 i.tm.extension_opcode = None;
3856 }
3857
3858
3859 static int
3860 check_hle (void)
3861 {
3862 switch (i.tm.opcode_modifier.hleprefixok)
3863 {
3864 default:
3865 abort ();
3866 case HLEPrefixNone:
3867 as_bad (_("invalid instruction `%s' after `%s'"),
3868 i.tm.name, i.hle_prefix);
3869 return 0;
3870 case HLEPrefixLock:
3871 if (i.prefix[LOCK_PREFIX])
3872 return 1;
3873 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3874 return 0;
3875 case HLEPrefixAny:
3876 return 1;
3877 case HLEPrefixRelease:
3878 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3879 {
3880 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3881 i.tm.name);
3882 return 0;
3883 }
3884 if (i.mem_operands == 0
3885 || !operand_type_check (i.types[i.operands - 1], anymem))
3886 {
3887 as_bad (_("memory destination needed for instruction `%s'"
3888 " after `xrelease'"), i.tm.name);
3889 return 0;
3890 }
3891 return 1;
3892 }
3893 }
3894
3895 /* Try the shortest encoding by shortening operand size. */
3896
3897 static void
3898 optimize_encoding (void)
3899 {
3900 unsigned int j;
3901
3902 if (optimize_for_space
3903 && i.reg_operands == 1
3904 && i.imm_operands == 1
3905 && !i.types[1].bitfield.byte
3906 && i.op[0].imms->X_op == O_constant
3907 && fits_in_imm7 (i.op[0].imms->X_add_number)
3908 && ((i.tm.base_opcode == 0xa8
3909 && i.tm.extension_opcode == None)
3910 || (i.tm.base_opcode == 0xf6
3911 && i.tm.extension_opcode == 0x0)))
3912 {
3913 /* Optimize: -Os:
3914 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
3915 */
3916 unsigned int base_regnum = i.op[1].regs->reg_num;
3917 if (flag_code == CODE_64BIT || base_regnum < 4)
3918 {
3919 i.types[1].bitfield.byte = 1;
3920 /* Ignore the suffix. */
3921 i.suffix = 0;
3922 if (base_regnum >= 4
3923 && !(i.op[1].regs->reg_flags & RegRex))
3924 {
3925 /* Handle SP, BP, SI and DI registers. */
3926 if (i.types[1].bitfield.word)
3927 j = 16;
3928 else if (i.types[1].bitfield.dword)
3929 j = 32;
3930 else
3931 j = 48;
3932 i.op[1].regs -= j;
3933 }
3934 }
3935 }
3936 else if (flag_code == CODE_64BIT
3937 && ((i.types[1].bitfield.qword
3938 && i.reg_operands == 1
3939 && i.imm_operands == 1
3940 && i.op[0].imms->X_op == O_constant
3941 && ((i.tm.base_opcode == 0xb0
3942 && i.tm.extension_opcode == None
3943 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
3944 || (fits_in_imm31 (i.op[0].imms->X_add_number)
3945 && (((i.tm.base_opcode == 0x24
3946 || i.tm.base_opcode == 0xa8)
3947 && i.tm.extension_opcode == None)
3948 || (i.tm.base_opcode == 0x80
3949 && i.tm.extension_opcode == 0x4)
3950 || ((i.tm.base_opcode == 0xf6
3951 || i.tm.base_opcode == 0xc6)
3952 && i.tm.extension_opcode == 0x0)))
3953 || (fits_in_imm7 (i.op[0].imms->X_add_number)
3954 && i.tm.base_opcode == 0x83
3955 && i.tm.extension_opcode == 0x4)))
3956 || (i.types[0].bitfield.qword
3957 && ((i.reg_operands == 2
3958 && i.op[0].regs == i.op[1].regs
3959 && ((i.tm.base_opcode == 0x30
3960 || i.tm.base_opcode == 0x28)
3961 && i.tm.extension_opcode == None))
3962 || (i.reg_operands == 1
3963 && i.operands == 1
3964 && i.tm.base_opcode == 0x30
3965 && i.tm.extension_opcode == None)))))
3966 {
3967 /* Optimize: -O:
3968 andq $imm31, %r64 -> andl $imm31, %r32
3969 andq $imm7, %r64 -> andl $imm7, %r32
3970 testq $imm31, %r64 -> testl $imm31, %r32
3971 xorq %r64, %r64 -> xorl %r32, %r32
3972 subq %r64, %r64 -> subl %r32, %r32
3973 movq $imm31, %r64 -> movl $imm31, %r32
3974 movq $imm32, %r64 -> movl $imm32, %r32
3975 */
3976 i.tm.opcode_modifier.norex64 = 1;
3977 if (i.tm.base_opcode == 0xb0 || i.tm.base_opcode == 0xc6)
3978 {
3979 /* Handle
3980 movq $imm31, %r64 -> movl $imm31, %r32
3981 movq $imm32, %r64 -> movl $imm32, %r32
3982 */
3983 i.tm.operand_types[0].bitfield.imm32 = 1;
3984 i.tm.operand_types[0].bitfield.imm32s = 0;
3985 i.tm.operand_types[0].bitfield.imm64 = 0;
3986 i.types[0].bitfield.imm32 = 1;
3987 i.types[0].bitfield.imm32s = 0;
3988 i.types[0].bitfield.imm64 = 0;
3989 i.types[1].bitfield.dword = 1;
3990 i.types[1].bitfield.qword = 0;
3991 if (i.tm.base_opcode == 0xc6)
3992 {
3993 /* Handle
3994 movq $imm31, %r64 -> movl $imm31, %r32
3995 */
3996 i.tm.base_opcode = 0xb0;
3997 i.tm.extension_opcode = None;
3998 i.tm.opcode_modifier.shortform = 1;
3999 i.tm.opcode_modifier.modrm = 0;
4000 }
4001 }
4002 }
4003 else if (i.reg_operands == 3
4004 && i.op[0].regs == i.op[1].regs
4005 && !i.types[2].bitfield.xmmword
4006 && (i.tm.opcode_modifier.vex
4007 || ((!i.mask || i.mask->zeroing)
4008 && !i.rounding
4009 && is_evex_encoding (&i.tm)
4010 && (i.vec_encoding != vex_encoding_evex
4011 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4012 || i.tm.cpu_flags.bitfield.cpuavx512vl
4013 || (i.tm.operand_types[2].bitfield.zmmword
4014 && i.types[2].bitfield.ymmword))))
4015 && ((i.tm.base_opcode == 0x55
4016 || i.tm.base_opcode == 0x6655
4017 || i.tm.base_opcode == 0x66df
4018 || i.tm.base_opcode == 0x57
4019 || i.tm.base_opcode == 0x6657
4020 || i.tm.base_opcode == 0x66ef
4021 || i.tm.base_opcode == 0x66f8
4022 || i.tm.base_opcode == 0x66f9
4023 || i.tm.base_opcode == 0x66fa
4024 || i.tm.base_opcode == 0x66fb
4025 || i.tm.base_opcode == 0x42
4026 || i.tm.base_opcode == 0x6642
4027 || i.tm.base_opcode == 0x47
4028 || i.tm.base_opcode == 0x6647)
4029 && i.tm.extension_opcode == None))
4030 {
4031 /* Optimize: -O1:
4032 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4033 vpsubq and vpsubw:
4034 EVEX VOP %zmmM, %zmmM, %zmmN
4035 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4036 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4037 EVEX VOP %ymmM, %ymmM, %ymmN
4038 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4039 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4040 VEX VOP %ymmM, %ymmM, %ymmN
4041 -> VEX VOP %xmmM, %xmmM, %xmmN
4042 VOP, one of vpandn and vpxor:
4043 VEX VOP %ymmM, %ymmM, %ymmN
4044 -> VEX VOP %xmmM, %xmmM, %xmmN
4045 VOP, one of vpandnd and vpandnq:
4046 EVEX VOP %zmmM, %zmmM, %zmmN
4047 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4048 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4049 EVEX VOP %ymmM, %ymmM, %ymmN
4050 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4051 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4052 VOP, one of vpxord and vpxorq:
4053 EVEX VOP %zmmM, %zmmM, %zmmN
4054 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4055 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4056 EVEX VOP %ymmM, %ymmM, %ymmN
4057 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4058 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4059 VOP, one of kxord and kxorq:
4060 VEX VOP %kM, %kM, %kN
4061 -> VEX kxorw %kM, %kM, %kN
4062 VOP, one of kandnd and kandnq:
4063 VEX VOP %kM, %kM, %kN
4064 -> VEX kandnw %kM, %kM, %kN
4065 */
4066 if (is_evex_encoding (&i.tm))
4067 {
4068 if (i.vec_encoding != vex_encoding_evex)
4069 {
4070 i.tm.opcode_modifier.vex = VEX128;
4071 i.tm.opcode_modifier.vexw = VEXW0;
4072 i.tm.opcode_modifier.evex = 0;
4073 }
4074 else if (optimize > 1)
4075 i.tm.opcode_modifier.evex = EVEX128;
4076 else
4077 return;
4078 }
4079 else if (i.tm.operand_types[0].bitfield.regmask)
4080 {
4081 i.tm.base_opcode &= 0xff;
4082 i.tm.opcode_modifier.vexw = VEXW0;
4083 }
4084 else
4085 i.tm.opcode_modifier.vex = VEX128;
4086
4087 if (i.tm.opcode_modifier.vex)
4088 for (j = 0; j < 3; j++)
4089 {
4090 i.types[j].bitfield.xmmword = 1;
4091 i.types[j].bitfield.ymmword = 0;
4092 }
4093 }
4094 else if (i.vec_encoding != vex_encoding_evex
4095 && !i.types[0].bitfield.zmmword
4096 && !i.types[1].bitfield.zmmword
4097 && !i.mask
4098 && !i.broadcast
4099 && is_evex_encoding (&i.tm)
4100 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4101 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4102 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4103 || (i.tm.base_opcode & ~4) == 0x66db
4104 || (i.tm.base_opcode & ~4) == 0x66eb)
4105 && i.tm.extension_opcode == None)
4106 {
4107 /* Optimize: -O1:
4108 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4109 vmovdqu32 and vmovdqu64:
4110 EVEX VOP %xmmM, %xmmN
4111 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4112 EVEX VOP %ymmM, %ymmN
4113 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4114 EVEX VOP %xmmM, mem
4115 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4116 EVEX VOP %ymmM, mem
4117 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4118 EVEX VOP mem, %xmmN
4119 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4120 EVEX VOP mem, %ymmN
4121 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4122 VOP, one of vpand, vpandn, vpor, vpxor:
4123 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4124 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4125 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4126 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4127 EVEX VOP{d,q} mem, %xmmM, %xmmN
4128 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4129 EVEX VOP{d,q} mem, %ymmM, %ymmN
4130 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4131 */
4132 for (j = 0; j < i.operands; j++)
4133 if (operand_type_check (i.types[j], disp)
4134 && i.op[j].disps->X_op == O_constant)
4135 {
4136 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4137 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4138 bytes, we choose EVEX Disp8 over VEX Disp32. */
4139 int evex_disp8, vex_disp8;
4140 unsigned int memshift = i.memshift;
4141 offsetT n = i.op[j].disps->X_add_number;
4142
4143 evex_disp8 = fits_in_disp8 (n);
4144 i.memshift = 0;
4145 vex_disp8 = fits_in_disp8 (n);
4146 if (evex_disp8 != vex_disp8)
4147 {
4148 i.memshift = memshift;
4149 return;
4150 }
4151
4152 i.types[j].bitfield.disp8 = vex_disp8;
4153 break;
4154 }
4155 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4156 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4157 i.tm.opcode_modifier.vex
4158 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4159 i.tm.opcode_modifier.vexw = VEXW0;
4160 i.tm.opcode_modifier.evex = 0;
4161 i.tm.opcode_modifier.masking = 0;
4162 i.tm.opcode_modifier.broadcast = 0;
4163 i.tm.opcode_modifier.disp8memshift = 0;
4164 i.memshift = 0;
4165 if (j < i.operands)
4166 i.types[j].bitfield.disp8
4167 = fits_in_disp8 (i.op[j].disps->X_add_number);
4168 }
4169 }
4170
4171 /* This is the guts of the machine-dependent assembler. LINE points to a
4172 machine dependent instruction. This function is supposed to emit
4173 the frags/bytes it assembles to. */
4174
4175 void
4176 md_assemble (char *line)
4177 {
4178 unsigned int j;
4179 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4180 const insn_template *t;
4181
4182 /* Initialize globals. */
4183 memset (&i, '\0', sizeof (i));
4184 for (j = 0; j < MAX_OPERANDS; j++)
4185 i.reloc[j] = NO_RELOC;
4186 memset (disp_expressions, '\0', sizeof (disp_expressions));
4187 memset (im_expressions, '\0', sizeof (im_expressions));
4188 save_stack_p = save_stack;
4189
4190 /* First parse an instruction mnemonic & call i386_operand for the operands.
4191 We assume that the scrubber has arranged it so that line[0] is the valid
4192 start of a (possibly prefixed) mnemonic. */
4193
4194 line = parse_insn (line, mnemonic);
4195 if (line == NULL)
4196 return;
4197 mnem_suffix = i.suffix;
4198
4199 line = parse_operands (line, mnemonic);
4200 this_operand = -1;
4201 xfree (i.memop1_string);
4202 i.memop1_string = NULL;
4203 if (line == NULL)
4204 return;
4205
4206 /* Now we've parsed the mnemonic into a set of templates, and have the
4207 operands at hand. */
4208
4209 /* All intel opcodes have reversed operands except for "bound" and
4210 "enter". We also don't reverse intersegment "jmp" and "call"
4211 instructions with 2 immediate operands so that the immediate segment
4212 precedes the offset, as it does when in AT&T mode. */
4213 if (intel_syntax
4214 && i.operands > 1
4215 && (strcmp (mnemonic, "bound") != 0)
4216 && (strcmp (mnemonic, "invlpga") != 0)
4217 && !(operand_type_check (i.types[0], imm)
4218 && operand_type_check (i.types[1], imm)))
4219 swap_operands ();
4220
4221 /* The order of the immediates should be reversed
4222 for 2 immediates extrq and insertq instructions */
4223 if (i.imm_operands == 2
4224 && (strcmp (mnemonic, "extrq") == 0
4225 || strcmp (mnemonic, "insertq") == 0))
4226 swap_2_operands (0, 1);
4227
4228 if (i.imm_operands)
4229 optimize_imm ();
4230
4231 /* Don't optimize displacement for movabs since it only takes 64bit
4232 displacement. */
4233 if (i.disp_operands
4234 && i.disp_encoding != disp_encoding_32bit
4235 && (flag_code != CODE_64BIT
4236 || strcmp (mnemonic, "movabs") != 0))
4237 optimize_disp ();
4238
4239 /* Next, we find a template that matches the given insn,
4240 making sure the overlap of the given operands types is consistent
4241 with the template operand types. */
4242
4243 if (!(t = match_template (mnem_suffix)))
4244 return;
4245
4246 if (sse_check != check_none
4247 && !i.tm.opcode_modifier.noavx
4248 && !i.tm.cpu_flags.bitfield.cpuavx
4249 && (i.tm.cpu_flags.bitfield.cpusse
4250 || i.tm.cpu_flags.bitfield.cpusse2
4251 || i.tm.cpu_flags.bitfield.cpusse3
4252 || i.tm.cpu_flags.bitfield.cpussse3
4253 || i.tm.cpu_flags.bitfield.cpusse4_1
4254 || i.tm.cpu_flags.bitfield.cpusse4_2
4255 || i.tm.cpu_flags.bitfield.cpupclmul
4256 || i.tm.cpu_flags.bitfield.cpuaes
4257 || i.tm.cpu_flags.bitfield.cpugfni))
4258 {
4259 (sse_check == check_warning
4260 ? as_warn
4261 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4262 }
4263
4264 /* Zap movzx and movsx suffix. The suffix has been set from
4265 "word ptr" or "byte ptr" on the source operand in Intel syntax
4266 or extracted from mnemonic in AT&T syntax. But we'll use
4267 the destination register to choose the suffix for encoding. */
4268 if ((i.tm.base_opcode & ~9) == 0x0fb6)
4269 {
4270 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
4271 there is no suffix, the default will be byte extension. */
4272 if (i.reg_operands != 2
4273 && !i.suffix
4274 && intel_syntax)
4275 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4276
4277 i.suffix = 0;
4278 }
4279
4280 if (i.tm.opcode_modifier.fwait)
4281 if (!add_prefix (FWAIT_OPCODE))
4282 return;
4283
4284 /* Check if REP prefix is OK. */
4285 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4286 {
4287 as_bad (_("invalid instruction `%s' after `%s'"),
4288 i.tm.name, i.rep_prefix);
4289 return;
4290 }
4291
4292 /* Check for lock without a lockable instruction. Destination operand
4293 must be memory unless it is xchg (0x86). */
4294 if (i.prefix[LOCK_PREFIX]
4295 && (!i.tm.opcode_modifier.islockable
4296 || i.mem_operands == 0
4297 || (i.tm.base_opcode != 0x86
4298 && !operand_type_check (i.types[i.operands - 1], anymem))))
4299 {
4300 as_bad (_("expecting lockable instruction after `lock'"));
4301 return;
4302 }
4303
4304 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4305 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4306 {
4307 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4308 return;
4309 }
4310
4311 /* Check if HLE prefix is OK. */
4312 if (i.hle_prefix && !check_hle ())
4313 return;
4314
4315 /* Check BND prefix. */
4316 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4317 as_bad (_("expecting valid branch instruction after `bnd'"));
4318
4319 /* Check NOTRACK prefix. */
4320 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4321 as_bad (_("expecting indirect branch instruction after `notrack'"));
4322
4323 if (i.tm.cpu_flags.bitfield.cpumpx)
4324 {
4325 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4326 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4327 else if (flag_code != CODE_16BIT
4328 ? i.prefix[ADDR_PREFIX]
4329 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4330 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4331 }
4332
4333 /* Insert BND prefix. */
4334 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4335 {
4336 if (!i.prefix[BND_PREFIX])
4337 add_prefix (BND_PREFIX_OPCODE);
4338 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4339 {
4340 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4341 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4342 }
4343 }
4344
4345 /* Check string instruction segment overrides. */
4346 if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
4347 {
4348 if (!check_string ())
4349 return;
4350 i.disp_operands = 0;
4351 }
4352
4353 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4354 optimize_encoding ();
4355
4356 if (!process_suffix ())
4357 return;
4358
4359 /* Update operand types. */
4360 for (j = 0; j < i.operands; j++)
4361 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4362
4363 /* Make still unresolved immediate matches conform to size of immediate
4364 given in i.suffix. */
4365 if (!finalize_imm ())
4366 return;
4367
4368 if (i.types[0].bitfield.imm1)
4369 i.imm_operands = 0; /* kludge for shift insns. */
4370
4371 /* We only need to check those implicit registers for instructions
4372 with 3 operands or less. */
4373 if (i.operands <= 3)
4374 for (j = 0; j < i.operands; j++)
4375 if (i.types[j].bitfield.inoutportreg
4376 || i.types[j].bitfield.shiftcount
4377 || (i.types[j].bitfield.acc && !i.types[j].bitfield.xmmword))
4378 i.reg_operands--;
4379
4380 /* ImmExt should be processed after SSE2AVX. */
4381 if (!i.tm.opcode_modifier.sse2avx
4382 && i.tm.opcode_modifier.immext)
4383 process_immext ();
4384
4385 /* For insns with operands there are more diddles to do to the opcode. */
4386 if (i.operands)
4387 {
4388 if (!process_operands ())
4389 return;
4390 }
4391 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4392 {
4393 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4394 as_warn (_("translating to `%sp'"), i.tm.name);
4395 }
4396
4397 if (is_any_vex_encoding (&i.tm))
4398 {
4399 if (!cpu_arch_flags.bitfield.cpui286)
4400 {
4401 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4402 i.tm.name);
4403 return;
4404 }
4405
4406 if (i.tm.opcode_modifier.vex)
4407 build_vex_prefix (t);
4408 else
4409 build_evex_prefix ();
4410 }
4411
4412 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4413 instructions may define INT_OPCODE as well, so avoid this corner
4414 case for those instructions that use MODRM. */
4415 if (i.tm.base_opcode == INT_OPCODE
4416 && !i.tm.opcode_modifier.modrm
4417 && i.op[0].imms->X_add_number == 3)
4418 {
4419 i.tm.base_opcode = INT3_OPCODE;
4420 i.imm_operands = 0;
4421 }
4422
4423 if ((i.tm.opcode_modifier.jump
4424 || i.tm.opcode_modifier.jumpbyte
4425 || i.tm.opcode_modifier.jumpdword)
4426 && i.op[0].disps->X_op == O_constant)
4427 {
4428 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4429 the absolute address given by the constant. Since ix86 jumps and
4430 calls are pc relative, we need to generate a reloc. */
4431 i.op[0].disps->X_add_symbol = &abs_symbol;
4432 i.op[0].disps->X_op = O_symbol;
4433 }
4434
4435 if (i.tm.opcode_modifier.rex64)
4436 i.rex |= REX_W;
4437
4438 /* For 8 bit registers we need an empty rex prefix. Also if the
4439 instruction already has a prefix, we need to convert old
4440 registers to new ones. */
4441
4442 if ((i.types[0].bitfield.reg && i.types[0].bitfield.byte
4443 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4444 || (i.types[1].bitfield.reg && i.types[1].bitfield.byte
4445 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4446 || (((i.types[0].bitfield.reg && i.types[0].bitfield.byte)
4447 || (i.types[1].bitfield.reg && i.types[1].bitfield.byte))
4448 && i.rex != 0))
4449 {
4450 int x;
4451
4452 i.rex |= REX_OPCODE;
4453 for (x = 0; x < 2; x++)
4454 {
4455 /* Look for 8 bit operand that uses old registers. */
4456 if (i.types[x].bitfield.reg && i.types[x].bitfield.byte
4457 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4458 {
4459 /* In case it is "hi" register, give up. */
4460 if (i.op[x].regs->reg_num > 3)
4461 as_bad (_("can't encode register '%s%s' in an "
4462 "instruction requiring REX prefix."),
4463 register_prefix, i.op[x].regs->reg_name);
4464
4465 /* Otherwise it is equivalent to the extended register.
4466 Since the encoding doesn't change this is merely
4467 cosmetic cleanup for debug output. */
4468
4469 i.op[x].regs = i.op[x].regs + 8;
4470 }
4471 }
4472 }
4473
4474 if (i.rex == 0 && i.rex_encoding)
4475 {
4476 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4477 that uses legacy register. If it is "hi" register, don't add
4478 the REX_OPCODE byte. */
4479 int x;
4480 for (x = 0; x < 2; x++)
4481 if (i.types[x].bitfield.reg
4482 && i.types[x].bitfield.byte
4483 && (i.op[x].regs->reg_flags & RegRex64) == 0
4484 && i.op[x].regs->reg_num > 3)
4485 {
4486 i.rex_encoding = FALSE;
4487 break;
4488 }
4489
4490 if (i.rex_encoding)
4491 i.rex = REX_OPCODE;
4492 }
4493
4494 if (i.rex != 0)
4495 add_prefix (REX_OPCODE | i.rex);
4496
4497 /* We are ready to output the insn. */
4498 output_insn ();
4499 }
4500
4501 static char *
4502 parse_insn (char *line, char *mnemonic)
4503 {
4504 char *l = line;
4505 char *token_start = l;
4506 char *mnem_p;
4507 int supported;
4508 const insn_template *t;
4509 char *dot_p = NULL;
4510
4511 while (1)
4512 {
4513 mnem_p = mnemonic;
4514 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4515 {
4516 if (*mnem_p == '.')
4517 dot_p = mnem_p;
4518 mnem_p++;
4519 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4520 {
4521 as_bad (_("no such instruction: `%s'"), token_start);
4522 return NULL;
4523 }
4524 l++;
4525 }
4526 if (!is_space_char (*l)
4527 && *l != END_OF_INSN
4528 && (intel_syntax
4529 || (*l != PREFIX_SEPARATOR
4530 && *l != ',')))
4531 {
4532 as_bad (_("invalid character %s in mnemonic"),
4533 output_invalid (*l));
4534 return NULL;
4535 }
4536 if (token_start == l)
4537 {
4538 if (!intel_syntax && *l == PREFIX_SEPARATOR)
4539 as_bad (_("expecting prefix; got nothing"));
4540 else
4541 as_bad (_("expecting mnemonic; got nothing"));
4542 return NULL;
4543 }
4544
4545 /* Look up instruction (or prefix) via hash table. */
4546 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4547
4548 if (*l != END_OF_INSN
4549 && (!is_space_char (*l) || l[1] != END_OF_INSN)
4550 && current_templates
4551 && current_templates->start->opcode_modifier.isprefix)
4552 {
4553 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4554 {
4555 as_bad ((flag_code != CODE_64BIT
4556 ? _("`%s' is only supported in 64-bit mode")
4557 : _("`%s' is not supported in 64-bit mode")),
4558 current_templates->start->name);
4559 return NULL;
4560 }
4561 /* If we are in 16-bit mode, do not allow addr16 or data16.
4562 Similarly, in 32-bit mode, do not allow addr32 or data32. */
4563 if ((current_templates->start->opcode_modifier.size == SIZE16
4564 || current_templates->start->opcode_modifier.size == SIZE32)
4565 && flag_code != CODE_64BIT
4566 && ((current_templates->start->opcode_modifier.size == SIZE32)
4567 ^ (flag_code == CODE_16BIT)))
4568 {
4569 as_bad (_("redundant %s prefix"),
4570 current_templates->start->name);
4571 return NULL;
4572 }
4573 if (current_templates->start->opcode_length == 0)
4574 {
4575 /* Handle pseudo prefixes. */
4576 switch (current_templates->start->base_opcode)
4577 {
4578 case 0x0:
4579 /* {disp8} */
4580 i.disp_encoding = disp_encoding_8bit;
4581 break;
4582 case 0x1:
4583 /* {disp32} */
4584 i.disp_encoding = disp_encoding_32bit;
4585 break;
4586 case 0x2:
4587 /* {load} */
4588 i.dir_encoding = dir_encoding_load;
4589 break;
4590 case 0x3:
4591 /* {store} */
4592 i.dir_encoding = dir_encoding_store;
4593 break;
4594 case 0x4:
4595 /* {vex2} */
4596 i.vec_encoding = vex_encoding_vex2;
4597 break;
4598 case 0x5:
4599 /* {vex3} */
4600 i.vec_encoding = vex_encoding_vex3;
4601 break;
4602 case 0x6:
4603 /* {evex} */
4604 i.vec_encoding = vex_encoding_evex;
4605 break;
4606 case 0x7:
4607 /* {rex} */
4608 i.rex_encoding = TRUE;
4609 break;
4610 case 0x8:
4611 /* {nooptimize} */
4612 i.no_optimize = TRUE;
4613 break;
4614 default:
4615 abort ();
4616 }
4617 }
4618 else
4619 {
4620 /* Add prefix, checking for repeated prefixes. */
4621 switch (add_prefix (current_templates->start->base_opcode))
4622 {
4623 case PREFIX_EXIST:
4624 return NULL;
4625 case PREFIX_DS:
4626 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4627 i.notrack_prefix = current_templates->start->name;
4628 break;
4629 case PREFIX_REP:
4630 if (current_templates->start->cpu_flags.bitfield.cpuhle)
4631 i.hle_prefix = current_templates->start->name;
4632 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4633 i.bnd_prefix = current_templates->start->name;
4634 else
4635 i.rep_prefix = current_templates->start->name;
4636 break;
4637 default:
4638 break;
4639 }
4640 }
4641 /* Skip past PREFIX_SEPARATOR and reset token_start. */
4642 token_start = ++l;
4643 }
4644 else
4645 break;
4646 }
4647
4648 if (!current_templates)
4649 {
4650 /* Deprecated functionality (new code should use pseudo-prefixes instead):
4651 Check if we should swap operand or force 32bit displacement in
4652 encoding. */
4653 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4654 i.dir_encoding = dir_encoding_swap;
4655 else if (mnem_p - 3 == dot_p
4656 && dot_p[1] == 'd'
4657 && dot_p[2] == '8')
4658 i.disp_encoding = disp_encoding_8bit;
4659 else if (mnem_p - 4 == dot_p
4660 && dot_p[1] == 'd'
4661 && dot_p[2] == '3'
4662 && dot_p[3] == '2')
4663 i.disp_encoding = disp_encoding_32bit;
4664 else
4665 goto check_suffix;
4666 mnem_p = dot_p;
4667 *dot_p = '\0';
4668 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4669 }
4670
4671 if (!current_templates)
4672 {
4673 check_suffix:
4674 if (mnem_p > mnemonic)
4675 {
4676 /* See if we can get a match by trimming off a suffix. */
4677 switch (mnem_p[-1])
4678 {
4679 case WORD_MNEM_SUFFIX:
4680 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4681 i.suffix = SHORT_MNEM_SUFFIX;
4682 else
4683 /* Fall through. */
4684 case BYTE_MNEM_SUFFIX:
4685 case QWORD_MNEM_SUFFIX:
4686 i.suffix = mnem_p[-1];
4687 mnem_p[-1] = '\0';
4688 current_templates = (const templates *) hash_find (op_hash,
4689 mnemonic);
4690 break;
4691 case SHORT_MNEM_SUFFIX:
4692 case LONG_MNEM_SUFFIX:
4693 if (!intel_syntax)
4694 {
4695 i.suffix = mnem_p[-1];
4696 mnem_p[-1] = '\0';
4697 current_templates = (const templates *) hash_find (op_hash,
4698 mnemonic);
4699 }
4700 break;
4701
4702 /* Intel Syntax. */
4703 case 'd':
4704 if (intel_syntax)
4705 {
4706 if (intel_float_operand (mnemonic) == 1)
4707 i.suffix = SHORT_MNEM_SUFFIX;
4708 else
4709 i.suffix = LONG_MNEM_SUFFIX;
4710 mnem_p[-1] = '\0';
4711 current_templates = (const templates *) hash_find (op_hash,
4712 mnemonic);
4713 }
4714 break;
4715 }
4716 }
4717
4718 if (!current_templates)
4719 {
4720 as_bad (_("no such instruction: `%s'"), token_start);
4721 return NULL;
4722 }
4723 }
4724
4725 if (current_templates->start->opcode_modifier.jump
4726 || current_templates->start->opcode_modifier.jumpbyte)
4727 {
4728 /* Check for a branch hint. We allow ",pt" and ",pn" for
4729 predict taken and predict not taken respectively.
4730 I'm not sure that branch hints actually do anything on loop
4731 and jcxz insns (JumpByte) for current Pentium4 chips. They
4732 may work in the future and it doesn't hurt to accept them
4733 now. */
4734 if (l[0] == ',' && l[1] == 'p')
4735 {
4736 if (l[2] == 't')
4737 {
4738 if (!add_prefix (DS_PREFIX_OPCODE))
4739 return NULL;
4740 l += 3;
4741 }
4742 else if (l[2] == 'n')
4743 {
4744 if (!add_prefix (CS_PREFIX_OPCODE))
4745 return NULL;
4746 l += 3;
4747 }
4748 }
4749 }
4750 /* Any other comma loses. */
4751 if (*l == ',')
4752 {
4753 as_bad (_("invalid character %s in mnemonic"),
4754 output_invalid (*l));
4755 return NULL;
4756 }
4757
4758 /* Check if instruction is supported on specified architecture. */
4759 supported = 0;
4760 for (t = current_templates->start; t < current_templates->end; ++t)
4761 {
4762 supported |= cpu_flags_match (t);
4763 if (supported == CPU_FLAGS_PERFECT_MATCH)
4764 {
4765 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4766 as_warn (_("use .code16 to ensure correct addressing mode"));
4767
4768 return l;
4769 }
4770 }
4771
4772 if (!(supported & CPU_FLAGS_64BIT_MATCH))
4773 as_bad (flag_code == CODE_64BIT
4774 ? _("`%s' is not supported in 64-bit mode")
4775 : _("`%s' is only supported in 64-bit mode"),
4776 current_templates->start->name);
4777 else
4778 as_bad (_("`%s' is not supported on `%s%s'"),
4779 current_templates->start->name,
4780 cpu_arch_name ? cpu_arch_name : default_arch,
4781 cpu_sub_arch_name ? cpu_sub_arch_name : "");
4782
4783 return NULL;
4784 }
4785
4786 static char *
4787 parse_operands (char *l, const char *mnemonic)
4788 {
4789 char *token_start;
4790
4791 /* 1 if operand is pending after ','. */
4792 unsigned int expecting_operand = 0;
4793
4794 /* Non-zero if operand parens not balanced. */
4795 unsigned int paren_not_balanced;
4796
4797 while (*l != END_OF_INSN)
4798 {
4799 /* Skip optional white space before operand. */
4800 if (is_space_char (*l))
4801 ++l;
4802 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4803 {
4804 as_bad (_("invalid character %s before operand %d"),
4805 output_invalid (*l),
4806 i.operands + 1);
4807 return NULL;
4808 }
4809 token_start = l; /* After white space. */
4810 paren_not_balanced = 0;
4811 while (paren_not_balanced || *l != ',')
4812 {
4813 if (*l == END_OF_INSN)
4814 {
4815 if (paren_not_balanced)
4816 {
4817 if (!intel_syntax)
4818 as_bad (_("unbalanced parenthesis in operand %d."),
4819 i.operands + 1);
4820 else
4821 as_bad (_("unbalanced brackets in operand %d."),
4822 i.operands + 1);
4823 return NULL;
4824 }
4825 else
4826 break; /* we are done */
4827 }
4828 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4829 {
4830 as_bad (_("invalid character %s in operand %d"),
4831 output_invalid (*l),
4832 i.operands + 1);
4833 return NULL;
4834 }
4835 if (!intel_syntax)
4836 {
4837 if (*l == '(')
4838 ++paren_not_balanced;
4839 if (*l == ')')
4840 --paren_not_balanced;
4841 }
4842 else
4843 {
4844 if (*l == '[')
4845 ++paren_not_balanced;
4846 if (*l == ']')
4847 --paren_not_balanced;
4848 }
4849 l++;
4850 }
4851 if (l != token_start)
4852 { /* Yes, we've read in another operand. */
4853 unsigned int operand_ok;
4854 this_operand = i.operands++;
4855 if (i.operands > MAX_OPERANDS)
4856 {
4857 as_bad (_("spurious operands; (%d operands/instruction max)"),
4858 MAX_OPERANDS);
4859 return NULL;
4860 }
4861 i.types[this_operand].bitfield.unspecified = 1;
4862 /* Now parse operand adding info to 'i' as we go along. */
4863 END_STRING_AND_SAVE (l);
4864
4865 if (i.mem_operands > 1)
4866 {
4867 as_bad (_("too many memory references for `%s'"),
4868 mnemonic);
4869 return 0;
4870 }
4871
4872 if (intel_syntax)
4873 operand_ok =
4874 i386_intel_operand (token_start,
4875 intel_float_operand (mnemonic));
4876 else
4877 operand_ok = i386_att_operand (token_start);
4878
4879 RESTORE_END_STRING (l);
4880 if (!operand_ok)
4881 return NULL;
4882 }
4883 else
4884 {
4885 if (expecting_operand)
4886 {
4887 expecting_operand_after_comma:
4888 as_bad (_("expecting operand after ','; got nothing"));
4889 return NULL;
4890 }
4891 if (*l == ',')
4892 {
4893 as_bad (_("expecting operand before ','; got nothing"));
4894 return NULL;
4895 }
4896 }
4897
4898 /* Now *l must be either ',' or END_OF_INSN. */
4899 if (*l == ',')
4900 {
4901 if (*++l == END_OF_INSN)
4902 {
4903 /* Just skip it, if it's \n complain. */
4904 goto expecting_operand_after_comma;
4905 }
4906 expecting_operand = 1;
4907 }
4908 }
4909 return l;
4910 }
4911
4912 static void
4913 swap_2_operands (int xchg1, int xchg2)
4914 {
4915 union i386_op temp_op;
4916 i386_operand_type temp_type;
4917 unsigned int temp_flags;
4918 enum bfd_reloc_code_real temp_reloc;
4919
4920 temp_type = i.types[xchg2];
4921 i.types[xchg2] = i.types[xchg1];
4922 i.types[xchg1] = temp_type;
4923
4924 temp_flags = i.flags[xchg2];
4925 i.flags[xchg2] = i.flags[xchg1];
4926 i.flags[xchg1] = temp_flags;
4927
4928 temp_op = i.op[xchg2];
4929 i.op[xchg2] = i.op[xchg1];
4930 i.op[xchg1] = temp_op;
4931
4932 temp_reloc = i.reloc[xchg2];
4933 i.reloc[xchg2] = i.reloc[xchg1];
4934 i.reloc[xchg1] = temp_reloc;
4935
4936 if (i.mask)
4937 {
4938 if (i.mask->operand == xchg1)
4939 i.mask->operand = xchg2;
4940 else if (i.mask->operand == xchg2)
4941 i.mask->operand = xchg1;
4942 }
4943 if (i.broadcast)
4944 {
4945 if (i.broadcast->operand == xchg1)
4946 i.broadcast->operand = xchg2;
4947 else if (i.broadcast->operand == xchg2)
4948 i.broadcast->operand = xchg1;
4949 }
4950 if (i.rounding)
4951 {
4952 if (i.rounding->operand == xchg1)
4953 i.rounding->operand = xchg2;
4954 else if (i.rounding->operand == xchg2)
4955 i.rounding->operand = xchg1;
4956 }
4957 }
4958
4959 static void
4960 swap_operands (void)
4961 {
4962 switch (i.operands)
4963 {
4964 case 5:
4965 case 4:
4966 swap_2_operands (1, i.operands - 2);
4967 /* Fall through. */
4968 case 3:
4969 case 2:
4970 swap_2_operands (0, i.operands - 1);
4971 break;
4972 default:
4973 abort ();
4974 }
4975
4976 if (i.mem_operands == 2)
4977 {
4978 const seg_entry *temp_seg;
4979 temp_seg = i.seg[0];
4980 i.seg[0] = i.seg[1];
4981 i.seg[1] = temp_seg;
4982 }
4983 }
4984
4985 /* Try to ensure constant immediates are represented in the smallest
4986 opcode possible. */
4987 static void
4988 optimize_imm (void)
4989 {
4990 char guess_suffix = 0;
4991 int op;
4992
4993 if (i.suffix)
4994 guess_suffix = i.suffix;
4995 else if (i.reg_operands)
4996 {
4997 /* Figure out a suffix from the last register operand specified.
4998 We can't do this properly yet, ie. excluding InOutPortReg,
4999 but the following works for instructions with immediates.
5000 In any case, we can't set i.suffix yet. */
5001 for (op = i.operands; --op >= 0;)
5002 if (i.types[op].bitfield.reg && i.types[op].bitfield.byte)
5003 {
5004 guess_suffix = BYTE_MNEM_SUFFIX;
5005 break;
5006 }
5007 else if (i.types[op].bitfield.reg && i.types[op].bitfield.word)
5008 {
5009 guess_suffix = WORD_MNEM_SUFFIX;
5010 break;
5011 }
5012 else if (i.types[op].bitfield.reg && i.types[op].bitfield.dword)
5013 {
5014 guess_suffix = LONG_MNEM_SUFFIX;
5015 break;
5016 }
5017 else if (i.types[op].bitfield.reg && i.types[op].bitfield.qword)
5018 {
5019 guess_suffix = QWORD_MNEM_SUFFIX;
5020 break;
5021 }
5022 }
5023 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5024 guess_suffix = WORD_MNEM_SUFFIX;
5025
5026 for (op = i.operands; --op >= 0;)
5027 if (operand_type_check (i.types[op], imm))
5028 {
5029 switch (i.op[op].imms->X_op)
5030 {
5031 case O_constant:
5032 /* If a suffix is given, this operand may be shortened. */
5033 switch (guess_suffix)
5034 {
5035 case LONG_MNEM_SUFFIX:
5036 i.types[op].bitfield.imm32 = 1;
5037 i.types[op].bitfield.imm64 = 1;
5038 break;
5039 case WORD_MNEM_SUFFIX:
5040 i.types[op].bitfield.imm16 = 1;
5041 i.types[op].bitfield.imm32 = 1;
5042 i.types[op].bitfield.imm32s = 1;
5043 i.types[op].bitfield.imm64 = 1;
5044 break;
5045 case BYTE_MNEM_SUFFIX:
5046 i.types[op].bitfield.imm8 = 1;
5047 i.types[op].bitfield.imm8s = 1;
5048 i.types[op].bitfield.imm16 = 1;
5049 i.types[op].bitfield.imm32 = 1;
5050 i.types[op].bitfield.imm32s = 1;
5051 i.types[op].bitfield.imm64 = 1;
5052 break;
5053 }
5054
5055 /* If this operand is at most 16 bits, convert it
5056 to a signed 16 bit number before trying to see
5057 whether it will fit in an even smaller size.
5058 This allows a 16-bit operand such as $0xffe0 to
5059 be recognised as within Imm8S range. */
5060 if ((i.types[op].bitfield.imm16)
5061 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5062 {
5063 i.op[op].imms->X_add_number =
5064 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5065 }
5066 #ifdef BFD64
5067 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5068 if ((i.types[op].bitfield.imm32)
5069 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5070 == 0))
5071 {
5072 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5073 ^ ((offsetT) 1 << 31))
5074 - ((offsetT) 1 << 31));
5075 }
5076 #endif
5077 i.types[op]
5078 = operand_type_or (i.types[op],
5079 smallest_imm_type (i.op[op].imms->X_add_number));
5080
5081 /* We must avoid matching of Imm32 templates when 64bit
5082 only immediate is available. */
5083 if (guess_suffix == QWORD_MNEM_SUFFIX)
5084 i.types[op].bitfield.imm32 = 0;
5085 break;
5086
5087 case O_absent:
5088 case O_register:
5089 abort ();
5090
5091 /* Symbols and expressions. */
5092 default:
5093 /* Convert symbolic operand to proper sizes for matching, but don't
5094 prevent matching a set of insns that only supports sizes other
5095 than those matching the insn suffix. */
5096 {
5097 i386_operand_type mask, allowed;
5098 const insn_template *t;
5099
5100 operand_type_set (&mask, 0);
5101 operand_type_set (&allowed, 0);
5102
5103 for (t = current_templates->start;
5104 t < current_templates->end;
5105 ++t)
5106 allowed = operand_type_or (allowed,
5107 t->operand_types[op]);
5108 switch (guess_suffix)
5109 {
5110 case QWORD_MNEM_SUFFIX:
5111 mask.bitfield.imm64 = 1;
5112 mask.bitfield.imm32s = 1;
5113 break;
5114 case LONG_MNEM_SUFFIX:
5115 mask.bitfield.imm32 = 1;
5116 break;
5117 case WORD_MNEM_SUFFIX:
5118 mask.bitfield.imm16 = 1;
5119 break;
5120 case BYTE_MNEM_SUFFIX:
5121 mask.bitfield.imm8 = 1;
5122 break;
5123 default:
5124 break;
5125 }
5126 allowed = operand_type_and (mask, allowed);
5127 if (!operand_type_all_zero (&allowed))
5128 i.types[op] = operand_type_and (i.types[op], mask);
5129 }
5130 break;
5131 }
5132 }
5133 }
5134
5135 /* Try to use the smallest displacement type too. */
5136 static void
5137 optimize_disp (void)
5138 {
5139 int op;
5140
5141 for (op = i.operands; --op >= 0;)
5142 if (operand_type_check (i.types[op], disp))
5143 {
5144 if (i.op[op].disps->X_op == O_constant)
5145 {
5146 offsetT op_disp = i.op[op].disps->X_add_number;
5147
5148 if (i.types[op].bitfield.disp16
5149 && (op_disp & ~(offsetT) 0xffff) == 0)
5150 {
5151 /* If this operand is at most 16 bits, convert
5152 to a signed 16 bit number and don't use 64bit
5153 displacement. */
5154 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5155 i.types[op].bitfield.disp64 = 0;
5156 }
5157 #ifdef BFD64
5158 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5159 if (i.types[op].bitfield.disp32
5160 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5161 {
5162 /* If this operand is at most 32 bits, convert
5163 to a signed 32 bit number and don't use 64bit
5164 displacement. */
5165 op_disp &= (((offsetT) 2 << 31) - 1);
5166 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5167 i.types[op].bitfield.disp64 = 0;
5168 }
5169 #endif
5170 if (!op_disp && i.types[op].bitfield.baseindex)
5171 {
5172 i.types[op].bitfield.disp8 = 0;
5173 i.types[op].bitfield.disp16 = 0;
5174 i.types[op].bitfield.disp32 = 0;
5175 i.types[op].bitfield.disp32s = 0;
5176 i.types[op].bitfield.disp64 = 0;
5177 i.op[op].disps = 0;
5178 i.disp_operands--;
5179 }
5180 else if (flag_code == CODE_64BIT)
5181 {
5182 if (fits_in_signed_long (op_disp))
5183 {
5184 i.types[op].bitfield.disp64 = 0;
5185 i.types[op].bitfield.disp32s = 1;
5186 }
5187 if (i.prefix[ADDR_PREFIX]
5188 && fits_in_unsigned_long (op_disp))
5189 i.types[op].bitfield.disp32 = 1;
5190 }
5191 if ((i.types[op].bitfield.disp32
5192 || i.types[op].bitfield.disp32s
5193 || i.types[op].bitfield.disp16)
5194 && fits_in_disp8 (op_disp))
5195 i.types[op].bitfield.disp8 = 1;
5196 }
5197 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5198 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5199 {
5200 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5201 i.op[op].disps, 0, i.reloc[op]);
5202 i.types[op].bitfield.disp8 = 0;
5203 i.types[op].bitfield.disp16 = 0;
5204 i.types[op].bitfield.disp32 = 0;
5205 i.types[op].bitfield.disp32s = 0;
5206 i.types[op].bitfield.disp64 = 0;
5207 }
5208 else
5209 /* We only support 64bit displacement on constants. */
5210 i.types[op].bitfield.disp64 = 0;
5211 }
5212 }
5213
5214 /* Return 1 if there is a match in broadcast bytes between operand
5215 GIVEN and instruction template T. */
5216
5217 static INLINE int
5218 match_broadcast_size (const insn_template *t, unsigned int given)
5219 {
5220 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5221 && i.types[given].bitfield.byte)
5222 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5223 && i.types[given].bitfield.word)
5224 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5225 && i.types[given].bitfield.dword)
5226 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5227 && i.types[given].bitfield.qword));
5228 }
5229
5230 /* Check if operands are valid for the instruction. */
5231
5232 static int
5233 check_VecOperands (const insn_template *t)
5234 {
5235 unsigned int op;
5236 i386_cpu_flags cpu;
5237 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
5238
5239 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5240 any one operand are implicity requiring AVX512VL support if the actual
5241 operand size is YMMword or XMMword. Since this function runs after
5242 template matching, there's no need to check for YMMword/XMMword in
5243 the template. */
5244 cpu = cpu_flags_and (t->cpu_flags, avx512);
5245 if (!cpu_flags_all_zero (&cpu)
5246 && !t->cpu_flags.bitfield.cpuavx512vl
5247 && !cpu_arch_flags.bitfield.cpuavx512vl)
5248 {
5249 for (op = 0; op < t->operands; ++op)
5250 {
5251 if (t->operand_types[op].bitfield.zmmword
5252 && (i.types[op].bitfield.ymmword
5253 || i.types[op].bitfield.xmmword))
5254 {
5255 i.error = unsupported;
5256 return 1;
5257 }
5258 }
5259 }
5260
5261 /* Without VSIB byte, we can't have a vector register for index. */
5262 if (!t->opcode_modifier.vecsib
5263 && i.index_reg
5264 && (i.index_reg->reg_type.bitfield.xmmword
5265 || i.index_reg->reg_type.bitfield.ymmword
5266 || i.index_reg->reg_type.bitfield.zmmword))
5267 {
5268 i.error = unsupported_vector_index_register;
5269 return 1;
5270 }
5271
5272 /* Check if default mask is allowed. */
5273 if (t->opcode_modifier.nodefmask
5274 && (!i.mask || i.mask->mask->reg_num == 0))
5275 {
5276 i.error = no_default_mask;
5277 return 1;
5278 }
5279
5280 /* For VSIB byte, we need a vector register for index, and all vector
5281 registers must be distinct. */
5282 if (t->opcode_modifier.vecsib)
5283 {
5284 if (!i.index_reg
5285 || !((t->opcode_modifier.vecsib == VecSIB128
5286 && i.index_reg->reg_type.bitfield.xmmword)
5287 || (t->opcode_modifier.vecsib == VecSIB256
5288 && i.index_reg->reg_type.bitfield.ymmword)
5289 || (t->opcode_modifier.vecsib == VecSIB512
5290 && i.index_reg->reg_type.bitfield.zmmword)))
5291 {
5292 i.error = invalid_vsib_address;
5293 return 1;
5294 }
5295
5296 gas_assert (i.reg_operands == 2 || i.mask);
5297 if (i.reg_operands == 2 && !i.mask)
5298 {
5299 gas_assert (i.types[0].bitfield.regsimd);
5300 gas_assert (i.types[0].bitfield.xmmword
5301 || i.types[0].bitfield.ymmword);
5302 gas_assert (i.types[2].bitfield.regsimd);
5303 gas_assert (i.types[2].bitfield.xmmword
5304 || i.types[2].bitfield.ymmword);
5305 if (operand_check == check_none)
5306 return 0;
5307 if (register_number (i.op[0].regs)
5308 != register_number (i.index_reg)
5309 && register_number (i.op[2].regs)
5310 != register_number (i.index_reg)
5311 && register_number (i.op[0].regs)
5312 != register_number (i.op[2].regs))
5313 return 0;
5314 if (operand_check == check_error)
5315 {
5316 i.error = invalid_vector_register_set;
5317 return 1;
5318 }
5319 as_warn (_("mask, index, and destination registers should be distinct"));
5320 }
5321 else if (i.reg_operands == 1 && i.mask)
5322 {
5323 if (i.types[1].bitfield.regsimd
5324 && (i.types[1].bitfield.xmmword
5325 || i.types[1].bitfield.ymmword
5326 || i.types[1].bitfield.zmmword)
5327 && (register_number (i.op[1].regs)
5328 == register_number (i.index_reg)))
5329 {
5330 if (operand_check == check_error)
5331 {
5332 i.error = invalid_vector_register_set;
5333 return 1;
5334 }
5335 if (operand_check != check_none)
5336 as_warn (_("index and destination registers should be distinct"));
5337 }
5338 }
5339 }
5340
5341 /* Check if broadcast is supported by the instruction and is applied
5342 to the memory operand. */
5343 if (i.broadcast)
5344 {
5345 i386_operand_type type, overlap;
5346
5347 /* Check if specified broadcast is supported in this instruction,
5348 and its broadcast bytes match the memory operand. */
5349 op = i.broadcast->operand;
5350 if (!t->opcode_modifier.broadcast
5351 || !(i.flags[op] & Operand_Mem)
5352 || (!i.types[op].bitfield.unspecified
5353 && !match_broadcast_size (t, op)))
5354 {
5355 bad_broadcast:
5356 i.error = unsupported_broadcast;
5357 return 1;
5358 }
5359
5360 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5361 * i.broadcast->type);
5362 operand_type_set (&type, 0);
5363 switch (i.broadcast->bytes)
5364 {
5365 case 2:
5366 type.bitfield.word = 1;
5367 break;
5368 case 4:
5369 type.bitfield.dword = 1;
5370 break;
5371 case 8:
5372 type.bitfield.qword = 1;
5373 break;
5374 case 16:
5375 type.bitfield.xmmword = 1;
5376 break;
5377 case 32:
5378 type.bitfield.ymmword = 1;
5379 break;
5380 case 64:
5381 type.bitfield.zmmword = 1;
5382 break;
5383 default:
5384 goto bad_broadcast;
5385 }
5386
5387 overlap = operand_type_and (type, t->operand_types[op]);
5388 if (operand_type_all_zero (&overlap))
5389 goto bad_broadcast;
5390
5391 if (t->opcode_modifier.checkregsize)
5392 {
5393 unsigned int j;
5394
5395 type.bitfield.baseindex = 1;
5396 for (j = 0; j < i.operands; ++j)
5397 {
5398 if (j != op
5399 && !operand_type_register_match(i.types[j],
5400 t->operand_types[j],
5401 type,
5402 t->operand_types[op]))
5403 goto bad_broadcast;
5404 }
5405 }
5406 }
5407 /* If broadcast is supported in this instruction, we need to check if
5408 operand of one-element size isn't specified without broadcast. */
5409 else if (t->opcode_modifier.broadcast && i.mem_operands)
5410 {
5411 /* Find memory operand. */
5412 for (op = 0; op < i.operands; op++)
5413 if (operand_type_check (i.types[op], anymem))
5414 break;
5415 gas_assert (op < i.operands);
5416 /* Check size of the memory operand. */
5417 if (match_broadcast_size (t, op))
5418 {
5419 i.error = broadcast_needed;
5420 return 1;
5421 }
5422 }
5423 else
5424 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5425
5426 /* Check if requested masking is supported. */
5427 if (i.mask)
5428 {
5429 switch (t->opcode_modifier.masking)
5430 {
5431 case BOTH_MASKING:
5432 break;
5433 case MERGING_MASKING:
5434 if (i.mask->zeroing)
5435 {
5436 case 0:
5437 i.error = unsupported_masking;
5438 return 1;
5439 }
5440 break;
5441 case DYNAMIC_MASKING:
5442 /* Memory destinations allow only merging masking. */
5443 if (i.mask->zeroing && i.mem_operands)
5444 {
5445 /* Find memory operand. */
5446 for (op = 0; op < i.operands; op++)
5447 if (i.flags[op] & Operand_Mem)
5448 break;
5449 gas_assert (op < i.operands);
5450 if (op == i.operands - 1)
5451 {
5452 i.error = unsupported_masking;
5453 return 1;
5454 }
5455 }
5456 break;
5457 default:
5458 abort ();
5459 }
5460 }
5461
5462 /* Check if masking is applied to dest operand. */
5463 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5464 {
5465 i.error = mask_not_on_destination;
5466 return 1;
5467 }
5468
5469 /* Check RC/SAE. */
5470 if (i.rounding)
5471 {
5472 if (!t->opcode_modifier.sae
5473 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5474 {
5475 i.error = unsupported_rc_sae;
5476 return 1;
5477 }
5478 /* If the instruction has several immediate operands and one of
5479 them is rounding, the rounding operand should be the last
5480 immediate operand. */
5481 if (i.imm_operands > 1
5482 && i.rounding->operand != (int) (i.imm_operands - 1))
5483 {
5484 i.error = rc_sae_operand_not_last_imm;
5485 return 1;
5486 }
5487 }
5488
5489 /* Check vector Disp8 operand. */
5490 if (t->opcode_modifier.disp8memshift
5491 && i.disp_encoding != disp_encoding_32bit)
5492 {
5493 if (i.broadcast)
5494 i.memshift = t->opcode_modifier.broadcast - 1;
5495 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5496 i.memshift = t->opcode_modifier.disp8memshift;
5497 else
5498 {
5499 const i386_operand_type *type = NULL;
5500
5501 i.memshift = 0;
5502 for (op = 0; op < i.operands; op++)
5503 if (operand_type_check (i.types[op], anymem))
5504 {
5505 if (t->opcode_modifier.evex == EVEXLIG)
5506 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5507 else if (t->operand_types[op].bitfield.xmmword
5508 + t->operand_types[op].bitfield.ymmword
5509 + t->operand_types[op].bitfield.zmmword <= 1)
5510 type = &t->operand_types[op];
5511 else if (!i.types[op].bitfield.unspecified)
5512 type = &i.types[op];
5513 }
5514 else if (i.types[op].bitfield.regsimd
5515 && t->opcode_modifier.evex != EVEXLIG)
5516 {
5517 if (i.types[op].bitfield.zmmword)
5518 i.memshift = 6;
5519 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5520 i.memshift = 5;
5521 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5522 i.memshift = 4;
5523 }
5524
5525 if (type)
5526 {
5527 if (type->bitfield.zmmword)
5528 i.memshift = 6;
5529 else if (type->bitfield.ymmword)
5530 i.memshift = 5;
5531 else if (type->bitfield.xmmword)
5532 i.memshift = 4;
5533 }
5534
5535 /* For the check in fits_in_disp8(). */
5536 if (i.memshift == 0)
5537 i.memshift = -1;
5538 }
5539
5540 for (op = 0; op < i.operands; op++)
5541 if (operand_type_check (i.types[op], disp)
5542 && i.op[op].disps->X_op == O_constant)
5543 {
5544 if (fits_in_disp8 (i.op[op].disps->X_add_number))
5545 {
5546 i.types[op].bitfield.disp8 = 1;
5547 return 0;
5548 }
5549 i.types[op].bitfield.disp8 = 0;
5550 }
5551 }
5552
5553 i.memshift = 0;
5554
5555 return 0;
5556 }
5557
5558 /* Check if operands are valid for the instruction. Update VEX
5559 operand types. */
5560
5561 static int
5562 VEX_check_operands (const insn_template *t)
5563 {
5564 if (i.vec_encoding == vex_encoding_evex)
5565 {
5566 /* This instruction must be encoded with EVEX prefix. */
5567 if (!is_evex_encoding (t))
5568 {
5569 i.error = unsupported;
5570 return 1;
5571 }
5572 return 0;
5573 }
5574
5575 if (!t->opcode_modifier.vex)
5576 {
5577 /* This instruction template doesn't have VEX prefix. */
5578 if (i.vec_encoding != vex_encoding_default)
5579 {
5580 i.error = unsupported;
5581 return 1;
5582 }
5583 return 0;
5584 }
5585
5586 /* Only check VEX_Imm4, which must be the first operand. */
5587 if (t->operand_types[0].bitfield.vec_imm4)
5588 {
5589 if (i.op[0].imms->X_op != O_constant
5590 || !fits_in_imm4 (i.op[0].imms->X_add_number))
5591 {
5592 i.error = bad_imm4;
5593 return 1;
5594 }
5595
5596 /* Turn off Imm8 so that update_imm won't complain. */
5597 i.types[0] = vec_imm4;
5598 }
5599
5600 return 0;
5601 }
5602
5603 static const insn_template *
5604 match_template (char mnem_suffix)
5605 {
5606 /* Points to template once we've found it. */
5607 const insn_template *t;
5608 i386_operand_type overlap0, overlap1, overlap2, overlap3;
5609 i386_operand_type overlap4;
5610 unsigned int found_reverse_match;
5611 i386_opcode_modifier suffix_check, mnemsuf_check;
5612 i386_operand_type operand_types [MAX_OPERANDS];
5613 int addr_prefix_disp;
5614 unsigned int j;
5615 unsigned int found_cpu_match, size_match;
5616 unsigned int check_register;
5617 enum i386_error specific_error = 0;
5618
5619 #if MAX_OPERANDS != 5
5620 # error "MAX_OPERANDS must be 5."
5621 #endif
5622
5623 found_reverse_match = 0;
5624 addr_prefix_disp = -1;
5625
5626 memset (&suffix_check, 0, sizeof (suffix_check));
5627 if (intel_syntax && i.broadcast)
5628 /* nothing */;
5629 else if (i.suffix == BYTE_MNEM_SUFFIX)
5630 suffix_check.no_bsuf = 1;
5631 else if (i.suffix == WORD_MNEM_SUFFIX)
5632 suffix_check.no_wsuf = 1;
5633 else if (i.suffix == SHORT_MNEM_SUFFIX)
5634 suffix_check.no_ssuf = 1;
5635 else if (i.suffix == LONG_MNEM_SUFFIX)
5636 suffix_check.no_lsuf = 1;
5637 else if (i.suffix == QWORD_MNEM_SUFFIX)
5638 suffix_check.no_qsuf = 1;
5639 else if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5640 suffix_check.no_ldsuf = 1;
5641
5642 memset (&mnemsuf_check, 0, sizeof (mnemsuf_check));
5643 if (intel_syntax)
5644 {
5645 switch (mnem_suffix)
5646 {
5647 case BYTE_MNEM_SUFFIX: mnemsuf_check.no_bsuf = 1; break;
5648 case WORD_MNEM_SUFFIX: mnemsuf_check.no_wsuf = 1; break;
5649 case SHORT_MNEM_SUFFIX: mnemsuf_check.no_ssuf = 1; break;
5650 case LONG_MNEM_SUFFIX: mnemsuf_check.no_lsuf = 1; break;
5651 case QWORD_MNEM_SUFFIX: mnemsuf_check.no_qsuf = 1; break;
5652 }
5653 }
5654
5655 /* Must have right number of operands. */
5656 i.error = number_of_operands_mismatch;
5657
5658 for (t = current_templates->start; t < current_templates->end; t++)
5659 {
5660 addr_prefix_disp = -1;
5661 found_reverse_match = 0;
5662
5663 if (i.operands != t->operands)
5664 continue;
5665
5666 /* Check processor support. */
5667 i.error = unsupported;
5668 found_cpu_match = (cpu_flags_match (t)
5669 == CPU_FLAGS_PERFECT_MATCH);
5670 if (!found_cpu_match)
5671 continue;
5672
5673 /* Check AT&T mnemonic. */
5674 i.error = unsupported_with_intel_mnemonic;
5675 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5676 continue;
5677
5678 /* Check AT&T/Intel syntax and Intel64/AMD64 ISA. */
5679 i.error = unsupported_syntax;
5680 if ((intel_syntax && t->opcode_modifier.attsyntax)
5681 || (!intel_syntax && t->opcode_modifier.intelsyntax)
5682 || (intel64 && t->opcode_modifier.amd64)
5683 || (!intel64 && t->opcode_modifier.intel64))
5684 continue;
5685
5686 /* Check the suffix, except for some instructions in intel mode. */
5687 i.error = invalid_instruction_suffix;
5688 if ((!intel_syntax || !t->opcode_modifier.ignoresize)
5689 && ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5690 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5691 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5692 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5693 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5694 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf)))
5695 continue;
5696 /* In Intel mode all mnemonic suffixes must be explicitly allowed. */
5697 if ((t->opcode_modifier.no_bsuf && mnemsuf_check.no_bsuf)
5698 || (t->opcode_modifier.no_wsuf && mnemsuf_check.no_wsuf)
5699 || (t->opcode_modifier.no_lsuf && mnemsuf_check.no_lsuf)
5700 || (t->opcode_modifier.no_ssuf && mnemsuf_check.no_ssuf)
5701 || (t->opcode_modifier.no_qsuf && mnemsuf_check.no_qsuf)
5702 || (t->opcode_modifier.no_ldsuf && mnemsuf_check.no_ldsuf))
5703 continue;
5704
5705 size_match = operand_size_match (t);
5706 if (!size_match)
5707 continue;
5708
5709 for (j = 0; j < MAX_OPERANDS; j++)
5710 operand_types[j] = t->operand_types[j];
5711
5712 /* In general, don't allow 64-bit operands in 32-bit mode. */
5713 if (i.suffix == QWORD_MNEM_SUFFIX
5714 && flag_code != CODE_64BIT
5715 && (intel_syntax
5716 ? (!t->opcode_modifier.ignoresize
5717 && !t->opcode_modifier.broadcast
5718 && !intel_float_operand (t->name))
5719 : intel_float_operand (t->name) != 2)
5720 && ((!operand_types[0].bitfield.regmmx
5721 && !operand_types[0].bitfield.regsimd)
5722 || (!operand_types[t->operands > 1].bitfield.regmmx
5723 && !operand_types[t->operands > 1].bitfield.regsimd))
5724 && (t->base_opcode != 0x0fc7
5725 || t->extension_opcode != 1 /* cmpxchg8b */))
5726 continue;
5727
5728 /* In general, don't allow 32-bit operands on pre-386. */
5729 else if (i.suffix == LONG_MNEM_SUFFIX
5730 && !cpu_arch_flags.bitfield.cpui386
5731 && (intel_syntax
5732 ? (!t->opcode_modifier.ignoresize
5733 && !intel_float_operand (t->name))
5734 : intel_float_operand (t->name) != 2)
5735 && ((!operand_types[0].bitfield.regmmx
5736 && !operand_types[0].bitfield.regsimd)
5737 || (!operand_types[t->operands > 1].bitfield.regmmx
5738 && !operand_types[t->operands > 1].bitfield.regsimd)))
5739 continue;
5740
5741 /* Do not verify operands when there are none. */
5742 else
5743 {
5744 if (!t->operands)
5745 /* We've found a match; break out of loop. */
5746 break;
5747 }
5748
5749 /* Address size prefix will turn Disp64/Disp32/Disp16 operand
5750 into Disp32/Disp16/Disp32 operand. */
5751 if (i.prefix[ADDR_PREFIX] != 0)
5752 {
5753 /* There should be only one Disp operand. */
5754 switch (flag_code)
5755 {
5756 case CODE_16BIT:
5757 for (j = 0; j < MAX_OPERANDS; j++)
5758 {
5759 if (operand_types[j].bitfield.disp16)
5760 {
5761 addr_prefix_disp = j;
5762 operand_types[j].bitfield.disp32 = 1;
5763 operand_types[j].bitfield.disp16 = 0;
5764 break;
5765 }
5766 }
5767 break;
5768 case CODE_32BIT:
5769 for (j = 0; j < MAX_OPERANDS; j++)
5770 {
5771 if (operand_types[j].bitfield.disp32)
5772 {
5773 addr_prefix_disp = j;
5774 operand_types[j].bitfield.disp32 = 0;
5775 operand_types[j].bitfield.disp16 = 1;
5776 break;
5777 }
5778 }
5779 break;
5780 case CODE_64BIT:
5781 for (j = 0; j < MAX_OPERANDS; j++)
5782 {
5783 if (operand_types[j].bitfield.disp64)
5784 {
5785 addr_prefix_disp = j;
5786 operand_types[j].bitfield.disp64 = 0;
5787 operand_types[j].bitfield.disp32 = 1;
5788 break;
5789 }
5790 }
5791 break;
5792 }
5793 }
5794
5795 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
5796 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5797 continue;
5798
5799 /* We check register size if needed. */
5800 if (t->opcode_modifier.checkregsize)
5801 {
5802 check_register = (1 << t->operands) - 1;
5803 if (i.broadcast)
5804 check_register &= ~(1 << i.broadcast->operand);
5805 }
5806 else
5807 check_register = 0;
5808
5809 overlap0 = operand_type_and (i.types[0], operand_types[0]);
5810 switch (t->operands)
5811 {
5812 case 1:
5813 if (!operand_type_match (overlap0, i.types[0]))
5814 continue;
5815 break;
5816 case 2:
5817 /* xchg %eax, %eax is a special case. It is an alias for nop
5818 only in 32bit mode and we can use opcode 0x90. In 64bit
5819 mode, we can't use 0x90 for xchg %eax, %eax since it should
5820 zero-extend %eax to %rax. */
5821 if (flag_code == CODE_64BIT
5822 && t->base_opcode == 0x90
5823 && i.types[0].bitfield.acc && i.types[0].bitfield.dword
5824 && i.types[1].bitfield.acc && i.types[1].bitfield.dword)
5825 continue;
5826 /* xrelease mov %eax, <disp> is another special case. It must not
5827 match the accumulator-only encoding of mov. */
5828 if (flag_code != CODE_64BIT
5829 && i.hle_prefix
5830 && t->base_opcode == 0xa0
5831 && i.types[0].bitfield.acc
5832 && operand_type_check (i.types[1], anymem))
5833 continue;
5834 /* Fall through. */
5835
5836 case 3:
5837 if (!(size_match & MATCH_STRAIGHT))
5838 goto check_reverse;
5839 /* Reverse direction of operands if swapping is possible in the first
5840 place (operands need to be symmetric) and
5841 - the load form is requested, and the template is a store form,
5842 - the store form is requested, and the template is a load form,
5843 - the non-default (swapped) form is requested. */
5844 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5845 if (t->opcode_modifier.d && i.reg_operands == i.operands
5846 && !operand_type_all_zero (&overlap1))
5847 switch (i.dir_encoding)
5848 {
5849 case dir_encoding_load:
5850 if (operand_type_check (operand_types[i.operands - 1], anymem)
5851 || operand_types[i.operands - 1].bitfield.regmem)
5852 goto check_reverse;
5853 break;
5854
5855 case dir_encoding_store:
5856 if (!operand_type_check (operand_types[i.operands - 1], anymem)
5857 && !operand_types[i.operands - 1].bitfield.regmem)
5858 goto check_reverse;
5859 break;
5860
5861 case dir_encoding_swap:
5862 goto check_reverse;
5863
5864 case dir_encoding_default:
5865 break;
5866 }
5867 /* If we want store form, we skip the current load. */
5868 if ((i.dir_encoding == dir_encoding_store
5869 || i.dir_encoding == dir_encoding_swap)
5870 && i.mem_operands == 0
5871 && t->opcode_modifier.load)
5872 continue;
5873 /* Fall through. */
5874 case 4:
5875 case 5:
5876 overlap1 = operand_type_and (i.types[1], operand_types[1]);
5877 if (!operand_type_match (overlap0, i.types[0])
5878 || !operand_type_match (overlap1, i.types[1])
5879 || ((check_register & 3) == 3
5880 && !operand_type_register_match (i.types[0],
5881 operand_types[0],
5882 i.types[1],
5883 operand_types[1])))
5884 {
5885 /* Check if other direction is valid ... */
5886 if (!t->opcode_modifier.d)
5887 continue;
5888
5889 check_reverse:
5890 if (!(size_match & MATCH_REVERSE))
5891 continue;
5892 /* Try reversing direction of operands. */
5893 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
5894 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
5895 if (!operand_type_match (overlap0, i.types[0])
5896 || !operand_type_match (overlap1, i.types[i.operands - 1])
5897 || (check_register
5898 && !operand_type_register_match (i.types[0],
5899 operand_types[i.operands - 1],
5900 i.types[i.operands - 1],
5901 operand_types[0])))
5902 {
5903 /* Does not match either direction. */
5904 continue;
5905 }
5906 /* found_reverse_match holds which of D or FloatR
5907 we've found. */
5908 if (!t->opcode_modifier.d)
5909 found_reverse_match = 0;
5910 else if (operand_types[0].bitfield.tbyte)
5911 found_reverse_match = Opcode_FloatD;
5912 else if (operand_types[0].bitfield.xmmword
5913 || operand_types[i.operands - 1].bitfield.xmmword
5914 || operand_types[0].bitfield.regmmx
5915 || operand_types[i.operands - 1].bitfield.regmmx
5916 || is_any_vex_encoding(t))
5917 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
5918 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
5919 else
5920 found_reverse_match = Opcode_D;
5921 if (t->opcode_modifier.floatr)
5922 found_reverse_match |= Opcode_FloatR;
5923 }
5924 else
5925 {
5926 /* Found a forward 2 operand match here. */
5927 switch (t->operands)
5928 {
5929 case 5:
5930 overlap4 = operand_type_and (i.types[4],
5931 operand_types[4]);
5932 /* Fall through. */
5933 case 4:
5934 overlap3 = operand_type_and (i.types[3],
5935 operand_types[3]);
5936 /* Fall through. */
5937 case 3:
5938 overlap2 = operand_type_and (i.types[2],
5939 operand_types[2]);
5940 break;
5941 }
5942
5943 switch (t->operands)
5944 {
5945 case 5:
5946 if (!operand_type_match (overlap4, i.types[4])
5947 || !operand_type_register_match (i.types[3],
5948 operand_types[3],
5949 i.types[4],
5950 operand_types[4]))
5951 continue;
5952 /* Fall through. */
5953 case 4:
5954 if (!operand_type_match (overlap3, i.types[3])
5955 || ((check_register & 0xa) == 0xa
5956 && !operand_type_register_match (i.types[1],
5957 operand_types[1],
5958 i.types[3],
5959 operand_types[3]))
5960 || ((check_register & 0xc) == 0xc
5961 && !operand_type_register_match (i.types[2],
5962 operand_types[2],
5963 i.types[3],
5964 operand_types[3])))
5965 continue;
5966 /* Fall through. */
5967 case 3:
5968 /* Here we make use of the fact that there are no
5969 reverse match 3 operand instructions. */
5970 if (!operand_type_match (overlap2, i.types[2])
5971 || ((check_register & 5) == 5
5972 && !operand_type_register_match (i.types[0],
5973 operand_types[0],
5974 i.types[2],
5975 operand_types[2]))
5976 || ((check_register & 6) == 6
5977 && !operand_type_register_match (i.types[1],
5978 operand_types[1],
5979 i.types[2],
5980 operand_types[2])))
5981 continue;
5982 break;
5983 }
5984 }
5985 /* Found either forward/reverse 2, 3 or 4 operand match here:
5986 slip through to break. */
5987 }
5988 if (!found_cpu_match)
5989 continue;
5990
5991 /* Check if vector and VEX operands are valid. */
5992 if (check_VecOperands (t) || VEX_check_operands (t))
5993 {
5994 specific_error = i.error;
5995 continue;
5996 }
5997
5998 /* We've found a match; break out of loop. */
5999 break;
6000 }
6001
6002 if (t == current_templates->end)
6003 {
6004 /* We found no match. */
6005 const char *err_msg;
6006 switch (specific_error ? specific_error : i.error)
6007 {
6008 default:
6009 abort ();
6010 case operand_size_mismatch:
6011 err_msg = _("operand size mismatch");
6012 break;
6013 case operand_type_mismatch:
6014 err_msg = _("operand type mismatch");
6015 break;
6016 case register_type_mismatch:
6017 err_msg = _("register type mismatch");
6018 break;
6019 case number_of_operands_mismatch:
6020 err_msg = _("number of operands mismatch");
6021 break;
6022 case invalid_instruction_suffix:
6023 err_msg = _("invalid instruction suffix");
6024 break;
6025 case bad_imm4:
6026 err_msg = _("constant doesn't fit in 4 bits");
6027 break;
6028 case unsupported_with_intel_mnemonic:
6029 err_msg = _("unsupported with Intel mnemonic");
6030 break;
6031 case unsupported_syntax:
6032 err_msg = _("unsupported syntax");
6033 break;
6034 case unsupported:
6035 as_bad (_("unsupported instruction `%s'"),
6036 current_templates->start->name);
6037 return NULL;
6038 case invalid_vsib_address:
6039 err_msg = _("invalid VSIB address");
6040 break;
6041 case invalid_vector_register_set:
6042 err_msg = _("mask, index, and destination registers must be distinct");
6043 break;
6044 case unsupported_vector_index_register:
6045 err_msg = _("unsupported vector index register");
6046 break;
6047 case unsupported_broadcast:
6048 err_msg = _("unsupported broadcast");
6049 break;
6050 case broadcast_needed:
6051 err_msg = _("broadcast is needed for operand of such type");
6052 break;
6053 case unsupported_masking:
6054 err_msg = _("unsupported masking");
6055 break;
6056 case mask_not_on_destination:
6057 err_msg = _("mask not on destination operand");
6058 break;
6059 case no_default_mask:
6060 err_msg = _("default mask isn't allowed");
6061 break;
6062 case unsupported_rc_sae:
6063 err_msg = _("unsupported static rounding/sae");
6064 break;
6065 case rc_sae_operand_not_last_imm:
6066 if (intel_syntax)
6067 err_msg = _("RC/SAE operand must precede immediate operands");
6068 else
6069 err_msg = _("RC/SAE operand must follow immediate operands");
6070 break;
6071 case invalid_register_operand:
6072 err_msg = _("invalid register operand");
6073 break;
6074 }
6075 as_bad (_("%s for `%s'"), err_msg,
6076 current_templates->start->name);
6077 return NULL;
6078 }
6079
6080 if (!quiet_warnings)
6081 {
6082 if (!intel_syntax
6083 && (i.types[0].bitfield.jumpabsolute
6084 != operand_types[0].bitfield.jumpabsolute))
6085 {
6086 as_warn (_("indirect %s without `*'"), t->name);
6087 }
6088
6089 if (t->opcode_modifier.isprefix
6090 && t->opcode_modifier.ignoresize)
6091 {
6092 /* Warn them that a data or address size prefix doesn't
6093 affect assembly of the next line of code. */
6094 as_warn (_("stand-alone `%s' prefix"), t->name);
6095 }
6096 }
6097
6098 /* Copy the template we found. */
6099 i.tm = *t;
6100
6101 if (addr_prefix_disp != -1)
6102 i.tm.operand_types[addr_prefix_disp]
6103 = operand_types[addr_prefix_disp];
6104
6105 if (found_reverse_match)
6106 {
6107 /* If we found a reverse match we must alter the opcode
6108 direction bit. found_reverse_match holds bits to change
6109 (different for int & float insns). */
6110
6111 i.tm.base_opcode ^= found_reverse_match;
6112
6113 i.tm.operand_types[0] = operand_types[i.operands - 1];
6114 i.tm.operand_types[i.operands - 1] = operand_types[0];
6115 }
6116
6117 return t;
6118 }
6119
6120 static int
6121 check_string (void)
6122 {
6123 int mem_op = operand_type_check (i.types[0], anymem) ? 0 : 1;
6124 if (i.tm.operand_types[mem_op].bitfield.esseg)
6125 {
6126 if (i.seg[0] != NULL && i.seg[0] != &es)
6127 {
6128 as_bad (_("`%s' operand %d must use `%ses' segment"),
6129 i.tm.name,
6130 mem_op + 1,
6131 register_prefix);
6132 return 0;
6133 }
6134 /* There's only ever one segment override allowed per instruction.
6135 This instruction possibly has a legal segment override on the
6136 second operand, so copy the segment to where non-string
6137 instructions store it, allowing common code. */
6138 i.seg[0] = i.seg[1];
6139 }
6140 else if (i.tm.operand_types[mem_op + 1].bitfield.esseg)
6141 {
6142 if (i.seg[1] != NULL && i.seg[1] != &es)
6143 {
6144 as_bad (_("`%s' operand %d must use `%ses' segment"),
6145 i.tm.name,
6146 mem_op + 2,
6147 register_prefix);
6148 return 0;
6149 }
6150 }
6151 return 1;
6152 }
6153
6154 static int
6155 process_suffix (void)
6156 {
6157 /* If matched instruction specifies an explicit instruction mnemonic
6158 suffix, use it. */
6159 if (i.tm.opcode_modifier.size == SIZE16)
6160 i.suffix = WORD_MNEM_SUFFIX;
6161 else if (i.tm.opcode_modifier.size == SIZE32)
6162 i.suffix = LONG_MNEM_SUFFIX;
6163 else if (i.tm.opcode_modifier.size == SIZE64)
6164 i.suffix = QWORD_MNEM_SUFFIX;
6165 else if (i.reg_operands)
6166 {
6167 /* If there's no instruction mnemonic suffix we try to invent one
6168 based on register operands. */
6169 if (!i.suffix)
6170 {
6171 /* We take i.suffix from the last register operand specified,
6172 Destination register type is more significant than source
6173 register type. crc32 in SSE4.2 prefers source register
6174 type. */
6175 if (i.tm.base_opcode == 0xf20f38f0 && i.types[0].bitfield.reg)
6176 {
6177 if (i.types[0].bitfield.byte)
6178 i.suffix = BYTE_MNEM_SUFFIX;
6179 else if (i.types[0].bitfield.word)
6180 i.suffix = WORD_MNEM_SUFFIX;
6181 else if (i.types[0].bitfield.dword)
6182 i.suffix = LONG_MNEM_SUFFIX;
6183 else if (i.types[0].bitfield.qword)
6184 i.suffix = QWORD_MNEM_SUFFIX;
6185 }
6186
6187 if (!i.suffix)
6188 {
6189 int op;
6190
6191 if (i.tm.base_opcode == 0xf20f38f0)
6192 {
6193 /* We have to know the operand size for crc32. */
6194 as_bad (_("ambiguous memory operand size for `%s`"),
6195 i.tm.name);
6196 return 0;
6197 }
6198
6199 for (op = i.operands; --op >= 0;)
6200 if (!i.tm.operand_types[op].bitfield.inoutportreg
6201 && !i.tm.operand_types[op].bitfield.shiftcount)
6202 {
6203 if (!i.types[op].bitfield.reg)
6204 continue;
6205 if (i.types[op].bitfield.byte)
6206 i.suffix = BYTE_MNEM_SUFFIX;
6207 else if (i.types[op].bitfield.word)
6208 i.suffix = WORD_MNEM_SUFFIX;
6209 else if (i.types[op].bitfield.dword)
6210 i.suffix = LONG_MNEM_SUFFIX;
6211 else if (i.types[op].bitfield.qword)
6212 i.suffix = QWORD_MNEM_SUFFIX;
6213 else
6214 continue;
6215 break;
6216 }
6217 }
6218 }
6219 else if (i.suffix == BYTE_MNEM_SUFFIX)
6220 {
6221 if (intel_syntax
6222 && i.tm.opcode_modifier.ignoresize
6223 && i.tm.opcode_modifier.no_bsuf)
6224 i.suffix = 0;
6225 else if (!check_byte_reg ())
6226 return 0;
6227 }
6228 else if (i.suffix == LONG_MNEM_SUFFIX)
6229 {
6230 if (intel_syntax
6231 && i.tm.opcode_modifier.ignoresize
6232 && i.tm.opcode_modifier.no_lsuf
6233 && !i.tm.opcode_modifier.todword
6234 && !i.tm.opcode_modifier.toqword)
6235 i.suffix = 0;
6236 else if (!check_long_reg ())
6237 return 0;
6238 }
6239 else if (i.suffix == QWORD_MNEM_SUFFIX)
6240 {
6241 if (intel_syntax
6242 && i.tm.opcode_modifier.ignoresize
6243 && i.tm.opcode_modifier.no_qsuf
6244 && !i.tm.opcode_modifier.todword
6245 && !i.tm.opcode_modifier.toqword)
6246 i.suffix = 0;
6247 else if (!check_qword_reg ())
6248 return 0;
6249 }
6250 else if (i.suffix == WORD_MNEM_SUFFIX)
6251 {
6252 if (intel_syntax
6253 && i.tm.opcode_modifier.ignoresize
6254 && i.tm.opcode_modifier.no_wsuf)
6255 i.suffix = 0;
6256 else if (!check_word_reg ())
6257 return 0;
6258 }
6259 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6260 /* Do nothing if the instruction is going to ignore the prefix. */
6261 ;
6262 else
6263 abort ();
6264 }
6265 else if (i.tm.opcode_modifier.defaultsize
6266 && !i.suffix
6267 /* exclude fldenv/frstor/fsave/fstenv */
6268 && i.tm.opcode_modifier.no_ssuf)
6269 {
6270 if (stackop_size == LONG_MNEM_SUFFIX
6271 && i.tm.base_opcode == 0xcf)
6272 {
6273 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6274 .code16gcc directive to support 16-bit mode with
6275 32-bit address. For IRET without a suffix, generate
6276 16-bit IRET (opcode 0xcf) to return from an interrupt
6277 handler. */
6278 i.suffix = WORD_MNEM_SUFFIX;
6279 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6280 }
6281 else
6282 i.suffix = stackop_size;
6283 }
6284 else if (intel_syntax
6285 && !i.suffix
6286 && (i.tm.operand_types[0].bitfield.jumpabsolute
6287 || i.tm.opcode_modifier.jumpbyte
6288 || i.tm.opcode_modifier.jumpintersegment
6289 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6290 && i.tm.extension_opcode <= 3)))
6291 {
6292 switch (flag_code)
6293 {
6294 case CODE_64BIT:
6295 if (!i.tm.opcode_modifier.no_qsuf)
6296 {
6297 i.suffix = QWORD_MNEM_SUFFIX;
6298 break;
6299 }
6300 /* Fall through. */
6301 case CODE_32BIT:
6302 if (!i.tm.opcode_modifier.no_lsuf)
6303 i.suffix = LONG_MNEM_SUFFIX;
6304 break;
6305 case CODE_16BIT:
6306 if (!i.tm.opcode_modifier.no_wsuf)
6307 i.suffix = WORD_MNEM_SUFFIX;
6308 break;
6309 }
6310 }
6311
6312 if (!i.suffix)
6313 {
6314 if (!intel_syntax)
6315 {
6316 if (i.tm.opcode_modifier.w)
6317 {
6318 as_bad (_("no instruction mnemonic suffix given and "
6319 "no register operands; can't size instruction"));
6320 return 0;
6321 }
6322 }
6323 else
6324 {
6325 unsigned int suffixes;
6326
6327 suffixes = !i.tm.opcode_modifier.no_bsuf;
6328 if (!i.tm.opcode_modifier.no_wsuf)
6329 suffixes |= 1 << 1;
6330 if (!i.tm.opcode_modifier.no_lsuf)
6331 suffixes |= 1 << 2;
6332 if (!i.tm.opcode_modifier.no_ldsuf)
6333 suffixes |= 1 << 3;
6334 if (!i.tm.opcode_modifier.no_ssuf)
6335 suffixes |= 1 << 4;
6336 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6337 suffixes |= 1 << 5;
6338
6339 /* There are more than suffix matches. */
6340 if (i.tm.opcode_modifier.w
6341 || ((suffixes & (suffixes - 1))
6342 && !i.tm.opcode_modifier.defaultsize
6343 && !i.tm.opcode_modifier.ignoresize))
6344 {
6345 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6346 return 0;
6347 }
6348 }
6349 }
6350
6351 /* Change the opcode based on the operand size given by i.suffix. */
6352 switch (i.suffix)
6353 {
6354 /* Size floating point instruction. */
6355 case LONG_MNEM_SUFFIX:
6356 if (i.tm.opcode_modifier.floatmf)
6357 {
6358 i.tm.base_opcode ^= 4;
6359 break;
6360 }
6361 /* fall through */
6362 case WORD_MNEM_SUFFIX:
6363 case QWORD_MNEM_SUFFIX:
6364 /* It's not a byte, select word/dword operation. */
6365 if (i.tm.opcode_modifier.w)
6366 {
6367 if (i.tm.opcode_modifier.shortform)
6368 i.tm.base_opcode |= 8;
6369 else
6370 i.tm.base_opcode |= 1;
6371 }
6372 /* fall through */
6373 case SHORT_MNEM_SUFFIX:
6374 /* Now select between word & dword operations via the operand
6375 size prefix, except for instructions that will ignore this
6376 prefix anyway. */
6377 if (i.reg_operands > 0
6378 && i.types[0].bitfield.reg
6379 && i.tm.opcode_modifier.addrprefixopreg
6380 && (i.tm.opcode_modifier.immext
6381 || i.operands == 1))
6382 {
6383 /* The address size override prefix changes the size of the
6384 first operand. */
6385 if ((flag_code == CODE_32BIT
6386 && i.op[0].regs->reg_type.bitfield.word)
6387 || (flag_code != CODE_32BIT
6388 && i.op[0].regs->reg_type.bitfield.dword))
6389 if (!add_prefix (ADDR_PREFIX_OPCODE))
6390 return 0;
6391 }
6392 else if (i.suffix != QWORD_MNEM_SUFFIX
6393 && !i.tm.opcode_modifier.ignoresize
6394 && !i.tm.opcode_modifier.floatmf
6395 && !is_any_vex_encoding (&i.tm)
6396 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6397 || (flag_code == CODE_64BIT
6398 && i.tm.opcode_modifier.jumpbyte)))
6399 {
6400 unsigned int prefix = DATA_PREFIX_OPCODE;
6401
6402 if (i.tm.opcode_modifier.jumpbyte) /* jcxz, loop */
6403 prefix = ADDR_PREFIX_OPCODE;
6404
6405 if (!add_prefix (prefix))
6406 return 0;
6407 }
6408
6409 /* Set mode64 for an operand. */
6410 if (i.suffix == QWORD_MNEM_SUFFIX
6411 && flag_code == CODE_64BIT
6412 && !i.tm.opcode_modifier.norex64
6413 /* Special case for xchg %rax,%rax. It is NOP and doesn't
6414 need rex64. */
6415 && ! (i.operands == 2
6416 && i.tm.base_opcode == 0x90
6417 && i.tm.extension_opcode == None
6418 && i.types[0].bitfield.acc && i.types[0].bitfield.qword
6419 && i.types[1].bitfield.acc && i.types[1].bitfield.qword))
6420 i.rex |= REX_W;
6421
6422 break;
6423 }
6424
6425 if (i.reg_operands != 0
6426 && i.operands > 1
6427 && i.tm.opcode_modifier.addrprefixopreg
6428 && !i.tm.opcode_modifier.immext)
6429 {
6430 /* Check invalid register operand when the address size override
6431 prefix changes the size of register operands. */
6432 unsigned int op;
6433 enum { need_word, need_dword, need_qword } need;
6434
6435 if (flag_code == CODE_32BIT)
6436 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6437 else
6438 {
6439 if (i.prefix[ADDR_PREFIX])
6440 need = need_dword;
6441 else
6442 need = flag_code == CODE_64BIT ? need_qword : need_word;
6443 }
6444
6445 for (op = 0; op < i.operands; op++)
6446 if (i.types[op].bitfield.reg
6447 && ((need == need_word
6448 && !i.op[op].regs->reg_type.bitfield.word)
6449 || (need == need_dword
6450 && !i.op[op].regs->reg_type.bitfield.dword)
6451 || (need == need_qword
6452 && !i.op[op].regs->reg_type.bitfield.qword)))
6453 {
6454 as_bad (_("invalid register operand size for `%s'"),
6455 i.tm.name);
6456 return 0;
6457 }
6458 }
6459
6460 return 1;
6461 }
6462
6463 static int
6464 check_byte_reg (void)
6465 {
6466 int op;
6467
6468 for (op = i.operands; --op >= 0;)
6469 {
6470 /* Skip non-register operands. */
6471 if (!i.types[op].bitfield.reg)
6472 continue;
6473
6474 /* If this is an eight bit register, it's OK. If it's the 16 or
6475 32 bit version of an eight bit register, we will just use the
6476 low portion, and that's OK too. */
6477 if (i.types[op].bitfield.byte)
6478 continue;
6479
6480 /* I/O port address operands are OK too. */
6481 if (i.tm.operand_types[op].bitfield.inoutportreg)
6482 continue;
6483
6484 /* crc32 doesn't generate this warning. */
6485 if (i.tm.base_opcode == 0xf20f38f0)
6486 continue;
6487
6488 if ((i.types[op].bitfield.word
6489 || i.types[op].bitfield.dword
6490 || i.types[op].bitfield.qword)
6491 && i.op[op].regs->reg_num < 4
6492 /* Prohibit these changes in 64bit mode, since the lowering
6493 would be more complicated. */
6494 && flag_code != CODE_64BIT)
6495 {
6496 #if REGISTER_WARNINGS
6497 if (!quiet_warnings)
6498 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6499 register_prefix,
6500 (i.op[op].regs + (i.types[op].bitfield.word
6501 ? REGNAM_AL - REGNAM_AX
6502 : REGNAM_AL - REGNAM_EAX))->reg_name,
6503 register_prefix,
6504 i.op[op].regs->reg_name,
6505 i.suffix);
6506 #endif
6507 continue;
6508 }
6509 /* Any other register is bad. */
6510 if (i.types[op].bitfield.reg
6511 || i.types[op].bitfield.regmmx
6512 || i.types[op].bitfield.regsimd
6513 || i.types[op].bitfield.sreg2
6514 || i.types[op].bitfield.sreg3
6515 || i.types[op].bitfield.control
6516 || i.types[op].bitfield.debug
6517 || i.types[op].bitfield.test)
6518 {
6519 as_bad (_("`%s%s' not allowed with `%s%c'"),
6520 register_prefix,
6521 i.op[op].regs->reg_name,
6522 i.tm.name,
6523 i.suffix);
6524 return 0;
6525 }
6526 }
6527 return 1;
6528 }
6529
6530 static int
6531 check_long_reg (void)
6532 {
6533 int op;
6534
6535 for (op = i.operands; --op >= 0;)
6536 /* Skip non-register operands. */
6537 if (!i.types[op].bitfield.reg)
6538 continue;
6539 /* Reject eight bit registers, except where the template requires
6540 them. (eg. movzb) */
6541 else if (i.types[op].bitfield.byte
6542 && (i.tm.operand_types[op].bitfield.reg
6543 || i.tm.operand_types[op].bitfield.acc)
6544 && (i.tm.operand_types[op].bitfield.word
6545 || i.tm.operand_types[op].bitfield.dword))
6546 {
6547 as_bad (_("`%s%s' not allowed with `%s%c'"),
6548 register_prefix,
6549 i.op[op].regs->reg_name,
6550 i.tm.name,
6551 i.suffix);
6552 return 0;
6553 }
6554 /* Warn if the e prefix on a general reg is missing. */
6555 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6556 && i.types[op].bitfield.word
6557 && (i.tm.operand_types[op].bitfield.reg
6558 || i.tm.operand_types[op].bitfield.acc)
6559 && i.tm.operand_types[op].bitfield.dword)
6560 {
6561 /* Prohibit these changes in the 64bit mode, since the
6562 lowering is more complicated. */
6563 if (flag_code == CODE_64BIT)
6564 {
6565 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6566 register_prefix, i.op[op].regs->reg_name,
6567 i.suffix);
6568 return 0;
6569 }
6570 #if REGISTER_WARNINGS
6571 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6572 register_prefix,
6573 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
6574 register_prefix, i.op[op].regs->reg_name, i.suffix);
6575 #endif
6576 }
6577 /* Warn if the r prefix on a general reg is present. */
6578 else if (i.types[op].bitfield.qword
6579 && (i.tm.operand_types[op].bitfield.reg
6580 || i.tm.operand_types[op].bitfield.acc)
6581 && i.tm.operand_types[op].bitfield.dword)
6582 {
6583 if (intel_syntax
6584 && i.tm.opcode_modifier.toqword
6585 && !i.types[0].bitfield.regsimd)
6586 {
6587 /* Convert to QWORD. We want REX byte. */
6588 i.suffix = QWORD_MNEM_SUFFIX;
6589 }
6590 else
6591 {
6592 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6593 register_prefix, i.op[op].regs->reg_name,
6594 i.suffix);
6595 return 0;
6596 }
6597 }
6598 return 1;
6599 }
6600
6601 static int
6602 check_qword_reg (void)
6603 {
6604 int op;
6605
6606 for (op = i.operands; --op >= 0; )
6607 /* Skip non-register operands. */
6608 if (!i.types[op].bitfield.reg)
6609 continue;
6610 /* Reject eight bit registers, except where the template requires
6611 them. (eg. movzb) */
6612 else if (i.types[op].bitfield.byte
6613 && (i.tm.operand_types[op].bitfield.reg
6614 || i.tm.operand_types[op].bitfield.acc)
6615 && (i.tm.operand_types[op].bitfield.word
6616 || i.tm.operand_types[op].bitfield.dword))
6617 {
6618 as_bad (_("`%s%s' not allowed with `%s%c'"),
6619 register_prefix,
6620 i.op[op].regs->reg_name,
6621 i.tm.name,
6622 i.suffix);
6623 return 0;
6624 }
6625 /* Warn if the r prefix on a general reg is missing. */
6626 else if ((i.types[op].bitfield.word
6627 || i.types[op].bitfield.dword)
6628 && (i.tm.operand_types[op].bitfield.reg
6629 || i.tm.operand_types[op].bitfield.acc)
6630 && i.tm.operand_types[op].bitfield.qword)
6631 {
6632 /* Prohibit these changes in the 64bit mode, since the
6633 lowering is more complicated. */
6634 if (intel_syntax
6635 && i.tm.opcode_modifier.todword
6636 && !i.types[0].bitfield.regsimd)
6637 {
6638 /* Convert to DWORD. We don't want REX byte. */
6639 i.suffix = LONG_MNEM_SUFFIX;
6640 }
6641 else
6642 {
6643 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6644 register_prefix, i.op[op].regs->reg_name,
6645 i.suffix);
6646 return 0;
6647 }
6648 }
6649 return 1;
6650 }
6651
6652 static int
6653 check_word_reg (void)
6654 {
6655 int op;
6656 for (op = i.operands; --op >= 0;)
6657 /* Skip non-register operands. */
6658 if (!i.types[op].bitfield.reg)
6659 continue;
6660 /* Reject eight bit registers, except where the template requires
6661 them. (eg. movzb) */
6662 else if (i.types[op].bitfield.byte
6663 && (i.tm.operand_types[op].bitfield.reg
6664 || i.tm.operand_types[op].bitfield.acc)
6665 && (i.tm.operand_types[op].bitfield.word
6666 || i.tm.operand_types[op].bitfield.dword))
6667 {
6668 as_bad (_("`%s%s' not allowed with `%s%c'"),
6669 register_prefix,
6670 i.op[op].regs->reg_name,
6671 i.tm.name,
6672 i.suffix);
6673 return 0;
6674 }
6675 /* Warn if the e or r prefix on a general reg is present. */
6676 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6677 && (i.types[op].bitfield.dword
6678 || i.types[op].bitfield.qword)
6679 && (i.tm.operand_types[op].bitfield.reg
6680 || i.tm.operand_types[op].bitfield.acc)
6681 && i.tm.operand_types[op].bitfield.word)
6682 {
6683 /* Prohibit these changes in the 64bit mode, since the
6684 lowering is more complicated. */
6685 if (flag_code == CODE_64BIT)
6686 {
6687 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6688 register_prefix, i.op[op].regs->reg_name,
6689 i.suffix);
6690 return 0;
6691 }
6692 #if REGISTER_WARNINGS
6693 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6694 register_prefix,
6695 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
6696 register_prefix, i.op[op].regs->reg_name, i.suffix);
6697 #endif
6698 }
6699 return 1;
6700 }
6701
6702 static int
6703 update_imm (unsigned int j)
6704 {
6705 i386_operand_type overlap = i.types[j];
6706 if ((overlap.bitfield.imm8
6707 || overlap.bitfield.imm8s
6708 || overlap.bitfield.imm16
6709 || overlap.bitfield.imm32
6710 || overlap.bitfield.imm32s
6711 || overlap.bitfield.imm64)
6712 && !operand_type_equal (&overlap, &imm8)
6713 && !operand_type_equal (&overlap, &imm8s)
6714 && !operand_type_equal (&overlap, &imm16)
6715 && !operand_type_equal (&overlap, &imm32)
6716 && !operand_type_equal (&overlap, &imm32s)
6717 && !operand_type_equal (&overlap, &imm64))
6718 {
6719 if (i.suffix)
6720 {
6721 i386_operand_type temp;
6722
6723 operand_type_set (&temp, 0);
6724 if (i.suffix == BYTE_MNEM_SUFFIX)
6725 {
6726 temp.bitfield.imm8 = overlap.bitfield.imm8;
6727 temp.bitfield.imm8s = overlap.bitfield.imm8s;
6728 }
6729 else if (i.suffix == WORD_MNEM_SUFFIX)
6730 temp.bitfield.imm16 = overlap.bitfield.imm16;
6731 else if (i.suffix == QWORD_MNEM_SUFFIX)
6732 {
6733 temp.bitfield.imm64 = overlap.bitfield.imm64;
6734 temp.bitfield.imm32s = overlap.bitfield.imm32s;
6735 }
6736 else
6737 temp.bitfield.imm32 = overlap.bitfield.imm32;
6738 overlap = temp;
6739 }
6740 else if (operand_type_equal (&overlap, &imm16_32_32s)
6741 || operand_type_equal (&overlap, &imm16_32)
6742 || operand_type_equal (&overlap, &imm16_32s))
6743 {
6744 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6745 overlap = imm16;
6746 else
6747 overlap = imm32s;
6748 }
6749 if (!operand_type_equal (&overlap, &imm8)
6750 && !operand_type_equal (&overlap, &imm8s)
6751 && !operand_type_equal (&overlap, &imm16)
6752 && !operand_type_equal (&overlap, &imm32)
6753 && !operand_type_equal (&overlap, &imm32s)
6754 && !operand_type_equal (&overlap, &imm64))
6755 {
6756 as_bad (_("no instruction mnemonic suffix given; "
6757 "can't determine immediate size"));
6758 return 0;
6759 }
6760 }
6761 i.types[j] = overlap;
6762
6763 return 1;
6764 }
6765
6766 static int
6767 finalize_imm (void)
6768 {
6769 unsigned int j, n;
6770
6771 /* Update the first 2 immediate operands. */
6772 n = i.operands > 2 ? 2 : i.operands;
6773 if (n)
6774 {
6775 for (j = 0; j < n; j++)
6776 if (update_imm (j) == 0)
6777 return 0;
6778
6779 /* The 3rd operand can't be immediate operand. */
6780 gas_assert (operand_type_check (i.types[2], imm) == 0);
6781 }
6782
6783 return 1;
6784 }
6785
6786 static int
6787 process_operands (void)
6788 {
6789 /* Default segment register this instruction will use for memory
6790 accesses. 0 means unknown. This is only for optimizing out
6791 unnecessary segment overrides. */
6792 const seg_entry *default_seg = 0;
6793
6794 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6795 {
6796 unsigned int dupl = i.operands;
6797 unsigned int dest = dupl - 1;
6798 unsigned int j;
6799
6800 /* The destination must be an xmm register. */
6801 gas_assert (i.reg_operands
6802 && MAX_OPERANDS > dupl
6803 && operand_type_equal (&i.types[dest], &regxmm));
6804
6805 if (i.tm.operand_types[0].bitfield.acc
6806 && i.tm.operand_types[0].bitfield.xmmword)
6807 {
6808 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6809 {
6810 /* Keep xmm0 for instructions with VEX prefix and 3
6811 sources. */
6812 i.tm.operand_types[0].bitfield.acc = 0;
6813 i.tm.operand_types[0].bitfield.regsimd = 1;
6814 goto duplicate;
6815 }
6816 else
6817 {
6818 /* We remove the first xmm0 and keep the number of
6819 operands unchanged, which in fact duplicates the
6820 destination. */
6821 for (j = 1; j < i.operands; j++)
6822 {
6823 i.op[j - 1] = i.op[j];
6824 i.types[j - 1] = i.types[j];
6825 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6826 }
6827 }
6828 }
6829 else if (i.tm.opcode_modifier.implicit1stxmm0)
6830 {
6831 gas_assert ((MAX_OPERANDS - 1) > dupl
6832 && (i.tm.opcode_modifier.vexsources
6833 == VEX3SOURCES));
6834
6835 /* Add the implicit xmm0 for instructions with VEX prefix
6836 and 3 sources. */
6837 for (j = i.operands; j > 0; j--)
6838 {
6839 i.op[j] = i.op[j - 1];
6840 i.types[j] = i.types[j - 1];
6841 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
6842 }
6843 i.op[0].regs
6844 = (const reg_entry *) hash_find (reg_hash, "xmm0");
6845 i.types[0] = regxmm;
6846 i.tm.operand_types[0] = regxmm;
6847
6848 i.operands += 2;
6849 i.reg_operands += 2;
6850 i.tm.operands += 2;
6851
6852 dupl++;
6853 dest++;
6854 i.op[dupl] = i.op[dest];
6855 i.types[dupl] = i.types[dest];
6856 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6857 }
6858 else
6859 {
6860 duplicate:
6861 i.operands++;
6862 i.reg_operands++;
6863 i.tm.operands++;
6864
6865 i.op[dupl] = i.op[dest];
6866 i.types[dupl] = i.types[dest];
6867 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6868 }
6869
6870 if (i.tm.opcode_modifier.immext)
6871 process_immext ();
6872 }
6873 else if (i.tm.operand_types[0].bitfield.acc
6874 && i.tm.operand_types[0].bitfield.xmmword)
6875 {
6876 unsigned int j;
6877
6878 for (j = 1; j < i.operands; j++)
6879 {
6880 i.op[j - 1] = i.op[j];
6881 i.types[j - 1] = i.types[j];
6882
6883 /* We need to adjust fields in i.tm since they are used by
6884 build_modrm_byte. */
6885 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
6886 }
6887
6888 i.operands--;
6889 i.reg_operands--;
6890 i.tm.operands--;
6891 }
6892 else if (i.tm.opcode_modifier.implicitquadgroup)
6893 {
6894 unsigned int regnum, first_reg_in_group, last_reg_in_group;
6895
6896 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
6897 gas_assert (i.operands >= 2 && i.types[1].bitfield.regsimd);
6898 regnum = register_number (i.op[1].regs);
6899 first_reg_in_group = regnum & ~3;
6900 last_reg_in_group = first_reg_in_group + 3;
6901 if (regnum != first_reg_in_group)
6902 as_warn (_("source register `%s%s' implicitly denotes"
6903 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
6904 register_prefix, i.op[1].regs->reg_name,
6905 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
6906 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
6907 i.tm.name);
6908 }
6909 else if (i.tm.opcode_modifier.regkludge)
6910 {
6911 /* The imul $imm, %reg instruction is converted into
6912 imul $imm, %reg, %reg, and the clr %reg instruction
6913 is converted into xor %reg, %reg. */
6914
6915 unsigned int first_reg_op;
6916
6917 if (operand_type_check (i.types[0], reg))
6918 first_reg_op = 0;
6919 else
6920 first_reg_op = 1;
6921 /* Pretend we saw the extra register operand. */
6922 gas_assert (i.reg_operands == 1
6923 && i.op[first_reg_op + 1].regs == 0);
6924 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
6925 i.types[first_reg_op + 1] = i.types[first_reg_op];
6926 i.operands++;
6927 i.reg_operands++;
6928 }
6929
6930 if (i.tm.opcode_modifier.shortform)
6931 {
6932 if (i.types[0].bitfield.sreg2
6933 || i.types[0].bitfield.sreg3)
6934 {
6935 if (i.tm.base_opcode == POP_SEG_SHORT
6936 && i.op[0].regs->reg_num == 1)
6937 {
6938 as_bad (_("you can't `pop %scs'"), register_prefix);
6939 return 0;
6940 }
6941 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
6942 if ((i.op[0].regs->reg_flags & RegRex) != 0)
6943 i.rex |= REX_B;
6944 }
6945 else
6946 {
6947 /* The register or float register operand is in operand
6948 0 or 1. */
6949 unsigned int op;
6950
6951 if ((i.types[0].bitfield.reg && i.types[0].bitfield.tbyte)
6952 || operand_type_check (i.types[0], reg))
6953 op = 0;
6954 else
6955 op = 1;
6956 /* Register goes in low 3 bits of opcode. */
6957 i.tm.base_opcode |= i.op[op].regs->reg_num;
6958 if ((i.op[op].regs->reg_flags & RegRex) != 0)
6959 i.rex |= REX_B;
6960 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
6961 {
6962 /* Warn about some common errors, but press on regardless.
6963 The first case can be generated by gcc (<= 2.8.1). */
6964 if (i.operands == 2)
6965 {
6966 /* Reversed arguments on faddp, fsubp, etc. */
6967 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
6968 register_prefix, i.op[!intel_syntax].regs->reg_name,
6969 register_prefix, i.op[intel_syntax].regs->reg_name);
6970 }
6971 else
6972 {
6973 /* Extraneous `l' suffix on fp insn. */
6974 as_warn (_("translating to `%s %s%s'"), i.tm.name,
6975 register_prefix, i.op[0].regs->reg_name);
6976 }
6977 }
6978 }
6979 }
6980 else if (i.tm.opcode_modifier.modrm)
6981 {
6982 /* The opcode is completed (modulo i.tm.extension_opcode which
6983 must be put into the modrm byte). Now, we make the modrm and
6984 index base bytes based on all the info we've collected. */
6985
6986 default_seg = build_modrm_byte ();
6987 }
6988 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
6989 {
6990 default_seg = &ds;
6991 }
6992 else if (i.tm.opcode_modifier.isstring)
6993 {
6994 /* For the string instructions that allow a segment override
6995 on one of their operands, the default segment is ds. */
6996 default_seg = &ds;
6997 }
6998
6999 if (i.tm.base_opcode == 0x8d /* lea */
7000 && i.seg[0]
7001 && !quiet_warnings)
7002 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7003
7004 /* If a segment was explicitly specified, and the specified segment
7005 is not the default, use an opcode prefix to select it. If we
7006 never figured out what the default segment is, then default_seg
7007 will be zero at this point, and the specified segment prefix will
7008 always be used. */
7009 if ((i.seg[0]) && (i.seg[0] != default_seg))
7010 {
7011 if (!add_prefix (i.seg[0]->seg_prefix))
7012 return 0;
7013 }
7014 return 1;
7015 }
7016
7017 static const seg_entry *
7018 build_modrm_byte (void)
7019 {
7020 const seg_entry *default_seg = 0;
7021 unsigned int source, dest;
7022 int vex_3_sources;
7023
7024 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7025 if (vex_3_sources)
7026 {
7027 unsigned int nds, reg_slot;
7028 expressionS *exp;
7029
7030 dest = i.operands - 1;
7031 nds = dest - 1;
7032
7033 /* There are 2 kinds of instructions:
7034 1. 5 operands: 4 register operands or 3 register operands
7035 plus 1 memory operand plus one Vec_Imm4 operand, VexXDS, and
7036 VexW0 or VexW1. The destination must be either XMM, YMM or
7037 ZMM register.
7038 2. 4 operands: 4 register operands or 3 register operands
7039 plus 1 memory operand, with VexXDS. */
7040 gas_assert ((i.reg_operands == 4
7041 || (i.reg_operands == 3 && i.mem_operands == 1))
7042 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7043 && i.tm.opcode_modifier.vexw
7044 && i.tm.operand_types[dest].bitfield.regsimd);
7045
7046 /* If VexW1 is set, the first non-immediate operand is the source and
7047 the second non-immediate one is encoded in the immediate operand. */
7048 if (i.tm.opcode_modifier.vexw == VEXW1)
7049 {
7050 source = i.imm_operands;
7051 reg_slot = i.imm_operands + 1;
7052 }
7053 else
7054 {
7055 source = i.imm_operands + 1;
7056 reg_slot = i.imm_operands;
7057 }
7058
7059 if (i.imm_operands == 0)
7060 {
7061 /* When there is no immediate operand, generate an 8bit
7062 immediate operand to encode the first operand. */
7063 exp = &im_expressions[i.imm_operands++];
7064 i.op[i.operands].imms = exp;
7065 i.types[i.operands] = imm8;
7066 i.operands++;
7067
7068 gas_assert (i.tm.operand_types[reg_slot].bitfield.regsimd);
7069 exp->X_op = O_constant;
7070 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7071 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7072 }
7073 else
7074 {
7075 unsigned int imm_slot;
7076
7077 gas_assert (i.imm_operands == 1 && i.types[0].bitfield.vec_imm4);
7078
7079 if (i.tm.opcode_modifier.immext)
7080 {
7081 /* When ImmExt is set, the immediate byte is the last
7082 operand. */
7083 imm_slot = i.operands - 1;
7084 source--;
7085 reg_slot--;
7086 }
7087 else
7088 {
7089 imm_slot = 0;
7090
7091 /* Turn on Imm8 so that output_imm will generate it. */
7092 i.types[imm_slot].bitfield.imm8 = 1;
7093 }
7094
7095 gas_assert (i.tm.operand_types[reg_slot].bitfield.regsimd);
7096 i.op[imm_slot].imms->X_add_number
7097 |= register_number (i.op[reg_slot].regs) << 4;
7098 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7099 }
7100
7101 gas_assert (i.tm.operand_types[nds].bitfield.regsimd);
7102 i.vex.register_specifier = i.op[nds].regs;
7103 }
7104 else
7105 source = dest = 0;
7106
7107 /* i.reg_operands MUST be the number of real register operands;
7108 implicit registers do not count. If there are 3 register
7109 operands, it must be a instruction with VexNDS. For a
7110 instruction with VexNDD, the destination register is encoded
7111 in VEX prefix. If there are 4 register operands, it must be
7112 a instruction with VEX prefix and 3 sources. */
7113 if (i.mem_operands == 0
7114 && ((i.reg_operands == 2
7115 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7116 || (i.reg_operands == 3
7117 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7118 || (i.reg_operands == 4 && vex_3_sources)))
7119 {
7120 switch (i.operands)
7121 {
7122 case 2:
7123 source = 0;
7124 break;
7125 case 3:
7126 /* When there are 3 operands, one of them may be immediate,
7127 which may be the first or the last operand. Otherwise,
7128 the first operand must be shift count register (cl) or it
7129 is an instruction with VexNDS. */
7130 gas_assert (i.imm_operands == 1
7131 || (i.imm_operands == 0
7132 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7133 || i.types[0].bitfield.shiftcount)));
7134 if (operand_type_check (i.types[0], imm)
7135 || i.types[0].bitfield.shiftcount)
7136 source = 1;
7137 else
7138 source = 0;
7139 break;
7140 case 4:
7141 /* When there are 4 operands, the first two must be 8bit
7142 immediate operands. The source operand will be the 3rd
7143 one.
7144
7145 For instructions with VexNDS, if the first operand
7146 an imm8, the source operand is the 2nd one. If the last
7147 operand is imm8, the source operand is the first one. */
7148 gas_assert ((i.imm_operands == 2
7149 && i.types[0].bitfield.imm8
7150 && i.types[1].bitfield.imm8)
7151 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7152 && i.imm_operands == 1
7153 && (i.types[0].bitfield.imm8
7154 || i.types[i.operands - 1].bitfield.imm8
7155 || i.rounding)));
7156 if (i.imm_operands == 2)
7157 source = 2;
7158 else
7159 {
7160 if (i.types[0].bitfield.imm8)
7161 source = 1;
7162 else
7163 source = 0;
7164 }
7165 break;
7166 case 5:
7167 if (is_evex_encoding (&i.tm))
7168 {
7169 /* For EVEX instructions, when there are 5 operands, the
7170 first one must be immediate operand. If the second one
7171 is immediate operand, the source operand is the 3th
7172 one. If the last one is immediate operand, the source
7173 operand is the 2nd one. */
7174 gas_assert (i.imm_operands == 2
7175 && i.tm.opcode_modifier.sae
7176 && operand_type_check (i.types[0], imm));
7177 if (operand_type_check (i.types[1], imm))
7178 source = 2;
7179 else if (operand_type_check (i.types[4], imm))
7180 source = 1;
7181 else
7182 abort ();
7183 }
7184 break;
7185 default:
7186 abort ();
7187 }
7188
7189 if (!vex_3_sources)
7190 {
7191 dest = source + 1;
7192
7193 /* RC/SAE operand could be between DEST and SRC. That happens
7194 when one operand is GPR and the other one is XMM/YMM/ZMM
7195 register. */
7196 if (i.rounding && i.rounding->operand == (int) dest)
7197 dest++;
7198
7199 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7200 {
7201 /* For instructions with VexNDS, the register-only source
7202 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7203 register. It is encoded in VEX prefix. We need to
7204 clear RegMem bit before calling operand_type_equal. */
7205
7206 i386_operand_type op;
7207 unsigned int vvvv;
7208
7209 /* Check register-only source operand when two source
7210 operands are swapped. */
7211 if (!i.tm.operand_types[source].bitfield.baseindex
7212 && i.tm.operand_types[dest].bitfield.baseindex)
7213 {
7214 vvvv = source;
7215 source = dest;
7216 }
7217 else
7218 vvvv = dest;
7219
7220 op = i.tm.operand_types[vvvv];
7221 op.bitfield.regmem = 0;
7222 if ((dest + 1) >= i.operands
7223 || ((!op.bitfield.reg
7224 || (!op.bitfield.dword && !op.bitfield.qword))
7225 && !op.bitfield.regsimd
7226 && !operand_type_equal (&op, &regmask)))
7227 abort ();
7228 i.vex.register_specifier = i.op[vvvv].regs;
7229 dest++;
7230 }
7231 }
7232
7233 i.rm.mode = 3;
7234 /* One of the register operands will be encoded in the i.tm.reg
7235 field, the other in the combined i.tm.mode and i.tm.regmem
7236 fields. If no form of this instruction supports a memory
7237 destination operand, then we assume the source operand may
7238 sometimes be a memory operand and so we need to store the
7239 destination in the i.rm.reg field. */
7240 if (!i.tm.operand_types[dest].bitfield.regmem
7241 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7242 {
7243 i.rm.reg = i.op[dest].regs->reg_num;
7244 i.rm.regmem = i.op[source].regs->reg_num;
7245 if (i.op[dest].regs->reg_type.bitfield.regmmx
7246 || i.op[source].regs->reg_type.bitfield.regmmx)
7247 i.has_regmmx = TRUE;
7248 else if (i.op[dest].regs->reg_type.bitfield.regsimd
7249 || i.op[source].regs->reg_type.bitfield.regsimd)
7250 {
7251 if (i.types[dest].bitfield.zmmword
7252 || i.types[source].bitfield.zmmword)
7253 i.has_regzmm = TRUE;
7254 else if (i.types[dest].bitfield.ymmword
7255 || i.types[source].bitfield.ymmword)
7256 i.has_regymm = TRUE;
7257 else
7258 i.has_regxmm = TRUE;
7259 }
7260 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7261 i.rex |= REX_R;
7262 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7263 i.vrex |= REX_R;
7264 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7265 i.rex |= REX_B;
7266 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7267 i.vrex |= REX_B;
7268 }
7269 else
7270 {
7271 i.rm.reg = i.op[source].regs->reg_num;
7272 i.rm.regmem = i.op[dest].regs->reg_num;
7273 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7274 i.rex |= REX_B;
7275 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7276 i.vrex |= REX_B;
7277 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7278 i.rex |= REX_R;
7279 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7280 i.vrex |= REX_R;
7281 }
7282 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7283 {
7284 if (!i.types[i.tm.operand_types[0].bitfield.regmem].bitfield.control)
7285 abort ();
7286 i.rex &= ~REX_R;
7287 add_prefix (LOCK_PREFIX_OPCODE);
7288 }
7289 }
7290 else
7291 { /* If it's not 2 reg operands... */
7292 unsigned int mem;
7293
7294 if (i.mem_operands)
7295 {
7296 unsigned int fake_zero_displacement = 0;
7297 unsigned int op;
7298
7299 for (op = 0; op < i.operands; op++)
7300 if (operand_type_check (i.types[op], anymem))
7301 break;
7302 gas_assert (op < i.operands);
7303
7304 if (i.tm.opcode_modifier.vecsib)
7305 {
7306 if (i.index_reg->reg_num == RegIZ)
7307 abort ();
7308
7309 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7310 if (!i.base_reg)
7311 {
7312 i.sib.base = NO_BASE_REGISTER;
7313 i.sib.scale = i.log2_scale_factor;
7314 i.types[op].bitfield.disp8 = 0;
7315 i.types[op].bitfield.disp16 = 0;
7316 i.types[op].bitfield.disp64 = 0;
7317 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7318 {
7319 /* Must be 32 bit */
7320 i.types[op].bitfield.disp32 = 1;
7321 i.types[op].bitfield.disp32s = 0;
7322 }
7323 else
7324 {
7325 i.types[op].bitfield.disp32 = 0;
7326 i.types[op].bitfield.disp32s = 1;
7327 }
7328 }
7329 i.sib.index = i.index_reg->reg_num;
7330 if ((i.index_reg->reg_flags & RegRex) != 0)
7331 i.rex |= REX_X;
7332 if ((i.index_reg->reg_flags & RegVRex) != 0)
7333 i.vrex |= REX_X;
7334 }
7335
7336 default_seg = &ds;
7337
7338 if (i.base_reg == 0)
7339 {
7340 i.rm.mode = 0;
7341 if (!i.disp_operands)
7342 fake_zero_displacement = 1;
7343 if (i.index_reg == 0)
7344 {
7345 i386_operand_type newdisp;
7346
7347 gas_assert (!i.tm.opcode_modifier.vecsib);
7348 /* Operand is just <disp> */
7349 if (flag_code == CODE_64BIT)
7350 {
7351 /* 64bit mode overwrites the 32bit absolute
7352 addressing by RIP relative addressing and
7353 absolute addressing is encoded by one of the
7354 redundant SIB forms. */
7355 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7356 i.sib.base = NO_BASE_REGISTER;
7357 i.sib.index = NO_INDEX_REGISTER;
7358 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7359 }
7360 else if ((flag_code == CODE_16BIT)
7361 ^ (i.prefix[ADDR_PREFIX] != 0))
7362 {
7363 i.rm.regmem = NO_BASE_REGISTER_16;
7364 newdisp = disp16;
7365 }
7366 else
7367 {
7368 i.rm.regmem = NO_BASE_REGISTER;
7369 newdisp = disp32;
7370 }
7371 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7372 i.types[op] = operand_type_or (i.types[op], newdisp);
7373 }
7374 else if (!i.tm.opcode_modifier.vecsib)
7375 {
7376 /* !i.base_reg && i.index_reg */
7377 if (i.index_reg->reg_num == RegIZ)
7378 i.sib.index = NO_INDEX_REGISTER;
7379 else
7380 i.sib.index = i.index_reg->reg_num;
7381 i.sib.base = NO_BASE_REGISTER;
7382 i.sib.scale = i.log2_scale_factor;
7383 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7384 i.types[op].bitfield.disp8 = 0;
7385 i.types[op].bitfield.disp16 = 0;
7386 i.types[op].bitfield.disp64 = 0;
7387 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7388 {
7389 /* Must be 32 bit */
7390 i.types[op].bitfield.disp32 = 1;
7391 i.types[op].bitfield.disp32s = 0;
7392 }
7393 else
7394 {
7395 i.types[op].bitfield.disp32 = 0;
7396 i.types[op].bitfield.disp32s = 1;
7397 }
7398 if ((i.index_reg->reg_flags & RegRex) != 0)
7399 i.rex |= REX_X;
7400 }
7401 }
7402 /* RIP addressing for 64bit mode. */
7403 else if (i.base_reg->reg_num == RegIP)
7404 {
7405 gas_assert (!i.tm.opcode_modifier.vecsib);
7406 i.rm.regmem = NO_BASE_REGISTER;
7407 i.types[op].bitfield.disp8 = 0;
7408 i.types[op].bitfield.disp16 = 0;
7409 i.types[op].bitfield.disp32 = 0;
7410 i.types[op].bitfield.disp32s = 1;
7411 i.types[op].bitfield.disp64 = 0;
7412 i.flags[op] |= Operand_PCrel;
7413 if (! i.disp_operands)
7414 fake_zero_displacement = 1;
7415 }
7416 else if (i.base_reg->reg_type.bitfield.word)
7417 {
7418 gas_assert (!i.tm.opcode_modifier.vecsib);
7419 switch (i.base_reg->reg_num)
7420 {
7421 case 3: /* (%bx) */
7422 if (i.index_reg == 0)
7423 i.rm.regmem = 7;
7424 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
7425 i.rm.regmem = i.index_reg->reg_num - 6;
7426 break;
7427 case 5: /* (%bp) */
7428 default_seg = &ss;
7429 if (i.index_reg == 0)
7430 {
7431 i.rm.regmem = 6;
7432 if (operand_type_check (i.types[op], disp) == 0)
7433 {
7434 /* fake (%bp) into 0(%bp) */
7435 i.types[op].bitfield.disp8 = 1;
7436 fake_zero_displacement = 1;
7437 }
7438 }
7439 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
7440 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7441 break;
7442 default: /* (%si) -> 4 or (%di) -> 5 */
7443 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7444 }
7445 i.rm.mode = mode_from_disp_size (i.types[op]);
7446 }
7447 else /* i.base_reg and 32/64 bit mode */
7448 {
7449 if (flag_code == CODE_64BIT
7450 && operand_type_check (i.types[op], disp))
7451 {
7452 i.types[op].bitfield.disp16 = 0;
7453 i.types[op].bitfield.disp64 = 0;
7454 if (i.prefix[ADDR_PREFIX] == 0)
7455 {
7456 i.types[op].bitfield.disp32 = 0;
7457 i.types[op].bitfield.disp32s = 1;
7458 }
7459 else
7460 {
7461 i.types[op].bitfield.disp32 = 1;
7462 i.types[op].bitfield.disp32s = 0;
7463 }
7464 }
7465
7466 if (!i.tm.opcode_modifier.vecsib)
7467 i.rm.regmem = i.base_reg->reg_num;
7468 if ((i.base_reg->reg_flags & RegRex) != 0)
7469 i.rex |= REX_B;
7470 i.sib.base = i.base_reg->reg_num;
7471 /* x86-64 ignores REX prefix bit here to avoid decoder
7472 complications. */
7473 if (!(i.base_reg->reg_flags & RegRex)
7474 && (i.base_reg->reg_num == EBP_REG_NUM
7475 || i.base_reg->reg_num == ESP_REG_NUM))
7476 default_seg = &ss;
7477 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7478 {
7479 fake_zero_displacement = 1;
7480 i.types[op].bitfield.disp8 = 1;
7481 }
7482 i.sib.scale = i.log2_scale_factor;
7483 if (i.index_reg == 0)
7484 {
7485 gas_assert (!i.tm.opcode_modifier.vecsib);
7486 /* <disp>(%esp) becomes two byte modrm with no index
7487 register. We've already stored the code for esp
7488 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7489 Any base register besides %esp will not use the
7490 extra modrm byte. */
7491 i.sib.index = NO_INDEX_REGISTER;
7492 }
7493 else if (!i.tm.opcode_modifier.vecsib)
7494 {
7495 if (i.index_reg->reg_num == RegIZ)
7496 i.sib.index = NO_INDEX_REGISTER;
7497 else
7498 i.sib.index = i.index_reg->reg_num;
7499 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7500 if ((i.index_reg->reg_flags & RegRex) != 0)
7501 i.rex |= REX_X;
7502 }
7503
7504 if (i.disp_operands
7505 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7506 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7507 i.rm.mode = 0;
7508 else
7509 {
7510 if (!fake_zero_displacement
7511 && !i.disp_operands
7512 && i.disp_encoding)
7513 {
7514 fake_zero_displacement = 1;
7515 if (i.disp_encoding == disp_encoding_8bit)
7516 i.types[op].bitfield.disp8 = 1;
7517 else
7518 i.types[op].bitfield.disp32 = 1;
7519 }
7520 i.rm.mode = mode_from_disp_size (i.types[op]);
7521 }
7522 }
7523
7524 if (fake_zero_displacement)
7525 {
7526 /* Fakes a zero displacement assuming that i.types[op]
7527 holds the correct displacement size. */
7528 expressionS *exp;
7529
7530 gas_assert (i.op[op].disps == 0);
7531 exp = &disp_expressions[i.disp_operands++];
7532 i.op[op].disps = exp;
7533 exp->X_op = O_constant;
7534 exp->X_add_number = 0;
7535 exp->X_add_symbol = (symbolS *) 0;
7536 exp->X_op_symbol = (symbolS *) 0;
7537 }
7538
7539 mem = op;
7540 }
7541 else
7542 mem = ~0;
7543
7544 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7545 {
7546 if (operand_type_check (i.types[0], imm))
7547 i.vex.register_specifier = NULL;
7548 else
7549 {
7550 /* VEX.vvvv encodes one of the sources when the first
7551 operand is not an immediate. */
7552 if (i.tm.opcode_modifier.vexw == VEXW0)
7553 i.vex.register_specifier = i.op[0].regs;
7554 else
7555 i.vex.register_specifier = i.op[1].regs;
7556 }
7557
7558 /* Destination is a XMM register encoded in the ModRM.reg
7559 and VEX.R bit. */
7560 i.rm.reg = i.op[2].regs->reg_num;
7561 if ((i.op[2].regs->reg_flags & RegRex) != 0)
7562 i.rex |= REX_R;
7563
7564 /* ModRM.rm and VEX.B encodes the other source. */
7565 if (!i.mem_operands)
7566 {
7567 i.rm.mode = 3;
7568
7569 if (i.tm.opcode_modifier.vexw == VEXW0)
7570 i.rm.regmem = i.op[1].regs->reg_num;
7571 else
7572 i.rm.regmem = i.op[0].regs->reg_num;
7573
7574 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7575 i.rex |= REX_B;
7576 }
7577 }
7578 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7579 {
7580 i.vex.register_specifier = i.op[2].regs;
7581 if (!i.mem_operands)
7582 {
7583 i.rm.mode = 3;
7584 i.rm.regmem = i.op[1].regs->reg_num;
7585 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7586 i.rex |= REX_B;
7587 }
7588 }
7589 /* Fill in i.rm.reg or i.rm.regmem field with register operand
7590 (if any) based on i.tm.extension_opcode. Again, we must be
7591 careful to make sure that segment/control/debug/test/MMX
7592 registers are coded into the i.rm.reg field. */
7593 else if (i.reg_operands)
7594 {
7595 unsigned int op;
7596 unsigned int vex_reg = ~0;
7597
7598 for (op = 0; op < i.operands; op++)
7599 {
7600 if (i.types[op].bitfield.reg
7601 || i.types[op].bitfield.regbnd
7602 || i.types[op].bitfield.regmask
7603 || i.types[op].bitfield.sreg2
7604 || i.types[op].bitfield.sreg3
7605 || i.types[op].bitfield.control
7606 || i.types[op].bitfield.debug
7607 || i.types[op].bitfield.test)
7608 break;
7609 if (i.types[op].bitfield.regsimd)
7610 {
7611 if (i.types[op].bitfield.zmmword)
7612 i.has_regzmm = TRUE;
7613 else if (i.types[op].bitfield.ymmword)
7614 i.has_regymm = TRUE;
7615 else
7616 i.has_regxmm = TRUE;
7617 break;
7618 }
7619 if (i.types[op].bitfield.regmmx)
7620 {
7621 i.has_regmmx = TRUE;
7622 break;
7623 }
7624 }
7625
7626 if (vex_3_sources)
7627 op = dest;
7628 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7629 {
7630 /* For instructions with VexNDS, the register-only
7631 source operand is encoded in VEX prefix. */
7632 gas_assert (mem != (unsigned int) ~0);
7633
7634 if (op > mem)
7635 {
7636 vex_reg = op++;
7637 gas_assert (op < i.operands);
7638 }
7639 else
7640 {
7641 /* Check register-only source operand when two source
7642 operands are swapped. */
7643 if (!i.tm.operand_types[op].bitfield.baseindex
7644 && i.tm.operand_types[op + 1].bitfield.baseindex)
7645 {
7646 vex_reg = op;
7647 op += 2;
7648 gas_assert (mem == (vex_reg + 1)
7649 && op < i.operands);
7650 }
7651 else
7652 {
7653 vex_reg = op + 1;
7654 gas_assert (vex_reg < i.operands);
7655 }
7656 }
7657 }
7658 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7659 {
7660 /* For instructions with VexNDD, the register destination
7661 is encoded in VEX prefix. */
7662 if (i.mem_operands == 0)
7663 {
7664 /* There is no memory operand. */
7665 gas_assert ((op + 2) == i.operands);
7666 vex_reg = op + 1;
7667 }
7668 else
7669 {
7670 /* There are only 2 non-immediate operands. */
7671 gas_assert (op < i.imm_operands + 2
7672 && i.operands == i.imm_operands + 2);
7673 vex_reg = i.imm_operands + 1;
7674 }
7675 }
7676 else
7677 gas_assert (op < i.operands);
7678
7679 if (vex_reg != (unsigned int) ~0)
7680 {
7681 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7682
7683 if ((!type->bitfield.reg
7684 || (!type->bitfield.dword && !type->bitfield.qword))
7685 && !type->bitfield.regsimd
7686 && !operand_type_equal (type, &regmask))
7687 abort ();
7688
7689 i.vex.register_specifier = i.op[vex_reg].regs;
7690 }
7691
7692 /* Don't set OP operand twice. */
7693 if (vex_reg != op)
7694 {
7695 /* If there is an extension opcode to put here, the
7696 register number must be put into the regmem field. */
7697 if (i.tm.extension_opcode != None)
7698 {
7699 i.rm.regmem = i.op[op].regs->reg_num;
7700 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7701 i.rex |= REX_B;
7702 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7703 i.vrex |= REX_B;
7704 }
7705 else
7706 {
7707 i.rm.reg = i.op[op].regs->reg_num;
7708 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7709 i.rex |= REX_R;
7710 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7711 i.vrex |= REX_R;
7712 }
7713 }
7714
7715 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7716 must set it to 3 to indicate this is a register operand
7717 in the regmem field. */
7718 if (!i.mem_operands)
7719 i.rm.mode = 3;
7720 }
7721
7722 /* Fill in i.rm.reg field with extension opcode (if any). */
7723 if (i.tm.extension_opcode != None)
7724 i.rm.reg = i.tm.extension_opcode;
7725 }
7726 return default_seg;
7727 }
7728
7729 static void
7730 output_branch (void)
7731 {
7732 char *p;
7733 int size;
7734 int code16;
7735 int prefix;
7736 relax_substateT subtype;
7737 symbolS *sym;
7738 offsetT off;
7739
7740 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7741 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7742
7743 prefix = 0;
7744 if (i.prefix[DATA_PREFIX] != 0)
7745 {
7746 prefix = 1;
7747 i.prefixes -= 1;
7748 code16 ^= CODE16;
7749 }
7750 /* Pentium4 branch hints. */
7751 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7752 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7753 {
7754 prefix++;
7755 i.prefixes--;
7756 }
7757 if (i.prefix[REX_PREFIX] != 0)
7758 {
7759 prefix++;
7760 i.prefixes--;
7761 }
7762
7763 /* BND prefixed jump. */
7764 if (i.prefix[BND_PREFIX] != 0)
7765 {
7766 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7767 i.prefixes -= 1;
7768 }
7769
7770 if (i.prefixes != 0 && !intel_syntax)
7771 as_warn (_("skipping prefixes on this instruction"));
7772
7773 /* It's always a symbol; End frag & setup for relax.
7774 Make sure there is enough room in this frag for the largest
7775 instruction we may generate in md_convert_frag. This is 2
7776 bytes for the opcode and room for the prefix and largest
7777 displacement. */
7778 frag_grow (prefix + 2 + 4);
7779 /* Prefix and 1 opcode byte go in fr_fix. */
7780 p = frag_more (prefix + 1);
7781 if (i.prefix[DATA_PREFIX] != 0)
7782 *p++ = DATA_PREFIX_OPCODE;
7783 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7784 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7785 *p++ = i.prefix[SEG_PREFIX];
7786 if (i.prefix[REX_PREFIX] != 0)
7787 *p++ = i.prefix[REX_PREFIX];
7788 *p = i.tm.base_opcode;
7789
7790 if ((unsigned char) *p == JUMP_PC_RELATIVE)
7791 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7792 else if (cpu_arch_flags.bitfield.cpui386)
7793 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7794 else
7795 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7796 subtype |= code16;
7797
7798 sym = i.op[0].disps->X_add_symbol;
7799 off = i.op[0].disps->X_add_number;
7800
7801 if (i.op[0].disps->X_op != O_constant
7802 && i.op[0].disps->X_op != O_symbol)
7803 {
7804 /* Handle complex expressions. */
7805 sym = make_expr_symbol (i.op[0].disps);
7806 off = 0;
7807 }
7808
7809 /* 1 possible extra opcode + 4 byte displacement go in var part.
7810 Pass reloc in fr_var. */
7811 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7812 }
7813
7814 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7815 /* Return TRUE iff PLT32 relocation should be used for branching to
7816 symbol S. */
7817
7818 static bfd_boolean
7819 need_plt32_p (symbolS *s)
7820 {
7821 /* PLT32 relocation is ELF only. */
7822 if (!IS_ELF)
7823 return FALSE;
7824
7825 #ifdef TE_SOLARIS
7826 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
7827 krtld support it. */
7828 return FALSE;
7829 #endif
7830
7831 /* Since there is no need to prepare for PLT branch on x86-64, we
7832 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
7833 be used as a marker for 32-bit PC-relative branches. */
7834 if (!object_64bit)
7835 return FALSE;
7836
7837 /* Weak or undefined symbol need PLT32 relocation. */
7838 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
7839 return TRUE;
7840
7841 /* Non-global symbol doesn't need PLT32 relocation. */
7842 if (! S_IS_EXTERNAL (s))
7843 return FALSE;
7844
7845 /* Other global symbols need PLT32 relocation. NB: Symbol with
7846 non-default visibilities are treated as normal global symbol
7847 so that PLT32 relocation can be used as a marker for 32-bit
7848 PC-relative branches. It is useful for linker relaxation. */
7849 return TRUE;
7850 }
7851 #endif
7852
7853 static void
7854 output_jump (void)
7855 {
7856 char *p;
7857 int size;
7858 fixS *fixP;
7859 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
7860
7861 if (i.tm.opcode_modifier.jumpbyte)
7862 {
7863 /* This is a loop or jecxz type instruction. */
7864 size = 1;
7865 if (i.prefix[ADDR_PREFIX] != 0)
7866 {
7867 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
7868 i.prefixes -= 1;
7869 }
7870 /* Pentium4 branch hints. */
7871 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7872 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7873 {
7874 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
7875 i.prefixes--;
7876 }
7877 }
7878 else
7879 {
7880 int code16;
7881
7882 code16 = 0;
7883 if (flag_code == CODE_16BIT)
7884 code16 = CODE16;
7885
7886 if (i.prefix[DATA_PREFIX] != 0)
7887 {
7888 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
7889 i.prefixes -= 1;
7890 code16 ^= CODE16;
7891 }
7892
7893 size = 4;
7894 if (code16)
7895 size = 2;
7896 }
7897
7898 if (i.prefix[REX_PREFIX] != 0)
7899 {
7900 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
7901 i.prefixes -= 1;
7902 }
7903
7904 /* BND prefixed jump. */
7905 if (i.prefix[BND_PREFIX] != 0)
7906 {
7907 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7908 i.prefixes -= 1;
7909 }
7910
7911 if (i.prefixes != 0 && !intel_syntax)
7912 as_warn (_("skipping prefixes on this instruction"));
7913
7914 p = frag_more (i.tm.opcode_length + size);
7915 switch (i.tm.opcode_length)
7916 {
7917 case 2:
7918 *p++ = i.tm.base_opcode >> 8;
7919 /* Fall through. */
7920 case 1:
7921 *p++ = i.tm.base_opcode;
7922 break;
7923 default:
7924 abort ();
7925 }
7926
7927 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7928 if (size == 4
7929 && jump_reloc == NO_RELOC
7930 && need_plt32_p (i.op[0].disps->X_add_symbol))
7931 jump_reloc = BFD_RELOC_X86_64_PLT32;
7932 #endif
7933
7934 jump_reloc = reloc (size, 1, 1, jump_reloc);
7935
7936 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7937 i.op[0].disps, 1, jump_reloc);
7938
7939 /* All jumps handled here are signed, but don't use a signed limit
7940 check for 32 and 16 bit jumps as we want to allow wrap around at
7941 4G and 64k respectively. */
7942 if (size == 1)
7943 fixP->fx_signed = 1;
7944 }
7945
7946 static void
7947 output_interseg_jump (void)
7948 {
7949 char *p;
7950 int size;
7951 int prefix;
7952 int code16;
7953
7954 code16 = 0;
7955 if (flag_code == CODE_16BIT)
7956 code16 = CODE16;
7957
7958 prefix = 0;
7959 if (i.prefix[DATA_PREFIX] != 0)
7960 {
7961 prefix = 1;
7962 i.prefixes -= 1;
7963 code16 ^= CODE16;
7964 }
7965 if (i.prefix[REX_PREFIX] != 0)
7966 {
7967 prefix++;
7968 i.prefixes -= 1;
7969 }
7970
7971 size = 4;
7972 if (code16)
7973 size = 2;
7974
7975 if (i.prefixes != 0 && !intel_syntax)
7976 as_warn (_("skipping prefixes on this instruction"));
7977
7978 /* 1 opcode; 2 segment; offset */
7979 p = frag_more (prefix + 1 + 2 + size);
7980
7981 if (i.prefix[DATA_PREFIX] != 0)
7982 *p++ = DATA_PREFIX_OPCODE;
7983
7984 if (i.prefix[REX_PREFIX] != 0)
7985 *p++ = i.prefix[REX_PREFIX];
7986
7987 *p++ = i.tm.base_opcode;
7988 if (i.op[1].imms->X_op == O_constant)
7989 {
7990 offsetT n = i.op[1].imms->X_add_number;
7991
7992 if (size == 2
7993 && !fits_in_unsigned_word (n)
7994 && !fits_in_signed_word (n))
7995 {
7996 as_bad (_("16-bit jump out of range"));
7997 return;
7998 }
7999 md_number_to_chars (p, n, size);
8000 }
8001 else
8002 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8003 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8004 if (i.op[0].imms->X_op != O_constant)
8005 as_bad (_("can't handle non absolute segment in `%s'"),
8006 i.tm.name);
8007 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8008 }
8009
8010 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8011 void
8012 x86_cleanup (void)
8013 {
8014 char *p;
8015 asection *seg = now_seg;
8016 subsegT subseg = now_subseg;
8017 asection *sec;
8018 unsigned int alignment, align_size_1;
8019 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8020 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8021 unsigned int padding;
8022
8023 if (!IS_ELF || !x86_used_note)
8024 return;
8025
8026 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8027
8028 /* The .note.gnu.property section layout:
8029
8030 Field Length Contents
8031 ---- ---- ----
8032 n_namsz 4 4
8033 n_descsz 4 The note descriptor size
8034 n_type 4 NT_GNU_PROPERTY_TYPE_0
8035 n_name 4 "GNU"
8036 n_desc n_descsz The program property array
8037 .... .... ....
8038 */
8039
8040 /* Create the .note.gnu.property section. */
8041 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8042 bfd_set_section_flags (stdoutput, sec,
8043 (SEC_ALLOC
8044 | SEC_LOAD
8045 | SEC_DATA
8046 | SEC_HAS_CONTENTS
8047 | SEC_READONLY));
8048
8049 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8050 {
8051 align_size_1 = 7;
8052 alignment = 3;
8053 }
8054 else
8055 {
8056 align_size_1 = 3;
8057 alignment = 2;
8058 }
8059
8060 bfd_set_section_alignment (stdoutput, sec, alignment);
8061 elf_section_type (sec) = SHT_NOTE;
8062
8063 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8064 + 4-byte data */
8065 isa_1_descsz_raw = 4 + 4 + 4;
8066 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8067 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8068
8069 feature_2_descsz_raw = isa_1_descsz;
8070 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8071 + 4-byte data */
8072 feature_2_descsz_raw += 4 + 4 + 4;
8073 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8074 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8075 & ~align_size_1);
8076
8077 descsz = feature_2_descsz;
8078 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8079 p = frag_more (4 + 4 + 4 + 4 + descsz);
8080
8081 /* Write n_namsz. */
8082 md_number_to_chars (p, (valueT) 4, 4);
8083
8084 /* Write n_descsz. */
8085 md_number_to_chars (p + 4, (valueT) descsz, 4);
8086
8087 /* Write n_type. */
8088 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8089
8090 /* Write n_name. */
8091 memcpy (p + 4 * 3, "GNU", 4);
8092
8093 /* Write 4-byte type. */
8094 md_number_to_chars (p + 4 * 4,
8095 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8096
8097 /* Write 4-byte data size. */
8098 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8099
8100 /* Write 4-byte data. */
8101 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8102
8103 /* Zero out paddings. */
8104 padding = isa_1_descsz - isa_1_descsz_raw;
8105 if (padding)
8106 memset (p + 4 * 7, 0, padding);
8107
8108 /* Write 4-byte type. */
8109 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8110 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8111
8112 /* Write 4-byte data size. */
8113 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8114
8115 /* Write 4-byte data. */
8116 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8117 (valueT) x86_feature_2_used, 4);
8118
8119 /* Zero out paddings. */
8120 padding = feature_2_descsz - feature_2_descsz_raw;
8121 if (padding)
8122 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8123
8124 /* We probably can't restore the current segment, for there likely
8125 isn't one yet... */
8126 if (seg && subseg)
8127 subseg_set (seg, subseg);
8128 }
8129 #endif
8130
8131 static unsigned int
8132 encoding_length (const fragS *start_frag, offsetT start_off,
8133 const char *frag_now_ptr)
8134 {
8135 unsigned int len = 0;
8136
8137 if (start_frag != frag_now)
8138 {
8139 const fragS *fr = start_frag;
8140
8141 do {
8142 len += fr->fr_fix;
8143 fr = fr->fr_next;
8144 } while (fr && fr != frag_now);
8145 }
8146
8147 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8148 }
8149
8150 static void
8151 output_insn (void)
8152 {
8153 fragS *insn_start_frag;
8154 offsetT insn_start_off;
8155
8156 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8157 if (IS_ELF && x86_used_note)
8158 {
8159 if (i.tm.cpu_flags.bitfield.cpucmov)
8160 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8161 if (i.tm.cpu_flags.bitfield.cpusse)
8162 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8163 if (i.tm.cpu_flags.bitfield.cpusse2)
8164 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8165 if (i.tm.cpu_flags.bitfield.cpusse3)
8166 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8167 if (i.tm.cpu_flags.bitfield.cpussse3)
8168 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8169 if (i.tm.cpu_flags.bitfield.cpusse4_1)
8170 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8171 if (i.tm.cpu_flags.bitfield.cpusse4_2)
8172 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8173 if (i.tm.cpu_flags.bitfield.cpuavx)
8174 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8175 if (i.tm.cpu_flags.bitfield.cpuavx2)
8176 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8177 if (i.tm.cpu_flags.bitfield.cpufma)
8178 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8179 if (i.tm.cpu_flags.bitfield.cpuavx512f)
8180 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8181 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8182 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8183 if (i.tm.cpu_flags.bitfield.cpuavx512er)
8184 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8185 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8186 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8187 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8188 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8189 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8190 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8191 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8192 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8193 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8194 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8195 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8196 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8197 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8198 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8199 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8200 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8201 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8202 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8203 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8204 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8205 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8206 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8207 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8208 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8209
8210 if (i.tm.cpu_flags.bitfield.cpu8087
8211 || i.tm.cpu_flags.bitfield.cpu287
8212 || i.tm.cpu_flags.bitfield.cpu387
8213 || i.tm.cpu_flags.bitfield.cpu687
8214 || i.tm.cpu_flags.bitfield.cpufisttp)
8215 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8216 /* Don't set GNU_PROPERTY_X86_FEATURE_2_MMX for prefetchtXXX nor
8217 Xfence instructions. */
8218 if (i.tm.base_opcode != 0xf18
8219 && i.tm.base_opcode != 0xf0d
8220 && i.tm.base_opcode != 0xfae
8221 && (i.has_regmmx
8222 || i.tm.cpu_flags.bitfield.cpummx
8223 || i.tm.cpu_flags.bitfield.cpua3dnow
8224 || i.tm.cpu_flags.bitfield.cpua3dnowa))
8225 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8226 if (i.has_regxmm)
8227 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8228 if (i.has_regymm)
8229 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8230 if (i.has_regzmm)
8231 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8232 if (i.tm.cpu_flags.bitfield.cpufxsr)
8233 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8234 if (i.tm.cpu_flags.bitfield.cpuxsave)
8235 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8236 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8237 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8238 if (i.tm.cpu_flags.bitfield.cpuxsavec)
8239 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8240 }
8241 #endif
8242
8243 /* Tie dwarf2 debug info to the address at the start of the insn.
8244 We can't do this after the insn has been output as the current
8245 frag may have been closed off. eg. by frag_var. */
8246 dwarf2_emit_insn (0);
8247
8248 insn_start_frag = frag_now;
8249 insn_start_off = frag_now_fix ();
8250
8251 /* Output jumps. */
8252 if (i.tm.opcode_modifier.jump)
8253 output_branch ();
8254 else if (i.tm.opcode_modifier.jumpbyte
8255 || i.tm.opcode_modifier.jumpdword)
8256 output_jump ();
8257 else if (i.tm.opcode_modifier.jumpintersegment)
8258 output_interseg_jump ();
8259 else
8260 {
8261 /* Output normal instructions here. */
8262 char *p;
8263 unsigned char *q;
8264 unsigned int j;
8265 unsigned int prefix;
8266
8267 if (avoid_fence
8268 && i.tm.base_opcode == 0xfae
8269 && i.operands == 1
8270 && i.imm_operands == 1
8271 && (i.op[0].imms->X_add_number == 0xe8
8272 || i.op[0].imms->X_add_number == 0xf0
8273 || i.op[0].imms->X_add_number == 0xf8))
8274 {
8275 /* Encode lfence, mfence, and sfence as
8276 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
8277 offsetT val = 0x240483f0ULL;
8278 p = frag_more (5);
8279 md_number_to_chars (p, val, 5);
8280 return;
8281 }
8282
8283 /* Some processors fail on LOCK prefix. This options makes
8284 assembler ignore LOCK prefix and serves as a workaround. */
8285 if (omit_lock_prefix)
8286 {
8287 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8288 return;
8289 i.prefix[LOCK_PREFIX] = 0;
8290 }
8291
8292 /* Since the VEX/EVEX prefix contains the implicit prefix, we
8293 don't need the explicit prefix. */
8294 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8295 {
8296 switch (i.tm.opcode_length)
8297 {
8298 case 3:
8299 if (i.tm.base_opcode & 0xff000000)
8300 {
8301 prefix = (i.tm.base_opcode >> 24) & 0xff;
8302 add_prefix (prefix);
8303 }
8304 break;
8305 case 2:
8306 if ((i.tm.base_opcode & 0xff0000) != 0)
8307 {
8308 prefix = (i.tm.base_opcode >> 16) & 0xff;
8309 if (!i.tm.cpu_flags.bitfield.cpupadlock
8310 || prefix != REPE_PREFIX_OPCODE
8311 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8312 add_prefix (prefix);
8313 }
8314 break;
8315 case 1:
8316 break;
8317 case 0:
8318 /* Check for pseudo prefixes. */
8319 as_bad_where (insn_start_frag->fr_file,
8320 insn_start_frag->fr_line,
8321 _("pseudo prefix without instruction"));
8322 return;
8323 default:
8324 abort ();
8325 }
8326
8327 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8328 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8329 R_X86_64_GOTTPOFF relocation so that linker can safely
8330 perform IE->LE optimization. */
8331 if (x86_elf_abi == X86_64_X32_ABI
8332 && i.operands == 2
8333 && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8334 && i.prefix[REX_PREFIX] == 0)
8335 add_prefix (REX_OPCODE);
8336 #endif
8337
8338 /* The prefix bytes. */
8339 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8340 if (*q)
8341 FRAG_APPEND_1_CHAR (*q);
8342 }
8343 else
8344 {
8345 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8346 if (*q)
8347 switch (j)
8348 {
8349 case REX_PREFIX:
8350 /* REX byte is encoded in VEX prefix. */
8351 break;
8352 case SEG_PREFIX:
8353 case ADDR_PREFIX:
8354 FRAG_APPEND_1_CHAR (*q);
8355 break;
8356 default:
8357 /* There should be no other prefixes for instructions
8358 with VEX prefix. */
8359 abort ();
8360 }
8361
8362 /* For EVEX instructions i.vrex should become 0 after
8363 build_evex_prefix. For VEX instructions upper 16 registers
8364 aren't available, so VREX should be 0. */
8365 if (i.vrex)
8366 abort ();
8367 /* Now the VEX prefix. */
8368 p = frag_more (i.vex.length);
8369 for (j = 0; j < i.vex.length; j++)
8370 p[j] = i.vex.bytes[j];
8371 }
8372
8373 /* Now the opcode; be careful about word order here! */
8374 if (i.tm.opcode_length == 1)
8375 {
8376 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8377 }
8378 else
8379 {
8380 switch (i.tm.opcode_length)
8381 {
8382 case 4:
8383 p = frag_more (4);
8384 *p++ = (i.tm.base_opcode >> 24) & 0xff;
8385 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8386 break;
8387 case 3:
8388 p = frag_more (3);
8389 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8390 break;
8391 case 2:
8392 p = frag_more (2);
8393 break;
8394 default:
8395 abort ();
8396 break;
8397 }
8398
8399 /* Put out high byte first: can't use md_number_to_chars! */
8400 *p++ = (i.tm.base_opcode >> 8) & 0xff;
8401 *p = i.tm.base_opcode & 0xff;
8402 }
8403
8404 /* Now the modrm byte and sib byte (if present). */
8405 if (i.tm.opcode_modifier.modrm)
8406 {
8407 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8408 | i.rm.reg << 3
8409 | i.rm.mode << 6));
8410 /* If i.rm.regmem == ESP (4)
8411 && i.rm.mode != (Register mode)
8412 && not 16 bit
8413 ==> need second modrm byte. */
8414 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8415 && i.rm.mode != 3
8416 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8417 FRAG_APPEND_1_CHAR ((i.sib.base << 0
8418 | i.sib.index << 3
8419 | i.sib.scale << 6));
8420 }
8421
8422 if (i.disp_operands)
8423 output_disp (insn_start_frag, insn_start_off);
8424
8425 if (i.imm_operands)
8426 output_imm (insn_start_frag, insn_start_off);
8427
8428 /*
8429 * frag_now_fix () returning plain abs_section_offset when we're in the
8430 * absolute section, and abs_section_offset not getting updated as data
8431 * gets added to the frag breaks the logic below.
8432 */
8433 if (now_seg != absolute_section)
8434 {
8435 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8436 if (j > 15)
8437 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8438 j);
8439 }
8440 }
8441
8442 #ifdef DEBUG386
8443 if (flag_debug)
8444 {
8445 pi ("" /*line*/, &i);
8446 }
8447 #endif /* DEBUG386 */
8448 }
8449
8450 /* Return the size of the displacement operand N. */
8451
8452 static int
8453 disp_size (unsigned int n)
8454 {
8455 int size = 4;
8456
8457 if (i.types[n].bitfield.disp64)
8458 size = 8;
8459 else if (i.types[n].bitfield.disp8)
8460 size = 1;
8461 else if (i.types[n].bitfield.disp16)
8462 size = 2;
8463 return size;
8464 }
8465
8466 /* Return the size of the immediate operand N. */
8467
8468 static int
8469 imm_size (unsigned int n)
8470 {
8471 int size = 4;
8472 if (i.types[n].bitfield.imm64)
8473 size = 8;
8474 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8475 size = 1;
8476 else if (i.types[n].bitfield.imm16)
8477 size = 2;
8478 return size;
8479 }
8480
8481 static void
8482 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
8483 {
8484 char *p;
8485 unsigned int n;
8486
8487 for (n = 0; n < i.operands; n++)
8488 {
8489 if (operand_type_check (i.types[n], disp))
8490 {
8491 if (i.op[n].disps->X_op == O_constant)
8492 {
8493 int size = disp_size (n);
8494 offsetT val = i.op[n].disps->X_add_number;
8495
8496 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
8497 size);
8498 p = frag_more (size);
8499 md_number_to_chars (p, val, size);
8500 }
8501 else
8502 {
8503 enum bfd_reloc_code_real reloc_type;
8504 int size = disp_size (n);
8505 int sign = i.types[n].bitfield.disp32s;
8506 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
8507 fixS *fixP;
8508
8509 /* We can't have 8 bit displacement here. */
8510 gas_assert (!i.types[n].bitfield.disp8);
8511
8512 /* The PC relative address is computed relative
8513 to the instruction boundary, so in case immediate
8514 fields follows, we need to adjust the value. */
8515 if (pcrel && i.imm_operands)
8516 {
8517 unsigned int n1;
8518 int sz = 0;
8519
8520 for (n1 = 0; n1 < i.operands; n1++)
8521 if (operand_type_check (i.types[n1], imm))
8522 {
8523 /* Only one immediate is allowed for PC
8524 relative address. */
8525 gas_assert (sz == 0);
8526 sz = imm_size (n1);
8527 i.op[n].disps->X_add_number -= sz;
8528 }
8529 /* We should find the immediate. */
8530 gas_assert (sz != 0);
8531 }
8532
8533 p = frag_more (size);
8534 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
8535 if (GOT_symbol
8536 && GOT_symbol == i.op[n].disps->X_add_symbol
8537 && (((reloc_type == BFD_RELOC_32
8538 || reloc_type == BFD_RELOC_X86_64_32S
8539 || (reloc_type == BFD_RELOC_64
8540 && object_64bit))
8541 && (i.op[n].disps->X_op == O_symbol
8542 || (i.op[n].disps->X_op == O_add
8543 && ((symbol_get_value_expression
8544 (i.op[n].disps->X_op_symbol)->X_op)
8545 == O_subtract))))
8546 || reloc_type == BFD_RELOC_32_PCREL))
8547 {
8548 if (!object_64bit)
8549 {
8550 reloc_type = BFD_RELOC_386_GOTPC;
8551 i.op[n].imms->X_add_number +=
8552 encoding_length (insn_start_frag, insn_start_off, p);
8553 }
8554 else if (reloc_type == BFD_RELOC_64)
8555 reloc_type = BFD_RELOC_X86_64_GOTPC64;
8556 else
8557 /* Don't do the adjustment for x86-64, as there
8558 the pcrel addressing is relative to the _next_
8559 insn, and that is taken care of in other code. */
8560 reloc_type = BFD_RELOC_X86_64_GOTPC32;
8561 }
8562 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
8563 size, i.op[n].disps, pcrel,
8564 reloc_type);
8565 /* Check for "call/jmp *mem", "mov mem, %reg",
8566 "test %reg, mem" and "binop mem, %reg" where binop
8567 is one of adc, add, and, cmp, or, sbb, sub, xor
8568 instructions without data prefix. Always generate
8569 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
8570 if (i.prefix[DATA_PREFIX] == 0
8571 && (generate_relax_relocations
8572 || (!object_64bit
8573 && i.rm.mode == 0
8574 && i.rm.regmem == 5))
8575 && (i.rm.mode == 2
8576 || (i.rm.mode == 0 && i.rm.regmem == 5))
8577 && ((i.operands == 1
8578 && i.tm.base_opcode == 0xff
8579 && (i.rm.reg == 2 || i.rm.reg == 4))
8580 || (i.operands == 2
8581 && (i.tm.base_opcode == 0x8b
8582 || i.tm.base_opcode == 0x85
8583 || (i.tm.base_opcode & 0xc7) == 0x03))))
8584 {
8585 if (object_64bit)
8586 {
8587 fixP->fx_tcbit = i.rex != 0;
8588 if (i.base_reg
8589 && (i.base_reg->reg_num == RegIP))
8590 fixP->fx_tcbit2 = 1;
8591 }
8592 else
8593 fixP->fx_tcbit2 = 1;
8594 }
8595 }
8596 }
8597 }
8598 }
8599
8600 static void
8601 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
8602 {
8603 char *p;
8604 unsigned int n;
8605
8606 for (n = 0; n < i.operands; n++)
8607 {
8608 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
8609 if (i.rounding && (int) n == i.rounding->operand)
8610 continue;
8611
8612 if (operand_type_check (i.types[n], imm))
8613 {
8614 if (i.op[n].imms->X_op == O_constant)
8615 {
8616 int size = imm_size (n);
8617 offsetT val;
8618
8619 val = offset_in_range (i.op[n].imms->X_add_number,
8620 size);
8621 p = frag_more (size);
8622 md_number_to_chars (p, val, size);
8623 }
8624 else
8625 {
8626 /* Not absolute_section.
8627 Need a 32-bit fixup (don't support 8bit
8628 non-absolute imms). Try to support other
8629 sizes ... */
8630 enum bfd_reloc_code_real reloc_type;
8631 int size = imm_size (n);
8632 int sign;
8633
8634 if (i.types[n].bitfield.imm32s
8635 && (i.suffix == QWORD_MNEM_SUFFIX
8636 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
8637 sign = 1;
8638 else
8639 sign = 0;
8640
8641 p = frag_more (size);
8642 reloc_type = reloc (size, 0, sign, i.reloc[n]);
8643
8644 /* This is tough to explain. We end up with this one if we
8645 * have operands that look like
8646 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
8647 * obtain the absolute address of the GOT, and it is strongly
8648 * preferable from a performance point of view to avoid using
8649 * a runtime relocation for this. The actual sequence of
8650 * instructions often look something like:
8651 *
8652 * call .L66
8653 * .L66:
8654 * popl %ebx
8655 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
8656 *
8657 * The call and pop essentially return the absolute address
8658 * of the label .L66 and store it in %ebx. The linker itself
8659 * will ultimately change the first operand of the addl so
8660 * that %ebx points to the GOT, but to keep things simple, the
8661 * .o file must have this operand set so that it generates not
8662 * the absolute address of .L66, but the absolute address of
8663 * itself. This allows the linker itself simply treat a GOTPC
8664 * relocation as asking for a pcrel offset to the GOT to be
8665 * added in, and the addend of the relocation is stored in the
8666 * operand field for the instruction itself.
8667 *
8668 * Our job here is to fix the operand so that it would add
8669 * the correct offset so that %ebx would point to itself. The
8670 * thing that is tricky is that .-.L66 will point to the
8671 * beginning of the instruction, so we need to further modify
8672 * the operand so that it will point to itself. There are
8673 * other cases where you have something like:
8674 *
8675 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
8676 *
8677 * and here no correction would be required. Internally in
8678 * the assembler we treat operands of this form as not being
8679 * pcrel since the '.' is explicitly mentioned, and I wonder
8680 * whether it would simplify matters to do it this way. Who
8681 * knows. In earlier versions of the PIC patches, the
8682 * pcrel_adjust field was used to store the correction, but
8683 * since the expression is not pcrel, I felt it would be
8684 * confusing to do it this way. */
8685
8686 if ((reloc_type == BFD_RELOC_32
8687 || reloc_type == BFD_RELOC_X86_64_32S
8688 || reloc_type == BFD_RELOC_64)
8689 && GOT_symbol
8690 && GOT_symbol == i.op[n].imms->X_add_symbol
8691 && (i.op[n].imms->X_op == O_symbol
8692 || (i.op[n].imms->X_op == O_add
8693 && ((symbol_get_value_expression
8694 (i.op[n].imms->X_op_symbol)->X_op)
8695 == O_subtract))))
8696 {
8697 if (!object_64bit)
8698 reloc_type = BFD_RELOC_386_GOTPC;
8699 else if (size == 4)
8700 reloc_type = BFD_RELOC_X86_64_GOTPC32;
8701 else if (size == 8)
8702 reloc_type = BFD_RELOC_X86_64_GOTPC64;
8703 i.op[n].imms->X_add_number +=
8704 encoding_length (insn_start_frag, insn_start_off, p);
8705 }
8706 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8707 i.op[n].imms, 0, reloc_type);
8708 }
8709 }
8710 }
8711 }
8712 \f
8713 /* x86_cons_fix_new is called via the expression parsing code when a
8714 reloc is needed. We use this hook to get the correct .got reloc. */
8715 static int cons_sign = -1;
8716
8717 void
8718 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
8719 expressionS *exp, bfd_reloc_code_real_type r)
8720 {
8721 r = reloc (len, 0, cons_sign, r);
8722
8723 #ifdef TE_PE
8724 if (exp->X_op == O_secrel)
8725 {
8726 exp->X_op = O_symbol;
8727 r = BFD_RELOC_32_SECREL;
8728 }
8729 #endif
8730
8731 fix_new_exp (frag, off, len, exp, 0, r);
8732 }
8733
8734 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
8735 purpose of the `.dc.a' internal pseudo-op. */
8736
8737 int
8738 x86_address_bytes (void)
8739 {
8740 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
8741 return 4;
8742 return stdoutput->arch_info->bits_per_address / 8;
8743 }
8744
8745 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
8746 || defined (LEX_AT)
8747 # define lex_got(reloc, adjust, types) NULL
8748 #else
8749 /* Parse operands of the form
8750 <symbol>@GOTOFF+<nnn>
8751 and similar .plt or .got references.
8752
8753 If we find one, set up the correct relocation in RELOC and copy the
8754 input string, minus the `@GOTOFF' into a malloc'd buffer for
8755 parsing by the calling routine. Return this buffer, and if ADJUST
8756 is non-null set it to the length of the string we removed from the
8757 input line. Otherwise return NULL. */
8758 static char *
8759 lex_got (enum bfd_reloc_code_real *rel,
8760 int *adjust,
8761 i386_operand_type *types)
8762 {
8763 /* Some of the relocations depend on the size of what field is to
8764 be relocated. But in our callers i386_immediate and i386_displacement
8765 we don't yet know the operand size (this will be set by insn
8766 matching). Hence we record the word32 relocation here,
8767 and adjust the reloc according to the real size in reloc(). */
8768 static const struct {
8769 const char *str;
8770 int len;
8771 const enum bfd_reloc_code_real rel[2];
8772 const i386_operand_type types64;
8773 } gotrel[] = {
8774 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8775 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
8776 BFD_RELOC_SIZE32 },
8777 OPERAND_TYPE_IMM32_64 },
8778 #endif
8779 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
8780 BFD_RELOC_X86_64_PLTOFF64 },
8781 OPERAND_TYPE_IMM64 },
8782 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
8783 BFD_RELOC_X86_64_PLT32 },
8784 OPERAND_TYPE_IMM32_32S_DISP32 },
8785 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
8786 BFD_RELOC_X86_64_GOTPLT64 },
8787 OPERAND_TYPE_IMM64_DISP64 },
8788 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
8789 BFD_RELOC_X86_64_GOTOFF64 },
8790 OPERAND_TYPE_IMM64_DISP64 },
8791 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
8792 BFD_RELOC_X86_64_GOTPCREL },
8793 OPERAND_TYPE_IMM32_32S_DISP32 },
8794 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
8795 BFD_RELOC_X86_64_TLSGD },
8796 OPERAND_TYPE_IMM32_32S_DISP32 },
8797 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
8798 _dummy_first_bfd_reloc_code_real },
8799 OPERAND_TYPE_NONE },
8800 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
8801 BFD_RELOC_X86_64_TLSLD },
8802 OPERAND_TYPE_IMM32_32S_DISP32 },
8803 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
8804 BFD_RELOC_X86_64_GOTTPOFF },
8805 OPERAND_TYPE_IMM32_32S_DISP32 },
8806 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
8807 BFD_RELOC_X86_64_TPOFF32 },
8808 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8809 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
8810 _dummy_first_bfd_reloc_code_real },
8811 OPERAND_TYPE_NONE },
8812 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
8813 BFD_RELOC_X86_64_DTPOFF32 },
8814 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8815 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
8816 _dummy_first_bfd_reloc_code_real },
8817 OPERAND_TYPE_NONE },
8818 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
8819 _dummy_first_bfd_reloc_code_real },
8820 OPERAND_TYPE_NONE },
8821 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
8822 BFD_RELOC_X86_64_GOT32 },
8823 OPERAND_TYPE_IMM32_32S_64_DISP32 },
8824 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
8825 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
8826 OPERAND_TYPE_IMM32_32S_DISP32 },
8827 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
8828 BFD_RELOC_X86_64_TLSDESC_CALL },
8829 OPERAND_TYPE_IMM32_32S_DISP32 },
8830 };
8831 char *cp;
8832 unsigned int j;
8833
8834 #if defined (OBJ_MAYBE_ELF)
8835 if (!IS_ELF)
8836 return NULL;
8837 #endif
8838
8839 for (cp = input_line_pointer; *cp != '@'; cp++)
8840 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
8841 return NULL;
8842
8843 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
8844 {
8845 int len = gotrel[j].len;
8846 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
8847 {
8848 if (gotrel[j].rel[object_64bit] != 0)
8849 {
8850 int first, second;
8851 char *tmpbuf, *past_reloc;
8852
8853 *rel = gotrel[j].rel[object_64bit];
8854
8855 if (types)
8856 {
8857 if (flag_code != CODE_64BIT)
8858 {
8859 types->bitfield.imm32 = 1;
8860 types->bitfield.disp32 = 1;
8861 }
8862 else
8863 *types = gotrel[j].types64;
8864 }
8865
8866 if (j != 0 && GOT_symbol == NULL)
8867 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
8868
8869 /* The length of the first part of our input line. */
8870 first = cp - input_line_pointer;
8871
8872 /* The second part goes from after the reloc token until
8873 (and including) an end_of_line char or comma. */
8874 past_reloc = cp + 1 + len;
8875 cp = past_reloc;
8876 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
8877 ++cp;
8878 second = cp + 1 - past_reloc;
8879
8880 /* Allocate and copy string. The trailing NUL shouldn't
8881 be necessary, but be safe. */
8882 tmpbuf = XNEWVEC (char, first + second + 2);
8883 memcpy (tmpbuf, input_line_pointer, first);
8884 if (second != 0 && *past_reloc != ' ')
8885 /* Replace the relocation token with ' ', so that
8886 errors like foo@GOTOFF1 will be detected. */
8887 tmpbuf[first++] = ' ';
8888 else
8889 /* Increment length by 1 if the relocation token is
8890 removed. */
8891 len++;
8892 if (adjust)
8893 *adjust = len;
8894 memcpy (tmpbuf + first, past_reloc, second);
8895 tmpbuf[first + second] = '\0';
8896 return tmpbuf;
8897 }
8898
8899 as_bad (_("@%s reloc is not supported with %d-bit output format"),
8900 gotrel[j].str, 1 << (5 + object_64bit));
8901 return NULL;
8902 }
8903 }
8904
8905 /* Might be a symbol version string. Don't as_bad here. */
8906 return NULL;
8907 }
8908 #endif
8909
8910 #ifdef TE_PE
8911 #ifdef lex_got
8912 #undef lex_got
8913 #endif
8914 /* Parse operands of the form
8915 <symbol>@SECREL32+<nnn>
8916
8917 If we find one, set up the correct relocation in RELOC and copy the
8918 input string, minus the `@SECREL32' into a malloc'd buffer for
8919 parsing by the calling routine. Return this buffer, and if ADJUST
8920 is non-null set it to the length of the string we removed from the
8921 input line. Otherwise return NULL.
8922
8923 This function is copied from the ELF version above adjusted for PE targets. */
8924
8925 static char *
8926 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
8927 int *adjust ATTRIBUTE_UNUSED,
8928 i386_operand_type *types)
8929 {
8930 static const struct
8931 {
8932 const char *str;
8933 int len;
8934 const enum bfd_reloc_code_real rel[2];
8935 const i386_operand_type types64;
8936 }
8937 gotrel[] =
8938 {
8939 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
8940 BFD_RELOC_32_SECREL },
8941 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8942 };
8943
8944 char *cp;
8945 unsigned j;
8946
8947 for (cp = input_line_pointer; *cp != '@'; cp++)
8948 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
8949 return NULL;
8950
8951 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
8952 {
8953 int len = gotrel[j].len;
8954
8955 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
8956 {
8957 if (gotrel[j].rel[object_64bit] != 0)
8958 {
8959 int first, second;
8960 char *tmpbuf, *past_reloc;
8961
8962 *rel = gotrel[j].rel[object_64bit];
8963 if (adjust)
8964 *adjust = len;
8965
8966 if (types)
8967 {
8968 if (flag_code != CODE_64BIT)
8969 {
8970 types->bitfield.imm32 = 1;
8971 types->bitfield.disp32 = 1;
8972 }
8973 else
8974 *types = gotrel[j].types64;
8975 }
8976
8977 /* The length of the first part of our input line. */
8978 first = cp - input_line_pointer;
8979
8980 /* The second part goes from after the reloc token until
8981 (and including) an end_of_line char or comma. */
8982 past_reloc = cp + 1 + len;
8983 cp = past_reloc;
8984 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
8985 ++cp;
8986 second = cp + 1 - past_reloc;
8987
8988 /* Allocate and copy string. The trailing NUL shouldn't
8989 be necessary, but be safe. */
8990 tmpbuf = XNEWVEC (char, first + second + 2);
8991 memcpy (tmpbuf, input_line_pointer, first);
8992 if (second != 0 && *past_reloc != ' ')
8993 /* Replace the relocation token with ' ', so that
8994 errors like foo@SECLREL321 will be detected. */
8995 tmpbuf[first++] = ' ';
8996 memcpy (tmpbuf + first, past_reloc, second);
8997 tmpbuf[first + second] = '\0';
8998 return tmpbuf;
8999 }
9000
9001 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9002 gotrel[j].str, 1 << (5 + object_64bit));
9003 return NULL;
9004 }
9005 }
9006
9007 /* Might be a symbol version string. Don't as_bad here. */
9008 return NULL;
9009 }
9010
9011 #endif /* TE_PE */
9012
9013 bfd_reloc_code_real_type
9014 x86_cons (expressionS *exp, int size)
9015 {
9016 bfd_reloc_code_real_type got_reloc = NO_RELOC;
9017
9018 intel_syntax = -intel_syntax;
9019
9020 exp->X_md = 0;
9021 if (size == 4 || (object_64bit && size == 8))
9022 {
9023 /* Handle @GOTOFF and the like in an expression. */
9024 char *save;
9025 char *gotfree_input_line;
9026 int adjust = 0;
9027
9028 save = input_line_pointer;
9029 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9030 if (gotfree_input_line)
9031 input_line_pointer = gotfree_input_line;
9032
9033 expression (exp);
9034
9035 if (gotfree_input_line)
9036 {
9037 /* expression () has merrily parsed up to the end of line,
9038 or a comma - in the wrong buffer. Transfer how far
9039 input_line_pointer has moved to the right buffer. */
9040 input_line_pointer = (save
9041 + (input_line_pointer - gotfree_input_line)
9042 + adjust);
9043 free (gotfree_input_line);
9044 if (exp->X_op == O_constant
9045 || exp->X_op == O_absent
9046 || exp->X_op == O_illegal
9047 || exp->X_op == O_register
9048 || exp->X_op == O_big)
9049 {
9050 char c = *input_line_pointer;
9051 *input_line_pointer = 0;
9052 as_bad (_("missing or invalid expression `%s'"), save);
9053 *input_line_pointer = c;
9054 }
9055 else if ((got_reloc == BFD_RELOC_386_PLT32
9056 || got_reloc == BFD_RELOC_X86_64_PLT32)
9057 && exp->X_op != O_symbol)
9058 {
9059 char c = *input_line_pointer;
9060 *input_line_pointer = 0;
9061 as_bad (_("invalid PLT expression `%s'"), save);
9062 *input_line_pointer = c;
9063 }
9064 }
9065 }
9066 else
9067 expression (exp);
9068
9069 intel_syntax = -intel_syntax;
9070
9071 if (intel_syntax)
9072 i386_intel_simplify (exp);
9073
9074 return got_reloc;
9075 }
9076
9077 static void
9078 signed_cons (int size)
9079 {
9080 if (flag_code == CODE_64BIT)
9081 cons_sign = 1;
9082 cons (size);
9083 cons_sign = -1;
9084 }
9085
9086 #ifdef TE_PE
9087 static void
9088 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9089 {
9090 expressionS exp;
9091
9092 do
9093 {
9094 expression (&exp);
9095 if (exp.X_op == O_symbol)
9096 exp.X_op = O_secrel;
9097
9098 emit_expr (&exp, 4);
9099 }
9100 while (*input_line_pointer++ == ',');
9101
9102 input_line_pointer--;
9103 demand_empty_rest_of_line ();
9104 }
9105 #endif
9106
9107 /* Handle Vector operations. */
9108
9109 static char *
9110 check_VecOperations (char *op_string, char *op_end)
9111 {
9112 const reg_entry *mask;
9113 const char *saved;
9114 char *end_op;
9115
9116 while (*op_string
9117 && (op_end == NULL || op_string < op_end))
9118 {
9119 saved = op_string;
9120 if (*op_string == '{')
9121 {
9122 op_string++;
9123
9124 /* Check broadcasts. */
9125 if (strncmp (op_string, "1to", 3) == 0)
9126 {
9127 int bcst_type;
9128
9129 if (i.broadcast)
9130 goto duplicated_vec_op;
9131
9132 op_string += 3;
9133 if (*op_string == '8')
9134 bcst_type = 8;
9135 else if (*op_string == '4')
9136 bcst_type = 4;
9137 else if (*op_string == '2')
9138 bcst_type = 2;
9139 else if (*op_string == '1'
9140 && *(op_string+1) == '6')
9141 {
9142 bcst_type = 16;
9143 op_string++;
9144 }
9145 else
9146 {
9147 as_bad (_("Unsupported broadcast: `%s'"), saved);
9148 return NULL;
9149 }
9150 op_string++;
9151
9152 broadcast_op.type = bcst_type;
9153 broadcast_op.operand = this_operand;
9154 broadcast_op.bytes = 0;
9155 i.broadcast = &broadcast_op;
9156 }
9157 /* Check masking operation. */
9158 else if ((mask = parse_register (op_string, &end_op)) != NULL)
9159 {
9160 /* k0 can't be used for write mask. */
9161 if (!mask->reg_type.bitfield.regmask || mask->reg_num == 0)
9162 {
9163 as_bad (_("`%s%s' can't be used for write mask"),
9164 register_prefix, mask->reg_name);
9165 return NULL;
9166 }
9167
9168 if (!i.mask)
9169 {
9170 mask_op.mask = mask;
9171 mask_op.zeroing = 0;
9172 mask_op.operand = this_operand;
9173 i.mask = &mask_op;
9174 }
9175 else
9176 {
9177 if (i.mask->mask)
9178 goto duplicated_vec_op;
9179
9180 i.mask->mask = mask;
9181
9182 /* Only "{z}" is allowed here. No need to check
9183 zeroing mask explicitly. */
9184 if (i.mask->operand != this_operand)
9185 {
9186 as_bad (_("invalid write mask `%s'"), saved);
9187 return NULL;
9188 }
9189 }
9190
9191 op_string = end_op;
9192 }
9193 /* Check zeroing-flag for masking operation. */
9194 else if (*op_string == 'z')
9195 {
9196 if (!i.mask)
9197 {
9198 mask_op.mask = NULL;
9199 mask_op.zeroing = 1;
9200 mask_op.operand = this_operand;
9201 i.mask = &mask_op;
9202 }
9203 else
9204 {
9205 if (i.mask->zeroing)
9206 {
9207 duplicated_vec_op:
9208 as_bad (_("duplicated `%s'"), saved);
9209 return NULL;
9210 }
9211
9212 i.mask->zeroing = 1;
9213
9214 /* Only "{%k}" is allowed here. No need to check mask
9215 register explicitly. */
9216 if (i.mask->operand != this_operand)
9217 {
9218 as_bad (_("invalid zeroing-masking `%s'"),
9219 saved);
9220 return NULL;
9221 }
9222 }
9223
9224 op_string++;
9225 }
9226 else
9227 goto unknown_vec_op;
9228
9229 if (*op_string != '}')
9230 {
9231 as_bad (_("missing `}' in `%s'"), saved);
9232 return NULL;
9233 }
9234 op_string++;
9235
9236 /* Strip whitespace since the addition of pseudo prefixes
9237 changed how the scrubber treats '{'. */
9238 if (is_space_char (*op_string))
9239 ++op_string;
9240
9241 continue;
9242 }
9243 unknown_vec_op:
9244 /* We don't know this one. */
9245 as_bad (_("unknown vector operation: `%s'"), saved);
9246 return NULL;
9247 }
9248
9249 if (i.mask && i.mask->zeroing && !i.mask->mask)
9250 {
9251 as_bad (_("zeroing-masking only allowed with write mask"));
9252 return NULL;
9253 }
9254
9255 return op_string;
9256 }
9257
9258 static int
9259 i386_immediate (char *imm_start)
9260 {
9261 char *save_input_line_pointer;
9262 char *gotfree_input_line;
9263 segT exp_seg = 0;
9264 expressionS *exp;
9265 i386_operand_type types;
9266
9267 operand_type_set (&types, ~0);
9268
9269 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9270 {
9271 as_bad (_("at most %d immediate operands are allowed"),
9272 MAX_IMMEDIATE_OPERANDS);
9273 return 0;
9274 }
9275
9276 exp = &im_expressions[i.imm_operands++];
9277 i.op[this_operand].imms = exp;
9278
9279 if (is_space_char (*imm_start))
9280 ++imm_start;
9281
9282 save_input_line_pointer = input_line_pointer;
9283 input_line_pointer = imm_start;
9284
9285 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9286 if (gotfree_input_line)
9287 input_line_pointer = gotfree_input_line;
9288
9289 exp_seg = expression (exp);
9290
9291 SKIP_WHITESPACE ();
9292
9293 /* Handle vector operations. */
9294 if (*input_line_pointer == '{')
9295 {
9296 input_line_pointer = check_VecOperations (input_line_pointer,
9297 NULL);
9298 if (input_line_pointer == NULL)
9299 return 0;
9300 }
9301
9302 if (*input_line_pointer)
9303 as_bad (_("junk `%s' after expression"), input_line_pointer);
9304
9305 input_line_pointer = save_input_line_pointer;
9306 if (gotfree_input_line)
9307 {
9308 free (gotfree_input_line);
9309
9310 if (exp->X_op == O_constant || exp->X_op == O_register)
9311 exp->X_op = O_illegal;
9312 }
9313
9314 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9315 }
9316
9317 static int
9318 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9319 i386_operand_type types, const char *imm_start)
9320 {
9321 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9322 {
9323 if (imm_start)
9324 as_bad (_("missing or invalid immediate expression `%s'"),
9325 imm_start);
9326 return 0;
9327 }
9328 else if (exp->X_op == O_constant)
9329 {
9330 /* Size it properly later. */
9331 i.types[this_operand].bitfield.imm64 = 1;
9332 /* If not 64bit, sign extend val. */
9333 if (flag_code != CODE_64BIT
9334 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9335 exp->X_add_number
9336 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9337 }
9338 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9339 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9340 && exp_seg != absolute_section
9341 && exp_seg != text_section
9342 && exp_seg != data_section
9343 && exp_seg != bss_section
9344 && exp_seg != undefined_section
9345 && !bfd_is_com_section (exp_seg))
9346 {
9347 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9348 return 0;
9349 }
9350 #endif
9351 else if (!intel_syntax && exp_seg == reg_section)
9352 {
9353 if (imm_start)
9354 as_bad (_("illegal immediate register operand %s"), imm_start);
9355 return 0;
9356 }
9357 else
9358 {
9359 /* This is an address. The size of the address will be
9360 determined later, depending on destination register,
9361 suffix, or the default for the section. */
9362 i.types[this_operand].bitfield.imm8 = 1;
9363 i.types[this_operand].bitfield.imm16 = 1;
9364 i.types[this_operand].bitfield.imm32 = 1;
9365 i.types[this_operand].bitfield.imm32s = 1;
9366 i.types[this_operand].bitfield.imm64 = 1;
9367 i.types[this_operand] = operand_type_and (i.types[this_operand],
9368 types);
9369 }
9370
9371 return 1;
9372 }
9373
9374 static char *
9375 i386_scale (char *scale)
9376 {
9377 offsetT val;
9378 char *save = input_line_pointer;
9379
9380 input_line_pointer = scale;
9381 val = get_absolute_expression ();
9382
9383 switch (val)
9384 {
9385 case 1:
9386 i.log2_scale_factor = 0;
9387 break;
9388 case 2:
9389 i.log2_scale_factor = 1;
9390 break;
9391 case 4:
9392 i.log2_scale_factor = 2;
9393 break;
9394 case 8:
9395 i.log2_scale_factor = 3;
9396 break;
9397 default:
9398 {
9399 char sep = *input_line_pointer;
9400
9401 *input_line_pointer = '\0';
9402 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9403 scale);
9404 *input_line_pointer = sep;
9405 input_line_pointer = save;
9406 return NULL;
9407 }
9408 }
9409 if (i.log2_scale_factor != 0 && i.index_reg == 0)
9410 {
9411 as_warn (_("scale factor of %d without an index register"),
9412 1 << i.log2_scale_factor);
9413 i.log2_scale_factor = 0;
9414 }
9415 scale = input_line_pointer;
9416 input_line_pointer = save;
9417 return scale;
9418 }
9419
9420 static int
9421 i386_displacement (char *disp_start, char *disp_end)
9422 {
9423 expressionS *exp;
9424 segT exp_seg = 0;
9425 char *save_input_line_pointer;
9426 char *gotfree_input_line;
9427 int override;
9428 i386_operand_type bigdisp, types = anydisp;
9429 int ret;
9430
9431 if (i.disp_operands == MAX_MEMORY_OPERANDS)
9432 {
9433 as_bad (_("at most %d displacement operands are allowed"),
9434 MAX_MEMORY_OPERANDS);
9435 return 0;
9436 }
9437
9438 operand_type_set (&bigdisp, 0);
9439 if ((i.types[this_operand].bitfield.jumpabsolute)
9440 || (!current_templates->start->opcode_modifier.jump
9441 && !current_templates->start->opcode_modifier.jumpdword))
9442 {
9443 bigdisp.bitfield.disp32 = 1;
9444 override = (i.prefix[ADDR_PREFIX] != 0);
9445 if (flag_code == CODE_64BIT)
9446 {
9447 if (!override)
9448 {
9449 bigdisp.bitfield.disp32s = 1;
9450 bigdisp.bitfield.disp64 = 1;
9451 }
9452 }
9453 else if ((flag_code == CODE_16BIT) ^ override)
9454 {
9455 bigdisp.bitfield.disp32 = 0;
9456 bigdisp.bitfield.disp16 = 1;
9457 }
9458 }
9459 else
9460 {
9461 /* For PC-relative branches, the width of the displacement
9462 is dependent upon data size, not address size. */
9463 override = (i.prefix[DATA_PREFIX] != 0);
9464 if (flag_code == CODE_64BIT)
9465 {
9466 if (override || i.suffix == WORD_MNEM_SUFFIX)
9467 bigdisp.bitfield.disp16 = 1;
9468 else
9469 {
9470 bigdisp.bitfield.disp32 = 1;
9471 bigdisp.bitfield.disp32s = 1;
9472 }
9473 }
9474 else
9475 {
9476 if (!override)
9477 override = (i.suffix == (flag_code != CODE_16BIT
9478 ? WORD_MNEM_SUFFIX
9479 : LONG_MNEM_SUFFIX));
9480 bigdisp.bitfield.disp32 = 1;
9481 if ((flag_code == CODE_16BIT) ^ override)
9482 {
9483 bigdisp.bitfield.disp32 = 0;
9484 bigdisp.bitfield.disp16 = 1;
9485 }
9486 }
9487 }
9488 i.types[this_operand] = operand_type_or (i.types[this_operand],
9489 bigdisp);
9490
9491 exp = &disp_expressions[i.disp_operands];
9492 i.op[this_operand].disps = exp;
9493 i.disp_operands++;
9494 save_input_line_pointer = input_line_pointer;
9495 input_line_pointer = disp_start;
9496 END_STRING_AND_SAVE (disp_end);
9497
9498 #ifndef GCC_ASM_O_HACK
9499 #define GCC_ASM_O_HACK 0
9500 #endif
9501 #if GCC_ASM_O_HACK
9502 END_STRING_AND_SAVE (disp_end + 1);
9503 if (i.types[this_operand].bitfield.baseIndex
9504 && displacement_string_end[-1] == '+')
9505 {
9506 /* This hack is to avoid a warning when using the "o"
9507 constraint within gcc asm statements.
9508 For instance:
9509
9510 #define _set_tssldt_desc(n,addr,limit,type) \
9511 __asm__ __volatile__ ( \
9512 "movw %w2,%0\n\t" \
9513 "movw %w1,2+%0\n\t" \
9514 "rorl $16,%1\n\t" \
9515 "movb %b1,4+%0\n\t" \
9516 "movb %4,5+%0\n\t" \
9517 "movb $0,6+%0\n\t" \
9518 "movb %h1,7+%0\n\t" \
9519 "rorl $16,%1" \
9520 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
9521
9522 This works great except that the output assembler ends
9523 up looking a bit weird if it turns out that there is
9524 no offset. You end up producing code that looks like:
9525
9526 #APP
9527 movw $235,(%eax)
9528 movw %dx,2+(%eax)
9529 rorl $16,%edx
9530 movb %dl,4+(%eax)
9531 movb $137,5+(%eax)
9532 movb $0,6+(%eax)
9533 movb %dh,7+(%eax)
9534 rorl $16,%edx
9535 #NO_APP
9536
9537 So here we provide the missing zero. */
9538
9539 *displacement_string_end = '0';
9540 }
9541 #endif
9542 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9543 if (gotfree_input_line)
9544 input_line_pointer = gotfree_input_line;
9545
9546 exp_seg = expression (exp);
9547
9548 SKIP_WHITESPACE ();
9549 if (*input_line_pointer)
9550 as_bad (_("junk `%s' after expression"), input_line_pointer);
9551 #if GCC_ASM_O_HACK
9552 RESTORE_END_STRING (disp_end + 1);
9553 #endif
9554 input_line_pointer = save_input_line_pointer;
9555 if (gotfree_input_line)
9556 {
9557 free (gotfree_input_line);
9558
9559 if (exp->X_op == O_constant || exp->X_op == O_register)
9560 exp->X_op = O_illegal;
9561 }
9562
9563 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
9564
9565 RESTORE_END_STRING (disp_end);
9566
9567 return ret;
9568 }
9569
9570 static int
9571 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9572 i386_operand_type types, const char *disp_start)
9573 {
9574 i386_operand_type bigdisp;
9575 int ret = 1;
9576
9577 /* We do this to make sure that the section symbol is in
9578 the symbol table. We will ultimately change the relocation
9579 to be relative to the beginning of the section. */
9580 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
9581 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
9582 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9583 {
9584 if (exp->X_op != O_symbol)
9585 goto inv_disp;
9586
9587 if (S_IS_LOCAL (exp->X_add_symbol)
9588 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
9589 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
9590 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
9591 exp->X_op = O_subtract;
9592 exp->X_op_symbol = GOT_symbol;
9593 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
9594 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
9595 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9596 i.reloc[this_operand] = BFD_RELOC_64;
9597 else
9598 i.reloc[this_operand] = BFD_RELOC_32;
9599 }
9600
9601 else if (exp->X_op == O_absent
9602 || exp->X_op == O_illegal
9603 || exp->X_op == O_big)
9604 {
9605 inv_disp:
9606 as_bad (_("missing or invalid displacement expression `%s'"),
9607 disp_start);
9608 ret = 0;
9609 }
9610
9611 else if (flag_code == CODE_64BIT
9612 && !i.prefix[ADDR_PREFIX]
9613 && exp->X_op == O_constant)
9614 {
9615 /* Since displacement is signed extended to 64bit, don't allow
9616 disp32 and turn off disp32s if they are out of range. */
9617 i.types[this_operand].bitfield.disp32 = 0;
9618 if (!fits_in_signed_long (exp->X_add_number))
9619 {
9620 i.types[this_operand].bitfield.disp32s = 0;
9621 if (i.types[this_operand].bitfield.baseindex)
9622 {
9623 as_bad (_("0x%lx out range of signed 32bit displacement"),
9624 (long) exp->X_add_number);
9625 ret = 0;
9626 }
9627 }
9628 }
9629
9630 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9631 else if (exp->X_op != O_constant
9632 && OUTPUT_FLAVOR == bfd_target_aout_flavour
9633 && exp_seg != absolute_section
9634 && exp_seg != text_section
9635 && exp_seg != data_section
9636 && exp_seg != bss_section
9637 && exp_seg != undefined_section
9638 && !bfd_is_com_section (exp_seg))
9639 {
9640 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9641 ret = 0;
9642 }
9643 #endif
9644
9645 /* Check if this is a displacement only operand. */
9646 bigdisp = i.types[this_operand];
9647 bigdisp.bitfield.disp8 = 0;
9648 bigdisp.bitfield.disp16 = 0;
9649 bigdisp.bitfield.disp32 = 0;
9650 bigdisp.bitfield.disp32s = 0;
9651 bigdisp.bitfield.disp64 = 0;
9652 if (operand_type_all_zero (&bigdisp))
9653 i.types[this_operand] = operand_type_and (i.types[this_operand],
9654 types);
9655
9656 return ret;
9657 }
9658
9659 /* Return the active addressing mode, taking address override and
9660 registers forming the address into consideration. Update the
9661 address override prefix if necessary. */
9662
9663 static enum flag_code
9664 i386_addressing_mode (void)
9665 {
9666 enum flag_code addr_mode;
9667
9668 if (i.prefix[ADDR_PREFIX])
9669 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
9670 else
9671 {
9672 addr_mode = flag_code;
9673
9674 #if INFER_ADDR_PREFIX
9675 if (i.mem_operands == 0)
9676 {
9677 /* Infer address prefix from the first memory operand. */
9678 const reg_entry *addr_reg = i.base_reg;
9679
9680 if (addr_reg == NULL)
9681 addr_reg = i.index_reg;
9682
9683 if (addr_reg)
9684 {
9685 if (addr_reg->reg_type.bitfield.dword)
9686 addr_mode = CODE_32BIT;
9687 else if (flag_code != CODE_64BIT
9688 && addr_reg->reg_type.bitfield.word)
9689 addr_mode = CODE_16BIT;
9690
9691 if (addr_mode != flag_code)
9692 {
9693 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
9694 i.prefixes += 1;
9695 /* Change the size of any displacement too. At most one
9696 of Disp16 or Disp32 is set.
9697 FIXME. There doesn't seem to be any real need for
9698 separate Disp16 and Disp32 flags. The same goes for
9699 Imm16 and Imm32. Removing them would probably clean
9700 up the code quite a lot. */
9701 if (flag_code != CODE_64BIT
9702 && (i.types[this_operand].bitfield.disp16
9703 || i.types[this_operand].bitfield.disp32))
9704 i.types[this_operand]
9705 = operand_type_xor (i.types[this_operand], disp16_32);
9706 }
9707 }
9708 }
9709 #endif
9710 }
9711
9712 return addr_mode;
9713 }
9714
9715 /* Make sure the memory operand we've been dealt is valid.
9716 Return 1 on success, 0 on a failure. */
9717
9718 static int
9719 i386_index_check (const char *operand_string)
9720 {
9721 const char *kind = "base/index";
9722 enum flag_code addr_mode = i386_addressing_mode ();
9723
9724 if (current_templates->start->opcode_modifier.isstring
9725 && !current_templates->start->opcode_modifier.immext
9726 && (current_templates->end[-1].opcode_modifier.isstring
9727 || i.mem_operands))
9728 {
9729 /* Memory operands of string insns are special in that they only allow
9730 a single register (rDI, rSI, or rBX) as their memory address. */
9731 const reg_entry *expected_reg;
9732 static const char *di_si[][2] =
9733 {
9734 { "esi", "edi" },
9735 { "si", "di" },
9736 { "rsi", "rdi" }
9737 };
9738 static const char *bx[] = { "ebx", "bx", "rbx" };
9739
9740 kind = "string address";
9741
9742 if (current_templates->start->opcode_modifier.repprefixok)
9743 {
9744 i386_operand_type type = current_templates->end[-1].operand_types[0];
9745
9746 if (!type.bitfield.baseindex
9747 || ((!i.mem_operands != !intel_syntax)
9748 && current_templates->end[-1].operand_types[1]
9749 .bitfield.baseindex))
9750 type = current_templates->end[-1].operand_types[1];
9751 expected_reg = hash_find (reg_hash,
9752 di_si[addr_mode][type.bitfield.esseg]);
9753
9754 }
9755 else
9756 expected_reg = hash_find (reg_hash, bx[addr_mode]);
9757
9758 if (i.base_reg != expected_reg
9759 || i.index_reg
9760 || operand_type_check (i.types[this_operand], disp))
9761 {
9762 /* The second memory operand must have the same size as
9763 the first one. */
9764 if (i.mem_operands
9765 && i.base_reg
9766 && !((addr_mode == CODE_64BIT
9767 && i.base_reg->reg_type.bitfield.qword)
9768 || (addr_mode == CODE_32BIT
9769 ? i.base_reg->reg_type.bitfield.dword
9770 : i.base_reg->reg_type.bitfield.word)))
9771 goto bad_address;
9772
9773 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
9774 operand_string,
9775 intel_syntax ? '[' : '(',
9776 register_prefix,
9777 expected_reg->reg_name,
9778 intel_syntax ? ']' : ')');
9779 return 1;
9780 }
9781 else
9782 return 1;
9783
9784 bad_address:
9785 as_bad (_("`%s' is not a valid %s expression"),
9786 operand_string, kind);
9787 return 0;
9788 }
9789 else
9790 {
9791 if (addr_mode != CODE_16BIT)
9792 {
9793 /* 32-bit/64-bit checks. */
9794 if ((i.base_reg
9795 && ((addr_mode == CODE_64BIT
9796 ? !i.base_reg->reg_type.bitfield.qword
9797 : !i.base_reg->reg_type.bitfield.dword)
9798 || (i.index_reg && i.base_reg->reg_num == RegIP)
9799 || i.base_reg->reg_num == RegIZ))
9800 || (i.index_reg
9801 && !i.index_reg->reg_type.bitfield.xmmword
9802 && !i.index_reg->reg_type.bitfield.ymmword
9803 && !i.index_reg->reg_type.bitfield.zmmword
9804 && ((addr_mode == CODE_64BIT
9805 ? !i.index_reg->reg_type.bitfield.qword
9806 : !i.index_reg->reg_type.bitfield.dword)
9807 || !i.index_reg->reg_type.bitfield.baseindex)))
9808 goto bad_address;
9809
9810 /* bndmk, bndldx, and bndstx have special restrictions. */
9811 if (current_templates->start->base_opcode == 0xf30f1b
9812 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
9813 {
9814 /* They cannot use RIP-relative addressing. */
9815 if (i.base_reg && i.base_reg->reg_num == RegIP)
9816 {
9817 as_bad (_("`%s' cannot be used here"), operand_string);
9818 return 0;
9819 }
9820
9821 /* bndldx and bndstx ignore their scale factor. */
9822 if (current_templates->start->base_opcode != 0xf30f1b
9823 && i.log2_scale_factor)
9824 as_warn (_("register scaling is being ignored here"));
9825 }
9826 }
9827 else
9828 {
9829 /* 16-bit checks. */
9830 if ((i.base_reg
9831 && (!i.base_reg->reg_type.bitfield.word
9832 || !i.base_reg->reg_type.bitfield.baseindex))
9833 || (i.index_reg
9834 && (!i.index_reg->reg_type.bitfield.word
9835 || !i.index_reg->reg_type.bitfield.baseindex
9836 || !(i.base_reg
9837 && i.base_reg->reg_num < 6
9838 && i.index_reg->reg_num >= 6
9839 && i.log2_scale_factor == 0))))
9840 goto bad_address;
9841 }
9842 }
9843 return 1;
9844 }
9845
9846 /* Handle vector immediates. */
9847
9848 static int
9849 RC_SAE_immediate (const char *imm_start)
9850 {
9851 unsigned int match_found, j;
9852 const char *pstr = imm_start;
9853 expressionS *exp;
9854
9855 if (*pstr != '{')
9856 return 0;
9857
9858 pstr++;
9859 match_found = 0;
9860 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
9861 {
9862 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
9863 {
9864 if (!i.rounding)
9865 {
9866 rc_op.type = RC_NamesTable[j].type;
9867 rc_op.operand = this_operand;
9868 i.rounding = &rc_op;
9869 }
9870 else
9871 {
9872 as_bad (_("duplicated `%s'"), imm_start);
9873 return 0;
9874 }
9875 pstr += RC_NamesTable[j].len;
9876 match_found = 1;
9877 break;
9878 }
9879 }
9880 if (!match_found)
9881 return 0;
9882
9883 if (*pstr++ != '}')
9884 {
9885 as_bad (_("Missing '}': '%s'"), imm_start);
9886 return 0;
9887 }
9888 /* RC/SAE immediate string should contain nothing more. */;
9889 if (*pstr != 0)
9890 {
9891 as_bad (_("Junk after '}': '%s'"), imm_start);
9892 return 0;
9893 }
9894
9895 exp = &im_expressions[i.imm_operands++];
9896 i.op[this_operand].imms = exp;
9897
9898 exp->X_op = O_constant;
9899 exp->X_add_number = 0;
9900 exp->X_add_symbol = (symbolS *) 0;
9901 exp->X_op_symbol = (symbolS *) 0;
9902
9903 i.types[this_operand].bitfield.imm8 = 1;
9904 return 1;
9905 }
9906
9907 /* Only string instructions can have a second memory operand, so
9908 reduce current_templates to just those if it contains any. */
9909 static int
9910 maybe_adjust_templates (void)
9911 {
9912 const insn_template *t;
9913
9914 gas_assert (i.mem_operands == 1);
9915
9916 for (t = current_templates->start; t < current_templates->end; ++t)
9917 if (t->opcode_modifier.isstring)
9918 break;
9919
9920 if (t < current_templates->end)
9921 {
9922 static templates aux_templates;
9923 bfd_boolean recheck;
9924
9925 aux_templates.start = t;
9926 for (; t < current_templates->end; ++t)
9927 if (!t->opcode_modifier.isstring)
9928 break;
9929 aux_templates.end = t;
9930
9931 /* Determine whether to re-check the first memory operand. */
9932 recheck = (aux_templates.start != current_templates->start
9933 || t != current_templates->end);
9934
9935 current_templates = &aux_templates;
9936
9937 if (recheck)
9938 {
9939 i.mem_operands = 0;
9940 if (i.memop1_string != NULL
9941 && i386_index_check (i.memop1_string) == 0)
9942 return 0;
9943 i.mem_operands = 1;
9944 }
9945 }
9946
9947 return 1;
9948 }
9949
9950 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
9951 on error. */
9952
9953 static int
9954 i386_att_operand (char *operand_string)
9955 {
9956 const reg_entry *r;
9957 char *end_op;
9958 char *op_string = operand_string;
9959
9960 if (is_space_char (*op_string))
9961 ++op_string;
9962
9963 /* We check for an absolute prefix (differentiating,
9964 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
9965 if (*op_string == ABSOLUTE_PREFIX)
9966 {
9967 ++op_string;
9968 if (is_space_char (*op_string))
9969 ++op_string;
9970 i.types[this_operand].bitfield.jumpabsolute = 1;
9971 }
9972
9973 /* Check if operand is a register. */
9974 if ((r = parse_register (op_string, &end_op)) != NULL)
9975 {
9976 i386_operand_type temp;
9977
9978 /* Check for a segment override by searching for ':' after a
9979 segment register. */
9980 op_string = end_op;
9981 if (is_space_char (*op_string))
9982 ++op_string;
9983 if (*op_string == ':'
9984 && (r->reg_type.bitfield.sreg2
9985 || r->reg_type.bitfield.sreg3))
9986 {
9987 switch (r->reg_num)
9988 {
9989 case 0:
9990 i.seg[i.mem_operands] = &es;
9991 break;
9992 case 1:
9993 i.seg[i.mem_operands] = &cs;
9994 break;
9995 case 2:
9996 i.seg[i.mem_operands] = &ss;
9997 break;
9998 case 3:
9999 i.seg[i.mem_operands] = &ds;
10000 break;
10001 case 4:
10002 i.seg[i.mem_operands] = &fs;
10003 break;
10004 case 5:
10005 i.seg[i.mem_operands] = &gs;
10006 break;
10007 }
10008
10009 /* Skip the ':' and whitespace. */
10010 ++op_string;
10011 if (is_space_char (*op_string))
10012 ++op_string;
10013
10014 if (!is_digit_char (*op_string)
10015 && !is_identifier_char (*op_string)
10016 && *op_string != '('
10017 && *op_string != ABSOLUTE_PREFIX)
10018 {
10019 as_bad (_("bad memory operand `%s'"), op_string);
10020 return 0;
10021 }
10022 /* Handle case of %es:*foo. */
10023 if (*op_string == ABSOLUTE_PREFIX)
10024 {
10025 ++op_string;
10026 if (is_space_char (*op_string))
10027 ++op_string;
10028 i.types[this_operand].bitfield.jumpabsolute = 1;
10029 }
10030 goto do_memory_reference;
10031 }
10032
10033 /* Handle vector operations. */
10034 if (*op_string == '{')
10035 {
10036 op_string = check_VecOperations (op_string, NULL);
10037 if (op_string == NULL)
10038 return 0;
10039 }
10040
10041 if (*op_string)
10042 {
10043 as_bad (_("junk `%s' after register"), op_string);
10044 return 0;
10045 }
10046 temp = r->reg_type;
10047 temp.bitfield.baseindex = 0;
10048 i.types[this_operand] = operand_type_or (i.types[this_operand],
10049 temp);
10050 i.types[this_operand].bitfield.unspecified = 0;
10051 i.op[this_operand].regs = r;
10052 i.reg_operands++;
10053 }
10054 else if (*op_string == REGISTER_PREFIX)
10055 {
10056 as_bad (_("bad register name `%s'"), op_string);
10057 return 0;
10058 }
10059 else if (*op_string == IMMEDIATE_PREFIX)
10060 {
10061 ++op_string;
10062 if (i.types[this_operand].bitfield.jumpabsolute)
10063 {
10064 as_bad (_("immediate operand illegal with absolute jump"));
10065 return 0;
10066 }
10067 if (!i386_immediate (op_string))
10068 return 0;
10069 }
10070 else if (RC_SAE_immediate (operand_string))
10071 {
10072 /* If it is a RC or SAE immediate, do nothing. */
10073 ;
10074 }
10075 else if (is_digit_char (*op_string)
10076 || is_identifier_char (*op_string)
10077 || *op_string == '"'
10078 || *op_string == '(')
10079 {
10080 /* This is a memory reference of some sort. */
10081 char *base_string;
10082
10083 /* Start and end of displacement string expression (if found). */
10084 char *displacement_string_start;
10085 char *displacement_string_end;
10086 char *vop_start;
10087
10088 do_memory_reference:
10089 if (i.mem_operands == 1 && !maybe_adjust_templates ())
10090 return 0;
10091 if ((i.mem_operands == 1
10092 && !current_templates->start->opcode_modifier.isstring)
10093 || i.mem_operands == 2)
10094 {
10095 as_bad (_("too many memory references for `%s'"),
10096 current_templates->start->name);
10097 return 0;
10098 }
10099
10100 /* Check for base index form. We detect the base index form by
10101 looking for an ')' at the end of the operand, searching
10102 for the '(' matching it, and finding a REGISTER_PREFIX or ','
10103 after the '('. */
10104 base_string = op_string + strlen (op_string);
10105
10106 /* Handle vector operations. */
10107 vop_start = strchr (op_string, '{');
10108 if (vop_start && vop_start < base_string)
10109 {
10110 if (check_VecOperations (vop_start, base_string) == NULL)
10111 return 0;
10112 base_string = vop_start;
10113 }
10114
10115 --base_string;
10116 if (is_space_char (*base_string))
10117 --base_string;
10118
10119 /* If we only have a displacement, set-up for it to be parsed later. */
10120 displacement_string_start = op_string;
10121 displacement_string_end = base_string + 1;
10122
10123 if (*base_string == ')')
10124 {
10125 char *temp_string;
10126 unsigned int parens_balanced = 1;
10127 /* We've already checked that the number of left & right ()'s are
10128 equal, so this loop will not be infinite. */
10129 do
10130 {
10131 base_string--;
10132 if (*base_string == ')')
10133 parens_balanced++;
10134 if (*base_string == '(')
10135 parens_balanced--;
10136 }
10137 while (parens_balanced);
10138
10139 temp_string = base_string;
10140
10141 /* Skip past '(' and whitespace. */
10142 ++base_string;
10143 if (is_space_char (*base_string))
10144 ++base_string;
10145
10146 if (*base_string == ','
10147 || ((i.base_reg = parse_register (base_string, &end_op))
10148 != NULL))
10149 {
10150 displacement_string_end = temp_string;
10151
10152 i.types[this_operand].bitfield.baseindex = 1;
10153
10154 if (i.base_reg)
10155 {
10156 base_string = end_op;
10157 if (is_space_char (*base_string))
10158 ++base_string;
10159 }
10160
10161 /* There may be an index reg or scale factor here. */
10162 if (*base_string == ',')
10163 {
10164 ++base_string;
10165 if (is_space_char (*base_string))
10166 ++base_string;
10167
10168 if ((i.index_reg = parse_register (base_string, &end_op))
10169 != NULL)
10170 {
10171 base_string = end_op;
10172 if (is_space_char (*base_string))
10173 ++base_string;
10174 if (*base_string == ',')
10175 {
10176 ++base_string;
10177 if (is_space_char (*base_string))
10178 ++base_string;
10179 }
10180 else if (*base_string != ')')
10181 {
10182 as_bad (_("expecting `,' or `)' "
10183 "after index register in `%s'"),
10184 operand_string);
10185 return 0;
10186 }
10187 }
10188 else if (*base_string == REGISTER_PREFIX)
10189 {
10190 end_op = strchr (base_string, ',');
10191 if (end_op)
10192 *end_op = '\0';
10193 as_bad (_("bad register name `%s'"), base_string);
10194 return 0;
10195 }
10196
10197 /* Check for scale factor. */
10198 if (*base_string != ')')
10199 {
10200 char *end_scale = i386_scale (base_string);
10201
10202 if (!end_scale)
10203 return 0;
10204
10205 base_string = end_scale;
10206 if (is_space_char (*base_string))
10207 ++base_string;
10208 if (*base_string != ')')
10209 {
10210 as_bad (_("expecting `)' "
10211 "after scale factor in `%s'"),
10212 operand_string);
10213 return 0;
10214 }
10215 }
10216 else if (!i.index_reg)
10217 {
10218 as_bad (_("expecting index register or scale factor "
10219 "after `,'; got '%c'"),
10220 *base_string);
10221 return 0;
10222 }
10223 }
10224 else if (*base_string != ')')
10225 {
10226 as_bad (_("expecting `,' or `)' "
10227 "after base register in `%s'"),
10228 operand_string);
10229 return 0;
10230 }
10231 }
10232 else if (*base_string == REGISTER_PREFIX)
10233 {
10234 end_op = strchr (base_string, ',');
10235 if (end_op)
10236 *end_op = '\0';
10237 as_bad (_("bad register name `%s'"), base_string);
10238 return 0;
10239 }
10240 }
10241
10242 /* If there's an expression beginning the operand, parse it,
10243 assuming displacement_string_start and
10244 displacement_string_end are meaningful. */
10245 if (displacement_string_start != displacement_string_end)
10246 {
10247 if (!i386_displacement (displacement_string_start,
10248 displacement_string_end))
10249 return 0;
10250 }
10251
10252 /* Special case for (%dx) while doing input/output op. */
10253 if (i.base_reg
10254 && i.base_reg->reg_type.bitfield.inoutportreg
10255 && i.index_reg == 0
10256 && i.log2_scale_factor == 0
10257 && i.seg[i.mem_operands] == 0
10258 && !operand_type_check (i.types[this_operand], disp))
10259 {
10260 i.types[this_operand] = i.base_reg->reg_type;
10261 return 1;
10262 }
10263
10264 if (i386_index_check (operand_string) == 0)
10265 return 0;
10266 i.flags[this_operand] |= Operand_Mem;
10267 if (i.mem_operands == 0)
10268 i.memop1_string = xstrdup (operand_string);
10269 i.mem_operands++;
10270 }
10271 else
10272 {
10273 /* It's not a memory operand; argh! */
10274 as_bad (_("invalid char %s beginning operand %d `%s'"),
10275 output_invalid (*op_string),
10276 this_operand + 1,
10277 op_string);
10278 return 0;
10279 }
10280 return 1; /* Normal return. */
10281 }
10282 \f
10283 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10284 that an rs_machine_dependent frag may reach. */
10285
10286 unsigned int
10287 i386_frag_max_var (fragS *frag)
10288 {
10289 /* The only relaxable frags are for jumps.
10290 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
10291 gas_assert (frag->fr_type == rs_machine_dependent);
10292 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10293 }
10294
10295 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10296 static int
10297 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10298 {
10299 /* STT_GNU_IFUNC symbol must go through PLT. */
10300 if ((symbol_get_bfdsym (fr_symbol)->flags
10301 & BSF_GNU_INDIRECT_FUNCTION) != 0)
10302 return 0;
10303
10304 if (!S_IS_EXTERNAL (fr_symbol))
10305 /* Symbol may be weak or local. */
10306 return !S_IS_WEAK (fr_symbol);
10307
10308 /* Global symbols with non-default visibility can't be preempted. */
10309 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10310 return 1;
10311
10312 if (fr_var != NO_RELOC)
10313 switch ((enum bfd_reloc_code_real) fr_var)
10314 {
10315 case BFD_RELOC_386_PLT32:
10316 case BFD_RELOC_X86_64_PLT32:
10317 /* Symbol with PLT relocation may be preempted. */
10318 return 0;
10319 default:
10320 abort ();
10321 }
10322
10323 /* Global symbols with default visibility in a shared library may be
10324 preempted by another definition. */
10325 return !shared;
10326 }
10327 #endif
10328
10329 /* md_estimate_size_before_relax()
10330
10331 Called just before relax() for rs_machine_dependent frags. The x86
10332 assembler uses these frags to handle variable size jump
10333 instructions.
10334
10335 Any symbol that is now undefined will not become defined.
10336 Return the correct fr_subtype in the frag.
10337 Return the initial "guess for variable size of frag" to caller.
10338 The guess is actually the growth beyond the fixed part. Whatever
10339 we do to grow the fixed or variable part contributes to our
10340 returned value. */
10341
10342 int
10343 md_estimate_size_before_relax (fragS *fragP, segT segment)
10344 {
10345 /* We've already got fragP->fr_subtype right; all we have to do is
10346 check for un-relaxable symbols. On an ELF system, we can't relax
10347 an externally visible symbol, because it may be overridden by a
10348 shared library. */
10349 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
10350 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10351 || (IS_ELF
10352 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
10353 fragP->fr_var))
10354 #endif
10355 #if defined (OBJ_COFF) && defined (TE_PE)
10356 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
10357 && S_IS_WEAK (fragP->fr_symbol))
10358 #endif
10359 )
10360 {
10361 /* Symbol is undefined in this segment, or we need to keep a
10362 reloc so that weak symbols can be overridden. */
10363 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
10364 enum bfd_reloc_code_real reloc_type;
10365 unsigned char *opcode;
10366 int old_fr_fix;
10367
10368 if (fragP->fr_var != NO_RELOC)
10369 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
10370 else if (size == 2)
10371 reloc_type = BFD_RELOC_16_PCREL;
10372 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10373 else if (need_plt32_p (fragP->fr_symbol))
10374 reloc_type = BFD_RELOC_X86_64_PLT32;
10375 #endif
10376 else
10377 reloc_type = BFD_RELOC_32_PCREL;
10378
10379 old_fr_fix = fragP->fr_fix;
10380 opcode = (unsigned char *) fragP->fr_opcode;
10381
10382 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
10383 {
10384 case UNCOND_JUMP:
10385 /* Make jmp (0xeb) a (d)word displacement jump. */
10386 opcode[0] = 0xe9;
10387 fragP->fr_fix += size;
10388 fix_new (fragP, old_fr_fix, size,
10389 fragP->fr_symbol,
10390 fragP->fr_offset, 1,
10391 reloc_type);
10392 break;
10393
10394 case COND_JUMP86:
10395 if (size == 2
10396 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
10397 {
10398 /* Negate the condition, and branch past an
10399 unconditional jump. */
10400 opcode[0] ^= 1;
10401 opcode[1] = 3;
10402 /* Insert an unconditional jump. */
10403 opcode[2] = 0xe9;
10404 /* We added two extra opcode bytes, and have a two byte
10405 offset. */
10406 fragP->fr_fix += 2 + 2;
10407 fix_new (fragP, old_fr_fix + 2, 2,
10408 fragP->fr_symbol,
10409 fragP->fr_offset, 1,
10410 reloc_type);
10411 break;
10412 }
10413 /* Fall through. */
10414
10415 case COND_JUMP:
10416 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
10417 {
10418 fixS *fixP;
10419
10420 fragP->fr_fix += 1;
10421 fixP = fix_new (fragP, old_fr_fix, 1,
10422 fragP->fr_symbol,
10423 fragP->fr_offset, 1,
10424 BFD_RELOC_8_PCREL);
10425 fixP->fx_signed = 1;
10426 break;
10427 }
10428
10429 /* This changes the byte-displacement jump 0x7N
10430 to the (d)word-displacement jump 0x0f,0x8N. */
10431 opcode[1] = opcode[0] + 0x10;
10432 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10433 /* We've added an opcode byte. */
10434 fragP->fr_fix += 1 + size;
10435 fix_new (fragP, old_fr_fix + 1, size,
10436 fragP->fr_symbol,
10437 fragP->fr_offset, 1,
10438 reloc_type);
10439 break;
10440
10441 default:
10442 BAD_CASE (fragP->fr_subtype);
10443 break;
10444 }
10445 frag_wane (fragP);
10446 return fragP->fr_fix - old_fr_fix;
10447 }
10448
10449 /* Guess size depending on current relax state. Initially the relax
10450 state will correspond to a short jump and we return 1, because
10451 the variable part of the frag (the branch offset) is one byte
10452 long. However, we can relax a section more than once and in that
10453 case we must either set fr_subtype back to the unrelaxed state,
10454 or return the value for the appropriate branch. */
10455 return md_relax_table[fragP->fr_subtype].rlx_length;
10456 }
10457
10458 /* Called after relax() is finished.
10459
10460 In: Address of frag.
10461 fr_type == rs_machine_dependent.
10462 fr_subtype is what the address relaxed to.
10463
10464 Out: Any fixSs and constants are set up.
10465 Caller will turn frag into a ".space 0". */
10466
10467 void
10468 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
10469 fragS *fragP)
10470 {
10471 unsigned char *opcode;
10472 unsigned char *where_to_put_displacement = NULL;
10473 offsetT target_address;
10474 offsetT opcode_address;
10475 unsigned int extension = 0;
10476 offsetT displacement_from_opcode_start;
10477
10478 opcode = (unsigned char *) fragP->fr_opcode;
10479
10480 /* Address we want to reach in file space. */
10481 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
10482
10483 /* Address opcode resides at in file space. */
10484 opcode_address = fragP->fr_address + fragP->fr_fix;
10485
10486 /* Displacement from opcode start to fill into instruction. */
10487 displacement_from_opcode_start = target_address - opcode_address;
10488
10489 if ((fragP->fr_subtype & BIG) == 0)
10490 {
10491 /* Don't have to change opcode. */
10492 extension = 1; /* 1 opcode + 1 displacement */
10493 where_to_put_displacement = &opcode[1];
10494 }
10495 else
10496 {
10497 if (no_cond_jump_promotion
10498 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
10499 as_warn_where (fragP->fr_file, fragP->fr_line,
10500 _("long jump required"));
10501
10502 switch (fragP->fr_subtype)
10503 {
10504 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
10505 extension = 4; /* 1 opcode + 4 displacement */
10506 opcode[0] = 0xe9;
10507 where_to_put_displacement = &opcode[1];
10508 break;
10509
10510 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
10511 extension = 2; /* 1 opcode + 2 displacement */
10512 opcode[0] = 0xe9;
10513 where_to_put_displacement = &opcode[1];
10514 break;
10515
10516 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
10517 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
10518 extension = 5; /* 2 opcode + 4 displacement */
10519 opcode[1] = opcode[0] + 0x10;
10520 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10521 where_to_put_displacement = &opcode[2];
10522 break;
10523
10524 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
10525 extension = 3; /* 2 opcode + 2 displacement */
10526 opcode[1] = opcode[0] + 0x10;
10527 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10528 where_to_put_displacement = &opcode[2];
10529 break;
10530
10531 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
10532 extension = 4;
10533 opcode[0] ^= 1;
10534 opcode[1] = 3;
10535 opcode[2] = 0xe9;
10536 where_to_put_displacement = &opcode[3];
10537 break;
10538
10539 default:
10540 BAD_CASE (fragP->fr_subtype);
10541 break;
10542 }
10543 }
10544
10545 /* If size if less then four we are sure that the operand fits,
10546 but if it's 4, then it could be that the displacement is larger
10547 then -/+ 2GB. */
10548 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
10549 && object_64bit
10550 && ((addressT) (displacement_from_opcode_start - extension
10551 + ((addressT) 1 << 31))
10552 > (((addressT) 2 << 31) - 1)))
10553 {
10554 as_bad_where (fragP->fr_file, fragP->fr_line,
10555 _("jump target out of range"));
10556 /* Make us emit 0. */
10557 displacement_from_opcode_start = extension;
10558 }
10559 /* Now put displacement after opcode. */
10560 md_number_to_chars ((char *) where_to_put_displacement,
10561 (valueT) (displacement_from_opcode_start - extension),
10562 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
10563 fragP->fr_fix += extension;
10564 }
10565 \f
10566 /* Apply a fixup (fixP) to segment data, once it has been determined
10567 by our caller that we have all the info we need to fix it up.
10568
10569 Parameter valP is the pointer to the value of the bits.
10570
10571 On the 386, immediates, displacements, and data pointers are all in
10572 the same (little-endian) format, so we don't need to care about which
10573 we are handling. */
10574
10575 void
10576 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
10577 {
10578 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
10579 valueT value = *valP;
10580
10581 #if !defined (TE_Mach)
10582 if (fixP->fx_pcrel)
10583 {
10584 switch (fixP->fx_r_type)
10585 {
10586 default:
10587 break;
10588
10589 case BFD_RELOC_64:
10590 fixP->fx_r_type = BFD_RELOC_64_PCREL;
10591 break;
10592 case BFD_RELOC_32:
10593 case BFD_RELOC_X86_64_32S:
10594 fixP->fx_r_type = BFD_RELOC_32_PCREL;
10595 break;
10596 case BFD_RELOC_16:
10597 fixP->fx_r_type = BFD_RELOC_16_PCREL;
10598 break;
10599 case BFD_RELOC_8:
10600 fixP->fx_r_type = BFD_RELOC_8_PCREL;
10601 break;
10602 }
10603 }
10604
10605 if (fixP->fx_addsy != NULL
10606 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
10607 || fixP->fx_r_type == BFD_RELOC_64_PCREL
10608 || fixP->fx_r_type == BFD_RELOC_16_PCREL
10609 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
10610 && !use_rela_relocations)
10611 {
10612 /* This is a hack. There should be a better way to handle this.
10613 This covers for the fact that bfd_install_relocation will
10614 subtract the current location (for partial_inplace, PC relative
10615 relocations); see more below. */
10616 #ifndef OBJ_AOUT
10617 if (IS_ELF
10618 #ifdef TE_PE
10619 || OUTPUT_FLAVOR == bfd_target_coff_flavour
10620 #endif
10621 )
10622 value += fixP->fx_where + fixP->fx_frag->fr_address;
10623 #endif
10624 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10625 if (IS_ELF)
10626 {
10627 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
10628
10629 if ((sym_seg == seg
10630 || (symbol_section_p (fixP->fx_addsy)
10631 && sym_seg != absolute_section))
10632 && !generic_force_reloc (fixP))
10633 {
10634 /* Yes, we add the values in twice. This is because
10635 bfd_install_relocation subtracts them out again. I think
10636 bfd_install_relocation is broken, but I don't dare change
10637 it. FIXME. */
10638 value += fixP->fx_where + fixP->fx_frag->fr_address;
10639 }
10640 }
10641 #endif
10642 #if defined (OBJ_COFF) && defined (TE_PE)
10643 /* For some reason, the PE format does not store a
10644 section address offset for a PC relative symbol. */
10645 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
10646 || S_IS_WEAK (fixP->fx_addsy))
10647 value += md_pcrel_from (fixP);
10648 #endif
10649 }
10650 #if defined (OBJ_COFF) && defined (TE_PE)
10651 if (fixP->fx_addsy != NULL
10652 && S_IS_WEAK (fixP->fx_addsy)
10653 /* PR 16858: Do not modify weak function references. */
10654 && ! fixP->fx_pcrel)
10655 {
10656 #if !defined (TE_PEP)
10657 /* For x86 PE weak function symbols are neither PC-relative
10658 nor do they set S_IS_FUNCTION. So the only reliable way
10659 to detect them is to check the flags of their containing
10660 section. */
10661 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
10662 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
10663 ;
10664 else
10665 #endif
10666 value -= S_GET_VALUE (fixP->fx_addsy);
10667 }
10668 #endif
10669
10670 /* Fix a few things - the dynamic linker expects certain values here,
10671 and we must not disappoint it. */
10672 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10673 if (IS_ELF && fixP->fx_addsy)
10674 switch (fixP->fx_r_type)
10675 {
10676 case BFD_RELOC_386_PLT32:
10677 case BFD_RELOC_X86_64_PLT32:
10678 /* Make the jump instruction point to the address of the operand.
10679 At runtime we merely add the offset to the actual PLT entry.
10680 NB: Subtract the offset size only for jump instructions. */
10681 if (fixP->fx_pcrel)
10682 value = -4;
10683 break;
10684
10685 case BFD_RELOC_386_TLS_GD:
10686 case BFD_RELOC_386_TLS_LDM:
10687 case BFD_RELOC_386_TLS_IE_32:
10688 case BFD_RELOC_386_TLS_IE:
10689 case BFD_RELOC_386_TLS_GOTIE:
10690 case BFD_RELOC_386_TLS_GOTDESC:
10691 case BFD_RELOC_X86_64_TLSGD:
10692 case BFD_RELOC_X86_64_TLSLD:
10693 case BFD_RELOC_X86_64_GOTTPOFF:
10694 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10695 value = 0; /* Fully resolved at runtime. No addend. */
10696 /* Fallthrough */
10697 case BFD_RELOC_386_TLS_LE:
10698 case BFD_RELOC_386_TLS_LDO_32:
10699 case BFD_RELOC_386_TLS_LE_32:
10700 case BFD_RELOC_X86_64_DTPOFF32:
10701 case BFD_RELOC_X86_64_DTPOFF64:
10702 case BFD_RELOC_X86_64_TPOFF32:
10703 case BFD_RELOC_X86_64_TPOFF64:
10704 S_SET_THREAD_LOCAL (fixP->fx_addsy);
10705 break;
10706
10707 case BFD_RELOC_386_TLS_DESC_CALL:
10708 case BFD_RELOC_X86_64_TLSDESC_CALL:
10709 value = 0; /* Fully resolved at runtime. No addend. */
10710 S_SET_THREAD_LOCAL (fixP->fx_addsy);
10711 fixP->fx_done = 0;
10712 return;
10713
10714 case BFD_RELOC_VTABLE_INHERIT:
10715 case BFD_RELOC_VTABLE_ENTRY:
10716 fixP->fx_done = 0;
10717 return;
10718
10719 default:
10720 break;
10721 }
10722 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
10723 *valP = value;
10724 #endif /* !defined (TE_Mach) */
10725
10726 /* Are we finished with this relocation now? */
10727 if (fixP->fx_addsy == NULL)
10728 fixP->fx_done = 1;
10729 #if defined (OBJ_COFF) && defined (TE_PE)
10730 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
10731 {
10732 fixP->fx_done = 0;
10733 /* Remember value for tc_gen_reloc. */
10734 fixP->fx_addnumber = value;
10735 /* Clear out the frag for now. */
10736 value = 0;
10737 }
10738 #endif
10739 else if (use_rela_relocations)
10740 {
10741 fixP->fx_no_overflow = 1;
10742 /* Remember value for tc_gen_reloc. */
10743 fixP->fx_addnumber = value;
10744 value = 0;
10745 }
10746
10747 md_number_to_chars (p, value, fixP->fx_size);
10748 }
10749 \f
10750 const char *
10751 md_atof (int type, char *litP, int *sizeP)
10752 {
10753 /* This outputs the LITTLENUMs in REVERSE order;
10754 in accord with the bigendian 386. */
10755 return ieee_md_atof (type, litP, sizeP, FALSE);
10756 }
10757 \f
10758 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
10759
10760 static char *
10761 output_invalid (int c)
10762 {
10763 if (ISPRINT (c))
10764 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10765 "'%c'", c);
10766 else
10767 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10768 "(0x%x)", (unsigned char) c);
10769 return output_invalid_buf;
10770 }
10771
10772 /* REG_STRING starts *before* REGISTER_PREFIX. */
10773
10774 static const reg_entry *
10775 parse_real_register (char *reg_string, char **end_op)
10776 {
10777 char *s = reg_string;
10778 char *p;
10779 char reg_name_given[MAX_REG_NAME_SIZE + 1];
10780 const reg_entry *r;
10781
10782 /* Skip possible REGISTER_PREFIX and possible whitespace. */
10783 if (*s == REGISTER_PREFIX)
10784 ++s;
10785
10786 if (is_space_char (*s))
10787 ++s;
10788
10789 p = reg_name_given;
10790 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
10791 {
10792 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
10793 return (const reg_entry *) NULL;
10794 s++;
10795 }
10796
10797 /* For naked regs, make sure that we are not dealing with an identifier.
10798 This prevents confusing an identifier like `eax_var' with register
10799 `eax'. */
10800 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
10801 return (const reg_entry *) NULL;
10802
10803 *end_op = s;
10804
10805 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
10806
10807 /* Handle floating point regs, allowing spaces in the (i) part. */
10808 if (r == i386_regtab /* %st is first entry of table */)
10809 {
10810 if (!cpu_arch_flags.bitfield.cpu8087
10811 && !cpu_arch_flags.bitfield.cpu287
10812 && !cpu_arch_flags.bitfield.cpu387)
10813 return (const reg_entry *) NULL;
10814
10815 if (is_space_char (*s))
10816 ++s;
10817 if (*s == '(')
10818 {
10819 ++s;
10820 if (is_space_char (*s))
10821 ++s;
10822 if (*s >= '0' && *s <= '7')
10823 {
10824 int fpr = *s - '0';
10825 ++s;
10826 if (is_space_char (*s))
10827 ++s;
10828 if (*s == ')')
10829 {
10830 *end_op = s + 1;
10831 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
10832 know (r);
10833 return r + fpr;
10834 }
10835 }
10836 /* We have "%st(" then garbage. */
10837 return (const reg_entry *) NULL;
10838 }
10839 }
10840
10841 if (r == NULL || allow_pseudo_reg)
10842 return r;
10843
10844 if (operand_type_all_zero (&r->reg_type))
10845 return (const reg_entry *) NULL;
10846
10847 if ((r->reg_type.bitfield.dword
10848 || r->reg_type.bitfield.sreg3
10849 || r->reg_type.bitfield.control
10850 || r->reg_type.bitfield.debug
10851 || r->reg_type.bitfield.test)
10852 && !cpu_arch_flags.bitfield.cpui386)
10853 return (const reg_entry *) NULL;
10854
10855 if (r->reg_type.bitfield.regmmx && !cpu_arch_flags.bitfield.cpummx)
10856 return (const reg_entry *) NULL;
10857
10858 if (!cpu_arch_flags.bitfield.cpuavx512f)
10859 {
10860 if (r->reg_type.bitfield.zmmword || r->reg_type.bitfield.regmask)
10861 return (const reg_entry *) NULL;
10862
10863 if (!cpu_arch_flags.bitfield.cpuavx)
10864 {
10865 if (r->reg_type.bitfield.ymmword)
10866 return (const reg_entry *) NULL;
10867
10868 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
10869 return (const reg_entry *) NULL;
10870 }
10871 }
10872
10873 if (r->reg_type.bitfield.regbnd && !cpu_arch_flags.bitfield.cpumpx)
10874 return (const reg_entry *) NULL;
10875
10876 /* Don't allow fake index register unless allow_index_reg isn't 0. */
10877 if (!allow_index_reg && r->reg_num == RegIZ)
10878 return (const reg_entry *) NULL;
10879
10880 /* Upper 16 vector registers are only available with VREX in 64bit
10881 mode, and require EVEX encoding. */
10882 if (r->reg_flags & RegVRex)
10883 {
10884 if (!cpu_arch_flags.bitfield.cpuavx512f
10885 || flag_code != CODE_64BIT)
10886 return (const reg_entry *) NULL;
10887
10888 i.vec_encoding = vex_encoding_evex;
10889 }
10890
10891 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
10892 && (!cpu_arch_flags.bitfield.cpulm || !r->reg_type.bitfield.control)
10893 && flag_code != CODE_64BIT)
10894 return (const reg_entry *) NULL;
10895
10896 if (r->reg_type.bitfield.sreg3 && r->reg_num == RegFlat && !intel_syntax)
10897 return (const reg_entry *) NULL;
10898
10899 return r;
10900 }
10901
10902 /* REG_STRING starts *before* REGISTER_PREFIX. */
10903
10904 static const reg_entry *
10905 parse_register (char *reg_string, char **end_op)
10906 {
10907 const reg_entry *r;
10908
10909 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
10910 r = parse_real_register (reg_string, end_op);
10911 else
10912 r = NULL;
10913 if (!r)
10914 {
10915 char *save = input_line_pointer;
10916 char c;
10917 symbolS *symbolP;
10918
10919 input_line_pointer = reg_string;
10920 c = get_symbol_name (&reg_string);
10921 symbolP = symbol_find (reg_string);
10922 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
10923 {
10924 const expressionS *e = symbol_get_value_expression (symbolP);
10925
10926 know (e->X_op == O_register);
10927 know (e->X_add_number >= 0
10928 && (valueT) e->X_add_number < i386_regtab_size);
10929 r = i386_regtab + e->X_add_number;
10930 if ((r->reg_flags & RegVRex))
10931 i.vec_encoding = vex_encoding_evex;
10932 *end_op = input_line_pointer;
10933 }
10934 *input_line_pointer = c;
10935 input_line_pointer = save;
10936 }
10937 return r;
10938 }
10939
10940 int
10941 i386_parse_name (char *name, expressionS *e, char *nextcharP)
10942 {
10943 const reg_entry *r;
10944 char *end = input_line_pointer;
10945
10946 *end = *nextcharP;
10947 r = parse_register (name, &input_line_pointer);
10948 if (r && end <= input_line_pointer)
10949 {
10950 *nextcharP = *input_line_pointer;
10951 *input_line_pointer = 0;
10952 e->X_op = O_register;
10953 e->X_add_number = r - i386_regtab;
10954 return 1;
10955 }
10956 input_line_pointer = end;
10957 *end = 0;
10958 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
10959 }
10960
10961 void
10962 md_operand (expressionS *e)
10963 {
10964 char *end;
10965 const reg_entry *r;
10966
10967 switch (*input_line_pointer)
10968 {
10969 case REGISTER_PREFIX:
10970 r = parse_real_register (input_line_pointer, &end);
10971 if (r)
10972 {
10973 e->X_op = O_register;
10974 e->X_add_number = r - i386_regtab;
10975 input_line_pointer = end;
10976 }
10977 break;
10978
10979 case '[':
10980 gas_assert (intel_syntax);
10981 end = input_line_pointer++;
10982 expression (e);
10983 if (*input_line_pointer == ']')
10984 {
10985 ++input_line_pointer;
10986 e->X_op_symbol = make_expr_symbol (e);
10987 e->X_add_symbol = NULL;
10988 e->X_add_number = 0;
10989 e->X_op = O_index;
10990 }
10991 else
10992 {
10993 e->X_op = O_absent;
10994 input_line_pointer = end;
10995 }
10996 break;
10997 }
10998 }
10999
11000 \f
11001 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11002 const char *md_shortopts = "kVQ:sqnO::";
11003 #else
11004 const char *md_shortopts = "qnO::";
11005 #endif
11006
11007 #define OPTION_32 (OPTION_MD_BASE + 0)
11008 #define OPTION_64 (OPTION_MD_BASE + 1)
11009 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
11010 #define OPTION_MARCH (OPTION_MD_BASE + 3)
11011 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
11012 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
11013 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
11014 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
11015 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
11016 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
11017 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
11018 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
11019 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
11020 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
11021 #define OPTION_X32 (OPTION_MD_BASE + 14)
11022 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
11023 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
11024 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
11025 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
11026 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
11027 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
11028 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
11029 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
11030 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
11031 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
11032 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
11033 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
11034
11035 struct option md_longopts[] =
11036 {
11037 {"32", no_argument, NULL, OPTION_32},
11038 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11039 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11040 {"64", no_argument, NULL, OPTION_64},
11041 #endif
11042 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11043 {"x32", no_argument, NULL, OPTION_X32},
11044 {"mshared", no_argument, NULL, OPTION_MSHARED},
11045 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
11046 #endif
11047 {"divide", no_argument, NULL, OPTION_DIVIDE},
11048 {"march", required_argument, NULL, OPTION_MARCH},
11049 {"mtune", required_argument, NULL, OPTION_MTUNE},
11050 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
11051 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
11052 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
11053 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
11054 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
11055 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
11056 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
11057 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
11058 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
11059 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
11060 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
11061 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
11062 # if defined (TE_PE) || defined (TE_PEP)
11063 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
11064 #endif
11065 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
11066 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
11067 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
11068 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
11069 {"mamd64", no_argument, NULL, OPTION_MAMD64},
11070 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
11071 {NULL, no_argument, NULL, 0}
11072 };
11073 size_t md_longopts_size = sizeof (md_longopts);
11074
11075 int
11076 md_parse_option (int c, const char *arg)
11077 {
11078 unsigned int j;
11079 char *arch, *next, *saved;
11080
11081 switch (c)
11082 {
11083 case 'n':
11084 optimize_align_code = 0;
11085 break;
11086
11087 case 'q':
11088 quiet_warnings = 1;
11089 break;
11090
11091 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11092 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
11093 should be emitted or not. FIXME: Not implemented. */
11094 case 'Q':
11095 break;
11096
11097 /* -V: SVR4 argument to print version ID. */
11098 case 'V':
11099 print_version_id ();
11100 break;
11101
11102 /* -k: Ignore for FreeBSD compatibility. */
11103 case 'k':
11104 break;
11105
11106 case 's':
11107 /* -s: On i386 Solaris, this tells the native assembler to use
11108 .stab instead of .stab.excl. We always use .stab anyhow. */
11109 break;
11110
11111 case OPTION_MSHARED:
11112 shared = 1;
11113 break;
11114
11115 case OPTION_X86_USED_NOTE:
11116 if (strcasecmp (arg, "yes") == 0)
11117 x86_used_note = 1;
11118 else if (strcasecmp (arg, "no") == 0)
11119 x86_used_note = 0;
11120 else
11121 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
11122 break;
11123
11124
11125 #endif
11126 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11127 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11128 case OPTION_64:
11129 {
11130 const char **list, **l;
11131
11132 list = bfd_target_list ();
11133 for (l = list; *l != NULL; l++)
11134 if (CONST_STRNEQ (*l, "elf64-x86-64")
11135 || strcmp (*l, "coff-x86-64") == 0
11136 || strcmp (*l, "pe-x86-64") == 0
11137 || strcmp (*l, "pei-x86-64") == 0
11138 || strcmp (*l, "mach-o-x86-64") == 0)
11139 {
11140 default_arch = "x86_64";
11141 break;
11142 }
11143 if (*l == NULL)
11144 as_fatal (_("no compiled in support for x86_64"));
11145 free (list);
11146 }
11147 break;
11148 #endif
11149
11150 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11151 case OPTION_X32:
11152 if (IS_ELF)
11153 {
11154 const char **list, **l;
11155
11156 list = bfd_target_list ();
11157 for (l = list; *l != NULL; l++)
11158 if (CONST_STRNEQ (*l, "elf32-x86-64"))
11159 {
11160 default_arch = "x86_64:32";
11161 break;
11162 }
11163 if (*l == NULL)
11164 as_fatal (_("no compiled in support for 32bit x86_64"));
11165 free (list);
11166 }
11167 else
11168 as_fatal (_("32bit x86_64 is only supported for ELF"));
11169 break;
11170 #endif
11171
11172 case OPTION_32:
11173 default_arch = "i386";
11174 break;
11175
11176 case OPTION_DIVIDE:
11177 #ifdef SVR4_COMMENT_CHARS
11178 {
11179 char *n, *t;
11180 const char *s;
11181
11182 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
11183 t = n;
11184 for (s = i386_comment_chars; *s != '\0'; s++)
11185 if (*s != '/')
11186 *t++ = *s;
11187 *t = '\0';
11188 i386_comment_chars = n;
11189 }
11190 #endif
11191 break;
11192
11193 case OPTION_MARCH:
11194 saved = xstrdup (arg);
11195 arch = saved;
11196 /* Allow -march=+nosse. */
11197 if (*arch == '+')
11198 arch++;
11199 do
11200 {
11201 if (*arch == '.')
11202 as_fatal (_("invalid -march= option: `%s'"), arg);
11203 next = strchr (arch, '+');
11204 if (next)
11205 *next++ = '\0';
11206 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11207 {
11208 if (strcmp (arch, cpu_arch [j].name) == 0)
11209 {
11210 /* Processor. */
11211 if (! cpu_arch[j].flags.bitfield.cpui386)
11212 continue;
11213
11214 cpu_arch_name = cpu_arch[j].name;
11215 cpu_sub_arch_name = NULL;
11216 cpu_arch_flags = cpu_arch[j].flags;
11217 cpu_arch_isa = cpu_arch[j].type;
11218 cpu_arch_isa_flags = cpu_arch[j].flags;
11219 if (!cpu_arch_tune_set)
11220 {
11221 cpu_arch_tune = cpu_arch_isa;
11222 cpu_arch_tune_flags = cpu_arch_isa_flags;
11223 }
11224 break;
11225 }
11226 else if (*cpu_arch [j].name == '.'
11227 && strcmp (arch, cpu_arch [j].name + 1) == 0)
11228 {
11229 /* ISA extension. */
11230 i386_cpu_flags flags;
11231
11232 flags = cpu_flags_or (cpu_arch_flags,
11233 cpu_arch[j].flags);
11234
11235 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
11236 {
11237 if (cpu_sub_arch_name)
11238 {
11239 char *name = cpu_sub_arch_name;
11240 cpu_sub_arch_name = concat (name,
11241 cpu_arch[j].name,
11242 (const char *) NULL);
11243 free (name);
11244 }
11245 else
11246 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
11247 cpu_arch_flags = flags;
11248 cpu_arch_isa_flags = flags;
11249 }
11250 else
11251 cpu_arch_isa_flags
11252 = cpu_flags_or (cpu_arch_isa_flags,
11253 cpu_arch[j].flags);
11254 break;
11255 }
11256 }
11257
11258 if (j >= ARRAY_SIZE (cpu_arch))
11259 {
11260 /* Disable an ISA extension. */
11261 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
11262 if (strcmp (arch, cpu_noarch [j].name) == 0)
11263 {
11264 i386_cpu_flags flags;
11265
11266 flags = cpu_flags_and_not (cpu_arch_flags,
11267 cpu_noarch[j].flags);
11268 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
11269 {
11270 if (cpu_sub_arch_name)
11271 {
11272 char *name = cpu_sub_arch_name;
11273 cpu_sub_arch_name = concat (arch,
11274 (const char *) NULL);
11275 free (name);
11276 }
11277 else
11278 cpu_sub_arch_name = xstrdup (arch);
11279 cpu_arch_flags = flags;
11280 cpu_arch_isa_flags = flags;
11281 }
11282 break;
11283 }
11284
11285 if (j >= ARRAY_SIZE (cpu_noarch))
11286 j = ARRAY_SIZE (cpu_arch);
11287 }
11288
11289 if (j >= ARRAY_SIZE (cpu_arch))
11290 as_fatal (_("invalid -march= option: `%s'"), arg);
11291
11292 arch = next;
11293 }
11294 while (next != NULL);
11295 free (saved);
11296 break;
11297
11298 case OPTION_MTUNE:
11299 if (*arg == '.')
11300 as_fatal (_("invalid -mtune= option: `%s'"), arg);
11301 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11302 {
11303 if (strcmp (arg, cpu_arch [j].name) == 0)
11304 {
11305 cpu_arch_tune_set = 1;
11306 cpu_arch_tune = cpu_arch [j].type;
11307 cpu_arch_tune_flags = cpu_arch[j].flags;
11308 break;
11309 }
11310 }
11311 if (j >= ARRAY_SIZE (cpu_arch))
11312 as_fatal (_("invalid -mtune= option: `%s'"), arg);
11313 break;
11314
11315 case OPTION_MMNEMONIC:
11316 if (strcasecmp (arg, "att") == 0)
11317 intel_mnemonic = 0;
11318 else if (strcasecmp (arg, "intel") == 0)
11319 intel_mnemonic = 1;
11320 else
11321 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
11322 break;
11323
11324 case OPTION_MSYNTAX:
11325 if (strcasecmp (arg, "att") == 0)
11326 intel_syntax = 0;
11327 else if (strcasecmp (arg, "intel") == 0)
11328 intel_syntax = 1;
11329 else
11330 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
11331 break;
11332
11333 case OPTION_MINDEX_REG:
11334 allow_index_reg = 1;
11335 break;
11336
11337 case OPTION_MNAKED_REG:
11338 allow_naked_reg = 1;
11339 break;
11340
11341 case OPTION_MSSE2AVX:
11342 sse2avx = 1;
11343 break;
11344
11345 case OPTION_MSSE_CHECK:
11346 if (strcasecmp (arg, "error") == 0)
11347 sse_check = check_error;
11348 else if (strcasecmp (arg, "warning") == 0)
11349 sse_check = check_warning;
11350 else if (strcasecmp (arg, "none") == 0)
11351 sse_check = check_none;
11352 else
11353 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
11354 break;
11355
11356 case OPTION_MOPERAND_CHECK:
11357 if (strcasecmp (arg, "error") == 0)
11358 operand_check = check_error;
11359 else if (strcasecmp (arg, "warning") == 0)
11360 operand_check = check_warning;
11361 else if (strcasecmp (arg, "none") == 0)
11362 operand_check = check_none;
11363 else
11364 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
11365 break;
11366
11367 case OPTION_MAVXSCALAR:
11368 if (strcasecmp (arg, "128") == 0)
11369 avxscalar = vex128;
11370 else if (strcasecmp (arg, "256") == 0)
11371 avxscalar = vex256;
11372 else
11373 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
11374 break;
11375
11376 case OPTION_MVEXWIG:
11377 if (strcmp (arg, "0") == 0)
11378 vexwig = evexw0;
11379 else if (strcmp (arg, "1") == 0)
11380 vexwig = evexw1;
11381 else
11382 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
11383 break;
11384
11385 case OPTION_MADD_BND_PREFIX:
11386 add_bnd_prefix = 1;
11387 break;
11388
11389 case OPTION_MEVEXLIG:
11390 if (strcmp (arg, "128") == 0)
11391 evexlig = evexl128;
11392 else if (strcmp (arg, "256") == 0)
11393 evexlig = evexl256;
11394 else if (strcmp (arg, "512") == 0)
11395 evexlig = evexl512;
11396 else
11397 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
11398 break;
11399
11400 case OPTION_MEVEXRCIG:
11401 if (strcmp (arg, "rne") == 0)
11402 evexrcig = rne;
11403 else if (strcmp (arg, "rd") == 0)
11404 evexrcig = rd;
11405 else if (strcmp (arg, "ru") == 0)
11406 evexrcig = ru;
11407 else if (strcmp (arg, "rz") == 0)
11408 evexrcig = rz;
11409 else
11410 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
11411 break;
11412
11413 case OPTION_MEVEXWIG:
11414 if (strcmp (arg, "0") == 0)
11415 evexwig = evexw0;
11416 else if (strcmp (arg, "1") == 0)
11417 evexwig = evexw1;
11418 else
11419 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
11420 break;
11421
11422 # if defined (TE_PE) || defined (TE_PEP)
11423 case OPTION_MBIG_OBJ:
11424 use_big_obj = 1;
11425 break;
11426 #endif
11427
11428 case OPTION_MOMIT_LOCK_PREFIX:
11429 if (strcasecmp (arg, "yes") == 0)
11430 omit_lock_prefix = 1;
11431 else if (strcasecmp (arg, "no") == 0)
11432 omit_lock_prefix = 0;
11433 else
11434 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
11435 break;
11436
11437 case OPTION_MFENCE_AS_LOCK_ADD:
11438 if (strcasecmp (arg, "yes") == 0)
11439 avoid_fence = 1;
11440 else if (strcasecmp (arg, "no") == 0)
11441 avoid_fence = 0;
11442 else
11443 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
11444 break;
11445
11446 case OPTION_MRELAX_RELOCATIONS:
11447 if (strcasecmp (arg, "yes") == 0)
11448 generate_relax_relocations = 1;
11449 else if (strcasecmp (arg, "no") == 0)
11450 generate_relax_relocations = 0;
11451 else
11452 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
11453 break;
11454
11455 case OPTION_MAMD64:
11456 intel64 = 0;
11457 break;
11458
11459 case OPTION_MINTEL64:
11460 intel64 = 1;
11461 break;
11462
11463 case 'O':
11464 if (arg == NULL)
11465 {
11466 optimize = 1;
11467 /* Turn off -Os. */
11468 optimize_for_space = 0;
11469 }
11470 else if (*arg == 's')
11471 {
11472 optimize_for_space = 1;
11473 /* Turn on all encoding optimizations. */
11474 optimize = INT_MAX;
11475 }
11476 else
11477 {
11478 optimize = atoi (arg);
11479 /* Turn off -Os. */
11480 optimize_for_space = 0;
11481 }
11482 break;
11483
11484 default:
11485 return 0;
11486 }
11487 return 1;
11488 }
11489
11490 #define MESSAGE_TEMPLATE \
11491 " "
11492
11493 static char *
11494 output_message (FILE *stream, char *p, char *message, char *start,
11495 int *left_p, const char *name, int len)
11496 {
11497 int size = sizeof (MESSAGE_TEMPLATE);
11498 int left = *left_p;
11499
11500 /* Reserve 2 spaces for ", " or ",\0" */
11501 left -= len + 2;
11502
11503 /* Check if there is any room. */
11504 if (left >= 0)
11505 {
11506 if (p != start)
11507 {
11508 *p++ = ',';
11509 *p++ = ' ';
11510 }
11511 p = mempcpy (p, name, len);
11512 }
11513 else
11514 {
11515 /* Output the current message now and start a new one. */
11516 *p++ = ',';
11517 *p = '\0';
11518 fprintf (stream, "%s\n", message);
11519 p = start;
11520 left = size - (start - message) - len - 2;
11521
11522 gas_assert (left >= 0);
11523
11524 p = mempcpy (p, name, len);
11525 }
11526
11527 *left_p = left;
11528 return p;
11529 }
11530
11531 static void
11532 show_arch (FILE *stream, int ext, int check)
11533 {
11534 static char message[] = MESSAGE_TEMPLATE;
11535 char *start = message + 27;
11536 char *p;
11537 int size = sizeof (MESSAGE_TEMPLATE);
11538 int left;
11539 const char *name;
11540 int len;
11541 unsigned int j;
11542
11543 p = start;
11544 left = size - (start - message);
11545 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11546 {
11547 /* Should it be skipped? */
11548 if (cpu_arch [j].skip)
11549 continue;
11550
11551 name = cpu_arch [j].name;
11552 len = cpu_arch [j].len;
11553 if (*name == '.')
11554 {
11555 /* It is an extension. Skip if we aren't asked to show it. */
11556 if (ext)
11557 {
11558 name++;
11559 len--;
11560 }
11561 else
11562 continue;
11563 }
11564 else if (ext)
11565 {
11566 /* It is an processor. Skip if we show only extension. */
11567 continue;
11568 }
11569 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
11570 {
11571 /* It is an impossible processor - skip. */
11572 continue;
11573 }
11574
11575 p = output_message (stream, p, message, start, &left, name, len);
11576 }
11577
11578 /* Display disabled extensions. */
11579 if (ext)
11580 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
11581 {
11582 name = cpu_noarch [j].name;
11583 len = cpu_noarch [j].len;
11584 p = output_message (stream, p, message, start, &left, name,
11585 len);
11586 }
11587
11588 *p = '\0';
11589 fprintf (stream, "%s\n", message);
11590 }
11591
11592 void
11593 md_show_usage (FILE *stream)
11594 {
11595 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11596 fprintf (stream, _("\
11597 -Q ignored\n\
11598 -V print assembler version number\n\
11599 -k ignored\n"));
11600 #endif
11601 fprintf (stream, _("\
11602 -n Do not optimize code alignment\n\
11603 -q quieten some warnings\n"));
11604 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11605 fprintf (stream, _("\
11606 -s ignored\n"));
11607 #endif
11608 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11609 || defined (TE_PE) || defined (TE_PEP))
11610 fprintf (stream, _("\
11611 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
11612 #endif
11613 #ifdef SVR4_COMMENT_CHARS
11614 fprintf (stream, _("\
11615 --divide do not treat `/' as a comment character\n"));
11616 #else
11617 fprintf (stream, _("\
11618 --divide ignored\n"));
11619 #endif
11620 fprintf (stream, _("\
11621 -march=CPU[,+EXTENSION...]\n\
11622 generate code for CPU and EXTENSION, CPU is one of:\n"));
11623 show_arch (stream, 0, 1);
11624 fprintf (stream, _("\
11625 EXTENSION is combination of:\n"));
11626 show_arch (stream, 1, 0);
11627 fprintf (stream, _("\
11628 -mtune=CPU optimize for CPU, CPU is one of:\n"));
11629 show_arch (stream, 0, 0);
11630 fprintf (stream, _("\
11631 -msse2avx encode SSE instructions with VEX prefix\n"));
11632 fprintf (stream, _("\
11633 -msse-check=[none|error|warning] (default: warning)\n\
11634 check SSE instructions\n"));
11635 fprintf (stream, _("\
11636 -moperand-check=[none|error|warning] (default: warning)\n\
11637 check operand combinations for validity\n"));
11638 fprintf (stream, _("\
11639 -mavxscalar=[128|256] (default: 128)\n\
11640 encode scalar AVX instructions with specific vector\n\
11641 length\n"));
11642 fprintf (stream, _("\
11643 -mvexwig=[0|1] (default: 0)\n\
11644 encode VEX instructions with specific VEX.W value\n\
11645 for VEX.W bit ignored instructions\n"));
11646 fprintf (stream, _("\
11647 -mevexlig=[128|256|512] (default: 128)\n\
11648 encode scalar EVEX instructions with specific vector\n\
11649 length\n"));
11650 fprintf (stream, _("\
11651 -mevexwig=[0|1] (default: 0)\n\
11652 encode EVEX instructions with specific EVEX.W value\n\
11653 for EVEX.W bit ignored instructions\n"));
11654 fprintf (stream, _("\
11655 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
11656 encode EVEX instructions with specific EVEX.RC value\n\
11657 for SAE-only ignored instructions\n"));
11658 fprintf (stream, _("\
11659 -mmnemonic=[att|intel] "));
11660 if (SYSV386_COMPAT)
11661 fprintf (stream, _("(default: att)\n"));
11662 else
11663 fprintf (stream, _("(default: intel)\n"));
11664 fprintf (stream, _("\
11665 use AT&T/Intel mnemonic\n"));
11666 fprintf (stream, _("\
11667 -msyntax=[att|intel] (default: att)\n\
11668 use AT&T/Intel syntax\n"));
11669 fprintf (stream, _("\
11670 -mindex-reg support pseudo index registers\n"));
11671 fprintf (stream, _("\
11672 -mnaked-reg don't require `%%' prefix for registers\n"));
11673 fprintf (stream, _("\
11674 -madd-bnd-prefix add BND prefix for all valid branches\n"));
11675 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11676 fprintf (stream, _("\
11677 -mshared disable branch optimization for shared code\n"));
11678 fprintf (stream, _("\
11679 -mx86-used-note=[no|yes] "));
11680 if (DEFAULT_X86_USED_NOTE)
11681 fprintf (stream, _("(default: yes)\n"));
11682 else
11683 fprintf (stream, _("(default: no)\n"));
11684 fprintf (stream, _("\
11685 generate x86 used ISA and feature properties\n"));
11686 #endif
11687 #if defined (TE_PE) || defined (TE_PEP)
11688 fprintf (stream, _("\
11689 -mbig-obj generate big object files\n"));
11690 #endif
11691 fprintf (stream, _("\
11692 -momit-lock-prefix=[no|yes] (default: no)\n\
11693 strip all lock prefixes\n"));
11694 fprintf (stream, _("\
11695 -mfence-as-lock-add=[no|yes] (default: no)\n\
11696 encode lfence, mfence and sfence as\n\
11697 lock addl $0x0, (%%{re}sp)\n"));
11698 fprintf (stream, _("\
11699 -mrelax-relocations=[no|yes] "));
11700 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
11701 fprintf (stream, _("(default: yes)\n"));
11702 else
11703 fprintf (stream, _("(default: no)\n"));
11704 fprintf (stream, _("\
11705 generate relax relocations\n"));
11706 fprintf (stream, _("\
11707 -mamd64 accept only AMD64 ISA [default]\n"));
11708 fprintf (stream, _("\
11709 -mintel64 accept only Intel64 ISA\n"));
11710 }
11711
11712 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
11713 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11714 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11715
11716 /* Pick the target format to use. */
11717
11718 const char *
11719 i386_target_format (void)
11720 {
11721 if (!strncmp (default_arch, "x86_64", 6))
11722 {
11723 update_code_flag (CODE_64BIT, 1);
11724 if (default_arch[6] == '\0')
11725 x86_elf_abi = X86_64_ABI;
11726 else
11727 x86_elf_abi = X86_64_X32_ABI;
11728 }
11729 else if (!strcmp (default_arch, "i386"))
11730 update_code_flag (CODE_32BIT, 1);
11731 else if (!strcmp (default_arch, "iamcu"))
11732 {
11733 update_code_flag (CODE_32BIT, 1);
11734 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
11735 {
11736 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
11737 cpu_arch_name = "iamcu";
11738 cpu_sub_arch_name = NULL;
11739 cpu_arch_flags = iamcu_flags;
11740 cpu_arch_isa = PROCESSOR_IAMCU;
11741 cpu_arch_isa_flags = iamcu_flags;
11742 if (!cpu_arch_tune_set)
11743 {
11744 cpu_arch_tune = cpu_arch_isa;
11745 cpu_arch_tune_flags = cpu_arch_isa_flags;
11746 }
11747 }
11748 else if (cpu_arch_isa != PROCESSOR_IAMCU)
11749 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
11750 cpu_arch_name);
11751 }
11752 else
11753 as_fatal (_("unknown architecture"));
11754
11755 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
11756 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11757 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
11758 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11759
11760 switch (OUTPUT_FLAVOR)
11761 {
11762 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
11763 case bfd_target_aout_flavour:
11764 return AOUT_TARGET_FORMAT;
11765 #endif
11766 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
11767 # if defined (TE_PE) || defined (TE_PEP)
11768 case bfd_target_coff_flavour:
11769 if (flag_code == CODE_64BIT)
11770 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
11771 else
11772 return "pe-i386";
11773 # elif defined (TE_GO32)
11774 case bfd_target_coff_flavour:
11775 return "coff-go32";
11776 # else
11777 case bfd_target_coff_flavour:
11778 return "coff-i386";
11779 # endif
11780 #endif
11781 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
11782 case bfd_target_elf_flavour:
11783 {
11784 const char *format;
11785
11786 switch (x86_elf_abi)
11787 {
11788 default:
11789 format = ELF_TARGET_FORMAT;
11790 break;
11791 case X86_64_ABI:
11792 use_rela_relocations = 1;
11793 object_64bit = 1;
11794 format = ELF_TARGET_FORMAT64;
11795 break;
11796 case X86_64_X32_ABI:
11797 use_rela_relocations = 1;
11798 object_64bit = 1;
11799 disallow_64bit_reloc = 1;
11800 format = ELF_TARGET_FORMAT32;
11801 break;
11802 }
11803 if (cpu_arch_isa == PROCESSOR_L1OM)
11804 {
11805 if (x86_elf_abi != X86_64_ABI)
11806 as_fatal (_("Intel L1OM is 64bit only"));
11807 return ELF_TARGET_L1OM_FORMAT;
11808 }
11809 else if (cpu_arch_isa == PROCESSOR_K1OM)
11810 {
11811 if (x86_elf_abi != X86_64_ABI)
11812 as_fatal (_("Intel K1OM is 64bit only"));
11813 return ELF_TARGET_K1OM_FORMAT;
11814 }
11815 else if (cpu_arch_isa == PROCESSOR_IAMCU)
11816 {
11817 if (x86_elf_abi != I386_ABI)
11818 as_fatal (_("Intel MCU is 32bit only"));
11819 return ELF_TARGET_IAMCU_FORMAT;
11820 }
11821 else
11822 return format;
11823 }
11824 #endif
11825 #if defined (OBJ_MACH_O)
11826 case bfd_target_mach_o_flavour:
11827 if (flag_code == CODE_64BIT)
11828 {
11829 use_rela_relocations = 1;
11830 object_64bit = 1;
11831 return "mach-o-x86-64";
11832 }
11833 else
11834 return "mach-o-i386";
11835 #endif
11836 default:
11837 abort ();
11838 return NULL;
11839 }
11840 }
11841
11842 #endif /* OBJ_MAYBE_ more than one */
11843 \f
11844 symbolS *
11845 md_undefined_symbol (char *name)
11846 {
11847 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
11848 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
11849 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
11850 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
11851 {
11852 if (!GOT_symbol)
11853 {
11854 if (symbol_find (name))
11855 as_bad (_("GOT already in symbol table"));
11856 GOT_symbol = symbol_new (name, undefined_section,
11857 (valueT) 0, &zero_address_frag);
11858 };
11859 return GOT_symbol;
11860 }
11861 return 0;
11862 }
11863
11864 /* Round up a section size to the appropriate boundary. */
11865
11866 valueT
11867 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
11868 {
11869 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
11870 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
11871 {
11872 /* For a.out, force the section size to be aligned. If we don't do
11873 this, BFD will align it for us, but it will not write out the
11874 final bytes of the section. This may be a bug in BFD, but it is
11875 easier to fix it here since that is how the other a.out targets
11876 work. */
11877 int align;
11878
11879 align = bfd_get_section_alignment (stdoutput, segment);
11880 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
11881 }
11882 #endif
11883
11884 return size;
11885 }
11886
11887 /* On the i386, PC-relative offsets are relative to the start of the
11888 next instruction. That is, the address of the offset, plus its
11889 size, since the offset is always the last part of the insn. */
11890
11891 long
11892 md_pcrel_from (fixS *fixP)
11893 {
11894 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
11895 }
11896
11897 #ifndef I386COFF
11898
11899 static void
11900 s_bss (int ignore ATTRIBUTE_UNUSED)
11901 {
11902 int temp;
11903
11904 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11905 if (IS_ELF)
11906 obj_elf_section_change_hook ();
11907 #endif
11908 temp = get_absolute_expression ();
11909 subseg_set (bss_section, (subsegT) temp);
11910 demand_empty_rest_of_line ();
11911 }
11912
11913 #endif
11914
11915 void
11916 i386_validate_fix (fixS *fixp)
11917 {
11918 if (fixp->fx_subsy)
11919 {
11920 if (fixp->fx_subsy == GOT_symbol)
11921 {
11922 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
11923 {
11924 if (!object_64bit)
11925 abort ();
11926 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11927 if (fixp->fx_tcbit2)
11928 fixp->fx_r_type = (fixp->fx_tcbit
11929 ? BFD_RELOC_X86_64_REX_GOTPCRELX
11930 : BFD_RELOC_X86_64_GOTPCRELX);
11931 else
11932 #endif
11933 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
11934 }
11935 else
11936 {
11937 if (!object_64bit)
11938 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
11939 else
11940 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
11941 }
11942 fixp->fx_subsy = 0;
11943 }
11944 }
11945 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11946 else if (!object_64bit)
11947 {
11948 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
11949 && fixp->fx_tcbit2)
11950 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
11951 }
11952 #endif
11953 }
11954
11955 arelent *
11956 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
11957 {
11958 arelent *rel;
11959 bfd_reloc_code_real_type code;
11960
11961 switch (fixp->fx_r_type)
11962 {
11963 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11964 case BFD_RELOC_SIZE32:
11965 case BFD_RELOC_SIZE64:
11966 if (S_IS_DEFINED (fixp->fx_addsy)
11967 && !S_IS_EXTERNAL (fixp->fx_addsy))
11968 {
11969 /* Resolve size relocation against local symbol to size of
11970 the symbol plus addend. */
11971 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
11972 if (fixp->fx_r_type == BFD_RELOC_SIZE32
11973 && !fits_in_unsigned_long (value))
11974 as_bad_where (fixp->fx_file, fixp->fx_line,
11975 _("symbol size computation overflow"));
11976 fixp->fx_addsy = NULL;
11977 fixp->fx_subsy = NULL;
11978 md_apply_fix (fixp, (valueT *) &value, NULL);
11979 return NULL;
11980 }
11981 #endif
11982 /* Fall through. */
11983
11984 case BFD_RELOC_X86_64_PLT32:
11985 case BFD_RELOC_X86_64_GOT32:
11986 case BFD_RELOC_X86_64_GOTPCREL:
11987 case BFD_RELOC_X86_64_GOTPCRELX:
11988 case BFD_RELOC_X86_64_REX_GOTPCRELX:
11989 case BFD_RELOC_386_PLT32:
11990 case BFD_RELOC_386_GOT32:
11991 case BFD_RELOC_386_GOT32X:
11992 case BFD_RELOC_386_GOTOFF:
11993 case BFD_RELOC_386_GOTPC:
11994 case BFD_RELOC_386_TLS_GD:
11995 case BFD_RELOC_386_TLS_LDM:
11996 case BFD_RELOC_386_TLS_LDO_32:
11997 case BFD_RELOC_386_TLS_IE_32:
11998 case BFD_RELOC_386_TLS_IE:
11999 case BFD_RELOC_386_TLS_GOTIE:
12000 case BFD_RELOC_386_TLS_LE_32:
12001 case BFD_RELOC_386_TLS_LE:
12002 case BFD_RELOC_386_TLS_GOTDESC:
12003 case BFD_RELOC_386_TLS_DESC_CALL:
12004 case BFD_RELOC_X86_64_TLSGD:
12005 case BFD_RELOC_X86_64_TLSLD:
12006 case BFD_RELOC_X86_64_DTPOFF32:
12007 case BFD_RELOC_X86_64_DTPOFF64:
12008 case BFD_RELOC_X86_64_GOTTPOFF:
12009 case BFD_RELOC_X86_64_TPOFF32:
12010 case BFD_RELOC_X86_64_TPOFF64:
12011 case BFD_RELOC_X86_64_GOTOFF64:
12012 case BFD_RELOC_X86_64_GOTPC32:
12013 case BFD_RELOC_X86_64_GOT64:
12014 case BFD_RELOC_X86_64_GOTPCREL64:
12015 case BFD_RELOC_X86_64_GOTPC64:
12016 case BFD_RELOC_X86_64_GOTPLT64:
12017 case BFD_RELOC_X86_64_PLTOFF64:
12018 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12019 case BFD_RELOC_X86_64_TLSDESC_CALL:
12020 case BFD_RELOC_RVA:
12021 case BFD_RELOC_VTABLE_ENTRY:
12022 case BFD_RELOC_VTABLE_INHERIT:
12023 #ifdef TE_PE
12024 case BFD_RELOC_32_SECREL:
12025 #endif
12026 code = fixp->fx_r_type;
12027 break;
12028 case BFD_RELOC_X86_64_32S:
12029 if (!fixp->fx_pcrel)
12030 {
12031 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
12032 code = fixp->fx_r_type;
12033 break;
12034 }
12035 /* Fall through. */
12036 default:
12037 if (fixp->fx_pcrel)
12038 {
12039 switch (fixp->fx_size)
12040 {
12041 default:
12042 as_bad_where (fixp->fx_file, fixp->fx_line,
12043 _("can not do %d byte pc-relative relocation"),
12044 fixp->fx_size);
12045 code = BFD_RELOC_32_PCREL;
12046 break;
12047 case 1: code = BFD_RELOC_8_PCREL; break;
12048 case 2: code = BFD_RELOC_16_PCREL; break;
12049 case 4: code = BFD_RELOC_32_PCREL; break;
12050 #ifdef BFD64
12051 case 8: code = BFD_RELOC_64_PCREL; break;
12052 #endif
12053 }
12054 }
12055 else
12056 {
12057 switch (fixp->fx_size)
12058 {
12059 default:
12060 as_bad_where (fixp->fx_file, fixp->fx_line,
12061 _("can not do %d byte relocation"),
12062 fixp->fx_size);
12063 code = BFD_RELOC_32;
12064 break;
12065 case 1: code = BFD_RELOC_8; break;
12066 case 2: code = BFD_RELOC_16; break;
12067 case 4: code = BFD_RELOC_32; break;
12068 #ifdef BFD64
12069 case 8: code = BFD_RELOC_64; break;
12070 #endif
12071 }
12072 }
12073 break;
12074 }
12075
12076 if ((code == BFD_RELOC_32
12077 || code == BFD_RELOC_32_PCREL
12078 || code == BFD_RELOC_X86_64_32S)
12079 && GOT_symbol
12080 && fixp->fx_addsy == GOT_symbol)
12081 {
12082 if (!object_64bit)
12083 code = BFD_RELOC_386_GOTPC;
12084 else
12085 code = BFD_RELOC_X86_64_GOTPC32;
12086 }
12087 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
12088 && GOT_symbol
12089 && fixp->fx_addsy == GOT_symbol)
12090 {
12091 code = BFD_RELOC_X86_64_GOTPC64;
12092 }
12093
12094 rel = XNEW (arelent);
12095 rel->sym_ptr_ptr = XNEW (asymbol *);
12096 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
12097
12098 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
12099
12100 if (!use_rela_relocations)
12101 {
12102 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
12103 vtable entry to be used in the relocation's section offset. */
12104 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
12105 rel->address = fixp->fx_offset;
12106 #if defined (OBJ_COFF) && defined (TE_PE)
12107 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
12108 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
12109 else
12110 #endif
12111 rel->addend = 0;
12112 }
12113 /* Use the rela in 64bit mode. */
12114 else
12115 {
12116 if (disallow_64bit_reloc)
12117 switch (code)
12118 {
12119 case BFD_RELOC_X86_64_DTPOFF64:
12120 case BFD_RELOC_X86_64_TPOFF64:
12121 case BFD_RELOC_64_PCREL:
12122 case BFD_RELOC_X86_64_GOTOFF64:
12123 case BFD_RELOC_X86_64_GOT64:
12124 case BFD_RELOC_X86_64_GOTPCREL64:
12125 case BFD_RELOC_X86_64_GOTPC64:
12126 case BFD_RELOC_X86_64_GOTPLT64:
12127 case BFD_RELOC_X86_64_PLTOFF64:
12128 as_bad_where (fixp->fx_file, fixp->fx_line,
12129 _("cannot represent relocation type %s in x32 mode"),
12130 bfd_get_reloc_code_name (code));
12131 break;
12132 default:
12133 break;
12134 }
12135
12136 if (!fixp->fx_pcrel)
12137 rel->addend = fixp->fx_offset;
12138 else
12139 switch (code)
12140 {
12141 case BFD_RELOC_X86_64_PLT32:
12142 case BFD_RELOC_X86_64_GOT32:
12143 case BFD_RELOC_X86_64_GOTPCREL:
12144 case BFD_RELOC_X86_64_GOTPCRELX:
12145 case BFD_RELOC_X86_64_REX_GOTPCRELX:
12146 case BFD_RELOC_X86_64_TLSGD:
12147 case BFD_RELOC_X86_64_TLSLD:
12148 case BFD_RELOC_X86_64_GOTTPOFF:
12149 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12150 case BFD_RELOC_X86_64_TLSDESC_CALL:
12151 rel->addend = fixp->fx_offset - fixp->fx_size;
12152 break;
12153 default:
12154 rel->addend = (section->vma
12155 - fixp->fx_size
12156 + fixp->fx_addnumber
12157 + md_pcrel_from (fixp));
12158 break;
12159 }
12160 }
12161
12162 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
12163 if (rel->howto == NULL)
12164 {
12165 as_bad_where (fixp->fx_file, fixp->fx_line,
12166 _("cannot represent relocation type %s"),
12167 bfd_get_reloc_code_name (code));
12168 /* Set howto to a garbage value so that we can keep going. */
12169 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
12170 gas_assert (rel->howto != NULL);
12171 }
12172
12173 return rel;
12174 }
12175
12176 #include "tc-i386-intel.c"
12177
12178 void
12179 tc_x86_parse_to_dw2regnum (expressionS *exp)
12180 {
12181 int saved_naked_reg;
12182 char saved_register_dot;
12183
12184 saved_naked_reg = allow_naked_reg;
12185 allow_naked_reg = 1;
12186 saved_register_dot = register_chars['.'];
12187 register_chars['.'] = '.';
12188 allow_pseudo_reg = 1;
12189 expression_and_evaluate (exp);
12190 allow_pseudo_reg = 0;
12191 register_chars['.'] = saved_register_dot;
12192 allow_naked_reg = saved_naked_reg;
12193
12194 if (exp->X_op == O_register && exp->X_add_number >= 0)
12195 {
12196 if ((addressT) exp->X_add_number < i386_regtab_size)
12197 {
12198 exp->X_op = O_constant;
12199 exp->X_add_number = i386_regtab[exp->X_add_number]
12200 .dw2_regnum[flag_code >> 1];
12201 }
12202 else
12203 exp->X_op = O_illegal;
12204 }
12205 }
12206
12207 void
12208 tc_x86_frame_initial_instructions (void)
12209 {
12210 static unsigned int sp_regno[2];
12211
12212 if (!sp_regno[flag_code >> 1])
12213 {
12214 char *saved_input = input_line_pointer;
12215 char sp[][4] = {"esp", "rsp"};
12216 expressionS exp;
12217
12218 input_line_pointer = sp[flag_code >> 1];
12219 tc_x86_parse_to_dw2regnum (&exp);
12220 gas_assert (exp.X_op == O_constant);
12221 sp_regno[flag_code >> 1] = exp.X_add_number;
12222 input_line_pointer = saved_input;
12223 }
12224
12225 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
12226 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
12227 }
12228
12229 int
12230 x86_dwarf2_addr_size (void)
12231 {
12232 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12233 if (x86_elf_abi == X86_64_X32_ABI)
12234 return 4;
12235 #endif
12236 return bfd_arch_bits_per_address (stdoutput) / 8;
12237 }
12238
12239 int
12240 i386_elf_section_type (const char *str, size_t len)
12241 {
12242 if (flag_code == CODE_64BIT
12243 && len == sizeof ("unwind") - 1
12244 && strncmp (str, "unwind", 6) == 0)
12245 return SHT_X86_64_UNWIND;
12246
12247 return -1;
12248 }
12249
12250 #ifdef TE_SOLARIS
12251 void
12252 i386_solaris_fix_up_eh_frame (segT sec)
12253 {
12254 if (flag_code == CODE_64BIT)
12255 elf_section_type (sec) = SHT_X86_64_UNWIND;
12256 }
12257 #endif
12258
12259 #ifdef TE_PE
12260 void
12261 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
12262 {
12263 expressionS exp;
12264
12265 exp.X_op = O_secrel;
12266 exp.X_add_symbol = symbol;
12267 exp.X_add_number = 0;
12268 emit_expr (&exp, size);
12269 }
12270 #endif
12271
12272 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12273 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
12274
12275 bfd_vma
12276 x86_64_section_letter (int letter, const char **ptr_msg)
12277 {
12278 if (flag_code == CODE_64BIT)
12279 {
12280 if (letter == 'l')
12281 return SHF_X86_64_LARGE;
12282
12283 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
12284 }
12285 else
12286 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
12287 return -1;
12288 }
12289
12290 bfd_vma
12291 x86_64_section_word (char *str, size_t len)
12292 {
12293 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
12294 return SHF_X86_64_LARGE;
12295
12296 return -1;
12297 }
12298
12299 static void
12300 handle_large_common (int small ATTRIBUTE_UNUSED)
12301 {
12302 if (flag_code != CODE_64BIT)
12303 {
12304 s_comm_internal (0, elf_common_parse);
12305 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
12306 }
12307 else
12308 {
12309 static segT lbss_section;
12310 asection *saved_com_section_ptr = elf_com_section_ptr;
12311 asection *saved_bss_section = bss_section;
12312
12313 if (lbss_section == NULL)
12314 {
12315 flagword applicable;
12316 segT seg = now_seg;
12317 subsegT subseg = now_subseg;
12318
12319 /* The .lbss section is for local .largecomm symbols. */
12320 lbss_section = subseg_new (".lbss", 0);
12321 applicable = bfd_applicable_section_flags (stdoutput);
12322 bfd_set_section_flags (stdoutput, lbss_section,
12323 applicable & SEC_ALLOC);
12324 seg_info (lbss_section)->bss = 1;
12325
12326 subseg_set (seg, subseg);
12327 }
12328
12329 elf_com_section_ptr = &_bfd_elf_large_com_section;
12330 bss_section = lbss_section;
12331
12332 s_comm_internal (0, elf_common_parse);
12333
12334 elf_com_section_ptr = saved_com_section_ptr;
12335 bss_section = saved_bss_section;
12336 }
12337 }
12338 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 0.468526 seconds and 4 git commands to generate.