Automatic date update in version.in
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
CommitLineData
b534c6d3 1/* tc-i386.c -- Assemble code for the Intel 80386
b3adc24a 2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
252b5132
RH
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
ec2655a6 8 the Free Software Foundation; either version 3, or (at your option)
252b5132
RH
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
4b4da160
NC
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
252b5132 20
47926f60
KH
21/* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
3e73aa7c 23 x86_64 support by Jan Hubicka (jh@suse.cz)
0f10071e 24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
47926f60
KH
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
252b5132 27
252b5132 28#include "as.h"
3882b010 29#include "safe-ctype.h"
252b5132 30#include "subsegs.h"
316e2c05 31#include "dwarf2dbg.h"
54cfded0 32#include "dw2gencfi.h"
d2b2c203 33#include "elf/x86-64.h"
40fb9820 34#include "opcodes/i386-init.h"
252b5132 35
41fd2579
L
36#ifdef HAVE_LIMITS_H
37#include <limits.h>
38#else
39#ifdef HAVE_SYS_PARAM_H
40#include <sys/param.h>
41#endif
42#ifndef INT_MAX
43#define INT_MAX (int) (((unsigned) (-1)) >> 1)
44#endif
45#endif
46
c3332e24 47#ifndef INFER_ADDR_PREFIX
eecb386c 48#define INFER_ADDR_PREFIX 1
c3332e24
AM
49#endif
50
29b0f896
AM
51#ifndef DEFAULT_ARCH
52#define DEFAULT_ARCH "i386"
246fcdee 53#endif
252b5132 54
edde18a5
AM
55#ifndef INLINE
56#if __GNUC__ >= 2
57#define INLINE __inline__
58#else
59#define INLINE
60#endif
61#endif
62
6305a203
L
63/* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
42164a71 67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
6305a203
L
68#define WAIT_PREFIX 0
69#define SEG_PREFIX 1
70#define ADDR_PREFIX 2
71#define DATA_PREFIX 3
c32fa91d 72#define REP_PREFIX 4
42164a71 73#define HLE_PREFIX REP_PREFIX
7e8b059b 74#define BND_PREFIX REP_PREFIX
c32fa91d 75#define LOCK_PREFIX 5
4e9ac44a
L
76#define REX_PREFIX 6 /* must come last. */
77#define MAX_PREFIXES 7 /* max prefixes per opcode */
6305a203
L
78
79/* we define the syntax here (modulo base,index,scale syntax) */
80#define REGISTER_PREFIX '%'
81#define IMMEDIATE_PREFIX '$'
82#define ABSOLUTE_PREFIX '*'
83
84/* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86#define WORD_MNEM_SUFFIX 'w'
87#define BYTE_MNEM_SUFFIX 'b'
88#define SHORT_MNEM_SUFFIX 's'
89#define LONG_MNEM_SUFFIX 'l'
90#define QWORD_MNEM_SUFFIX 'q'
6305a203
L
91/* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93#define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95#define END_OF_INSN '\0'
96
79dec6b7
JB
97/* This matches the C -> StaticRounding alias in the opcode table. */
98#define commutative staticrounding
99
6305a203
L
100/*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107typedef struct
108{
d3ce72d0
NC
109 const insn_template *start;
110 const insn_template *end;
6305a203
L
111}
112templates;
113
114/* 386 operand encoding bytes: see 386 book for details of this. */
115typedef struct
116{
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120}
121modrm_byte;
122
123/* x86-64 extension prefix. */
124typedef int rex_byte;
125
6305a203
L
126/* 386 opcode byte to code indirect addressing. */
127typedef struct
128{
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132}
133sib_byte;
134
6305a203
L
135/* x86 arch names, types and features */
136typedef struct
137{
138 const char *name; /* arch name */
8a2c8fef 139 unsigned int len; /* arch string length */
6305a203
L
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
8a2c8fef 142 unsigned int skip; /* show_arch should skip this. */
6305a203
L
143}
144arch_entry;
145
293f5f65
L
146/* Used to turn off indicated flags. */
147typedef struct
148{
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152}
153noarch_entry;
154
78f12dd3 155static void update_code_flag (int, int);
e3bb37b5
L
156static void set_code_flag (int);
157static void set_16bit_gcc_code_flag (int);
158static void set_intel_syntax (int);
1efbbeb4 159static void set_intel_mnemonic (int);
db51cc60 160static void set_allow_index_reg (int);
7bab8ab5 161static void set_check (int);
e3bb37b5 162static void set_cpu_arch (int);
6482c264 163#ifdef TE_PE
e3bb37b5 164static void pe_directive_secrel (int);
6482c264 165#endif
e3bb37b5
L
166static void signed_cons (int);
167static char *output_invalid (int c);
ee86248c
JB
168static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
a7619375 172static int i386_att_operand (char *);
e3bb37b5 173static int i386_intel_operand (char *, int);
ee86248c
JB
174static int i386_intel_simplify (expressionS *);
175static int i386_intel_parse_name (const char *, expressionS *);
e3bb37b5
L
176static const reg_entry *parse_register (char *, char **);
177static char *parse_insn (char *, char *);
178static char *parse_operands (char *, const char *);
179static void swap_operands (void);
4d456e3d 180static void swap_2_operands (int, int);
48bcea9f 181static enum flag_code i386_addressing_mode (void);
e3bb37b5
L
182static void optimize_imm (void);
183static void optimize_disp (void);
83b16ac6 184static const insn_template *match_template (char);
e3bb37b5
L
185static int check_string (void);
186static int process_suffix (void);
187static int check_byte_reg (void);
188static int check_long_reg (void);
189static int check_qword_reg (void);
190static int check_word_reg (void);
191static int finalize_imm (void);
192static int process_operands (void);
193static const seg_entry *build_modrm_byte (void);
194static void output_insn (void);
195static void output_imm (fragS *, offsetT);
196static void output_disp (fragS *, offsetT);
29b0f896 197#ifndef I386COFF
e3bb37b5 198static void s_bss (int);
252b5132 199#endif
17d4e2a2
L
200#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201static void handle_large_common (int small ATTRIBUTE_UNUSED);
b4a3a7b4
L
202
203/* GNU_PROPERTY_X86_ISA_1_USED. */
204static unsigned int x86_isa_1_used;
205/* GNU_PROPERTY_X86_FEATURE_2_USED. */
206static unsigned int x86_feature_2_used;
207/* Generate x86 used ISA and feature properties. */
208static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
17d4e2a2 209#endif
252b5132 210
a847613f 211static const char *default_arch = DEFAULT_ARCH;
3e73aa7c 212
8a6fb3f9
JB
213/* parse_register() returns this when a register alias cannot be used. */
214static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
215 { Dw2Inval, Dw2Inval } };
216
43234a1e
L
217/* This struct describes rounding control and SAE in the instruction. */
218struct RC_Operation
219{
220 enum rc_type
221 {
222 rne = 0,
223 rd,
224 ru,
225 rz,
226 saeonly
227 } type;
228 int operand;
229};
230
231static struct RC_Operation rc_op;
232
233/* The struct describes masking, applied to OPERAND in the instruction.
234 MASK is a pointer to the corresponding mask register. ZEROING tells
235 whether merging or zeroing mask is used. */
236struct Mask_Operation
237{
238 const reg_entry *mask;
239 unsigned int zeroing;
240 /* The operand where this operation is associated. */
241 int operand;
242};
243
244static struct Mask_Operation mask_op;
245
246/* The struct describes broadcasting, applied to OPERAND. FACTOR is
247 broadcast factor. */
248struct Broadcast_Operation
249{
8e6e0792 250 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
43234a1e
L
251 int type;
252
253 /* Index of broadcasted operand. */
254 int operand;
4a1b91ea
L
255
256 /* Number of bytes to broadcast. */
257 int bytes;
43234a1e
L
258};
259
260static struct Broadcast_Operation broadcast_op;
261
c0f3af97
L
262/* VEX prefix. */
263typedef struct
264{
43234a1e
L
265 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
266 unsigned char bytes[4];
c0f3af97
L
267 unsigned int length;
268 /* Destination or source register specifier. */
269 const reg_entry *register_specifier;
270} vex_prefix;
271
252b5132 272/* 'md_assemble ()' gathers together information and puts it into a
47926f60 273 i386_insn. */
252b5132 274
520dc8e8
AM
275union i386_op
276 {
277 expressionS *disps;
278 expressionS *imms;
279 const reg_entry *regs;
280 };
281
a65babc9
L
282enum i386_error
283 {
86e026a4 284 operand_size_mismatch,
a65babc9
L
285 operand_type_mismatch,
286 register_type_mismatch,
287 number_of_operands_mismatch,
288 invalid_instruction_suffix,
289 bad_imm4,
a65babc9
L
290 unsupported_with_intel_mnemonic,
291 unsupported_syntax,
6c30d220 292 unsupported,
260cd341 293 invalid_sib_address,
6c30d220 294 invalid_vsib_address,
7bab8ab5 295 invalid_vector_register_set,
260cd341 296 invalid_tmm_register_set,
43234a1e
L
297 unsupported_vector_index_register,
298 unsupported_broadcast,
43234a1e
L
299 broadcast_needed,
300 unsupported_masking,
301 mask_not_on_destination,
302 no_default_mask,
303 unsupported_rc_sae,
304 rc_sae_operand_not_last_imm,
305 invalid_register_operand,
a65babc9
L
306 };
307
252b5132
RH
308struct _i386_insn
309 {
47926f60 310 /* TM holds the template for the insn were currently assembling. */
d3ce72d0 311 insn_template tm;
252b5132 312
7d5e4556
L
313 /* SUFFIX holds the instruction size suffix for byte, word, dword
314 or qword, if given. */
252b5132
RH
315 char suffix;
316
47926f60 317 /* OPERANDS gives the number of given operands. */
252b5132
RH
318 unsigned int operands;
319
320 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
321 of given register, displacement, memory operands and immediate
47926f60 322 operands. */
252b5132
RH
323 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
324
325 /* TYPES [i] is the type (see above #defines) which tells us how to
520dc8e8 326 use OP[i] for the corresponding operand. */
40fb9820 327 i386_operand_type types[MAX_OPERANDS];
252b5132 328
520dc8e8
AM
329 /* Displacement expression, immediate expression, or register for each
330 operand. */
331 union i386_op op[MAX_OPERANDS];
252b5132 332
3e73aa7c
JH
333 /* Flags for operands. */
334 unsigned int flags[MAX_OPERANDS];
335#define Operand_PCrel 1
c48dadc9 336#define Operand_Mem 2
3e73aa7c 337
252b5132 338 /* Relocation type for operand */
f86103b7 339 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
252b5132 340
252b5132
RH
341 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
342 the base index byte below. */
343 const reg_entry *base_reg;
344 const reg_entry *index_reg;
345 unsigned int log2_scale_factor;
346
347 /* SEG gives the seg_entries of this insn. They are zero unless
47926f60 348 explicit segment overrides are given. */
ce8a8b2f 349 const seg_entry *seg[2];
252b5132 350
8325cc63
JB
351 /* Copied first memory operand string, for re-checking. */
352 char *memop1_string;
353
252b5132
RH
354 /* PREFIX holds all the given prefix opcodes (usually null).
355 PREFIXES is the number of prefix opcodes. */
356 unsigned int prefixes;
357 unsigned char prefix[MAX_PREFIXES];
358
50128d0c
JB
359 /* Register is in low 3 bits of opcode. */
360 bfd_boolean short_form;
361
6f2f06be
JB
362 /* The operand to a branch insn indicates an absolute branch. */
363 bfd_boolean jumpabsolute;
364
921eafea
L
365 /* Extended states. */
366 enum
367 {
368 /* Use MMX state. */
369 xstate_mmx = 1 << 0,
370 /* Use XMM state. */
371 xstate_xmm = 1 << 1,
372 /* Use YMM state. */
373 xstate_ymm = 1 << 2 | xstate_xmm,
374 /* Use ZMM state. */
375 xstate_zmm = 1 << 3 | xstate_ymm,
376 /* Use TMM state. */
377 xstate_tmm = 1 << 4
378 } xstate;
260cd341 379
e379e5f3
L
380 /* Has GOTPC or TLS relocation. */
381 bfd_boolean has_gotpc_tls_reloc;
382
252b5132 383 /* RM and SIB are the modrm byte and the sib byte where the
c1e679ec 384 addressing modes of this insn are encoded. */
252b5132 385 modrm_byte rm;
3e73aa7c 386 rex_byte rex;
43234a1e 387 rex_byte vrex;
252b5132 388 sib_byte sib;
c0f3af97 389 vex_prefix vex;
b6169b20 390
43234a1e
L
391 /* Masking attributes. */
392 struct Mask_Operation *mask;
393
394 /* Rounding control and SAE attributes. */
395 struct RC_Operation *rounding;
396
397 /* Broadcasting attributes. */
398 struct Broadcast_Operation *broadcast;
399
400 /* Compressed disp8*N attribute. */
401 unsigned int memshift;
402
86fa6981
L
403 /* Prefer load or store in encoding. */
404 enum
405 {
406 dir_encoding_default = 0,
407 dir_encoding_load,
64c49ab3
JB
408 dir_encoding_store,
409 dir_encoding_swap
86fa6981 410 } dir_encoding;
891edac4 411
a501d77e
L
412 /* Prefer 8bit or 32bit displacement in encoding. */
413 enum
414 {
415 disp_encoding_default = 0,
416 disp_encoding_8bit,
417 disp_encoding_32bit
418 } disp_encoding;
f8a5c266 419
6b6b6807
L
420 /* Prefer the REX byte in encoding. */
421 bfd_boolean rex_encoding;
422
b6f8c7c4
L
423 /* Disable instruction size optimization. */
424 bfd_boolean no_optimize;
425
86fa6981
L
426 /* How to encode vector instructions. */
427 enum
428 {
429 vex_encoding_default = 0,
42e04b36 430 vex_encoding_vex,
86fa6981 431 vex_encoding_vex3,
da4977e0
JB
432 vex_encoding_evex,
433 vex_encoding_error
86fa6981
L
434 } vec_encoding;
435
d5de92cf
L
436 /* REP prefix. */
437 const char *rep_prefix;
438
165de32a
L
439 /* HLE prefix. */
440 const char *hle_prefix;
42164a71 441
7e8b059b
L
442 /* Have BND prefix. */
443 const char *bnd_prefix;
444
04ef582a
L
445 /* Have NOTRACK prefix. */
446 const char *notrack_prefix;
447
891edac4 448 /* Error message. */
a65babc9 449 enum i386_error error;
252b5132
RH
450 };
451
452typedef struct _i386_insn i386_insn;
453
43234a1e
L
454/* Link RC type with corresponding string, that'll be looked for in
455 asm. */
456struct RC_name
457{
458 enum rc_type type;
459 const char *name;
460 unsigned int len;
461};
462
463static const struct RC_name RC_NamesTable[] =
464{
465 { rne, STRING_COMMA_LEN ("rn-sae") },
466 { rd, STRING_COMMA_LEN ("rd-sae") },
467 { ru, STRING_COMMA_LEN ("ru-sae") },
468 { rz, STRING_COMMA_LEN ("rz-sae") },
469 { saeonly, STRING_COMMA_LEN ("sae") },
470};
471
252b5132
RH
472/* List of chars besides those in app.c:symbol_chars that can start an
473 operand. Used to prevent the scrubber eating vital white-space. */
86fa6981 474const char extra_symbol_chars[] = "*%-([{}"
252b5132 475#ifdef LEX_AT
32137342
NC
476 "@"
477#endif
478#ifdef LEX_QM
479 "?"
252b5132 480#endif
32137342 481 ;
252b5132 482
29b0f896
AM
483#if (defined (TE_I386AIX) \
484 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
3896cfd5 485 && !defined (TE_GNU) \
29b0f896
AM
486 && !defined (TE_LINUX) \
487 && !defined (TE_FreeBSD) \
5b806d27 488 && !defined (TE_DragonFly) \
29b0f896 489 && !defined (TE_NetBSD)))
252b5132 490/* This array holds the chars that always start a comment. If the
b3b91714
AM
491 pre-processor is disabled, these aren't very useful. The option
492 --divide will remove '/' from this list. */
493const char *i386_comment_chars = "#/";
494#define SVR4_COMMENT_CHARS 1
252b5132 495#define PREFIX_SEPARATOR '\\'
252b5132 496
b3b91714
AM
497#else
498const char *i386_comment_chars = "#";
499#define PREFIX_SEPARATOR '/'
500#endif
501
252b5132
RH
502/* This array holds the chars that only start a comment at the beginning of
503 a line. If the line seems to have the form '# 123 filename'
ce8a8b2f
AM
504 .line and .file directives will appear in the pre-processed output.
505 Note that input_file.c hand checks for '#' at the beginning of the
252b5132 506 first line of the input file. This is because the compiler outputs
ce8a8b2f
AM
507 #NO_APP at the beginning of its output.
508 Also note that comments started like this one will always work if
252b5132 509 '/' isn't otherwise defined. */
b3b91714 510const char line_comment_chars[] = "#/";
252b5132 511
63a0b638 512const char line_separator_chars[] = ";";
252b5132 513
ce8a8b2f
AM
514/* Chars that can be used to separate mant from exp in floating point
515 nums. */
252b5132
RH
516const char EXP_CHARS[] = "eE";
517
ce8a8b2f
AM
518/* Chars that mean this number is a floating point constant
519 As in 0f12.456
520 or 0d1.2345e12. */
252b5132
RH
521const char FLT_CHARS[] = "fFdDxX";
522
ce8a8b2f 523/* Tables for lexical analysis. */
252b5132
RH
524static char mnemonic_chars[256];
525static char register_chars[256];
526static char operand_chars[256];
527static char identifier_chars[256];
528static char digit_chars[256];
529
ce8a8b2f 530/* Lexical macros. */
252b5132
RH
531#define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
532#define is_operand_char(x) (operand_chars[(unsigned char) x])
533#define is_register_char(x) (register_chars[(unsigned char) x])
534#define is_space_char(x) ((x) == ' ')
535#define is_identifier_char(x) (identifier_chars[(unsigned char) x])
536#define is_digit_char(x) (digit_chars[(unsigned char) x])
537
0234cb7c 538/* All non-digit non-letter characters that may occur in an operand. */
252b5132
RH
539static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
540
541/* md_assemble() always leaves the strings it's passed unaltered. To
542 effect this we maintain a stack of saved characters that we've smashed
543 with '\0's (indicating end of strings for various sub-fields of the
47926f60 544 assembler instruction). */
252b5132 545static char save_stack[32];
ce8a8b2f 546static char *save_stack_p;
252b5132
RH
547#define END_STRING_AND_SAVE(s) \
548 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
549#define RESTORE_END_STRING(s) \
550 do { *(s) = *--save_stack_p; } while (0)
551
47926f60 552/* The instruction we're assembling. */
252b5132
RH
553static i386_insn i;
554
555/* Possible templates for current insn. */
556static const templates *current_templates;
557
31b2323c
L
558/* Per instruction expressionS buffers: max displacements & immediates. */
559static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
560static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
252b5132 561
47926f60 562/* Current operand we are working on. */
ee86248c 563static int this_operand = -1;
252b5132 564
3e73aa7c
JH
565/* We support four different modes. FLAG_CODE variable is used to distinguish
566 these. */
567
568enum flag_code {
569 CODE_32BIT,
570 CODE_16BIT,
571 CODE_64BIT };
572
573static enum flag_code flag_code;
4fa24527 574static unsigned int object_64bit;
862be3fb 575static unsigned int disallow_64bit_reloc;
3e73aa7c 576static int use_rela_relocations = 0;
e379e5f3
L
577/* __tls_get_addr/___tls_get_addr symbol for TLS. */
578static const char *tls_get_addr;
3e73aa7c 579
7af8ed2d
NC
580#if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
581 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
582 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
583
351f65ca
L
584/* The ELF ABI to use. */
585enum x86_elf_abi
586{
587 I386_ABI,
7f56bc95
L
588 X86_64_ABI,
589 X86_64_X32_ABI
351f65ca
L
590};
591
592static enum x86_elf_abi x86_elf_abi = I386_ABI;
7af8ed2d 593#endif
351f65ca 594
167ad85b
TG
595#if defined (TE_PE) || defined (TE_PEP)
596/* Use big object file format. */
597static int use_big_obj = 0;
598#endif
599
8dcea932
L
600#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
601/* 1 if generating code for a shared library. */
602static int shared = 0;
603#endif
604
47926f60
KH
605/* 1 for intel syntax,
606 0 if att syntax. */
607static int intel_syntax = 0;
252b5132 608
4b5aaf5f
L
609static enum x86_64_isa
610{
611 amd64 = 1, /* AMD64 ISA. */
612 intel64 /* Intel64 ISA. */
613} isa64;
e89c5eaa 614
1efbbeb4
L
615/* 1 for intel mnemonic,
616 0 if att mnemonic. */
617static int intel_mnemonic = !SYSV386_COMPAT;
618
a60de03c
JB
619/* 1 if pseudo registers are permitted. */
620static int allow_pseudo_reg = 0;
621
47926f60
KH
622/* 1 if register prefix % not required. */
623static int allow_naked_reg = 0;
252b5132 624
33eaf5de 625/* 1 if the assembler should add BND prefix for all control-transferring
7e8b059b
L
626 instructions supporting it, even if this prefix wasn't specified
627 explicitly. */
628static int add_bnd_prefix = 0;
629
ba104c83 630/* 1 if pseudo index register, eiz/riz, is allowed . */
db51cc60
L
631static int allow_index_reg = 0;
632
d022bddd
IT
633/* 1 if the assembler should ignore LOCK prefix, even if it was
634 specified explicitly. */
635static int omit_lock_prefix = 0;
636
e4e00185
AS
637/* 1 if the assembler should encode lfence, mfence, and sfence as
638 "lock addl $0, (%{re}sp)". */
639static int avoid_fence = 0;
640
ae531041
L
641/* 1 if lfence should be inserted after every load. */
642static int lfence_after_load = 0;
643
644/* Non-zero if lfence should be inserted before indirect branch. */
645static enum lfence_before_indirect_branch_kind
646 {
647 lfence_branch_none = 0,
648 lfence_branch_register,
649 lfence_branch_memory,
650 lfence_branch_all
651 }
652lfence_before_indirect_branch;
653
654/* Non-zero if lfence should be inserted before ret. */
655static enum lfence_before_ret_kind
656 {
657 lfence_before_ret_none = 0,
658 lfence_before_ret_not,
a09f656b 659 lfence_before_ret_or,
660 lfence_before_ret_shl
ae531041
L
661 }
662lfence_before_ret;
663
664/* Types of previous instruction is .byte or prefix. */
e379e5f3
L
665static struct
666 {
667 segT seg;
668 const char *file;
669 const char *name;
670 unsigned int line;
671 enum last_insn_kind
672 {
673 last_insn_other = 0,
674 last_insn_directive,
675 last_insn_prefix
676 } kind;
677 } last_insn;
678
0cb4071e
L
679/* 1 if the assembler should generate relax relocations. */
680
681static int generate_relax_relocations
682 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
683
7bab8ab5 684static enum check_kind
daf50ae7 685 {
7bab8ab5
JB
686 check_none = 0,
687 check_warning,
688 check_error
daf50ae7 689 }
7bab8ab5 690sse_check, operand_check = check_warning;
daf50ae7 691
e379e5f3
L
692/* Non-zero if branches should be aligned within power of 2 boundary. */
693static int align_branch_power = 0;
694
695/* Types of branches to align. */
696enum align_branch_kind
697 {
698 align_branch_none = 0,
699 align_branch_jcc = 1,
700 align_branch_fused = 2,
701 align_branch_jmp = 3,
702 align_branch_call = 4,
703 align_branch_indirect = 5,
704 align_branch_ret = 6
705 };
706
707/* Type bits of branches to align. */
708enum align_branch_bit
709 {
710 align_branch_jcc_bit = 1 << align_branch_jcc,
711 align_branch_fused_bit = 1 << align_branch_fused,
712 align_branch_jmp_bit = 1 << align_branch_jmp,
713 align_branch_call_bit = 1 << align_branch_call,
714 align_branch_indirect_bit = 1 << align_branch_indirect,
715 align_branch_ret_bit = 1 << align_branch_ret
716 };
717
718static unsigned int align_branch = (align_branch_jcc_bit
719 | align_branch_fused_bit
720 | align_branch_jmp_bit);
721
79d72f45
HL
722/* Types of condition jump used by macro-fusion. */
723enum mf_jcc_kind
724 {
725 mf_jcc_jo = 0, /* base opcode 0x70 */
726 mf_jcc_jc, /* base opcode 0x72 */
727 mf_jcc_je, /* base opcode 0x74 */
728 mf_jcc_jna, /* base opcode 0x76 */
729 mf_jcc_js, /* base opcode 0x78 */
730 mf_jcc_jp, /* base opcode 0x7a */
731 mf_jcc_jl, /* base opcode 0x7c */
732 mf_jcc_jle, /* base opcode 0x7e */
733 };
734
735/* Types of compare flag-modifying insntructions used by macro-fusion. */
736enum mf_cmp_kind
737 {
738 mf_cmp_test_and, /* test/cmp */
739 mf_cmp_alu_cmp, /* add/sub/cmp */
740 mf_cmp_incdec /* inc/dec */
741 };
742
e379e5f3
L
743/* The maximum padding size for fused jcc. CMP like instruction can
744 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
745 prefixes. */
746#define MAX_FUSED_JCC_PADDING_SIZE 20
747
748/* The maximum number of prefixes added for an instruction. */
749static unsigned int align_branch_prefix_size = 5;
750
b6f8c7c4
L
751/* Optimization:
752 1. Clear the REX_W bit with register operand if possible.
753 2. Above plus use 128bit vector instruction to clear the full vector
754 register.
755 */
756static int optimize = 0;
757
758/* Optimization:
759 1. Clear the REX_W bit with register operand if possible.
760 2. Above plus use 128bit vector instruction to clear the full vector
761 register.
762 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
763 "testb $imm7,%r8".
764 */
765static int optimize_for_space = 0;
766
2ca3ace5
L
767/* Register prefix used for error message. */
768static const char *register_prefix = "%";
769
47926f60
KH
770/* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
771 leave, push, and pop instructions so that gcc has the same stack
772 frame as in 32 bit mode. */
773static char stackop_size = '\0';
eecb386c 774
12b55ccc
L
775/* Non-zero to optimize code alignment. */
776int optimize_align_code = 1;
777
47926f60
KH
778/* Non-zero to quieten some warnings. */
779static int quiet_warnings = 0;
a38cf1db 780
47926f60
KH
781/* CPU name. */
782static const char *cpu_arch_name = NULL;
6305a203 783static char *cpu_sub_arch_name = NULL;
a38cf1db 784
47926f60 785/* CPU feature flags. */
40fb9820
L
786static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
787
ccc9c027
L
788/* If we have selected a cpu we are generating instructions for. */
789static int cpu_arch_tune_set = 0;
790
9103f4f4 791/* Cpu we are generating instructions for. */
fbf3f584 792enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
9103f4f4
L
793
794/* CPU feature flags of cpu we are generating instructions for. */
40fb9820 795static i386_cpu_flags cpu_arch_tune_flags;
9103f4f4 796
ccc9c027 797/* CPU instruction set architecture used. */
fbf3f584 798enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
ccc9c027 799
9103f4f4 800/* CPU feature flags of instruction set architecture used. */
fbf3f584 801i386_cpu_flags cpu_arch_isa_flags;
9103f4f4 802
fddf5b5b
AM
803/* If set, conditional jumps are not automatically promoted to handle
804 larger than a byte offset. */
805static unsigned int no_cond_jump_promotion = 0;
806
c0f3af97
L
807/* Encode SSE instructions with VEX prefix. */
808static unsigned int sse2avx;
809
539f890d
L
810/* Encode scalar AVX instructions with specific vector length. */
811static enum
812 {
813 vex128 = 0,
814 vex256
815 } avxscalar;
816
03751133
L
817/* Encode VEX WIG instructions with specific vex.w. */
818static enum
819 {
820 vexw0 = 0,
821 vexw1
822 } vexwig;
823
43234a1e
L
824/* Encode scalar EVEX LIG instructions with specific vector length. */
825static enum
826 {
827 evexl128 = 0,
828 evexl256,
829 evexl512
830 } evexlig;
831
832/* Encode EVEX WIG instructions with specific evex.w. */
833static enum
834 {
835 evexw0 = 0,
836 evexw1
837 } evexwig;
838
d3d3c6db
IT
839/* Value to encode in EVEX RC bits, for SAE-only instructions. */
840static enum rc_type evexrcig = rne;
841
29b0f896 842/* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
87c245cc 843static symbolS *GOT_symbol;
29b0f896 844
a4447b93
RH
845/* The dwarf2 return column, adjusted for 32 or 64 bit. */
846unsigned int x86_dwarf2_return_column;
847
848/* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
849int x86_cie_data_alignment;
850
252b5132 851/* Interface to relax_segment.
fddf5b5b
AM
852 There are 3 major relax states for 386 jump insns because the
853 different types of jumps add different sizes to frags when we're
e379e5f3
L
854 figuring out what sort of jump to choose to reach a given label.
855
856 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
857 branches which are handled by md_estimate_size_before_relax() and
858 i386_generic_table_relax_frag(). */
252b5132 859
47926f60 860/* Types. */
93c2a809
AM
861#define UNCOND_JUMP 0
862#define COND_JUMP 1
863#define COND_JUMP86 2
e379e5f3
L
864#define BRANCH_PADDING 3
865#define BRANCH_PREFIX 4
866#define FUSED_JCC_PADDING 5
fddf5b5b 867
47926f60 868/* Sizes. */
252b5132
RH
869#define CODE16 1
870#define SMALL 0
29b0f896 871#define SMALL16 (SMALL | CODE16)
252b5132 872#define BIG 2
29b0f896 873#define BIG16 (BIG | CODE16)
252b5132
RH
874
875#ifndef INLINE
876#ifdef __GNUC__
877#define INLINE __inline__
878#else
879#define INLINE
880#endif
881#endif
882
fddf5b5b
AM
883#define ENCODE_RELAX_STATE(type, size) \
884 ((relax_substateT) (((type) << 2) | (size)))
885#define TYPE_FROM_RELAX_STATE(s) \
886 ((s) >> 2)
887#define DISP_SIZE_FROM_RELAX_STATE(s) \
888 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
252b5132
RH
889
890/* This table is used by relax_frag to promote short jumps to long
891 ones where necessary. SMALL (short) jumps may be promoted to BIG
892 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
893 don't allow a short jump in a 32 bit code segment to be promoted to
894 a 16 bit offset jump because it's slower (requires data size
895 prefix), and doesn't work, unless the destination is in the bottom
896 64k of the code segment (The top 16 bits of eip are zeroed). */
897
898const relax_typeS md_relax_table[] =
899{
24eab124
AM
900 /* The fields are:
901 1) most positive reach of this state,
902 2) most negative reach of this state,
93c2a809 903 3) how many bytes this mode will have in the variable part of the frag
ce8a8b2f 904 4) which index into the table to try if we can't fit into this one. */
252b5132 905
fddf5b5b 906 /* UNCOND_JUMP states. */
93c2a809
AM
907 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
908 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
909 /* dword jmp adds 4 bytes to frag:
910 0 extra opcode bytes, 4 displacement bytes. */
252b5132 911 {0, 0, 4, 0},
93c2a809
AM
912 /* word jmp adds 2 byte2 to frag:
913 0 extra opcode bytes, 2 displacement bytes. */
252b5132
RH
914 {0, 0, 2, 0},
915
93c2a809
AM
916 /* COND_JUMP states. */
917 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
918 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
919 /* dword conditionals adds 5 bytes to frag:
920 1 extra opcode byte, 4 displacement bytes. */
921 {0, 0, 5, 0},
fddf5b5b 922 /* word conditionals add 3 bytes to frag:
93c2a809
AM
923 1 extra opcode byte, 2 displacement bytes. */
924 {0, 0, 3, 0},
925
926 /* COND_JUMP86 states. */
927 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
928 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
929 /* dword conditionals adds 5 bytes to frag:
930 1 extra opcode byte, 4 displacement bytes. */
931 {0, 0, 5, 0},
932 /* word conditionals add 4 bytes to frag:
933 1 displacement byte and a 3 byte long branch insn. */
934 {0, 0, 4, 0}
252b5132
RH
935};
936
9103f4f4
L
937static const arch_entry cpu_arch[] =
938{
89507696
JB
939 /* Do not replace the first two entries - i386_target_format()
940 relies on them being there in this order. */
8a2c8fef 941 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
293f5f65 942 CPU_GENERIC32_FLAGS, 0 },
8a2c8fef 943 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
293f5f65 944 CPU_GENERIC64_FLAGS, 0 },
8a2c8fef 945 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
293f5f65 946 CPU_NONE_FLAGS, 0 },
8a2c8fef 947 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
293f5f65 948 CPU_I186_FLAGS, 0 },
8a2c8fef 949 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
293f5f65 950 CPU_I286_FLAGS, 0 },
8a2c8fef 951 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
293f5f65 952 CPU_I386_FLAGS, 0 },
8a2c8fef 953 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
293f5f65 954 CPU_I486_FLAGS, 0 },
8a2c8fef 955 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
293f5f65 956 CPU_I586_FLAGS, 0 },
8a2c8fef 957 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
293f5f65 958 CPU_I686_FLAGS, 0 },
8a2c8fef 959 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
293f5f65 960 CPU_I586_FLAGS, 0 },
8a2c8fef 961 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
293f5f65 962 CPU_PENTIUMPRO_FLAGS, 0 },
8a2c8fef 963 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
293f5f65 964 CPU_P2_FLAGS, 0 },
8a2c8fef 965 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
293f5f65 966 CPU_P3_FLAGS, 0 },
8a2c8fef 967 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
293f5f65 968 CPU_P4_FLAGS, 0 },
8a2c8fef 969 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
293f5f65 970 CPU_CORE_FLAGS, 0 },
8a2c8fef 971 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
293f5f65 972 CPU_NOCONA_FLAGS, 0 },
8a2c8fef 973 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
293f5f65 974 CPU_CORE_FLAGS, 1 },
8a2c8fef 975 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
293f5f65 976 CPU_CORE_FLAGS, 0 },
8a2c8fef 977 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
293f5f65 978 CPU_CORE2_FLAGS, 1 },
8a2c8fef 979 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
293f5f65 980 CPU_CORE2_FLAGS, 0 },
8a2c8fef 981 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
293f5f65 982 CPU_COREI7_FLAGS, 0 },
8a2c8fef 983 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
293f5f65 984 CPU_L1OM_FLAGS, 0 },
7a9068fe 985 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
293f5f65 986 CPU_K1OM_FLAGS, 0 },
81486035 987 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
293f5f65 988 CPU_IAMCU_FLAGS, 0 },
8a2c8fef 989 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
293f5f65 990 CPU_K6_FLAGS, 0 },
8a2c8fef 991 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
293f5f65 992 CPU_K6_2_FLAGS, 0 },
8a2c8fef 993 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
293f5f65 994 CPU_ATHLON_FLAGS, 0 },
8a2c8fef 995 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
293f5f65 996 CPU_K8_FLAGS, 1 },
8a2c8fef 997 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
293f5f65 998 CPU_K8_FLAGS, 0 },
8a2c8fef 999 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
293f5f65 1000 CPU_K8_FLAGS, 0 },
8a2c8fef 1001 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
293f5f65 1002 CPU_AMDFAM10_FLAGS, 0 },
8aedb9fe 1003 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
293f5f65 1004 CPU_BDVER1_FLAGS, 0 },
8aedb9fe 1005 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
293f5f65 1006 CPU_BDVER2_FLAGS, 0 },
5e5c50d3 1007 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
293f5f65 1008 CPU_BDVER3_FLAGS, 0 },
c7b0bd56 1009 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
293f5f65 1010 CPU_BDVER4_FLAGS, 0 },
029f3522 1011 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
293f5f65 1012 CPU_ZNVER1_FLAGS, 0 },
a9660a6f
AP
1013 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1014 CPU_ZNVER2_FLAGS, 0 },
7b458c12 1015 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
293f5f65 1016 CPU_BTVER1_FLAGS, 0 },
7b458c12 1017 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
293f5f65 1018 CPU_BTVER2_FLAGS, 0 },
8a2c8fef 1019 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
293f5f65 1020 CPU_8087_FLAGS, 0 },
8a2c8fef 1021 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
293f5f65 1022 CPU_287_FLAGS, 0 },
8a2c8fef 1023 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
293f5f65 1024 CPU_387_FLAGS, 0 },
1848e567
L
1025 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1026 CPU_687_FLAGS, 0 },
d871f3f4
L
1027 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1028 CPU_CMOV_FLAGS, 0 },
1029 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1030 CPU_FXSR_FLAGS, 0 },
8a2c8fef 1031 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
293f5f65 1032 CPU_MMX_FLAGS, 0 },
8a2c8fef 1033 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
293f5f65 1034 CPU_SSE_FLAGS, 0 },
8a2c8fef 1035 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
293f5f65 1036 CPU_SSE2_FLAGS, 0 },
8a2c8fef 1037 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
293f5f65 1038 CPU_SSE3_FLAGS, 0 },
af5c13b0
L
1039 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1040 CPU_SSE4A_FLAGS, 0 },
8a2c8fef 1041 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
293f5f65 1042 CPU_SSSE3_FLAGS, 0 },
8a2c8fef 1043 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
293f5f65 1044 CPU_SSE4_1_FLAGS, 0 },
8a2c8fef 1045 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
293f5f65 1046 CPU_SSE4_2_FLAGS, 0 },
8a2c8fef 1047 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
293f5f65 1048 CPU_SSE4_2_FLAGS, 0 },
8a2c8fef 1049 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
293f5f65 1050 CPU_AVX_FLAGS, 0 },
6c30d220 1051 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
293f5f65 1052 CPU_AVX2_FLAGS, 0 },
43234a1e 1053 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
293f5f65 1054 CPU_AVX512F_FLAGS, 0 },
43234a1e 1055 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
293f5f65 1056 CPU_AVX512CD_FLAGS, 0 },
43234a1e 1057 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
293f5f65 1058 CPU_AVX512ER_FLAGS, 0 },
43234a1e 1059 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
293f5f65 1060 CPU_AVX512PF_FLAGS, 0 },
1dfc6506 1061 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
293f5f65 1062 CPU_AVX512DQ_FLAGS, 0 },
1dfc6506 1063 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
293f5f65 1064 CPU_AVX512BW_FLAGS, 0 },
1dfc6506 1065 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
293f5f65 1066 CPU_AVX512VL_FLAGS, 0 },
8a2c8fef 1067 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
293f5f65 1068 CPU_VMX_FLAGS, 0 },
8729a6f6 1069 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
293f5f65 1070 CPU_VMFUNC_FLAGS, 0 },
8a2c8fef 1071 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
293f5f65 1072 CPU_SMX_FLAGS, 0 },
8a2c8fef 1073 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
293f5f65 1074 CPU_XSAVE_FLAGS, 0 },
c7b8aa3a 1075 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
293f5f65 1076 CPU_XSAVEOPT_FLAGS, 0 },
1dfc6506 1077 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
293f5f65 1078 CPU_XSAVEC_FLAGS, 0 },
1dfc6506 1079 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
293f5f65 1080 CPU_XSAVES_FLAGS, 0 },
8a2c8fef 1081 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
293f5f65 1082 CPU_AES_FLAGS, 0 },
8a2c8fef 1083 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
293f5f65 1084 CPU_PCLMUL_FLAGS, 0 },
8a2c8fef 1085 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
293f5f65 1086 CPU_PCLMUL_FLAGS, 1 },
c7b8aa3a 1087 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
293f5f65 1088 CPU_FSGSBASE_FLAGS, 0 },
c7b8aa3a 1089 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
293f5f65 1090 CPU_RDRND_FLAGS, 0 },
c7b8aa3a 1091 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
293f5f65 1092 CPU_F16C_FLAGS, 0 },
6c30d220 1093 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
293f5f65 1094 CPU_BMI2_FLAGS, 0 },
8a2c8fef 1095 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
293f5f65 1096 CPU_FMA_FLAGS, 0 },
8a2c8fef 1097 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
293f5f65 1098 CPU_FMA4_FLAGS, 0 },
8a2c8fef 1099 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
293f5f65 1100 CPU_XOP_FLAGS, 0 },
8a2c8fef 1101 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
293f5f65 1102 CPU_LWP_FLAGS, 0 },
8a2c8fef 1103 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
293f5f65 1104 CPU_MOVBE_FLAGS, 0 },
60aa667e 1105 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
293f5f65 1106 CPU_CX16_FLAGS, 0 },
8a2c8fef 1107 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
293f5f65 1108 CPU_EPT_FLAGS, 0 },
6c30d220 1109 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
293f5f65 1110 CPU_LZCNT_FLAGS, 0 },
272a84b1
L
1111 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1112 CPU_POPCNT_FLAGS, 0 },
42164a71 1113 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
293f5f65 1114 CPU_HLE_FLAGS, 0 },
42164a71 1115 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
293f5f65 1116 CPU_RTM_FLAGS, 0 },
6c30d220 1117 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
293f5f65 1118 CPU_INVPCID_FLAGS, 0 },
8a2c8fef 1119 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
293f5f65 1120 CPU_CLFLUSH_FLAGS, 0 },
22109423 1121 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
293f5f65 1122 CPU_NOP_FLAGS, 0 },
8a2c8fef 1123 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
293f5f65 1124 CPU_SYSCALL_FLAGS, 0 },
8a2c8fef 1125 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
293f5f65 1126 CPU_RDTSCP_FLAGS, 0 },
8a2c8fef 1127 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
293f5f65 1128 CPU_3DNOW_FLAGS, 0 },
8a2c8fef 1129 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
293f5f65 1130 CPU_3DNOWA_FLAGS, 0 },
8a2c8fef 1131 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
293f5f65 1132 CPU_PADLOCK_FLAGS, 0 },
8a2c8fef 1133 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
293f5f65 1134 CPU_SVME_FLAGS, 1 },
8a2c8fef 1135 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
293f5f65 1136 CPU_SVME_FLAGS, 0 },
8a2c8fef 1137 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
293f5f65 1138 CPU_SSE4A_FLAGS, 0 },
8a2c8fef 1139 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
293f5f65 1140 CPU_ABM_FLAGS, 0 },
87973e9f 1141 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
293f5f65 1142 CPU_BMI_FLAGS, 0 },
2a2a0f38 1143 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
293f5f65 1144 CPU_TBM_FLAGS, 0 },
e2e1fcde 1145 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
293f5f65 1146 CPU_ADX_FLAGS, 0 },
e2e1fcde 1147 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
293f5f65 1148 CPU_RDSEED_FLAGS, 0 },
e2e1fcde 1149 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
293f5f65 1150 CPU_PRFCHW_FLAGS, 0 },
5c111e37 1151 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
293f5f65 1152 CPU_SMAP_FLAGS, 0 },
7e8b059b 1153 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
293f5f65 1154 CPU_MPX_FLAGS, 0 },
a0046408 1155 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
293f5f65 1156 CPU_SHA_FLAGS, 0 },
963f3586 1157 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
293f5f65 1158 CPU_CLFLUSHOPT_FLAGS, 0 },
dcf893b5 1159 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
293f5f65 1160 CPU_PREFETCHWT1_FLAGS, 0 },
2cf200a4 1161 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
293f5f65 1162 CPU_SE1_FLAGS, 0 },
c5e7287a 1163 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
293f5f65 1164 CPU_CLWB_FLAGS, 0 },
2cc1b5aa 1165 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
293f5f65 1166 CPU_AVX512IFMA_FLAGS, 0 },
14f195c9 1167 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
293f5f65 1168 CPU_AVX512VBMI_FLAGS, 0 },
920d2ddc
IT
1169 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1170 CPU_AVX512_4FMAPS_FLAGS, 0 },
47acf0bd
IT
1171 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1172 CPU_AVX512_4VNNIW_FLAGS, 0 },
620214f7
IT
1173 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1174 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
53467f57
IT
1175 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1176 CPU_AVX512_VBMI2_FLAGS, 0 },
8cfcb765
IT
1177 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1178 CPU_AVX512_VNNI_FLAGS, 0 },
ee6872be
IT
1179 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1180 CPU_AVX512_BITALG_FLAGS, 0 },
029f3522 1181 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
293f5f65 1182 CPU_CLZERO_FLAGS, 0 },
9916071f 1183 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
293f5f65 1184 CPU_MWAITX_FLAGS, 0 },
8eab4136 1185 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
293f5f65 1186 CPU_OSPKE_FLAGS, 0 },
8bc52696 1187 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
293f5f65 1188 CPU_RDPID_FLAGS, 0 },
6b40c462
L
1189 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1190 CPU_PTWRITE_FLAGS, 0 },
d777820b
IT
1191 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1192 CPU_IBT_FLAGS, 0 },
1193 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1194 CPU_SHSTK_FLAGS, 0 },
48521003
IT
1195 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1196 CPU_GFNI_FLAGS, 0 },
8dcf1fad
IT
1197 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1198 CPU_VAES_FLAGS, 0 },
ff1982d5
IT
1199 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1200 CPU_VPCLMULQDQ_FLAGS, 0 },
3233d7d0
IT
1201 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1202 CPU_WBNOINVD_FLAGS, 0 },
be3a8dca
IT
1203 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1204 CPU_PCONFIG_FLAGS, 0 },
de89d0a3
IT
1205 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1206 CPU_WAITPKG_FLAGS, 0 },
c48935d7
IT
1207 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1208 CPU_CLDEMOTE_FLAGS, 0 },
260cd341
LC
1209 { STRING_COMMA_LEN (".amx_int8"), PROCESSOR_UNKNOWN,
1210 CPU_AMX_INT8_FLAGS, 0 },
1211 { STRING_COMMA_LEN (".amx_bf16"), PROCESSOR_UNKNOWN,
1212 CPU_AMX_BF16_FLAGS, 0 },
1213 { STRING_COMMA_LEN (".amx_tile"), PROCESSOR_UNKNOWN,
1214 CPU_AMX_TILE_FLAGS, 0 },
c0a30a9f
L
1215 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1216 CPU_MOVDIRI_FLAGS, 0 },
1217 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1218 CPU_MOVDIR64B_FLAGS, 0 },
d6aab7a1
XG
1219 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1220 CPU_AVX512_BF16_FLAGS, 0 },
9186c494
L
1221 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1222 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
dd455cf5
L
1223 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1224 CPU_ENQCMD_FLAGS, 0 },
4b27d27c
L
1225 { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1226 CPU_SERIALIZE_FLAGS, 0 },
142861df
JB
1227 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1228 CPU_RDPRU_FLAGS, 0 },
1229 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1230 CPU_MCOMMIT_FLAGS, 0 },
a847e322
JB
1231 { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1232 CPU_SEV_ES_FLAGS, 0 },
bb651e8b
CL
1233 { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1234 CPU_TSXLDTRK_FLAGS, 0 },
293f5f65
L
1235};
1236
1237static const noarch_entry cpu_noarch[] =
1238{
1239 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1848e567
L
1240 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1241 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1242 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
d871f3f4
L
1243 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1244 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
293f5f65
L
1245 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1246 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1848e567
L
1247 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1248 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
af5c13b0 1249 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1848e567
L
1250 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1251 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1252 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
af5c13b0 1253 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
293f5f65 1254 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1848e567 1255 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
144b71e2
L
1256 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1257 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1258 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1259 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1260 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1261 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1262 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1263 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1264 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
920d2ddc 1265 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
47acf0bd 1266 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
620214f7 1267 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
53467f57 1268 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
8cfcb765 1269 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
ee6872be 1270 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
d777820b
IT
1271 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1272 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
260cd341
LC
1273 { STRING_COMMA_LEN ("noamx_int8"), CPU_ANY_AMX_INT8_FLAGS },
1274 { STRING_COMMA_LEN ("noamx_bf16"), CPU_ANY_AMX_BF16_FLAGS },
1275 { STRING_COMMA_LEN ("noamx_tile"), CPU_ANY_AMX_TILE_FLAGS },
c0a30a9f
L
1276 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1277 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
d6aab7a1 1278 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
708a2fff
CL
1279 { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1280 CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
dd455cf5 1281 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
4b27d27c 1282 { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
bb651e8b 1283 { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
e413e4e9
AM
1284};
1285
704209c0 1286#ifdef I386COFF
a6c24e68
NC
1287/* Like s_lcomm_internal in gas/read.c but the alignment string
1288 is allowed to be optional. */
1289
1290static symbolS *
1291pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1292{
1293 addressT align = 0;
1294
1295 SKIP_WHITESPACE ();
1296
7ab9ffdd 1297 if (needs_align
a6c24e68
NC
1298 && *input_line_pointer == ',')
1299 {
1300 align = parse_align (needs_align - 1);
7ab9ffdd 1301
a6c24e68
NC
1302 if (align == (addressT) -1)
1303 return NULL;
1304 }
1305 else
1306 {
1307 if (size >= 8)
1308 align = 3;
1309 else if (size >= 4)
1310 align = 2;
1311 else if (size >= 2)
1312 align = 1;
1313 else
1314 align = 0;
1315 }
1316
1317 bss_alloc (symbolP, size, align);
1318 return symbolP;
1319}
1320
704209c0 1321static void
a6c24e68
NC
1322pe_lcomm (int needs_align)
1323{
1324 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1325}
704209c0 1326#endif
a6c24e68 1327
29b0f896
AM
1328const pseudo_typeS md_pseudo_table[] =
1329{
1330#if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1331 {"align", s_align_bytes, 0},
1332#else
1333 {"align", s_align_ptwo, 0},
1334#endif
1335 {"arch", set_cpu_arch, 0},
1336#ifndef I386COFF
1337 {"bss", s_bss, 0},
a6c24e68
NC
1338#else
1339 {"lcomm", pe_lcomm, 1},
29b0f896
AM
1340#endif
1341 {"ffloat", float_cons, 'f'},
1342 {"dfloat", float_cons, 'd'},
1343 {"tfloat", float_cons, 'x'},
1344 {"value", cons, 2},
d182319b 1345 {"slong", signed_cons, 4},
29b0f896
AM
1346 {"noopt", s_ignore, 0},
1347 {"optim", s_ignore, 0},
1348 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1349 {"code16", set_code_flag, CODE_16BIT},
1350 {"code32", set_code_flag, CODE_32BIT},
da5f19a2 1351#ifdef BFD64
29b0f896 1352 {"code64", set_code_flag, CODE_64BIT},
da5f19a2 1353#endif
29b0f896
AM
1354 {"intel_syntax", set_intel_syntax, 1},
1355 {"att_syntax", set_intel_syntax, 0},
1efbbeb4
L
1356 {"intel_mnemonic", set_intel_mnemonic, 1},
1357 {"att_mnemonic", set_intel_mnemonic, 0},
db51cc60
L
1358 {"allow_index_reg", set_allow_index_reg, 1},
1359 {"disallow_index_reg", set_allow_index_reg, 0},
7bab8ab5
JB
1360 {"sse_check", set_check, 0},
1361 {"operand_check", set_check, 1},
3b22753a
L
1362#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1363 {"largecomm", handle_large_common, 0},
07a53e5c 1364#else
68d20676 1365 {"file", dwarf2_directive_file, 0},
07a53e5c
RH
1366 {"loc", dwarf2_directive_loc, 0},
1367 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
3b22753a 1368#endif
6482c264
NC
1369#ifdef TE_PE
1370 {"secrel32", pe_directive_secrel, 0},
1371#endif
29b0f896
AM
1372 {0, 0, 0}
1373};
1374
1375/* For interface with expression (). */
1376extern char *input_line_pointer;
1377
1378/* Hash table for instruction mnemonic lookup. */
1379static struct hash_control *op_hash;
1380
1381/* Hash table for register lookup. */
1382static struct hash_control *reg_hash;
1383\f
ce8a8b2f
AM
1384 /* Various efficient no-op patterns for aligning code labels.
1385 Note: Don't try to assemble the instructions in the comments.
1386 0L and 0w are not legal. */
62a02d25
L
1387static const unsigned char f32_1[] =
1388 {0x90}; /* nop */
1389static const unsigned char f32_2[] =
1390 {0x66,0x90}; /* xchg %ax,%ax */
1391static const unsigned char f32_3[] =
1392 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1393static const unsigned char f32_4[] =
1394 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
62a02d25
L
1395static const unsigned char f32_6[] =
1396 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1397static const unsigned char f32_7[] =
1398 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
62a02d25 1399static const unsigned char f16_3[] =
3ae729d5 1400 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
62a02d25 1401static const unsigned char f16_4[] =
3ae729d5
L
1402 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1403static const unsigned char jump_disp8[] =
1404 {0xeb}; /* jmp disp8 */
1405static const unsigned char jump32_disp32[] =
1406 {0xe9}; /* jmp disp32 */
1407static const unsigned char jump16_disp32[] =
1408 {0x66,0xe9}; /* jmp disp32 */
62a02d25
L
1409/* 32-bit NOPs patterns. */
1410static const unsigned char *const f32_patt[] = {
3ae729d5 1411 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
62a02d25
L
1412};
1413/* 16-bit NOPs patterns. */
1414static const unsigned char *const f16_patt[] = {
3ae729d5 1415 f32_1, f32_2, f16_3, f16_4
62a02d25
L
1416};
1417/* nopl (%[re]ax) */
1418static const unsigned char alt_3[] =
1419 {0x0f,0x1f,0x00};
1420/* nopl 0(%[re]ax) */
1421static const unsigned char alt_4[] =
1422 {0x0f,0x1f,0x40,0x00};
1423/* nopl 0(%[re]ax,%[re]ax,1) */
1424static const unsigned char alt_5[] =
1425 {0x0f,0x1f,0x44,0x00,0x00};
1426/* nopw 0(%[re]ax,%[re]ax,1) */
1427static const unsigned char alt_6[] =
1428 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1429/* nopl 0L(%[re]ax) */
1430static const unsigned char alt_7[] =
1431 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1432/* nopl 0L(%[re]ax,%[re]ax,1) */
1433static const unsigned char alt_8[] =
1434 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1435/* nopw 0L(%[re]ax,%[re]ax,1) */
1436static const unsigned char alt_9[] =
1437 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1438/* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1439static const unsigned char alt_10[] =
1440 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
3ae729d5
L
1441/* data16 nopw %cs:0L(%eax,%eax,1) */
1442static const unsigned char alt_11[] =
1443 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
62a02d25
L
1444/* 32-bit and 64-bit NOPs patterns. */
1445static const unsigned char *const alt_patt[] = {
1446 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
3ae729d5 1447 alt_9, alt_10, alt_11
62a02d25
L
1448};
1449
1450/* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1451 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1452
1453static void
1454i386_output_nops (char *where, const unsigned char *const *patt,
1455 int count, int max_single_nop_size)
1456
1457{
3ae729d5
L
1458 /* Place the longer NOP first. */
1459 int last;
1460 int offset;
3076e594
NC
1461 const unsigned char *nops;
1462
1463 if (max_single_nop_size < 1)
1464 {
1465 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1466 max_single_nop_size);
1467 return;
1468 }
1469
1470 nops = patt[max_single_nop_size - 1];
3ae729d5
L
1471
1472 /* Use the smaller one if the requsted one isn't available. */
1473 if (nops == NULL)
62a02d25 1474 {
3ae729d5
L
1475 max_single_nop_size--;
1476 nops = patt[max_single_nop_size - 1];
62a02d25
L
1477 }
1478
3ae729d5
L
1479 last = count % max_single_nop_size;
1480
1481 count -= last;
1482 for (offset = 0; offset < count; offset += max_single_nop_size)
1483 memcpy (where + offset, nops, max_single_nop_size);
1484
1485 if (last)
1486 {
1487 nops = patt[last - 1];
1488 if (nops == NULL)
1489 {
1490 /* Use the smaller one plus one-byte NOP if the needed one
1491 isn't available. */
1492 last--;
1493 nops = patt[last - 1];
1494 memcpy (where + offset, nops, last);
1495 where[offset + last] = *patt[0];
1496 }
1497 else
1498 memcpy (where + offset, nops, last);
1499 }
62a02d25
L
1500}
1501
3ae729d5
L
1502static INLINE int
1503fits_in_imm7 (offsetT num)
1504{
1505 return (num & 0x7f) == num;
1506}
1507
1508static INLINE int
1509fits_in_imm31 (offsetT num)
1510{
1511 return (num & 0x7fffffff) == num;
1512}
62a02d25
L
1513
1514/* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1515 single NOP instruction LIMIT. */
1516
1517void
3ae729d5 1518i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
62a02d25 1519{
3ae729d5 1520 const unsigned char *const *patt = NULL;
62a02d25 1521 int max_single_nop_size;
3ae729d5
L
1522 /* Maximum number of NOPs before switching to jump over NOPs. */
1523 int max_number_of_nops;
62a02d25 1524
3ae729d5 1525 switch (fragP->fr_type)
62a02d25 1526 {
3ae729d5
L
1527 case rs_fill_nop:
1528 case rs_align_code:
1529 break;
e379e5f3
L
1530 case rs_machine_dependent:
1531 /* Allow NOP padding for jumps and calls. */
1532 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1533 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1534 break;
1535 /* Fall through. */
3ae729d5 1536 default:
62a02d25
L
1537 return;
1538 }
1539
ccc9c027
L
1540 /* We need to decide which NOP sequence to use for 32bit and
1541 64bit. When -mtune= is used:
4eed87de 1542
76bc74dc
L
1543 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1544 PROCESSOR_GENERIC32, f32_patt will be used.
80b8656c
L
1545 2. For the rest, alt_patt will be used.
1546
1547 When -mtune= isn't used, alt_patt will be used if
22109423 1548 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
76bc74dc 1549 be used.
ccc9c027
L
1550
1551 When -march= or .arch is used, we can't use anything beyond
1552 cpu_arch_isa_flags. */
1553
1554 if (flag_code == CODE_16BIT)
1555 {
3ae729d5
L
1556 patt = f16_patt;
1557 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1558 /* Limit number of NOPs to 2 in 16-bit mode. */
1559 max_number_of_nops = 2;
252b5132 1560 }
33fef721 1561 else
ccc9c027 1562 {
fbf3f584 1563 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
ccc9c027
L
1564 {
1565 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1566 switch (cpu_arch_tune)
1567 {
1568 case PROCESSOR_UNKNOWN:
1569 /* We use cpu_arch_isa_flags to check if we SHOULD
22109423
L
1570 optimize with nops. */
1571 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1572 patt = alt_patt;
ccc9c027
L
1573 else
1574 patt = f32_patt;
1575 break;
ccc9c027
L
1576 case PROCESSOR_PENTIUM4:
1577 case PROCESSOR_NOCONA:
ef05d495 1578 case PROCESSOR_CORE:
76bc74dc 1579 case PROCESSOR_CORE2:
bd5295b2 1580 case PROCESSOR_COREI7:
3632d14b 1581 case PROCESSOR_L1OM:
7a9068fe 1582 case PROCESSOR_K1OM:
76bc74dc 1583 case PROCESSOR_GENERIC64:
ccc9c027
L
1584 case PROCESSOR_K6:
1585 case PROCESSOR_ATHLON:
1586 case PROCESSOR_K8:
4eed87de 1587 case PROCESSOR_AMDFAM10:
8aedb9fe 1588 case PROCESSOR_BD:
029f3522 1589 case PROCESSOR_ZNVER:
7b458c12 1590 case PROCESSOR_BT:
80b8656c 1591 patt = alt_patt;
ccc9c027 1592 break;
76bc74dc 1593 case PROCESSOR_I386:
ccc9c027
L
1594 case PROCESSOR_I486:
1595 case PROCESSOR_PENTIUM:
2dde1948 1596 case PROCESSOR_PENTIUMPRO:
81486035 1597 case PROCESSOR_IAMCU:
ccc9c027
L
1598 case PROCESSOR_GENERIC32:
1599 patt = f32_patt;
1600 break;
4eed87de 1601 }
ccc9c027
L
1602 }
1603 else
1604 {
fbf3f584 1605 switch (fragP->tc_frag_data.tune)
ccc9c027
L
1606 {
1607 case PROCESSOR_UNKNOWN:
e6a14101 1608 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
ccc9c027
L
1609 PROCESSOR_UNKNOWN. */
1610 abort ();
1611 break;
1612
76bc74dc 1613 case PROCESSOR_I386:
ccc9c027
L
1614 case PROCESSOR_I486:
1615 case PROCESSOR_PENTIUM:
81486035 1616 case PROCESSOR_IAMCU:
ccc9c027
L
1617 case PROCESSOR_K6:
1618 case PROCESSOR_ATHLON:
1619 case PROCESSOR_K8:
4eed87de 1620 case PROCESSOR_AMDFAM10:
8aedb9fe 1621 case PROCESSOR_BD:
029f3522 1622 case PROCESSOR_ZNVER:
7b458c12 1623 case PROCESSOR_BT:
ccc9c027
L
1624 case PROCESSOR_GENERIC32:
1625 /* We use cpu_arch_isa_flags to check if we CAN optimize
22109423
L
1626 with nops. */
1627 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1628 patt = alt_patt;
ccc9c027
L
1629 else
1630 patt = f32_patt;
1631 break;
76bc74dc
L
1632 case PROCESSOR_PENTIUMPRO:
1633 case PROCESSOR_PENTIUM4:
1634 case PROCESSOR_NOCONA:
1635 case PROCESSOR_CORE:
ef05d495 1636 case PROCESSOR_CORE2:
bd5295b2 1637 case PROCESSOR_COREI7:
3632d14b 1638 case PROCESSOR_L1OM:
7a9068fe 1639 case PROCESSOR_K1OM:
22109423 1640 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
80b8656c 1641 patt = alt_patt;
ccc9c027
L
1642 else
1643 patt = f32_patt;
1644 break;
1645 case PROCESSOR_GENERIC64:
80b8656c 1646 patt = alt_patt;
ccc9c027 1647 break;
4eed87de 1648 }
ccc9c027
L
1649 }
1650
76bc74dc
L
1651 if (patt == f32_patt)
1652 {
3ae729d5
L
1653 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1654 /* Limit number of NOPs to 2 for older processors. */
1655 max_number_of_nops = 2;
76bc74dc
L
1656 }
1657 else
1658 {
3ae729d5
L
1659 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1660 /* Limit number of NOPs to 7 for newer processors. */
1661 max_number_of_nops = 7;
1662 }
1663 }
1664
1665 if (limit == 0)
1666 limit = max_single_nop_size;
1667
1668 if (fragP->fr_type == rs_fill_nop)
1669 {
1670 /* Output NOPs for .nop directive. */
1671 if (limit > max_single_nop_size)
1672 {
1673 as_bad_where (fragP->fr_file, fragP->fr_line,
1674 _("invalid single nop size: %d "
1675 "(expect within [0, %d])"),
1676 limit, max_single_nop_size);
1677 return;
1678 }
1679 }
e379e5f3 1680 else if (fragP->fr_type != rs_machine_dependent)
3ae729d5
L
1681 fragP->fr_var = count;
1682
1683 if ((count / max_single_nop_size) > max_number_of_nops)
1684 {
1685 /* Generate jump over NOPs. */
1686 offsetT disp = count - 2;
1687 if (fits_in_imm7 (disp))
1688 {
1689 /* Use "jmp disp8" if possible. */
1690 count = disp;
1691 where[0] = jump_disp8[0];
1692 where[1] = count;
1693 where += 2;
1694 }
1695 else
1696 {
1697 unsigned int size_of_jump;
1698
1699 if (flag_code == CODE_16BIT)
1700 {
1701 where[0] = jump16_disp32[0];
1702 where[1] = jump16_disp32[1];
1703 size_of_jump = 2;
1704 }
1705 else
1706 {
1707 where[0] = jump32_disp32[0];
1708 size_of_jump = 1;
1709 }
1710
1711 count -= size_of_jump + 4;
1712 if (!fits_in_imm31 (count))
1713 {
1714 as_bad_where (fragP->fr_file, fragP->fr_line,
1715 _("jump over nop padding out of range"));
1716 return;
1717 }
1718
1719 md_number_to_chars (where + size_of_jump, count, 4);
1720 where += size_of_jump + 4;
76bc74dc 1721 }
ccc9c027 1722 }
3ae729d5
L
1723
1724 /* Generate multiple NOPs. */
1725 i386_output_nops (where, patt, count, limit);
252b5132
RH
1726}
1727
c6fb90c8 1728static INLINE int
0dfbf9d7 1729operand_type_all_zero (const union i386_operand_type *x)
40fb9820 1730{
0dfbf9d7 1731 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1732 {
1733 case 3:
0dfbf9d7 1734 if (x->array[2])
c6fb90c8 1735 return 0;
1a0670f3 1736 /* Fall through. */
c6fb90c8 1737 case 2:
0dfbf9d7 1738 if (x->array[1])
c6fb90c8 1739 return 0;
1a0670f3 1740 /* Fall through. */
c6fb90c8 1741 case 1:
0dfbf9d7 1742 return !x->array[0];
c6fb90c8
L
1743 default:
1744 abort ();
1745 }
40fb9820
L
1746}
1747
c6fb90c8 1748static INLINE void
0dfbf9d7 1749operand_type_set (union i386_operand_type *x, unsigned int v)
40fb9820 1750{
0dfbf9d7 1751 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1752 {
1753 case 3:
0dfbf9d7 1754 x->array[2] = v;
1a0670f3 1755 /* Fall through. */
c6fb90c8 1756 case 2:
0dfbf9d7 1757 x->array[1] = v;
1a0670f3 1758 /* Fall through. */
c6fb90c8 1759 case 1:
0dfbf9d7 1760 x->array[0] = v;
1a0670f3 1761 /* Fall through. */
c6fb90c8
L
1762 break;
1763 default:
1764 abort ();
1765 }
bab6aec1
JB
1766
1767 x->bitfield.class = ClassNone;
75e5731b 1768 x->bitfield.instance = InstanceNone;
c6fb90c8 1769}
40fb9820 1770
c6fb90c8 1771static INLINE int
0dfbf9d7
L
1772operand_type_equal (const union i386_operand_type *x,
1773 const union i386_operand_type *y)
c6fb90c8 1774{
0dfbf9d7 1775 switch (ARRAY_SIZE(x->array))
c6fb90c8
L
1776 {
1777 case 3:
0dfbf9d7 1778 if (x->array[2] != y->array[2])
c6fb90c8 1779 return 0;
1a0670f3 1780 /* Fall through. */
c6fb90c8 1781 case 2:
0dfbf9d7 1782 if (x->array[1] != y->array[1])
c6fb90c8 1783 return 0;
1a0670f3 1784 /* Fall through. */
c6fb90c8 1785 case 1:
0dfbf9d7 1786 return x->array[0] == y->array[0];
c6fb90c8
L
1787 break;
1788 default:
1789 abort ();
1790 }
1791}
40fb9820 1792
0dfbf9d7
L
1793static INLINE int
1794cpu_flags_all_zero (const union i386_cpu_flags *x)
1795{
1796 switch (ARRAY_SIZE(x->array))
1797 {
53467f57
IT
1798 case 4:
1799 if (x->array[3])
1800 return 0;
1801 /* Fall through. */
0dfbf9d7
L
1802 case 3:
1803 if (x->array[2])
1804 return 0;
1a0670f3 1805 /* Fall through. */
0dfbf9d7
L
1806 case 2:
1807 if (x->array[1])
1808 return 0;
1a0670f3 1809 /* Fall through. */
0dfbf9d7
L
1810 case 1:
1811 return !x->array[0];
1812 default:
1813 abort ();
1814 }
1815}
1816
0dfbf9d7
L
1817static INLINE int
1818cpu_flags_equal (const union i386_cpu_flags *x,
1819 const union i386_cpu_flags *y)
1820{
1821 switch (ARRAY_SIZE(x->array))
1822 {
53467f57
IT
1823 case 4:
1824 if (x->array[3] != y->array[3])
1825 return 0;
1826 /* Fall through. */
0dfbf9d7
L
1827 case 3:
1828 if (x->array[2] != y->array[2])
1829 return 0;
1a0670f3 1830 /* Fall through. */
0dfbf9d7
L
1831 case 2:
1832 if (x->array[1] != y->array[1])
1833 return 0;
1a0670f3 1834 /* Fall through. */
0dfbf9d7
L
1835 case 1:
1836 return x->array[0] == y->array[0];
1837 break;
1838 default:
1839 abort ();
1840 }
1841}
c6fb90c8
L
1842
1843static INLINE int
1844cpu_flags_check_cpu64 (i386_cpu_flags f)
1845{
1846 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1847 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
40fb9820
L
1848}
1849
c6fb90c8
L
1850static INLINE i386_cpu_flags
1851cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
40fb9820 1852{
c6fb90c8
L
1853 switch (ARRAY_SIZE (x.array))
1854 {
53467f57
IT
1855 case 4:
1856 x.array [3] &= y.array [3];
1857 /* Fall through. */
c6fb90c8
L
1858 case 3:
1859 x.array [2] &= y.array [2];
1a0670f3 1860 /* Fall through. */
c6fb90c8
L
1861 case 2:
1862 x.array [1] &= y.array [1];
1a0670f3 1863 /* Fall through. */
c6fb90c8
L
1864 case 1:
1865 x.array [0] &= y.array [0];
1866 break;
1867 default:
1868 abort ();
1869 }
1870 return x;
1871}
40fb9820 1872
c6fb90c8
L
1873static INLINE i386_cpu_flags
1874cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
40fb9820 1875{
c6fb90c8 1876 switch (ARRAY_SIZE (x.array))
40fb9820 1877 {
53467f57
IT
1878 case 4:
1879 x.array [3] |= y.array [3];
1880 /* Fall through. */
c6fb90c8
L
1881 case 3:
1882 x.array [2] |= y.array [2];
1a0670f3 1883 /* Fall through. */
c6fb90c8
L
1884 case 2:
1885 x.array [1] |= y.array [1];
1a0670f3 1886 /* Fall through. */
c6fb90c8
L
1887 case 1:
1888 x.array [0] |= y.array [0];
40fb9820
L
1889 break;
1890 default:
1891 abort ();
1892 }
40fb9820
L
1893 return x;
1894}
1895
309d3373
JB
1896static INLINE i386_cpu_flags
1897cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1898{
1899 switch (ARRAY_SIZE (x.array))
1900 {
53467f57
IT
1901 case 4:
1902 x.array [3] &= ~y.array [3];
1903 /* Fall through. */
309d3373
JB
1904 case 3:
1905 x.array [2] &= ~y.array [2];
1a0670f3 1906 /* Fall through. */
309d3373
JB
1907 case 2:
1908 x.array [1] &= ~y.array [1];
1a0670f3 1909 /* Fall through. */
309d3373
JB
1910 case 1:
1911 x.array [0] &= ~y.array [0];
1912 break;
1913 default:
1914 abort ();
1915 }
1916 return x;
1917}
1918
6c0946d0
JB
1919static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1920
c0f3af97
L
1921#define CPU_FLAGS_ARCH_MATCH 0x1
1922#define CPU_FLAGS_64BIT_MATCH 0x2
1923
c0f3af97 1924#define CPU_FLAGS_PERFECT_MATCH \
db12e14e 1925 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
c0f3af97
L
1926
1927/* Return CPU flags match bits. */
3629bb00 1928
40fb9820 1929static int
d3ce72d0 1930cpu_flags_match (const insn_template *t)
40fb9820 1931{
c0f3af97
L
1932 i386_cpu_flags x = t->cpu_flags;
1933 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
40fb9820
L
1934
1935 x.bitfield.cpu64 = 0;
1936 x.bitfield.cpuno64 = 0;
1937
0dfbf9d7 1938 if (cpu_flags_all_zero (&x))
c0f3af97
L
1939 {
1940 /* This instruction is available on all archs. */
db12e14e 1941 match |= CPU_FLAGS_ARCH_MATCH;
c0f3af97 1942 }
3629bb00
L
1943 else
1944 {
c0f3af97 1945 /* This instruction is available only on some archs. */
3629bb00
L
1946 i386_cpu_flags cpu = cpu_arch_flags;
1947
ab592e75
JB
1948 /* AVX512VL is no standalone feature - match it and then strip it. */
1949 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1950 return match;
1951 x.bitfield.cpuavx512vl = 0;
1952
3629bb00 1953 cpu = cpu_flags_and (x, cpu);
c0f3af97
L
1954 if (!cpu_flags_all_zero (&cpu))
1955 {
a5ff0eb2
L
1956 if (x.bitfield.cpuavx)
1957 {
929f69fa 1958 /* We need to check a few extra flags with AVX. */
b9d49817 1959 if (cpu.bitfield.cpuavx
40d231b4
JB
1960 && (!t->opcode_modifier.sse2avx
1961 || (sse2avx && !i.prefix[DATA_PREFIX]))
b9d49817 1962 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
929f69fa 1963 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
b9d49817
JB
1964 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1965 match |= CPU_FLAGS_ARCH_MATCH;
a5ff0eb2 1966 }
929f69fa
JB
1967 else if (x.bitfield.cpuavx512f)
1968 {
1969 /* We need to check a few extra flags with AVX512F. */
1970 if (cpu.bitfield.cpuavx512f
1971 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1972 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1973 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1974 match |= CPU_FLAGS_ARCH_MATCH;
1975 }
a5ff0eb2 1976 else
db12e14e 1977 match |= CPU_FLAGS_ARCH_MATCH;
c0f3af97 1978 }
3629bb00 1979 }
c0f3af97 1980 return match;
40fb9820
L
1981}
1982
c6fb90c8
L
1983static INLINE i386_operand_type
1984operand_type_and (i386_operand_type x, i386_operand_type y)
40fb9820 1985{
bab6aec1
JB
1986 if (x.bitfield.class != y.bitfield.class)
1987 x.bitfield.class = ClassNone;
75e5731b
JB
1988 if (x.bitfield.instance != y.bitfield.instance)
1989 x.bitfield.instance = InstanceNone;
bab6aec1 1990
c6fb90c8
L
1991 switch (ARRAY_SIZE (x.array))
1992 {
1993 case 3:
1994 x.array [2] &= y.array [2];
1a0670f3 1995 /* Fall through. */
c6fb90c8
L
1996 case 2:
1997 x.array [1] &= y.array [1];
1a0670f3 1998 /* Fall through. */
c6fb90c8
L
1999 case 1:
2000 x.array [0] &= y.array [0];
2001 break;
2002 default:
2003 abort ();
2004 }
2005 return x;
40fb9820
L
2006}
2007
73053c1f
JB
2008static INLINE i386_operand_type
2009operand_type_and_not (i386_operand_type x, i386_operand_type y)
2010{
bab6aec1 2011 gas_assert (y.bitfield.class == ClassNone);
75e5731b 2012 gas_assert (y.bitfield.instance == InstanceNone);
bab6aec1 2013
73053c1f
JB
2014 switch (ARRAY_SIZE (x.array))
2015 {
2016 case 3:
2017 x.array [2] &= ~y.array [2];
2018 /* Fall through. */
2019 case 2:
2020 x.array [1] &= ~y.array [1];
2021 /* Fall through. */
2022 case 1:
2023 x.array [0] &= ~y.array [0];
2024 break;
2025 default:
2026 abort ();
2027 }
2028 return x;
2029}
2030
c6fb90c8
L
2031static INLINE i386_operand_type
2032operand_type_or (i386_operand_type x, i386_operand_type y)
40fb9820 2033{
bab6aec1
JB
2034 gas_assert (x.bitfield.class == ClassNone ||
2035 y.bitfield.class == ClassNone ||
2036 x.bitfield.class == y.bitfield.class);
75e5731b
JB
2037 gas_assert (x.bitfield.instance == InstanceNone ||
2038 y.bitfield.instance == InstanceNone ||
2039 x.bitfield.instance == y.bitfield.instance);
bab6aec1 2040
c6fb90c8 2041 switch (ARRAY_SIZE (x.array))
40fb9820 2042 {
c6fb90c8
L
2043 case 3:
2044 x.array [2] |= y.array [2];
1a0670f3 2045 /* Fall through. */
c6fb90c8
L
2046 case 2:
2047 x.array [1] |= y.array [1];
1a0670f3 2048 /* Fall through. */
c6fb90c8
L
2049 case 1:
2050 x.array [0] |= y.array [0];
40fb9820
L
2051 break;
2052 default:
2053 abort ();
2054 }
c6fb90c8
L
2055 return x;
2056}
40fb9820 2057
c6fb90c8
L
2058static INLINE i386_operand_type
2059operand_type_xor (i386_operand_type x, i386_operand_type y)
2060{
bab6aec1 2061 gas_assert (y.bitfield.class == ClassNone);
75e5731b 2062 gas_assert (y.bitfield.instance == InstanceNone);
bab6aec1 2063
c6fb90c8
L
2064 switch (ARRAY_SIZE (x.array))
2065 {
2066 case 3:
2067 x.array [2] ^= y.array [2];
1a0670f3 2068 /* Fall through. */
c6fb90c8
L
2069 case 2:
2070 x.array [1] ^= y.array [1];
1a0670f3 2071 /* Fall through. */
c6fb90c8
L
2072 case 1:
2073 x.array [0] ^= y.array [0];
2074 break;
2075 default:
2076 abort ();
2077 }
40fb9820
L
2078 return x;
2079}
2080
40fb9820
L
2081static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2082static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2083static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2084static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
bab6aec1
JB
2085static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2086static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
40fb9820 2087static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
43234a1e 2088static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
40fb9820
L
2089static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2090static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2091static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2092static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2093static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2094static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2095static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2096static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2097static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2098
2099enum operand_type
2100{
2101 reg,
40fb9820
L
2102 imm,
2103 disp,
2104 anymem
2105};
2106
c6fb90c8 2107static INLINE int
40fb9820
L
2108operand_type_check (i386_operand_type t, enum operand_type c)
2109{
2110 switch (c)
2111 {
2112 case reg:
bab6aec1 2113 return t.bitfield.class == Reg;
40fb9820 2114
40fb9820
L
2115 case imm:
2116 return (t.bitfield.imm8
2117 || t.bitfield.imm8s
2118 || t.bitfield.imm16
2119 || t.bitfield.imm32
2120 || t.bitfield.imm32s
2121 || t.bitfield.imm64);
2122
2123 case disp:
2124 return (t.bitfield.disp8
2125 || t.bitfield.disp16
2126 || t.bitfield.disp32
2127 || t.bitfield.disp32s
2128 || t.bitfield.disp64);
2129
2130 case anymem:
2131 return (t.bitfield.disp8
2132 || t.bitfield.disp16
2133 || t.bitfield.disp32
2134 || t.bitfield.disp32s
2135 || t.bitfield.disp64
2136 || t.bitfield.baseindex);
2137
2138 default:
2139 abort ();
2140 }
2cfe26b6
AM
2141
2142 return 0;
40fb9820
L
2143}
2144
7a54636a
L
2145/* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2146 between operand GIVEN and opeand WANTED for instruction template T. */
5c07affc
L
2147
2148static INLINE int
7a54636a
L
2149match_operand_size (const insn_template *t, unsigned int wanted,
2150 unsigned int given)
5c07affc 2151{
3ac21baa
JB
2152 return !((i.types[given].bitfield.byte
2153 && !t->operand_types[wanted].bitfield.byte)
2154 || (i.types[given].bitfield.word
2155 && !t->operand_types[wanted].bitfield.word)
2156 || (i.types[given].bitfield.dword
2157 && !t->operand_types[wanted].bitfield.dword)
2158 || (i.types[given].bitfield.qword
2159 && !t->operand_types[wanted].bitfield.qword)
2160 || (i.types[given].bitfield.tbyte
2161 && !t->operand_types[wanted].bitfield.tbyte));
5c07affc
L
2162}
2163
dd40ce22
L
2164/* Return 1 if there is no conflict in SIMD register between operand
2165 GIVEN and opeand WANTED for instruction template T. */
1b54b8d7
JB
2166
2167static INLINE int
dd40ce22
L
2168match_simd_size (const insn_template *t, unsigned int wanted,
2169 unsigned int given)
1b54b8d7 2170{
3ac21baa
JB
2171 return !((i.types[given].bitfield.xmmword
2172 && !t->operand_types[wanted].bitfield.xmmword)
2173 || (i.types[given].bitfield.ymmword
2174 && !t->operand_types[wanted].bitfield.ymmword)
2175 || (i.types[given].bitfield.zmmword
260cd341
LC
2176 && !t->operand_types[wanted].bitfield.zmmword)
2177 || (i.types[given].bitfield.tmmword
2178 && !t->operand_types[wanted].bitfield.tmmword));
1b54b8d7
JB
2179}
2180
7a54636a
L
2181/* Return 1 if there is no conflict in any size between operand GIVEN
2182 and opeand WANTED for instruction template T. */
5c07affc
L
2183
2184static INLINE int
dd40ce22
L
2185match_mem_size (const insn_template *t, unsigned int wanted,
2186 unsigned int given)
5c07affc 2187{
7a54636a 2188 return (match_operand_size (t, wanted, given)
3ac21baa 2189 && !((i.types[given].bitfield.unspecified
af508cb9 2190 && !i.broadcast
3ac21baa
JB
2191 && !t->operand_types[wanted].bitfield.unspecified)
2192 || (i.types[given].bitfield.fword
2193 && !t->operand_types[wanted].bitfield.fword)
1b54b8d7
JB
2194 /* For scalar opcode templates to allow register and memory
2195 operands at the same time, some special casing is needed
d6793fa1
JB
2196 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2197 down-conversion vpmov*. */
3528c362 2198 || ((t->operand_types[wanted].bitfield.class == RegSIMD
bc49bfd8
JB
2199 && t->operand_types[wanted].bitfield.byte
2200 + t->operand_types[wanted].bitfield.word
2201 + t->operand_types[wanted].bitfield.dword
2202 + t->operand_types[wanted].bitfield.qword
2203 > !!t->opcode_modifier.broadcast)
3ac21baa
JB
2204 ? (i.types[given].bitfield.xmmword
2205 || i.types[given].bitfield.ymmword
2206 || i.types[given].bitfield.zmmword)
2207 : !match_simd_size(t, wanted, given))));
5c07affc
L
2208}
2209
3ac21baa
JB
2210/* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2211 operands for instruction template T, and it has MATCH_REVERSE set if there
2212 is no size conflict on any operands for the template with operands reversed
2213 (and the template allows for reversing in the first place). */
5c07affc 2214
3ac21baa
JB
2215#define MATCH_STRAIGHT 1
2216#define MATCH_REVERSE 2
2217
2218static INLINE unsigned int
d3ce72d0 2219operand_size_match (const insn_template *t)
5c07affc 2220{
3ac21baa 2221 unsigned int j, match = MATCH_STRAIGHT;
5c07affc 2222
0cfa3eb3 2223 /* Don't check non-absolute jump instructions. */
5c07affc 2224 if (t->opcode_modifier.jump
0cfa3eb3 2225 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5c07affc
L
2226 return match;
2227
2228 /* Check memory and accumulator operand size. */
2229 for (j = 0; j < i.operands; j++)
2230 {
3528c362
JB
2231 if (i.types[j].bitfield.class != Reg
2232 && i.types[j].bitfield.class != RegSIMD
601e8564 2233 && t->opcode_modifier.anysize)
5c07affc
L
2234 continue;
2235
bab6aec1 2236 if (t->operand_types[j].bitfield.class == Reg
7a54636a 2237 && !match_operand_size (t, j, j))
5c07affc
L
2238 {
2239 match = 0;
2240 break;
2241 }
2242
3528c362 2243 if (t->operand_types[j].bitfield.class == RegSIMD
3ac21baa 2244 && !match_simd_size (t, j, j))
1b54b8d7
JB
2245 {
2246 match = 0;
2247 break;
2248 }
2249
75e5731b 2250 if (t->operand_types[j].bitfield.instance == Accum
7a54636a 2251 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
1b54b8d7
JB
2252 {
2253 match = 0;
2254 break;
2255 }
2256
c48dadc9 2257 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
5c07affc
L
2258 {
2259 match = 0;
2260 break;
2261 }
2262 }
2263
3ac21baa 2264 if (!t->opcode_modifier.d)
891edac4 2265 {
dc1e8a47 2266 mismatch:
3ac21baa
JB
2267 if (!match)
2268 i.error = operand_size_mismatch;
2269 return match;
891edac4 2270 }
5c07affc
L
2271
2272 /* Check reverse. */
f5eb1d70 2273 gas_assert (i.operands >= 2 && i.operands <= 3);
5c07affc 2274
f5eb1d70 2275 for (j = 0; j < i.operands; j++)
5c07affc 2276 {
f5eb1d70
JB
2277 unsigned int given = i.operands - j - 1;
2278
bab6aec1 2279 if (t->operand_types[j].bitfield.class == Reg
f5eb1d70 2280 && !match_operand_size (t, j, given))
891edac4 2281 goto mismatch;
5c07affc 2282
3528c362 2283 if (t->operand_types[j].bitfield.class == RegSIMD
f5eb1d70 2284 && !match_simd_size (t, j, given))
dbbc8b7e
JB
2285 goto mismatch;
2286
75e5731b 2287 if (t->operand_types[j].bitfield.instance == Accum
f5eb1d70
JB
2288 && (!match_operand_size (t, j, given)
2289 || !match_simd_size (t, j, given)))
dbbc8b7e
JB
2290 goto mismatch;
2291
f5eb1d70 2292 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
891edac4 2293 goto mismatch;
5c07affc
L
2294 }
2295
3ac21baa 2296 return match | MATCH_REVERSE;
5c07affc
L
2297}
2298
c6fb90c8 2299static INLINE int
40fb9820
L
2300operand_type_match (i386_operand_type overlap,
2301 i386_operand_type given)
2302{
2303 i386_operand_type temp = overlap;
2304
7d5e4556 2305 temp.bitfield.unspecified = 0;
5c07affc
L
2306 temp.bitfield.byte = 0;
2307 temp.bitfield.word = 0;
2308 temp.bitfield.dword = 0;
2309 temp.bitfield.fword = 0;
2310 temp.bitfield.qword = 0;
2311 temp.bitfield.tbyte = 0;
2312 temp.bitfield.xmmword = 0;
c0f3af97 2313 temp.bitfield.ymmword = 0;
43234a1e 2314 temp.bitfield.zmmword = 0;
260cd341 2315 temp.bitfield.tmmword = 0;
0dfbf9d7 2316 if (operand_type_all_zero (&temp))
891edac4 2317 goto mismatch;
40fb9820 2318
6f2f06be 2319 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
891edac4
L
2320 return 1;
2321
dc1e8a47 2322 mismatch:
a65babc9 2323 i.error = operand_type_mismatch;
891edac4 2324 return 0;
40fb9820
L
2325}
2326
7d5e4556 2327/* If given types g0 and g1 are registers they must be of the same type
10c17abd 2328 unless the expected operand type register overlap is null.
5de4d9ef 2329 Some Intel syntax memory operand size checking also happens here. */
40fb9820 2330
c6fb90c8 2331static INLINE int
dc821c5f 2332operand_type_register_match (i386_operand_type g0,
40fb9820 2333 i386_operand_type t0,
40fb9820
L
2334 i386_operand_type g1,
2335 i386_operand_type t1)
2336{
bab6aec1 2337 if (g0.bitfield.class != Reg
3528c362 2338 && g0.bitfield.class != RegSIMD
10c17abd
JB
2339 && (!operand_type_check (g0, anymem)
2340 || g0.bitfield.unspecified
5de4d9ef
JB
2341 || (t0.bitfield.class != Reg
2342 && t0.bitfield.class != RegSIMD)))
40fb9820
L
2343 return 1;
2344
bab6aec1 2345 if (g1.bitfield.class != Reg
3528c362 2346 && g1.bitfield.class != RegSIMD
10c17abd
JB
2347 && (!operand_type_check (g1, anymem)
2348 || g1.bitfield.unspecified
5de4d9ef
JB
2349 || (t1.bitfield.class != Reg
2350 && t1.bitfield.class != RegSIMD)))
40fb9820
L
2351 return 1;
2352
dc821c5f
JB
2353 if (g0.bitfield.byte == g1.bitfield.byte
2354 && g0.bitfield.word == g1.bitfield.word
2355 && g0.bitfield.dword == g1.bitfield.dword
10c17abd
JB
2356 && g0.bitfield.qword == g1.bitfield.qword
2357 && g0.bitfield.xmmword == g1.bitfield.xmmword
2358 && g0.bitfield.ymmword == g1.bitfield.ymmword
2359 && g0.bitfield.zmmword == g1.bitfield.zmmword)
40fb9820
L
2360 return 1;
2361
dc821c5f
JB
2362 if (!(t0.bitfield.byte & t1.bitfield.byte)
2363 && !(t0.bitfield.word & t1.bitfield.word)
2364 && !(t0.bitfield.dword & t1.bitfield.dword)
10c17abd
JB
2365 && !(t0.bitfield.qword & t1.bitfield.qword)
2366 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2367 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2368 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
891edac4
L
2369 return 1;
2370
a65babc9 2371 i.error = register_type_mismatch;
891edac4
L
2372
2373 return 0;
40fb9820
L
2374}
2375
4c692bc7
JB
2376static INLINE unsigned int
2377register_number (const reg_entry *r)
2378{
2379 unsigned int nr = r->reg_num;
2380
2381 if (r->reg_flags & RegRex)
2382 nr += 8;
2383
200cbe0f
L
2384 if (r->reg_flags & RegVRex)
2385 nr += 16;
2386
4c692bc7
JB
2387 return nr;
2388}
2389
252b5132 2390static INLINE unsigned int
40fb9820 2391mode_from_disp_size (i386_operand_type t)
252b5132 2392{
b5014f7a 2393 if (t.bitfield.disp8)
40fb9820
L
2394 return 1;
2395 else if (t.bitfield.disp16
2396 || t.bitfield.disp32
2397 || t.bitfield.disp32s)
2398 return 2;
2399 else
2400 return 0;
252b5132
RH
2401}
2402
2403static INLINE int
65879393 2404fits_in_signed_byte (addressT num)
252b5132 2405{
65879393 2406 return num + 0x80 <= 0xff;
47926f60 2407}
252b5132
RH
2408
2409static INLINE int
65879393 2410fits_in_unsigned_byte (addressT num)
252b5132 2411{
65879393 2412 return num <= 0xff;
47926f60 2413}
252b5132
RH
2414
2415static INLINE int
65879393 2416fits_in_unsigned_word (addressT num)
252b5132 2417{
65879393 2418 return num <= 0xffff;
47926f60 2419}
252b5132
RH
2420
2421static INLINE int
65879393 2422fits_in_signed_word (addressT num)
252b5132 2423{
65879393 2424 return num + 0x8000 <= 0xffff;
47926f60 2425}
2a962e6d 2426
3e73aa7c 2427static INLINE int
65879393 2428fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
3e73aa7c
JH
2429{
2430#ifndef BFD64
2431 return 1;
2432#else
65879393 2433 return num + 0x80000000 <= 0xffffffff;
3e73aa7c
JH
2434#endif
2435} /* fits_in_signed_long() */
2a962e6d 2436
3e73aa7c 2437static INLINE int
65879393 2438fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
3e73aa7c
JH
2439{
2440#ifndef BFD64
2441 return 1;
2442#else
65879393 2443 return num <= 0xffffffff;
3e73aa7c
JH
2444#endif
2445} /* fits_in_unsigned_long() */
252b5132 2446
43234a1e 2447static INLINE int
b5014f7a 2448fits_in_disp8 (offsetT num)
43234a1e
L
2449{
2450 int shift = i.memshift;
2451 unsigned int mask;
2452
2453 if (shift == -1)
2454 abort ();
2455
2456 mask = (1 << shift) - 1;
2457
2458 /* Return 0 if NUM isn't properly aligned. */
2459 if ((num & mask))
2460 return 0;
2461
2462 /* Check if NUM will fit in 8bit after shift. */
2463 return fits_in_signed_byte (num >> shift);
2464}
2465
a683cc34
SP
2466static INLINE int
2467fits_in_imm4 (offsetT num)
2468{
2469 return (num & 0xf) == num;
2470}
2471
40fb9820 2472static i386_operand_type
e3bb37b5 2473smallest_imm_type (offsetT num)
252b5132 2474{
40fb9820 2475 i386_operand_type t;
7ab9ffdd 2476
0dfbf9d7 2477 operand_type_set (&t, 0);
40fb9820
L
2478 t.bitfield.imm64 = 1;
2479
2480 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
e413e4e9
AM
2481 {
2482 /* This code is disabled on the 486 because all the Imm1 forms
2483 in the opcode table are slower on the i486. They're the
2484 versions with the implicitly specified single-position
2485 displacement, which has another syntax if you really want to
2486 use that form. */
40fb9820
L
2487 t.bitfield.imm1 = 1;
2488 t.bitfield.imm8 = 1;
2489 t.bitfield.imm8s = 1;
2490 t.bitfield.imm16 = 1;
2491 t.bitfield.imm32 = 1;
2492 t.bitfield.imm32s = 1;
2493 }
2494 else if (fits_in_signed_byte (num))
2495 {
2496 t.bitfield.imm8 = 1;
2497 t.bitfield.imm8s = 1;
2498 t.bitfield.imm16 = 1;
2499 t.bitfield.imm32 = 1;
2500 t.bitfield.imm32s = 1;
2501 }
2502 else if (fits_in_unsigned_byte (num))
2503 {
2504 t.bitfield.imm8 = 1;
2505 t.bitfield.imm16 = 1;
2506 t.bitfield.imm32 = 1;
2507 t.bitfield.imm32s = 1;
2508 }
2509 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2510 {
2511 t.bitfield.imm16 = 1;
2512 t.bitfield.imm32 = 1;
2513 t.bitfield.imm32s = 1;
2514 }
2515 else if (fits_in_signed_long (num))
2516 {
2517 t.bitfield.imm32 = 1;
2518 t.bitfield.imm32s = 1;
2519 }
2520 else if (fits_in_unsigned_long (num))
2521 t.bitfield.imm32 = 1;
2522
2523 return t;
47926f60 2524}
252b5132 2525
847f7ad4 2526static offsetT
e3bb37b5 2527offset_in_range (offsetT val, int size)
847f7ad4 2528{
508866be 2529 addressT mask;
ba2adb93 2530
847f7ad4
AM
2531 switch (size)
2532 {
508866be
L
2533 case 1: mask = ((addressT) 1 << 8) - 1; break;
2534 case 2: mask = ((addressT) 1 << 16) - 1; break;
3b0ec529 2535 case 4: mask = ((addressT) 2 << 31) - 1; break;
3e73aa7c
JH
2536#ifdef BFD64
2537 case 8: mask = ((addressT) 2 << 63) - 1; break;
2538#endif
47926f60 2539 default: abort ();
847f7ad4
AM
2540 }
2541
9de868bf
L
2542#ifdef BFD64
2543 /* If BFD64, sign extend val for 32bit address mode. */
2544 if (flag_code != CODE_64BIT
2545 || i.prefix[ADDR_PREFIX])
3e73aa7c
JH
2546 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2547 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
fa289fb8 2548#endif
ba2adb93 2549
47926f60 2550 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
847f7ad4
AM
2551 {
2552 char buf1[40], buf2[40];
2553
2554 sprint_value (buf1, val);
2555 sprint_value (buf2, val & mask);
2556 as_warn (_("%s shortened to %s"), buf1, buf2);
2557 }
2558 return val & mask;
2559}
2560
c32fa91d
L
2561enum PREFIX_GROUP
2562{
2563 PREFIX_EXIST = 0,
2564 PREFIX_LOCK,
2565 PREFIX_REP,
04ef582a 2566 PREFIX_DS,
c32fa91d
L
2567 PREFIX_OTHER
2568};
2569
2570/* Returns
2571 a. PREFIX_EXIST if attempting to add a prefix where one from the
2572 same class already exists.
2573 b. PREFIX_LOCK if lock prefix is added.
2574 c. PREFIX_REP if rep/repne prefix is added.
04ef582a
L
2575 d. PREFIX_DS if ds prefix is added.
2576 e. PREFIX_OTHER if other prefix is added.
c32fa91d
L
2577 */
2578
2579static enum PREFIX_GROUP
e3bb37b5 2580add_prefix (unsigned int prefix)
252b5132 2581{
c32fa91d 2582 enum PREFIX_GROUP ret = PREFIX_OTHER;
b1905489 2583 unsigned int q;
252b5132 2584
29b0f896
AM
2585 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2586 && flag_code == CODE_64BIT)
b1905489 2587 {
161a04f6 2588 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
44846f29
JB
2589 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2590 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2591 || (i.prefix[REX_PREFIX] & prefix & REX_B))
c32fa91d 2592 ret = PREFIX_EXIST;
b1905489
JB
2593 q = REX_PREFIX;
2594 }
3e73aa7c 2595 else
b1905489
JB
2596 {
2597 switch (prefix)
2598 {
2599 default:
2600 abort ();
2601
b1905489 2602 case DS_PREFIX_OPCODE:
04ef582a
L
2603 ret = PREFIX_DS;
2604 /* Fall through. */
2605 case CS_PREFIX_OPCODE:
b1905489
JB
2606 case ES_PREFIX_OPCODE:
2607 case FS_PREFIX_OPCODE:
2608 case GS_PREFIX_OPCODE:
2609 case SS_PREFIX_OPCODE:
2610 q = SEG_PREFIX;
2611 break;
2612
2613 case REPNE_PREFIX_OPCODE:
2614 case REPE_PREFIX_OPCODE:
c32fa91d
L
2615 q = REP_PREFIX;
2616 ret = PREFIX_REP;
2617 break;
2618
b1905489 2619 case LOCK_PREFIX_OPCODE:
c32fa91d
L
2620 q = LOCK_PREFIX;
2621 ret = PREFIX_LOCK;
b1905489
JB
2622 break;
2623
2624 case FWAIT_OPCODE:
2625 q = WAIT_PREFIX;
2626 break;
2627
2628 case ADDR_PREFIX_OPCODE:
2629 q = ADDR_PREFIX;
2630 break;
2631
2632 case DATA_PREFIX_OPCODE:
2633 q = DATA_PREFIX;
2634 break;
2635 }
2636 if (i.prefix[q] != 0)
c32fa91d 2637 ret = PREFIX_EXIST;
b1905489 2638 }
252b5132 2639
b1905489 2640 if (ret)
252b5132 2641 {
b1905489
JB
2642 if (!i.prefix[q])
2643 ++i.prefixes;
2644 i.prefix[q] |= prefix;
252b5132 2645 }
b1905489
JB
2646 else
2647 as_bad (_("same type of prefix used twice"));
252b5132 2648
252b5132
RH
2649 return ret;
2650}
2651
2652static void
78f12dd3 2653update_code_flag (int value, int check)
eecb386c 2654{
78f12dd3
L
2655 PRINTF_LIKE ((*as_error));
2656
1e9cc1c2 2657 flag_code = (enum flag_code) value;
40fb9820
L
2658 if (flag_code == CODE_64BIT)
2659 {
2660 cpu_arch_flags.bitfield.cpu64 = 1;
2661 cpu_arch_flags.bitfield.cpuno64 = 0;
40fb9820
L
2662 }
2663 else
2664 {
2665 cpu_arch_flags.bitfield.cpu64 = 0;
2666 cpu_arch_flags.bitfield.cpuno64 = 1;
40fb9820
L
2667 }
2668 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
3e73aa7c 2669 {
78f12dd3
L
2670 if (check)
2671 as_error = as_fatal;
2672 else
2673 as_error = as_bad;
2674 (*as_error) (_("64bit mode not supported on `%s'."),
2675 cpu_arch_name ? cpu_arch_name : default_arch);
3e73aa7c 2676 }
40fb9820 2677 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
3e73aa7c 2678 {
78f12dd3
L
2679 if (check)
2680 as_error = as_fatal;
2681 else
2682 as_error = as_bad;
2683 (*as_error) (_("32bit mode not supported on `%s'."),
2684 cpu_arch_name ? cpu_arch_name : default_arch);
3e73aa7c 2685 }
eecb386c
AM
2686 stackop_size = '\0';
2687}
2688
78f12dd3
L
2689static void
2690set_code_flag (int value)
2691{
2692 update_code_flag (value, 0);
2693}
2694
eecb386c 2695static void
e3bb37b5 2696set_16bit_gcc_code_flag (int new_code_flag)
252b5132 2697{
1e9cc1c2 2698 flag_code = (enum flag_code) new_code_flag;
40fb9820
L
2699 if (flag_code != CODE_16BIT)
2700 abort ();
2701 cpu_arch_flags.bitfield.cpu64 = 0;
2702 cpu_arch_flags.bitfield.cpuno64 = 1;
9306ca4a 2703 stackop_size = LONG_MNEM_SUFFIX;
252b5132
RH
2704}
2705
2706static void
e3bb37b5 2707set_intel_syntax (int syntax_flag)
252b5132
RH
2708{
2709 /* Find out if register prefixing is specified. */
2710 int ask_naked_reg = 0;
2711
2712 SKIP_WHITESPACE ();
29b0f896 2713 if (!is_end_of_line[(unsigned char) *input_line_pointer])
252b5132 2714 {
d02603dc
NC
2715 char *string;
2716 int e = get_symbol_name (&string);
252b5132 2717
47926f60 2718 if (strcmp (string, "prefix") == 0)
252b5132 2719 ask_naked_reg = 1;
47926f60 2720 else if (strcmp (string, "noprefix") == 0)
252b5132
RH
2721 ask_naked_reg = -1;
2722 else
d0b47220 2723 as_bad (_("bad argument to syntax directive."));
d02603dc 2724 (void) restore_line_pointer (e);
252b5132
RH
2725 }
2726 demand_empty_rest_of_line ();
c3332e24 2727
252b5132
RH
2728 intel_syntax = syntax_flag;
2729
2730 if (ask_naked_reg == 0)
f86103b7
AM
2731 allow_naked_reg = (intel_syntax
2732 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
252b5132
RH
2733 else
2734 allow_naked_reg = (ask_naked_reg < 0);
9306ca4a 2735
ee86248c 2736 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
7ab9ffdd 2737
e4a3b5a4 2738 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
9306ca4a 2739 identifier_chars['$'] = intel_syntax ? '$' : 0;
e4a3b5a4 2740 register_prefix = allow_naked_reg ? "" : "%";
252b5132
RH
2741}
2742
1efbbeb4
L
2743static void
2744set_intel_mnemonic (int mnemonic_flag)
2745{
e1d4d893 2746 intel_mnemonic = mnemonic_flag;
1efbbeb4
L
2747}
2748
db51cc60
L
2749static void
2750set_allow_index_reg (int flag)
2751{
2752 allow_index_reg = flag;
2753}
2754
cb19c032 2755static void
7bab8ab5 2756set_check (int what)
cb19c032 2757{
7bab8ab5
JB
2758 enum check_kind *kind;
2759 const char *str;
2760
2761 if (what)
2762 {
2763 kind = &operand_check;
2764 str = "operand";
2765 }
2766 else
2767 {
2768 kind = &sse_check;
2769 str = "sse";
2770 }
2771
cb19c032
L
2772 SKIP_WHITESPACE ();
2773
2774 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2775 {
d02603dc
NC
2776 char *string;
2777 int e = get_symbol_name (&string);
cb19c032
L
2778
2779 if (strcmp (string, "none") == 0)
7bab8ab5 2780 *kind = check_none;
cb19c032 2781 else if (strcmp (string, "warning") == 0)
7bab8ab5 2782 *kind = check_warning;
cb19c032 2783 else if (strcmp (string, "error") == 0)
7bab8ab5 2784 *kind = check_error;
cb19c032 2785 else
7bab8ab5 2786 as_bad (_("bad argument to %s_check directive."), str);
d02603dc 2787 (void) restore_line_pointer (e);
cb19c032
L
2788 }
2789 else
7bab8ab5 2790 as_bad (_("missing argument for %s_check directive"), str);
cb19c032
L
2791
2792 demand_empty_rest_of_line ();
2793}
2794
8a9036a4
L
2795static void
2796check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
1e9cc1c2 2797 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
8a9036a4
L
2798{
2799#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2800 static const char *arch;
2801
2802 /* Intel LIOM is only supported on ELF. */
2803 if (!IS_ELF)
2804 return;
2805
2806 if (!arch)
2807 {
2808 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2809 use default_arch. */
2810 arch = cpu_arch_name;
2811 if (!arch)
2812 arch = default_arch;
2813 }
2814
81486035
L
2815 /* If we are targeting Intel MCU, we must enable it. */
2816 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2817 || new_flag.bitfield.cpuiamcu)
2818 return;
2819
3632d14b 2820 /* If we are targeting Intel L1OM, we must enable it. */
8a9036a4 2821 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
1e9cc1c2 2822 || new_flag.bitfield.cpul1om)
8a9036a4 2823 return;
76ba9986 2824
7a9068fe
L
2825 /* If we are targeting Intel K1OM, we must enable it. */
2826 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2827 || new_flag.bitfield.cpuk1om)
2828 return;
2829
8a9036a4
L
2830 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2831#endif
2832}
2833
e413e4e9 2834static void
e3bb37b5 2835set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
e413e4e9 2836{
47926f60 2837 SKIP_WHITESPACE ();
e413e4e9 2838
29b0f896 2839 if (!is_end_of_line[(unsigned char) *input_line_pointer])
e413e4e9 2840 {
d02603dc
NC
2841 char *string;
2842 int e = get_symbol_name (&string);
91d6fa6a 2843 unsigned int j;
40fb9820 2844 i386_cpu_flags flags;
e413e4e9 2845
91d6fa6a 2846 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
e413e4e9 2847 {
91d6fa6a 2848 if (strcmp (string, cpu_arch[j].name) == 0)
e413e4e9 2849 {
91d6fa6a 2850 check_cpu_arch_compatible (string, cpu_arch[j].flags);
8a9036a4 2851
5c6af06e
JB
2852 if (*string != '.')
2853 {
91d6fa6a 2854 cpu_arch_name = cpu_arch[j].name;
5c6af06e 2855 cpu_sub_arch_name = NULL;
91d6fa6a 2856 cpu_arch_flags = cpu_arch[j].flags;
40fb9820
L
2857 if (flag_code == CODE_64BIT)
2858 {
2859 cpu_arch_flags.bitfield.cpu64 = 1;
2860 cpu_arch_flags.bitfield.cpuno64 = 0;
2861 }
2862 else
2863 {
2864 cpu_arch_flags.bitfield.cpu64 = 0;
2865 cpu_arch_flags.bitfield.cpuno64 = 1;
2866 }
91d6fa6a
NC
2867 cpu_arch_isa = cpu_arch[j].type;
2868 cpu_arch_isa_flags = cpu_arch[j].flags;
ccc9c027
L
2869 if (!cpu_arch_tune_set)
2870 {
2871 cpu_arch_tune = cpu_arch_isa;
2872 cpu_arch_tune_flags = cpu_arch_isa_flags;
2873 }
5c6af06e
JB
2874 break;
2875 }
40fb9820 2876
293f5f65
L
2877 flags = cpu_flags_or (cpu_arch_flags,
2878 cpu_arch[j].flags);
81486035 2879
5b64d091 2880 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
5c6af06e 2881 {
6305a203
L
2882 if (cpu_sub_arch_name)
2883 {
2884 char *name = cpu_sub_arch_name;
2885 cpu_sub_arch_name = concat (name,
91d6fa6a 2886 cpu_arch[j].name,
1bf57e9f 2887 (const char *) NULL);
6305a203
L
2888 free (name);
2889 }
2890 else
91d6fa6a 2891 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
40fb9820 2892 cpu_arch_flags = flags;
a586129e 2893 cpu_arch_isa_flags = flags;
5c6af06e 2894 }
0089dace
L
2895 else
2896 cpu_arch_isa_flags
2897 = cpu_flags_or (cpu_arch_isa_flags,
2898 cpu_arch[j].flags);
d02603dc 2899 (void) restore_line_pointer (e);
5c6af06e
JB
2900 demand_empty_rest_of_line ();
2901 return;
e413e4e9
AM
2902 }
2903 }
293f5f65
L
2904
2905 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2906 {
33eaf5de 2907 /* Disable an ISA extension. */
293f5f65
L
2908 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2909 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2910 {
2911 flags = cpu_flags_and_not (cpu_arch_flags,
2912 cpu_noarch[j].flags);
2913 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2914 {
2915 if (cpu_sub_arch_name)
2916 {
2917 char *name = cpu_sub_arch_name;
2918 cpu_sub_arch_name = concat (name, string,
2919 (const char *) NULL);
2920 free (name);
2921 }
2922 else
2923 cpu_sub_arch_name = xstrdup (string);
2924 cpu_arch_flags = flags;
2925 cpu_arch_isa_flags = flags;
2926 }
2927 (void) restore_line_pointer (e);
2928 demand_empty_rest_of_line ();
2929 return;
2930 }
2931
2932 j = ARRAY_SIZE (cpu_arch);
2933 }
2934
91d6fa6a 2935 if (j >= ARRAY_SIZE (cpu_arch))
e413e4e9
AM
2936 as_bad (_("no such architecture: `%s'"), string);
2937
2938 *input_line_pointer = e;
2939 }
2940 else
2941 as_bad (_("missing cpu architecture"));
2942
fddf5b5b
AM
2943 no_cond_jump_promotion = 0;
2944 if (*input_line_pointer == ','
29b0f896 2945 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
fddf5b5b 2946 {
d02603dc
NC
2947 char *string;
2948 char e;
2949
2950 ++input_line_pointer;
2951 e = get_symbol_name (&string);
fddf5b5b
AM
2952
2953 if (strcmp (string, "nojumps") == 0)
2954 no_cond_jump_promotion = 1;
2955 else if (strcmp (string, "jumps") == 0)
2956 ;
2957 else
2958 as_bad (_("no such architecture modifier: `%s'"), string);
2959
d02603dc 2960 (void) restore_line_pointer (e);
fddf5b5b
AM
2961 }
2962
e413e4e9
AM
2963 demand_empty_rest_of_line ();
2964}
2965
8a9036a4
L
2966enum bfd_architecture
2967i386_arch (void)
2968{
3632d14b 2969 if (cpu_arch_isa == PROCESSOR_L1OM)
8a9036a4
L
2970 {
2971 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2972 || flag_code != CODE_64BIT)
2973 as_fatal (_("Intel L1OM is 64bit ELF only"));
2974 return bfd_arch_l1om;
2975 }
7a9068fe
L
2976 else if (cpu_arch_isa == PROCESSOR_K1OM)
2977 {
2978 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2979 || flag_code != CODE_64BIT)
2980 as_fatal (_("Intel K1OM is 64bit ELF only"));
2981 return bfd_arch_k1om;
2982 }
81486035
L
2983 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2984 {
2985 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2986 || flag_code == CODE_64BIT)
2987 as_fatal (_("Intel MCU is 32bit ELF only"));
2988 return bfd_arch_iamcu;
2989 }
8a9036a4
L
2990 else
2991 return bfd_arch_i386;
2992}
2993
b9d79e03 2994unsigned long
7016a5d5 2995i386_mach (void)
b9d79e03 2996{
351f65ca 2997 if (!strncmp (default_arch, "x86_64", 6))
8a9036a4 2998 {
3632d14b 2999 if (cpu_arch_isa == PROCESSOR_L1OM)
8a9036a4 3000 {
351f65ca
L
3001 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3002 || default_arch[6] != '\0')
8a9036a4
L
3003 as_fatal (_("Intel L1OM is 64bit ELF only"));
3004 return bfd_mach_l1om;
3005 }
7a9068fe
L
3006 else if (cpu_arch_isa == PROCESSOR_K1OM)
3007 {
3008 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3009 || default_arch[6] != '\0')
3010 as_fatal (_("Intel K1OM is 64bit ELF only"));
3011 return bfd_mach_k1om;
3012 }
351f65ca 3013 else if (default_arch[6] == '\0')
8a9036a4 3014 return bfd_mach_x86_64;
351f65ca
L
3015 else
3016 return bfd_mach_x64_32;
8a9036a4 3017 }
5197d474
L
3018 else if (!strcmp (default_arch, "i386")
3019 || !strcmp (default_arch, "iamcu"))
81486035
L
3020 {
3021 if (cpu_arch_isa == PROCESSOR_IAMCU)
3022 {
3023 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3024 as_fatal (_("Intel MCU is 32bit ELF only"));
3025 return bfd_mach_i386_iamcu;
3026 }
3027 else
3028 return bfd_mach_i386_i386;
3029 }
b9d79e03 3030 else
2b5d6a91 3031 as_fatal (_("unknown architecture"));
b9d79e03 3032}
b9d79e03 3033\f
252b5132 3034void
7016a5d5 3035md_begin (void)
252b5132
RH
3036{
3037 const char *hash_err;
3038
86fa6981
L
3039 /* Support pseudo prefixes like {disp32}. */
3040 lex_type ['{'] = LEX_BEGIN_NAME;
3041
47926f60 3042 /* Initialize op_hash hash table. */
252b5132
RH
3043 op_hash = hash_new ();
3044
3045 {
d3ce72d0 3046 const insn_template *optab;
29b0f896 3047 templates *core_optab;
252b5132 3048
47926f60
KH
3049 /* Setup for loop. */
3050 optab = i386_optab;
add39d23 3051 core_optab = XNEW (templates);
252b5132
RH
3052 core_optab->start = optab;
3053
3054 while (1)
3055 {
3056 ++optab;
3057 if (optab->name == NULL
3058 || strcmp (optab->name, (optab - 1)->name) != 0)
3059 {
3060 /* different name --> ship out current template list;
47926f60 3061 add to hash table; & begin anew. */
252b5132
RH
3062 core_optab->end = optab;
3063 hash_err = hash_insert (op_hash,
3064 (optab - 1)->name,
5a49b8ac 3065 (void *) core_optab);
252b5132
RH
3066 if (hash_err)
3067 {
b37df7c4 3068 as_fatal (_("can't hash %s: %s"),
252b5132
RH
3069 (optab - 1)->name,
3070 hash_err);
3071 }
3072 if (optab->name == NULL)
3073 break;
add39d23 3074 core_optab = XNEW (templates);
252b5132
RH
3075 core_optab->start = optab;
3076 }
3077 }
3078 }
3079
47926f60 3080 /* Initialize reg_hash hash table. */
252b5132
RH
3081 reg_hash = hash_new ();
3082 {
29b0f896 3083 const reg_entry *regtab;
c3fe08fa 3084 unsigned int regtab_size = i386_regtab_size;
252b5132 3085
c3fe08fa 3086 for (regtab = i386_regtab; regtab_size--; regtab++)
252b5132 3087 {
5a49b8ac 3088 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
252b5132 3089 if (hash_err)
b37df7c4 3090 as_fatal (_("can't hash %s: %s"),
3e73aa7c
JH
3091 regtab->reg_name,
3092 hash_err);
252b5132
RH
3093 }
3094 }
3095
47926f60 3096 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
252b5132 3097 {
29b0f896
AM
3098 int c;
3099 char *p;
252b5132
RH
3100
3101 for (c = 0; c < 256; c++)
3102 {
3882b010 3103 if (ISDIGIT (c))
252b5132
RH
3104 {
3105 digit_chars[c] = c;
3106 mnemonic_chars[c] = c;
3107 register_chars[c] = c;
3108 operand_chars[c] = c;
3109 }
3882b010 3110 else if (ISLOWER (c))
252b5132
RH
3111 {
3112 mnemonic_chars[c] = c;
3113 register_chars[c] = c;
3114 operand_chars[c] = c;
3115 }
3882b010 3116 else if (ISUPPER (c))
252b5132 3117 {
3882b010 3118 mnemonic_chars[c] = TOLOWER (c);
252b5132
RH
3119 register_chars[c] = mnemonic_chars[c];
3120 operand_chars[c] = c;
3121 }
43234a1e 3122 else if (c == '{' || c == '}')
86fa6981
L
3123 {
3124 mnemonic_chars[c] = c;
3125 operand_chars[c] = c;
3126 }
252b5132 3127
3882b010 3128 if (ISALPHA (c) || ISDIGIT (c))
252b5132
RH
3129 identifier_chars[c] = c;
3130 else if (c >= 128)
3131 {
3132 identifier_chars[c] = c;
3133 operand_chars[c] = c;
3134 }
3135 }
3136
3137#ifdef LEX_AT
3138 identifier_chars['@'] = '@';
32137342
NC
3139#endif
3140#ifdef LEX_QM
3141 identifier_chars['?'] = '?';
3142 operand_chars['?'] = '?';
252b5132 3143#endif
252b5132 3144 digit_chars['-'] = '-';
c0f3af97 3145 mnemonic_chars['_'] = '_';
791fe849 3146 mnemonic_chars['-'] = '-';
0003779b 3147 mnemonic_chars['.'] = '.';
252b5132
RH
3148 identifier_chars['_'] = '_';
3149 identifier_chars['.'] = '.';
3150
3151 for (p = operand_special_chars; *p != '\0'; p++)
3152 operand_chars[(unsigned char) *p] = *p;
3153 }
3154
a4447b93
RH
3155 if (flag_code == CODE_64BIT)
3156 {
ca19b261
KT
3157#if defined (OBJ_COFF) && defined (TE_PE)
3158 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3159 ? 32 : 16);
3160#else
a4447b93 3161 x86_dwarf2_return_column = 16;
ca19b261 3162#endif
61ff971f 3163 x86_cie_data_alignment = -8;
a4447b93
RH
3164 }
3165 else
3166 {
3167 x86_dwarf2_return_column = 8;
3168 x86_cie_data_alignment = -4;
3169 }
e379e5f3
L
3170
3171 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3172 can be turned into BRANCH_PREFIX frag. */
3173 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3174 abort ();
252b5132
RH
3175}
3176
3177void
e3bb37b5 3178i386_print_statistics (FILE *file)
252b5132
RH
3179{
3180 hash_print_statistics (file, "i386 opcode", op_hash);
3181 hash_print_statistics (file, "i386 register", reg_hash);
3182}
3183\f
252b5132
RH
3184#ifdef DEBUG386
3185
ce8a8b2f 3186/* Debugging routines for md_assemble. */
d3ce72d0 3187static void pte (insn_template *);
40fb9820 3188static void pt (i386_operand_type);
e3bb37b5
L
3189static void pe (expressionS *);
3190static void ps (symbolS *);
252b5132
RH
3191
3192static void
2c703856 3193pi (const char *line, i386_insn *x)
252b5132 3194{
09137c09 3195 unsigned int j;
252b5132
RH
3196
3197 fprintf (stdout, "%s: template ", line);
3198 pte (&x->tm);
09f131f2
JH
3199 fprintf (stdout, " address: base %s index %s scale %x\n",
3200 x->base_reg ? x->base_reg->reg_name : "none",
3201 x->index_reg ? x->index_reg->reg_name : "none",
3202 x->log2_scale_factor);
3203 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
252b5132 3204 x->rm.mode, x->rm.reg, x->rm.regmem);
09f131f2
JH
3205 fprintf (stdout, " sib: base %x index %x scale %x\n",
3206 x->sib.base, x->sib.index, x->sib.scale);
3207 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
161a04f6
L
3208 (x->rex & REX_W) != 0,
3209 (x->rex & REX_R) != 0,
3210 (x->rex & REX_X) != 0,
3211 (x->rex & REX_B) != 0);
09137c09 3212 for (j = 0; j < x->operands; j++)
252b5132 3213 {
09137c09
SP
3214 fprintf (stdout, " #%d: ", j + 1);
3215 pt (x->types[j]);
252b5132 3216 fprintf (stdout, "\n");
bab6aec1 3217 if (x->types[j].bitfield.class == Reg
3528c362
JB
3218 || x->types[j].bitfield.class == RegMMX
3219 || x->types[j].bitfield.class == RegSIMD
dd6b8a0b 3220 || x->types[j].bitfield.class == RegMask
00cee14f 3221 || x->types[j].bitfield.class == SReg
4a5c67ed
JB
3222 || x->types[j].bitfield.class == RegCR
3223 || x->types[j].bitfield.class == RegDR
dd6b8a0b
JB
3224 || x->types[j].bitfield.class == RegTR
3225 || x->types[j].bitfield.class == RegBND)
09137c09
SP
3226 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3227 if (operand_type_check (x->types[j], imm))
3228 pe (x->op[j].imms);
3229 if (operand_type_check (x->types[j], disp))
3230 pe (x->op[j].disps);
252b5132
RH
3231 }
3232}
3233
3234static void
d3ce72d0 3235pte (insn_template *t)
252b5132 3236{
09137c09 3237 unsigned int j;
252b5132 3238 fprintf (stdout, " %d operands ", t->operands);
47926f60 3239 fprintf (stdout, "opcode %x ", t->base_opcode);
252b5132
RH
3240 if (t->extension_opcode != None)
3241 fprintf (stdout, "ext %x ", t->extension_opcode);
40fb9820 3242 if (t->opcode_modifier.d)
252b5132 3243 fprintf (stdout, "D");
40fb9820 3244 if (t->opcode_modifier.w)
252b5132
RH
3245 fprintf (stdout, "W");
3246 fprintf (stdout, "\n");
09137c09 3247 for (j = 0; j < t->operands; j++)
252b5132 3248 {
09137c09
SP
3249 fprintf (stdout, " #%d type ", j + 1);
3250 pt (t->operand_types[j]);
252b5132
RH
3251 fprintf (stdout, "\n");
3252 }
3253}
3254
3255static void
e3bb37b5 3256pe (expressionS *e)
252b5132 3257{
24eab124 3258 fprintf (stdout, " operation %d\n", e->X_op);
b77ad1d4
AM
3259 fprintf (stdout, " add_number %ld (%lx)\n",
3260 (long) e->X_add_number, (long) e->X_add_number);
252b5132
RH
3261 if (e->X_add_symbol)
3262 {
3263 fprintf (stdout, " add_symbol ");
3264 ps (e->X_add_symbol);
3265 fprintf (stdout, "\n");
3266 }
3267 if (e->X_op_symbol)
3268 {
3269 fprintf (stdout, " op_symbol ");
3270 ps (e->X_op_symbol);
3271 fprintf (stdout, "\n");
3272 }
3273}
3274
3275static void
e3bb37b5 3276ps (symbolS *s)
252b5132
RH
3277{
3278 fprintf (stdout, "%s type %s%s",
3279 S_GET_NAME (s),
3280 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3281 segment_name (S_GET_SEGMENT (s)));
3282}
3283
7b81dfbb 3284static struct type_name
252b5132 3285 {
40fb9820
L
3286 i386_operand_type mask;
3287 const char *name;
252b5132 3288 }
7b81dfbb 3289const type_names[] =
252b5132 3290{
40fb9820
L
3291 { OPERAND_TYPE_REG8, "r8" },
3292 { OPERAND_TYPE_REG16, "r16" },
3293 { OPERAND_TYPE_REG32, "r32" },
3294 { OPERAND_TYPE_REG64, "r64" },
2c703856
JB
3295 { OPERAND_TYPE_ACC8, "acc8" },
3296 { OPERAND_TYPE_ACC16, "acc16" },
3297 { OPERAND_TYPE_ACC32, "acc32" },
3298 { OPERAND_TYPE_ACC64, "acc64" },
40fb9820
L
3299 { OPERAND_TYPE_IMM8, "i8" },
3300 { OPERAND_TYPE_IMM8, "i8s" },
3301 { OPERAND_TYPE_IMM16, "i16" },
3302 { OPERAND_TYPE_IMM32, "i32" },
3303 { OPERAND_TYPE_IMM32S, "i32s" },
3304 { OPERAND_TYPE_IMM64, "i64" },
3305 { OPERAND_TYPE_IMM1, "i1" },
3306 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3307 { OPERAND_TYPE_DISP8, "d8" },
3308 { OPERAND_TYPE_DISP16, "d16" },
3309 { OPERAND_TYPE_DISP32, "d32" },
3310 { OPERAND_TYPE_DISP32S, "d32s" },
3311 { OPERAND_TYPE_DISP64, "d64" },
3312 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3313 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3314 { OPERAND_TYPE_CONTROL, "control reg" },
3315 { OPERAND_TYPE_TEST, "test reg" },
3316 { OPERAND_TYPE_DEBUG, "debug reg" },
3317 { OPERAND_TYPE_FLOATREG, "FReg" },
3318 { OPERAND_TYPE_FLOATACC, "FAcc" },
21df382b 3319 { OPERAND_TYPE_SREG, "SReg" },
40fb9820
L
3320 { OPERAND_TYPE_REGMMX, "rMMX" },
3321 { OPERAND_TYPE_REGXMM, "rXMM" },
0349dc08 3322 { OPERAND_TYPE_REGYMM, "rYMM" },
43234a1e 3323 { OPERAND_TYPE_REGZMM, "rZMM" },
260cd341 3324 { OPERAND_TYPE_REGTMM, "rTMM" },
43234a1e 3325 { OPERAND_TYPE_REGMASK, "Mask reg" },
252b5132
RH
3326};
3327
3328static void
40fb9820 3329pt (i386_operand_type t)
252b5132 3330{
40fb9820 3331 unsigned int j;
c6fb90c8 3332 i386_operand_type a;
252b5132 3333
40fb9820 3334 for (j = 0; j < ARRAY_SIZE (type_names); j++)
c6fb90c8
L
3335 {
3336 a = operand_type_and (t, type_names[j].mask);
2c703856 3337 if (operand_type_equal (&a, &type_names[j].mask))
c6fb90c8
L
3338 fprintf (stdout, "%s, ", type_names[j].name);
3339 }
252b5132
RH
3340 fflush (stdout);
3341}
3342
3343#endif /* DEBUG386 */
3344\f
252b5132 3345static bfd_reloc_code_real_type
3956db08 3346reloc (unsigned int size,
64e74474
AM
3347 int pcrel,
3348 int sign,
3349 bfd_reloc_code_real_type other)
252b5132 3350{
47926f60 3351 if (other != NO_RELOC)
3956db08 3352 {
91d6fa6a 3353 reloc_howto_type *rel;
3956db08
JB
3354
3355 if (size == 8)
3356 switch (other)
3357 {
64e74474
AM
3358 case BFD_RELOC_X86_64_GOT32:
3359 return BFD_RELOC_X86_64_GOT64;
3360 break;
553d1284
L
3361 case BFD_RELOC_X86_64_GOTPLT64:
3362 return BFD_RELOC_X86_64_GOTPLT64;
3363 break;
64e74474
AM
3364 case BFD_RELOC_X86_64_PLTOFF64:
3365 return BFD_RELOC_X86_64_PLTOFF64;
3366 break;
3367 case BFD_RELOC_X86_64_GOTPC32:
3368 other = BFD_RELOC_X86_64_GOTPC64;
3369 break;
3370 case BFD_RELOC_X86_64_GOTPCREL:
3371 other = BFD_RELOC_X86_64_GOTPCREL64;
3372 break;
3373 case BFD_RELOC_X86_64_TPOFF32:
3374 other = BFD_RELOC_X86_64_TPOFF64;
3375 break;
3376 case BFD_RELOC_X86_64_DTPOFF32:
3377 other = BFD_RELOC_X86_64_DTPOFF64;
3378 break;
3379 default:
3380 break;
3956db08 3381 }
e05278af 3382
8ce3d284 3383#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
3384 if (other == BFD_RELOC_SIZE32)
3385 {
3386 if (size == 8)
1ab668bf 3387 other = BFD_RELOC_SIZE64;
8fd4256d 3388 if (pcrel)
1ab668bf
AM
3389 {
3390 as_bad (_("there are no pc-relative size relocations"));
3391 return NO_RELOC;
3392 }
8fd4256d 3393 }
8ce3d284 3394#endif
8fd4256d 3395
e05278af 3396 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
f2d8a97c 3397 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
e05278af
JB
3398 sign = -1;
3399
91d6fa6a
NC
3400 rel = bfd_reloc_type_lookup (stdoutput, other);
3401 if (!rel)
3956db08 3402 as_bad (_("unknown relocation (%u)"), other);
91d6fa6a 3403 else if (size != bfd_get_reloc_size (rel))
3956db08 3404 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
91d6fa6a 3405 bfd_get_reloc_size (rel),
3956db08 3406 size);
91d6fa6a 3407 else if (pcrel && !rel->pc_relative)
3956db08 3408 as_bad (_("non-pc-relative relocation for pc-relative field"));
91d6fa6a 3409 else if ((rel->complain_on_overflow == complain_overflow_signed
3956db08 3410 && !sign)
91d6fa6a 3411 || (rel->complain_on_overflow == complain_overflow_unsigned
64e74474 3412 && sign > 0))
3956db08
JB
3413 as_bad (_("relocated field and relocation type differ in signedness"));
3414 else
3415 return other;
3416 return NO_RELOC;
3417 }
252b5132
RH
3418
3419 if (pcrel)
3420 {
3e73aa7c 3421 if (!sign)
3956db08 3422 as_bad (_("there are no unsigned pc-relative relocations"));
252b5132
RH
3423 switch (size)
3424 {
3425 case 1: return BFD_RELOC_8_PCREL;
3426 case 2: return BFD_RELOC_16_PCREL;
d258b828 3427 case 4: return BFD_RELOC_32_PCREL;
d6ab8113 3428 case 8: return BFD_RELOC_64_PCREL;
252b5132 3429 }
3956db08 3430 as_bad (_("cannot do %u byte pc-relative relocation"), size);
252b5132
RH
3431 }
3432 else
3433 {
3956db08 3434 if (sign > 0)
e5cb08ac 3435 switch (size)
3e73aa7c
JH
3436 {
3437 case 4: return BFD_RELOC_X86_64_32S;
3438 }
3439 else
3440 switch (size)
3441 {
3442 case 1: return BFD_RELOC_8;
3443 case 2: return BFD_RELOC_16;
3444 case 4: return BFD_RELOC_32;
3445 case 8: return BFD_RELOC_64;
3446 }
3956db08
JB
3447 as_bad (_("cannot do %s %u byte relocation"),
3448 sign > 0 ? "signed" : "unsigned", size);
252b5132
RH
3449 }
3450
0cc9e1d3 3451 return NO_RELOC;
252b5132
RH
3452}
3453
47926f60
KH
3454/* Here we decide which fixups can be adjusted to make them relative to
3455 the beginning of the section instead of the symbol. Basically we need
3456 to make sure that the dynamic relocations are done correctly, so in
3457 some cases we force the original symbol to be used. */
3458
252b5132 3459int
e3bb37b5 3460tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
252b5132 3461{
6d249963 3462#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 3463 if (!IS_ELF)
31312f95
AM
3464 return 1;
3465
a161fe53
AM
3466 /* Don't adjust pc-relative references to merge sections in 64-bit
3467 mode. */
3468 if (use_rela_relocations
3469 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3470 && fixP->fx_pcrel)
252b5132 3471 return 0;
31312f95 3472
8d01d9a9
AJ
3473 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3474 and changed later by validate_fix. */
3475 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3476 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3477 return 0;
3478
8fd4256d
L
3479 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3480 for size relocations. */
3481 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3482 || fixP->fx_r_type == BFD_RELOC_SIZE64
3483 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
252b5132 3484 || fixP->fx_r_type == BFD_RELOC_386_GOT32
02a86693 3485 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
13ae64f3
JJ
3486 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3487 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3488 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3489 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
37e55690
JJ
3490 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3491 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
13ae64f3
JJ
3492 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3493 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
67a4f2b7
AO
3494 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3495 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3e73aa7c 3496 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
80b3ee89 3497 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
56ceb5b5
L
3498 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3499 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
bffbf940
JJ
3500 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3501 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3502 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
d6ab8113 3503 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
bffbf940
JJ
3504 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3505 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
d6ab8113
JB
3506 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3507 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
67a4f2b7
AO
3508 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3509 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
252b5132
RH
3510 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3511 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3512 return 0;
31312f95 3513#endif
252b5132
RH
3514 return 1;
3515}
252b5132 3516
b4cac588 3517static int
e3bb37b5 3518intel_float_operand (const char *mnemonic)
252b5132 3519{
9306ca4a
JB
3520 /* Note that the value returned is meaningful only for opcodes with (memory)
3521 operands, hence the code here is free to improperly handle opcodes that
3522 have no operands (for better performance and smaller code). */
3523
3524 if (mnemonic[0] != 'f')
3525 return 0; /* non-math */
3526
3527 switch (mnemonic[1])
3528 {
3529 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3530 the fs segment override prefix not currently handled because no
3531 call path can make opcodes without operands get here */
3532 case 'i':
3533 return 2 /* integer op */;
3534 case 'l':
3535 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3536 return 3; /* fldcw/fldenv */
3537 break;
3538 case 'n':
3539 if (mnemonic[2] != 'o' /* fnop */)
3540 return 3; /* non-waiting control op */
3541 break;
3542 case 'r':
3543 if (mnemonic[2] == 's')
3544 return 3; /* frstor/frstpm */
3545 break;
3546 case 's':
3547 if (mnemonic[2] == 'a')
3548 return 3; /* fsave */
3549 if (mnemonic[2] == 't')
3550 {
3551 switch (mnemonic[3])
3552 {
3553 case 'c': /* fstcw */
3554 case 'd': /* fstdw */
3555 case 'e': /* fstenv */
3556 case 's': /* fsts[gw] */
3557 return 3;
3558 }
3559 }
3560 break;
3561 case 'x':
3562 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3563 return 0; /* fxsave/fxrstor are not really math ops */
3564 break;
3565 }
252b5132 3566
9306ca4a 3567 return 1;
252b5132
RH
3568}
3569
c0f3af97
L
3570/* Build the VEX prefix. */
3571
3572static void
d3ce72d0 3573build_vex_prefix (const insn_template *t)
c0f3af97
L
3574{
3575 unsigned int register_specifier;
3576 unsigned int implied_prefix;
3577 unsigned int vector_length;
03751133 3578 unsigned int w;
c0f3af97
L
3579
3580 /* Check register specifier. */
3581 if (i.vex.register_specifier)
43234a1e
L
3582 {
3583 register_specifier =
3584 ~register_number (i.vex.register_specifier) & 0xf;
3585 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3586 }
c0f3af97
L
3587 else
3588 register_specifier = 0xf;
3589
79f0fa25
L
3590 /* Use 2-byte VEX prefix by swapping destination and source operand
3591 if there are more than 1 register operand. */
3592 if (i.reg_operands > 1
3593 && i.vec_encoding != vex_encoding_vex3
86fa6981 3594 && i.dir_encoding == dir_encoding_default
fa99fab2 3595 && i.operands == i.reg_operands
dbbc8b7e 3596 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
7f399153 3597 && i.tm.opcode_modifier.vexopcode == VEX0F
dbbc8b7e 3598 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
fa99fab2
L
3599 && i.rex == REX_B)
3600 {
3601 unsigned int xchg = i.operands - 1;
3602 union i386_op temp_op;
3603 i386_operand_type temp_type;
3604
3605 temp_type = i.types[xchg];
3606 i.types[xchg] = i.types[0];
3607 i.types[0] = temp_type;
3608 temp_op = i.op[xchg];
3609 i.op[xchg] = i.op[0];
3610 i.op[0] = temp_op;
3611
9c2799c2 3612 gas_assert (i.rm.mode == 3);
fa99fab2
L
3613
3614 i.rex = REX_R;
3615 xchg = i.rm.regmem;
3616 i.rm.regmem = i.rm.reg;
3617 i.rm.reg = xchg;
3618
dbbc8b7e
JB
3619 if (i.tm.opcode_modifier.d)
3620 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3621 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3622 else /* Use the next insn. */
3623 i.tm = t[1];
fa99fab2
L
3624 }
3625
79dec6b7
JB
3626 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3627 are no memory operands and at least 3 register ones. */
3628 if (i.reg_operands >= 3
3629 && i.vec_encoding != vex_encoding_vex3
3630 && i.reg_operands == i.operands - i.imm_operands
3631 && i.tm.opcode_modifier.vex
3632 && i.tm.opcode_modifier.commutative
3633 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3634 && i.rex == REX_B
3635 && i.vex.register_specifier
3636 && !(i.vex.register_specifier->reg_flags & RegRex))
3637 {
3638 unsigned int xchg = i.operands - i.reg_operands;
3639 union i386_op temp_op;
3640 i386_operand_type temp_type;
3641
3642 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3643 gas_assert (!i.tm.opcode_modifier.sae);
3644 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3645 &i.types[i.operands - 3]));
3646 gas_assert (i.rm.mode == 3);
3647
3648 temp_type = i.types[xchg];
3649 i.types[xchg] = i.types[xchg + 1];
3650 i.types[xchg + 1] = temp_type;
3651 temp_op = i.op[xchg];
3652 i.op[xchg] = i.op[xchg + 1];
3653 i.op[xchg + 1] = temp_op;
3654
3655 i.rex = 0;
3656 xchg = i.rm.regmem | 8;
3657 i.rm.regmem = ~register_specifier & 0xf;
3658 gas_assert (!(i.rm.regmem & 8));
3659 i.vex.register_specifier += xchg - i.rm.regmem;
3660 register_specifier = ~xchg & 0xf;
3661 }
3662
539f890d
L
3663 if (i.tm.opcode_modifier.vex == VEXScalar)
3664 vector_length = avxscalar;
10c17abd
JB
3665 else if (i.tm.opcode_modifier.vex == VEX256)
3666 vector_length = 1;
539f890d 3667 else
10c17abd 3668 {
56522fc5 3669 unsigned int op;
10c17abd 3670
c7213af9
L
3671 /* Determine vector length from the last multi-length vector
3672 operand. */
10c17abd 3673 vector_length = 0;
56522fc5 3674 for (op = t->operands; op--;)
10c17abd
JB
3675 if (t->operand_types[op].bitfield.xmmword
3676 && t->operand_types[op].bitfield.ymmword
3677 && i.types[op].bitfield.ymmword)
3678 {
3679 vector_length = 1;
3680 break;
3681 }
3682 }
c0f3af97 3683
8c190ce0 3684 switch ((i.tm.base_opcode >> (i.tm.opcode_length << 3)) & 0xff)
c0f3af97
L
3685 {
3686 case 0:
3687 implied_prefix = 0;
3688 break;
3689 case DATA_PREFIX_OPCODE:
3690 implied_prefix = 1;
3691 break;
3692 case REPE_PREFIX_OPCODE:
3693 implied_prefix = 2;
3694 break;
3695 case REPNE_PREFIX_OPCODE:
3696 implied_prefix = 3;
3697 break;
3698 default:
3699 abort ();
3700 }
3701
03751133
L
3702 /* Check the REX.W bit and VEXW. */
3703 if (i.tm.opcode_modifier.vexw == VEXWIG)
3704 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3705 else if (i.tm.opcode_modifier.vexw)
3706 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3707 else
931d03b7 3708 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
03751133 3709
c0f3af97 3710 /* Use 2-byte VEX prefix if possible. */
03751133
L
3711 if (w == 0
3712 && i.vec_encoding != vex_encoding_vex3
86fa6981 3713 && i.tm.opcode_modifier.vexopcode == VEX0F
c0f3af97
L
3714 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3715 {
3716 /* 2-byte VEX prefix. */
3717 unsigned int r;
3718
3719 i.vex.length = 2;
3720 i.vex.bytes[0] = 0xc5;
3721
3722 /* Check the REX.R bit. */
3723 r = (i.rex & REX_R) ? 0 : 1;
3724 i.vex.bytes[1] = (r << 7
3725 | register_specifier << 3
3726 | vector_length << 2
3727 | implied_prefix);
3728 }
3729 else
3730 {
3731 /* 3-byte VEX prefix. */
03751133 3732 unsigned int m;
c0f3af97 3733
f88c9eb0 3734 i.vex.length = 3;
f88c9eb0 3735
7f399153 3736 switch (i.tm.opcode_modifier.vexopcode)
5dd85c99 3737 {
7f399153
L
3738 case VEX0F:
3739 m = 0x1;
80de6e00 3740 i.vex.bytes[0] = 0xc4;
7f399153
L
3741 break;
3742 case VEX0F38:
3743 m = 0x2;
80de6e00 3744 i.vex.bytes[0] = 0xc4;
7f399153
L
3745 break;
3746 case VEX0F3A:
3747 m = 0x3;
80de6e00 3748 i.vex.bytes[0] = 0xc4;
7f399153
L
3749 break;
3750 case XOP08:
5dd85c99
SP
3751 m = 0x8;
3752 i.vex.bytes[0] = 0x8f;
7f399153
L
3753 break;
3754 case XOP09:
f88c9eb0
SP
3755 m = 0x9;
3756 i.vex.bytes[0] = 0x8f;
7f399153
L
3757 break;
3758 case XOP0A:
f88c9eb0
SP
3759 m = 0xa;
3760 i.vex.bytes[0] = 0x8f;
7f399153
L
3761 break;
3762 default:
3763 abort ();
f88c9eb0 3764 }
c0f3af97 3765
c0f3af97
L
3766 /* The high 3 bits of the second VEX byte are 1's compliment
3767 of RXB bits from REX. */
3768 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3769
c0f3af97
L
3770 i.vex.bytes[2] = (w << 7
3771 | register_specifier << 3
3772 | vector_length << 2
3773 | implied_prefix);
3774 }
3775}
3776
e771e7c9
JB
3777static INLINE bfd_boolean
3778is_evex_encoding (const insn_template *t)
3779{
7091c612 3780 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
e771e7c9 3781 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
a80195f1 3782 || t->opcode_modifier.sae;
e771e7c9
JB
3783}
3784
7a8655d2
JB
3785static INLINE bfd_boolean
3786is_any_vex_encoding (const insn_template *t)
3787{
3788 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3789 || is_evex_encoding (t);
3790}
3791
43234a1e
L
3792/* Build the EVEX prefix. */
3793
3794static void
3795build_evex_prefix (void)
3796{
3797 unsigned int register_specifier;
3798 unsigned int implied_prefix;
3799 unsigned int m, w;
3800 rex_byte vrex_used = 0;
3801
3802 /* Check register specifier. */
3803 if (i.vex.register_specifier)
3804 {
3805 gas_assert ((i.vrex & REX_X) == 0);
3806
3807 register_specifier = i.vex.register_specifier->reg_num;
3808 if ((i.vex.register_specifier->reg_flags & RegRex))
3809 register_specifier += 8;
3810 /* The upper 16 registers are encoded in the fourth byte of the
3811 EVEX prefix. */
3812 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3813 i.vex.bytes[3] = 0x8;
3814 register_specifier = ~register_specifier & 0xf;
3815 }
3816 else
3817 {
3818 register_specifier = 0xf;
3819
3820 /* Encode upper 16 vector index register in the fourth byte of
3821 the EVEX prefix. */
3822 if (!(i.vrex & REX_X))
3823 i.vex.bytes[3] = 0x8;
3824 else
3825 vrex_used |= REX_X;
3826 }
3827
3828 switch ((i.tm.base_opcode >> 8) & 0xff)
3829 {
3830 case 0:
3831 implied_prefix = 0;
3832 break;
3833 case DATA_PREFIX_OPCODE:
3834 implied_prefix = 1;
3835 break;
3836 case REPE_PREFIX_OPCODE:
3837 implied_prefix = 2;
3838 break;
3839 case REPNE_PREFIX_OPCODE:
3840 implied_prefix = 3;
3841 break;
3842 default:
3843 abort ();
3844 }
3845
3846 /* 4 byte EVEX prefix. */
3847 i.vex.length = 4;
3848 i.vex.bytes[0] = 0x62;
3849
3850 /* mmmm bits. */
3851 switch (i.tm.opcode_modifier.vexopcode)
3852 {
3853 case VEX0F:
3854 m = 1;
3855 break;
3856 case VEX0F38:
3857 m = 2;
3858 break;
3859 case VEX0F3A:
3860 m = 3;
3861 break;
3862 default:
3863 abort ();
3864 break;
3865 }
3866
3867 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3868 bits from REX. */
3869 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3870
3871 /* The fifth bit of the second EVEX byte is 1's compliment of the
3872 REX_R bit in VREX. */
3873 if (!(i.vrex & REX_R))
3874 i.vex.bytes[1] |= 0x10;
3875 else
3876 vrex_used |= REX_R;
3877
3878 if ((i.reg_operands + i.imm_operands) == i.operands)
3879 {
3880 /* When all operands are registers, the REX_X bit in REX is not
3881 used. We reuse it to encode the upper 16 registers, which is
3882 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3883 as 1's compliment. */
3884 if ((i.vrex & REX_B))
3885 {
3886 vrex_used |= REX_B;
3887 i.vex.bytes[1] &= ~0x40;
3888 }
3889 }
3890
3891 /* EVEX instructions shouldn't need the REX prefix. */
3892 i.vrex &= ~vrex_used;
3893 gas_assert (i.vrex == 0);
3894
6865c043
L
3895 /* Check the REX.W bit and VEXW. */
3896 if (i.tm.opcode_modifier.vexw == VEXWIG)
3897 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3898 else if (i.tm.opcode_modifier.vexw)
3899 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3900 else
931d03b7 3901 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
43234a1e
L
3902
3903 /* Encode the U bit. */
3904 implied_prefix |= 0x4;
3905
3906 /* The third byte of the EVEX prefix. */
3907 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3908
3909 /* The fourth byte of the EVEX prefix. */
3910 /* The zeroing-masking bit. */
3911 if (i.mask && i.mask->zeroing)
3912 i.vex.bytes[3] |= 0x80;
3913
3914 /* Don't always set the broadcast bit if there is no RC. */
3915 if (!i.rounding)
3916 {
3917 /* Encode the vector length. */
3918 unsigned int vec_length;
3919
e771e7c9
JB
3920 if (!i.tm.opcode_modifier.evex
3921 || i.tm.opcode_modifier.evex == EVEXDYN)
3922 {
56522fc5 3923 unsigned int op;
e771e7c9 3924
c7213af9
L
3925 /* Determine vector length from the last multi-length vector
3926 operand. */
56522fc5 3927 for (op = i.operands; op--;)
e771e7c9
JB
3928 if (i.tm.operand_types[op].bitfield.xmmword
3929 + i.tm.operand_types[op].bitfield.ymmword
3930 + i.tm.operand_types[op].bitfield.zmmword > 1)
3931 {
3932 if (i.types[op].bitfield.zmmword)
c7213af9
L
3933 {
3934 i.tm.opcode_modifier.evex = EVEX512;
3935 break;
3936 }
e771e7c9 3937 else if (i.types[op].bitfield.ymmword)
c7213af9
L
3938 {
3939 i.tm.opcode_modifier.evex = EVEX256;
3940 break;
3941 }
e771e7c9 3942 else if (i.types[op].bitfield.xmmword)
c7213af9
L
3943 {
3944 i.tm.opcode_modifier.evex = EVEX128;
3945 break;
3946 }
625cbd7a
JB
3947 else if (i.broadcast && (int) op == i.broadcast->operand)
3948 {
4a1b91ea 3949 switch (i.broadcast->bytes)
625cbd7a
JB
3950 {
3951 case 64:
3952 i.tm.opcode_modifier.evex = EVEX512;
3953 break;
3954 case 32:
3955 i.tm.opcode_modifier.evex = EVEX256;
3956 break;
3957 case 16:
3958 i.tm.opcode_modifier.evex = EVEX128;
3959 break;
3960 default:
c7213af9 3961 abort ();
625cbd7a 3962 }
c7213af9 3963 break;
625cbd7a 3964 }
e771e7c9 3965 }
c7213af9 3966
56522fc5 3967 if (op >= MAX_OPERANDS)
c7213af9 3968 abort ();
e771e7c9
JB
3969 }
3970
43234a1e
L
3971 switch (i.tm.opcode_modifier.evex)
3972 {
3973 case EVEXLIG: /* LL' is ignored */
3974 vec_length = evexlig << 5;
3975 break;
3976 case EVEX128:
3977 vec_length = 0 << 5;
3978 break;
3979 case EVEX256:
3980 vec_length = 1 << 5;
3981 break;
3982 case EVEX512:
3983 vec_length = 2 << 5;
3984 break;
3985 default:
3986 abort ();
3987 break;
3988 }
3989 i.vex.bytes[3] |= vec_length;
3990 /* Encode the broadcast bit. */
3991 if (i.broadcast)
3992 i.vex.bytes[3] |= 0x10;
3993 }
3994 else
3995 {
3996 if (i.rounding->type != saeonly)
3997 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3998 else
d3d3c6db 3999 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
43234a1e
L
4000 }
4001
4002 if (i.mask && i.mask->mask)
4003 i.vex.bytes[3] |= i.mask->mask->reg_num;
4004}
4005
65da13b5
L
4006static void
4007process_immext (void)
4008{
4009 expressionS *exp;
4010
c0f3af97 4011 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
65da13b5
L
4012 which is coded in the same place as an 8-bit immediate field
4013 would be. Here we fake an 8-bit immediate operand from the
4014 opcode suffix stored in tm.extension_opcode.
4015
c1e679ec 4016 AVX instructions also use this encoding, for some of
c0f3af97 4017 3 argument instructions. */
65da13b5 4018
43234a1e 4019 gas_assert (i.imm_operands <= 1
7ab9ffdd 4020 && (i.operands <= 2
7a8655d2 4021 || (is_any_vex_encoding (&i.tm)
7ab9ffdd 4022 && i.operands <= 4)));
65da13b5
L
4023
4024 exp = &im_expressions[i.imm_operands++];
4025 i.op[i.operands].imms = exp;
4026 i.types[i.operands] = imm8;
4027 i.operands++;
4028 exp->X_op = O_constant;
4029 exp->X_add_number = i.tm.extension_opcode;
4030 i.tm.extension_opcode = None;
4031}
4032
42164a71
L
4033
4034static int
4035check_hle (void)
4036{
4037 switch (i.tm.opcode_modifier.hleprefixok)
4038 {
4039 default:
4040 abort ();
82c2def5 4041 case HLEPrefixNone:
165de32a
L
4042 as_bad (_("invalid instruction `%s' after `%s'"),
4043 i.tm.name, i.hle_prefix);
42164a71 4044 return 0;
82c2def5 4045 case HLEPrefixLock:
42164a71
L
4046 if (i.prefix[LOCK_PREFIX])
4047 return 1;
165de32a 4048 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
42164a71 4049 return 0;
82c2def5 4050 case HLEPrefixAny:
42164a71 4051 return 1;
82c2def5 4052 case HLEPrefixRelease:
42164a71
L
4053 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4054 {
4055 as_bad (_("instruction `%s' after `xacquire' not allowed"),
4056 i.tm.name);
4057 return 0;
4058 }
8dc0818e 4059 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
42164a71
L
4060 {
4061 as_bad (_("memory destination needed for instruction `%s'"
4062 " after `xrelease'"), i.tm.name);
4063 return 0;
4064 }
4065 return 1;
4066 }
4067}
4068
b6f8c7c4
L
4069/* Try the shortest encoding by shortening operand size. */
4070
4071static void
4072optimize_encoding (void)
4073{
a0a1771e 4074 unsigned int j;
b6f8c7c4
L
4075
4076 if (optimize_for_space
72aea328 4077 && !is_any_vex_encoding (&i.tm)
b6f8c7c4
L
4078 && i.reg_operands == 1
4079 && i.imm_operands == 1
4080 && !i.types[1].bitfield.byte
4081 && i.op[0].imms->X_op == O_constant
4082 && fits_in_imm7 (i.op[0].imms->X_add_number)
72aea328 4083 && (i.tm.base_opcode == 0xa8
b6f8c7c4
L
4084 || (i.tm.base_opcode == 0xf6
4085 && i.tm.extension_opcode == 0x0)))
4086 {
4087 /* Optimize: -Os:
4088 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4089 */
4090 unsigned int base_regnum = i.op[1].regs->reg_num;
4091 if (flag_code == CODE_64BIT || base_regnum < 4)
4092 {
4093 i.types[1].bitfield.byte = 1;
4094 /* Ignore the suffix. */
4095 i.suffix = 0;
7697afb6
JB
4096 /* Convert to byte registers. */
4097 if (i.types[1].bitfield.word)
4098 j = 16;
4099 else if (i.types[1].bitfield.dword)
4100 j = 32;
4101 else
4102 j = 48;
4103 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4104 j += 8;
4105 i.op[1].regs -= j;
b6f8c7c4
L
4106 }
4107 }
4108 else if (flag_code == CODE_64BIT
72aea328 4109 && !is_any_vex_encoding (&i.tm)
d3d50934
L
4110 && ((i.types[1].bitfield.qword
4111 && i.reg_operands == 1
b6f8c7c4
L
4112 && i.imm_operands == 1
4113 && i.op[0].imms->X_op == O_constant
507916b8 4114 && ((i.tm.base_opcode == 0xb8
b6f8c7c4
L
4115 && i.tm.extension_opcode == None
4116 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4117 || (fits_in_imm31 (i.op[0].imms->X_add_number)
72aea328
JB
4118 && ((i.tm.base_opcode == 0x24
4119 || i.tm.base_opcode == 0xa8)
b6f8c7c4
L
4120 || (i.tm.base_opcode == 0x80
4121 && i.tm.extension_opcode == 0x4)
4122 || ((i.tm.base_opcode == 0xf6
507916b8 4123 || (i.tm.base_opcode | 1) == 0xc7)
b8364fa7
JB
4124 && i.tm.extension_opcode == 0x0)))
4125 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4126 && i.tm.base_opcode == 0x83
4127 && i.tm.extension_opcode == 0x4)))
d3d50934
L
4128 || (i.types[0].bitfield.qword
4129 && ((i.reg_operands == 2
4130 && i.op[0].regs == i.op[1].regs
72aea328
JB
4131 && (i.tm.base_opcode == 0x30
4132 || i.tm.base_opcode == 0x28))
d3d50934
L
4133 || (i.reg_operands == 1
4134 && i.operands == 1
72aea328 4135 && i.tm.base_opcode == 0x30)))))
b6f8c7c4
L
4136 {
4137 /* Optimize: -O:
4138 andq $imm31, %r64 -> andl $imm31, %r32
b8364fa7 4139 andq $imm7, %r64 -> andl $imm7, %r32
b6f8c7c4
L
4140 testq $imm31, %r64 -> testl $imm31, %r32
4141 xorq %r64, %r64 -> xorl %r32, %r32
4142 subq %r64, %r64 -> subl %r32, %r32
4143 movq $imm31, %r64 -> movl $imm31, %r32
4144 movq $imm32, %r64 -> movl $imm32, %r32
4145 */
4146 i.tm.opcode_modifier.norex64 = 1;
507916b8 4147 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
b6f8c7c4
L
4148 {
4149 /* Handle
4150 movq $imm31, %r64 -> movl $imm31, %r32
4151 movq $imm32, %r64 -> movl $imm32, %r32
4152 */
4153 i.tm.operand_types[0].bitfield.imm32 = 1;
4154 i.tm.operand_types[0].bitfield.imm32s = 0;
4155 i.tm.operand_types[0].bitfield.imm64 = 0;
4156 i.types[0].bitfield.imm32 = 1;
4157 i.types[0].bitfield.imm32s = 0;
4158 i.types[0].bitfield.imm64 = 0;
4159 i.types[1].bitfield.dword = 1;
4160 i.types[1].bitfield.qword = 0;
507916b8 4161 if ((i.tm.base_opcode | 1) == 0xc7)
b6f8c7c4
L
4162 {
4163 /* Handle
4164 movq $imm31, %r64 -> movl $imm31, %r32
4165 */
507916b8 4166 i.tm.base_opcode = 0xb8;
b6f8c7c4 4167 i.tm.extension_opcode = None;
507916b8 4168 i.tm.opcode_modifier.w = 0;
b6f8c7c4
L
4169 i.tm.opcode_modifier.modrm = 0;
4170 }
4171 }
4172 }
5641ec01
JB
4173 else if (optimize > 1
4174 && !optimize_for_space
72aea328 4175 && !is_any_vex_encoding (&i.tm)
5641ec01
JB
4176 && i.reg_operands == 2
4177 && i.op[0].regs == i.op[1].regs
4178 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4179 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4180 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4181 {
4182 /* Optimize: -O2:
4183 andb %rN, %rN -> testb %rN, %rN
4184 andw %rN, %rN -> testw %rN, %rN
4185 andq %rN, %rN -> testq %rN, %rN
4186 orb %rN, %rN -> testb %rN, %rN
4187 orw %rN, %rN -> testw %rN, %rN
4188 orq %rN, %rN -> testq %rN, %rN
4189
4190 and outside of 64-bit mode
4191
4192 andl %rN, %rN -> testl %rN, %rN
4193 orl %rN, %rN -> testl %rN, %rN
4194 */
4195 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4196 }
99112332 4197 else if (i.reg_operands == 3
b6f8c7c4
L
4198 && i.op[0].regs == i.op[1].regs
4199 && !i.types[2].bitfield.xmmword
4200 && (i.tm.opcode_modifier.vex
7a69eac3 4201 || ((!i.mask || i.mask->zeroing)
b6f8c7c4 4202 && !i.rounding
e771e7c9 4203 && is_evex_encoding (&i.tm)
80c34c38 4204 && (i.vec_encoding != vex_encoding_evex
dd22218c 4205 || cpu_arch_isa_flags.bitfield.cpuavx512vl
80c34c38 4206 || i.tm.cpu_flags.bitfield.cpuavx512vl
7091c612 4207 || (i.tm.operand_types[2].bitfield.zmmword
dd22218c 4208 && i.types[2].bitfield.ymmword))))
b6f8c7c4
L
4209 && ((i.tm.base_opcode == 0x55
4210 || i.tm.base_opcode == 0x6655
4211 || i.tm.base_opcode == 0x66df
4212 || i.tm.base_opcode == 0x57
4213 || i.tm.base_opcode == 0x6657
8305403a
L
4214 || i.tm.base_opcode == 0x66ef
4215 || i.tm.base_opcode == 0x66f8
4216 || i.tm.base_opcode == 0x66f9
4217 || i.tm.base_opcode == 0x66fa
1424ad86
JB
4218 || i.tm.base_opcode == 0x66fb
4219 || i.tm.base_opcode == 0x42
4220 || i.tm.base_opcode == 0x6642
4221 || i.tm.base_opcode == 0x47
4222 || i.tm.base_opcode == 0x6647)
b6f8c7c4
L
4223 && i.tm.extension_opcode == None))
4224 {
99112332 4225 /* Optimize: -O1:
8305403a
L
4226 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4227 vpsubq and vpsubw:
b6f8c7c4
L
4228 EVEX VOP %zmmM, %zmmM, %zmmN
4229 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4230 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4231 EVEX VOP %ymmM, %ymmM, %ymmN
4232 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4233 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4234 VEX VOP %ymmM, %ymmM, %ymmN
4235 -> VEX VOP %xmmM, %xmmM, %xmmN
4236 VOP, one of vpandn and vpxor:
4237 VEX VOP %ymmM, %ymmM, %ymmN
4238 -> VEX VOP %xmmM, %xmmM, %xmmN
4239 VOP, one of vpandnd and vpandnq:
4240 EVEX VOP %zmmM, %zmmM, %zmmN
4241 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4242 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4243 EVEX VOP %ymmM, %ymmM, %ymmN
4244 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4245 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4246 VOP, one of vpxord and vpxorq:
4247 EVEX VOP %zmmM, %zmmM, %zmmN
4248 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4249 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
b6f8c7c4
L
4250 EVEX VOP %ymmM, %ymmM, %ymmN
4251 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
99112332 4252 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
1424ad86
JB
4253 VOP, one of kxord and kxorq:
4254 VEX VOP %kM, %kM, %kN
4255 -> VEX kxorw %kM, %kM, %kN
4256 VOP, one of kandnd and kandnq:
4257 VEX VOP %kM, %kM, %kN
4258 -> VEX kandnw %kM, %kM, %kN
b6f8c7c4 4259 */
e771e7c9 4260 if (is_evex_encoding (&i.tm))
b6f8c7c4 4261 {
7b1d7ca1 4262 if (i.vec_encoding != vex_encoding_evex)
b6f8c7c4
L
4263 {
4264 i.tm.opcode_modifier.vex = VEX128;
4265 i.tm.opcode_modifier.vexw = VEXW0;
4266 i.tm.opcode_modifier.evex = 0;
4267 }
7b1d7ca1 4268 else if (optimize > 1)
dd22218c
L
4269 i.tm.opcode_modifier.evex = EVEX128;
4270 else
4271 return;
b6f8c7c4 4272 }
f74a6307 4273 else if (i.tm.operand_types[0].bitfield.class == RegMask)
1424ad86
JB
4274 {
4275 i.tm.base_opcode &= 0xff;
4276 i.tm.opcode_modifier.vexw = VEXW0;
4277 }
b6f8c7c4
L
4278 else
4279 i.tm.opcode_modifier.vex = VEX128;
4280
4281 if (i.tm.opcode_modifier.vex)
4282 for (j = 0; j < 3; j++)
4283 {
4284 i.types[j].bitfield.xmmword = 1;
4285 i.types[j].bitfield.ymmword = 0;
4286 }
4287 }
392a5972 4288 else if (i.vec_encoding != vex_encoding_evex
97ed31ae 4289 && !i.types[0].bitfield.zmmword
392a5972 4290 && !i.types[1].bitfield.zmmword
97ed31ae 4291 && !i.mask
a0a1771e 4292 && !i.broadcast
97ed31ae 4293 && is_evex_encoding (&i.tm)
392a5972
L
4294 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4295 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
a0a1771e
JB
4296 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4297 || (i.tm.base_opcode & ~4) == 0x66db
4298 || (i.tm.base_opcode & ~4) == 0x66eb)
97ed31ae
L
4299 && i.tm.extension_opcode == None)
4300 {
4301 /* Optimize: -O1:
4302 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4303 vmovdqu32 and vmovdqu64:
4304 EVEX VOP %xmmM, %xmmN
4305 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4306 EVEX VOP %ymmM, %ymmN
4307 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4308 EVEX VOP %xmmM, mem
4309 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4310 EVEX VOP %ymmM, mem
4311 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4312 EVEX VOP mem, %xmmN
4313 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4314 EVEX VOP mem, %ymmN
4315 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
a0a1771e
JB
4316 VOP, one of vpand, vpandn, vpor, vpxor:
4317 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4318 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4319 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4320 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4321 EVEX VOP{d,q} mem, %xmmM, %xmmN
4322 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4323 EVEX VOP{d,q} mem, %ymmM, %ymmN
4324 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
97ed31ae 4325 */
a0a1771e 4326 for (j = 0; j < i.operands; j++)
392a5972
L
4327 if (operand_type_check (i.types[j], disp)
4328 && i.op[j].disps->X_op == O_constant)
4329 {
4330 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4331 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4332 bytes, we choose EVEX Disp8 over VEX Disp32. */
4333 int evex_disp8, vex_disp8;
4334 unsigned int memshift = i.memshift;
4335 offsetT n = i.op[j].disps->X_add_number;
4336
4337 evex_disp8 = fits_in_disp8 (n);
4338 i.memshift = 0;
4339 vex_disp8 = fits_in_disp8 (n);
4340 if (evex_disp8 != vex_disp8)
4341 {
4342 i.memshift = memshift;
4343 return;
4344 }
4345
4346 i.types[j].bitfield.disp8 = vex_disp8;
4347 break;
4348 }
4349 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4350 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
97ed31ae
L
4351 i.tm.opcode_modifier.vex
4352 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4353 i.tm.opcode_modifier.vexw = VEXW0;
79dec6b7
JB
4354 /* VPAND, VPOR, and VPXOR are commutative. */
4355 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4356 i.tm.opcode_modifier.commutative = 1;
97ed31ae
L
4357 i.tm.opcode_modifier.evex = 0;
4358 i.tm.opcode_modifier.masking = 0;
a0a1771e 4359 i.tm.opcode_modifier.broadcast = 0;
97ed31ae
L
4360 i.tm.opcode_modifier.disp8memshift = 0;
4361 i.memshift = 0;
a0a1771e
JB
4362 if (j < i.operands)
4363 i.types[j].bitfield.disp8
4364 = fits_in_disp8 (i.op[j].disps->X_add_number);
97ed31ae 4365 }
b6f8c7c4
L
4366}
4367
ae531041
L
4368/* Return non-zero for load instruction. */
4369
4370static int
4371load_insn_p (void)
4372{
4373 unsigned int dest;
4374 int any_vex_p = is_any_vex_encoding (&i.tm);
4375 unsigned int base_opcode = i.tm.base_opcode | 1;
4376
4377 if (!any_vex_p)
4378 {
a09f656b 4379 /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4380 prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4381 bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote. */
4382 if (i.tm.opcode_modifier.anysize)
ae531041
L
4383 return 0;
4384
a09f656b 4385 /* pop, popf, popa. */
4386 if (strcmp (i.tm.name, "pop") == 0
4387 || i.tm.base_opcode == 0x9d
4388 || i.tm.base_opcode == 0x61)
ae531041
L
4389 return 1;
4390
4391 /* movs, cmps, lods, scas. */
4392 if ((i.tm.base_opcode | 0xb) == 0xaf)
4393 return 1;
4394
a09f656b 4395 /* outs, xlatb. */
4396 if (base_opcode == 0x6f
4397 || i.tm.base_opcode == 0xd7)
ae531041 4398 return 1;
a09f656b 4399 /* NB: For AMD-specific insns with implicit memory operands,
4400 they're intentionally not covered. */
ae531041
L
4401 }
4402
4403 /* No memory operand. */
4404 if (!i.mem_operands)
4405 return 0;
4406
4407 if (any_vex_p)
4408 {
4409 /* vldmxcsr. */
4410 if (i.tm.base_opcode == 0xae
4411 && i.tm.opcode_modifier.vex
4412 && i.tm.opcode_modifier.vexopcode == VEX0F
4413 && i.tm.extension_opcode == 2)
4414 return 1;
4415 }
4416 else
4417 {
4418 /* test, not, neg, mul, imul, div, idiv. */
4419 if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4420 && i.tm.extension_opcode != 1)
4421 return 1;
4422
4423 /* inc, dec. */
4424 if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4425 return 1;
4426
4427 /* add, or, adc, sbb, and, sub, xor, cmp. */
4428 if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4429 return 1;
4430
4431 /* bt, bts, btr, btc. */
4432 if (i.tm.base_opcode == 0xfba
4433 && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4434 return 1;
4435
4436 /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4437 if ((base_opcode == 0xc1
4438 || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4439 && i.tm.extension_opcode != 6)
4440 return 1;
4441
4442 /* cmpxchg8b, cmpxchg16b, xrstors. */
4443 if (i.tm.base_opcode == 0xfc7
4444 && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4445 return 1;
4446
4447 /* fxrstor, ldmxcsr, xrstor. */
4448 if (i.tm.base_opcode == 0xfae
4449 && (i.tm.extension_opcode == 1
4450 || i.tm.extension_opcode == 2
4451 || i.tm.extension_opcode == 5))
4452 return 1;
4453
4454 /* lgdt, lidt, lmsw. */
4455 if (i.tm.base_opcode == 0xf01
4456 && (i.tm.extension_opcode == 2
4457 || i.tm.extension_opcode == 3
4458 || i.tm.extension_opcode == 6))
4459 return 1;
4460
4461 /* vmptrld */
4462 if (i.tm.base_opcode == 0xfc7
4463 && i.tm.extension_opcode == 6)
4464 return 1;
4465
4466 /* Check for x87 instructions. */
4467 if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4468 {
4469 /* Skip fst, fstp, fstenv, fstcw. */
4470 if (i.tm.base_opcode == 0xd9
4471 && (i.tm.extension_opcode == 2
4472 || i.tm.extension_opcode == 3
4473 || i.tm.extension_opcode == 6
4474 || i.tm.extension_opcode == 7))
4475 return 0;
4476
4477 /* Skip fisttp, fist, fistp, fstp. */
4478 if (i.tm.base_opcode == 0xdb
4479 && (i.tm.extension_opcode == 1
4480 || i.tm.extension_opcode == 2
4481 || i.tm.extension_opcode == 3
4482 || i.tm.extension_opcode == 7))
4483 return 0;
4484
4485 /* Skip fisttp, fst, fstp, fsave, fstsw. */
4486 if (i.tm.base_opcode == 0xdd
4487 && (i.tm.extension_opcode == 1
4488 || i.tm.extension_opcode == 2
4489 || i.tm.extension_opcode == 3
4490 || i.tm.extension_opcode == 6
4491 || i.tm.extension_opcode == 7))
4492 return 0;
4493
4494 /* Skip fisttp, fist, fistp, fbstp, fistp. */
4495 if (i.tm.base_opcode == 0xdf
4496 && (i.tm.extension_opcode == 1
4497 || i.tm.extension_opcode == 2
4498 || i.tm.extension_opcode == 3
4499 || i.tm.extension_opcode == 6
4500 || i.tm.extension_opcode == 7))
4501 return 0;
4502
4503 return 1;
4504 }
4505 }
4506
4507 dest = i.operands - 1;
4508
4509 /* Check fake imm8 operand and 3 source operands. */
4510 if ((i.tm.opcode_modifier.immext
4511 || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4512 && i.types[dest].bitfield.imm8)
4513 dest--;
4514
4515 /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd */
4516 if (!any_vex_p
4517 && (base_opcode == 0x1
4518 || base_opcode == 0x9
4519 || base_opcode == 0x11
4520 || base_opcode == 0x19
4521 || base_opcode == 0x21
4522 || base_opcode == 0x29
4523 || base_opcode == 0x31
4524 || base_opcode == 0x39
4525 || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4526 || base_opcode == 0xfc1))
4527 return 1;
4528
4529 /* Check for load instruction. */
4530 return (i.types[dest].bitfield.class != ClassNone
4531 || i.types[dest].bitfield.instance == Accum);
4532}
4533
4534/* Output lfence, 0xfaee8, after instruction. */
4535
4536static void
4537insert_lfence_after (void)
4538{
4539 if (lfence_after_load && load_insn_p ())
4540 {
a09f656b 4541 /* There are also two REP string instructions that require
4542 special treatment. Specifically, the compare string (CMPS)
4543 and scan string (SCAS) instructions set EFLAGS in a manner
4544 that depends on the data being compared/scanned. When used
4545 with a REP prefix, the number of iterations may therefore
4546 vary depending on this data. If the data is a program secret
4547 chosen by the adversary using an LVI method,
4548 then this data-dependent behavior may leak some aspect
4549 of the secret. */
4550 if (((i.tm.base_opcode | 0x1) == 0xa7
4551 || (i.tm.base_opcode | 0x1) == 0xaf)
4552 && i.prefix[REP_PREFIX])
4553 {
4554 as_warn (_("`%s` changes flags which would affect control flow behavior"),
4555 i.tm.name);
4556 }
ae531041
L
4557 char *p = frag_more (3);
4558 *p++ = 0xf;
4559 *p++ = 0xae;
4560 *p = 0xe8;
4561 }
4562}
4563
4564/* Output lfence, 0xfaee8, before instruction. */
4565
4566static void
4567insert_lfence_before (void)
4568{
4569 char *p;
4570
4571 if (is_any_vex_encoding (&i.tm))
4572 return;
4573
4574 if (i.tm.base_opcode == 0xff
4575 && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4576 {
4577 /* Insert lfence before indirect branch if needed. */
4578
4579 if (lfence_before_indirect_branch == lfence_branch_none)
4580 return;
4581
4582 if (i.operands != 1)
4583 abort ();
4584
4585 if (i.reg_operands == 1)
4586 {
4587 /* Indirect branch via register. Don't insert lfence with
4588 -mlfence-after-load=yes. */
4589 if (lfence_after_load
4590 || lfence_before_indirect_branch == lfence_branch_memory)
4591 return;
4592 }
4593 else if (i.mem_operands == 1
4594 && lfence_before_indirect_branch != lfence_branch_register)
4595 {
4596 as_warn (_("indirect `%s` with memory operand should be avoided"),
4597 i.tm.name);
4598 return;
4599 }
4600 else
4601 return;
4602
4603 if (last_insn.kind != last_insn_other
4604 && last_insn.seg == now_seg)
4605 {
4606 as_warn_where (last_insn.file, last_insn.line,
4607 _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4608 last_insn.name, i.tm.name);
4609 return;
4610 }
4611
4612 p = frag_more (3);
4613 *p++ = 0xf;
4614 *p++ = 0xae;
4615 *p = 0xe8;
4616 return;
4617 }
4618
503648e4 4619 /* Output or/not/shl and lfence before near ret. */
ae531041
L
4620 if (lfence_before_ret != lfence_before_ret_none
4621 && (i.tm.base_opcode == 0xc2
503648e4 4622 || i.tm.base_opcode == 0xc3))
ae531041
L
4623 {
4624 if (last_insn.kind != last_insn_other
4625 && last_insn.seg == now_seg)
4626 {
4627 as_warn_where (last_insn.file, last_insn.line,
4628 _("`%s` skips -mlfence-before-ret on `%s`"),
4629 last_insn.name, i.tm.name);
4630 return;
4631 }
a09f656b 4632
a09f656b 4633 /* Near ret ingore operand size override under CPU64. */
503648e4 4634 char prefix = flag_code == CODE_64BIT
4635 ? 0x48
4636 : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
a09f656b 4637
4638 if (lfence_before_ret == lfence_before_ret_not)
4639 {
4640 /* not: 0xf71424, may add prefix
4641 for operand size override or 64-bit code. */
4642 p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4643 if (prefix)
4644 *p++ = prefix;
ae531041
L
4645 *p++ = 0xf7;
4646 *p++ = 0x14;
4647 *p++ = 0x24;
a09f656b 4648 if (prefix)
4649 *p++ = prefix;
ae531041
L
4650 *p++ = 0xf7;
4651 *p++ = 0x14;
4652 *p++ = 0x24;
4653 }
a09f656b 4654 else
4655 {
4656 p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4657 if (prefix)
4658 *p++ = prefix;
4659 if (lfence_before_ret == lfence_before_ret_or)
4660 {
4661 /* or: 0x830c2400, may add prefix
4662 for operand size override or 64-bit code. */
4663 *p++ = 0x83;
4664 *p++ = 0x0c;
4665 }
4666 else
4667 {
4668 /* shl: 0xc1242400, may add prefix
4669 for operand size override or 64-bit code. */
4670 *p++ = 0xc1;
4671 *p++ = 0x24;
4672 }
4673
4674 *p++ = 0x24;
4675 *p++ = 0x0;
4676 }
4677
ae531041
L
4678 *p++ = 0xf;
4679 *p++ = 0xae;
4680 *p = 0xe8;
4681 }
4682}
4683
252b5132
RH
4684/* This is the guts of the machine-dependent assembler. LINE points to a
4685 machine dependent instruction. This function is supposed to emit
4686 the frags/bytes it assembles to. */
4687
4688void
65da13b5 4689md_assemble (char *line)
252b5132 4690{
40fb9820 4691 unsigned int j;
83b16ac6 4692 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
d3ce72d0 4693 const insn_template *t;
252b5132 4694
47926f60 4695 /* Initialize globals. */
252b5132
RH
4696 memset (&i, '\0', sizeof (i));
4697 for (j = 0; j < MAX_OPERANDS; j++)
1ae12ab7 4698 i.reloc[j] = NO_RELOC;
252b5132
RH
4699 memset (disp_expressions, '\0', sizeof (disp_expressions));
4700 memset (im_expressions, '\0', sizeof (im_expressions));
ce8a8b2f 4701 save_stack_p = save_stack;
252b5132
RH
4702
4703 /* First parse an instruction mnemonic & call i386_operand for the operands.
4704 We assume that the scrubber has arranged it so that line[0] is the valid
47926f60 4705 start of a (possibly prefixed) mnemonic. */
252b5132 4706
29b0f896
AM
4707 line = parse_insn (line, mnemonic);
4708 if (line == NULL)
4709 return;
83b16ac6 4710 mnem_suffix = i.suffix;
252b5132 4711
29b0f896 4712 line = parse_operands (line, mnemonic);
ee86248c 4713 this_operand = -1;
8325cc63
JB
4714 xfree (i.memop1_string);
4715 i.memop1_string = NULL;
29b0f896
AM
4716 if (line == NULL)
4717 return;
252b5132 4718
29b0f896
AM
4719 /* Now we've parsed the mnemonic into a set of templates, and have the
4720 operands at hand. */
4721
b630c145
JB
4722 /* All Intel opcodes have reversed operands except for "bound", "enter",
4723 "monitor*", "mwait*", "tpause", and "umwait". We also don't reverse
4724 intersegment "jmp" and "call" instructions with 2 immediate operands so
4725 that the immediate segment precedes the offset, as it does when in AT&T
4726 mode. */
4d456e3d
L
4727 if (intel_syntax
4728 && i.operands > 1
29b0f896 4729 && (strcmp (mnemonic, "bound") != 0)
30123838 4730 && (strcmp (mnemonic, "invlpga") != 0)
eedb0f2c
JB
4731 && (strncmp (mnemonic, "monitor", 7) != 0)
4732 && (strncmp (mnemonic, "mwait", 5) != 0)
b630c145
JB
4733 && (strcmp (mnemonic, "tpause") != 0)
4734 && (strcmp (mnemonic, "umwait") != 0)
40fb9820
L
4735 && !(operand_type_check (i.types[0], imm)
4736 && operand_type_check (i.types[1], imm)))
29b0f896
AM
4737 swap_operands ();
4738
ec56d5c0
JB
4739 /* The order of the immediates should be reversed
4740 for 2 immediates extrq and insertq instructions */
4741 if (i.imm_operands == 2
4742 && (strcmp (mnemonic, "extrq") == 0
4743 || strcmp (mnemonic, "insertq") == 0))
4744 swap_2_operands (0, 1);
4745
29b0f896
AM
4746 if (i.imm_operands)
4747 optimize_imm ();
4748
b300c311
L
4749 /* Don't optimize displacement for movabs since it only takes 64bit
4750 displacement. */
4751 if (i.disp_operands
a501d77e 4752 && i.disp_encoding != disp_encoding_32bit
862be3fb
L
4753 && (flag_code != CODE_64BIT
4754 || strcmp (mnemonic, "movabs") != 0))
4755 optimize_disp ();
29b0f896
AM
4756
4757 /* Next, we find a template that matches the given insn,
4758 making sure the overlap of the given operands types is consistent
4759 with the template operand types. */
252b5132 4760
83b16ac6 4761 if (!(t = match_template (mnem_suffix)))
29b0f896 4762 return;
252b5132 4763
7bab8ab5 4764 if (sse_check != check_none
81f8a913 4765 && !i.tm.opcode_modifier.noavx
6e3e5c9e 4766 && !i.tm.cpu_flags.bitfield.cpuavx
569d50f1 4767 && !i.tm.cpu_flags.bitfield.cpuavx512f
daf50ae7
L
4768 && (i.tm.cpu_flags.bitfield.cpusse
4769 || i.tm.cpu_flags.bitfield.cpusse2
4770 || i.tm.cpu_flags.bitfield.cpusse3
4771 || i.tm.cpu_flags.bitfield.cpussse3
4772 || i.tm.cpu_flags.bitfield.cpusse4_1
6e3e5c9e
JB
4773 || i.tm.cpu_flags.bitfield.cpusse4_2
4774 || i.tm.cpu_flags.bitfield.cpupclmul
4775 || i.tm.cpu_flags.bitfield.cpuaes
569d50f1 4776 || i.tm.cpu_flags.bitfield.cpusha
6e3e5c9e 4777 || i.tm.cpu_flags.bitfield.cpugfni))
daf50ae7 4778 {
7bab8ab5 4779 (sse_check == check_warning
daf50ae7
L
4780 ? as_warn
4781 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4782 }
4783
40fb9820 4784 if (i.tm.opcode_modifier.fwait)
29b0f896
AM
4785 if (!add_prefix (FWAIT_OPCODE))
4786 return;
252b5132 4787
d5de92cf
L
4788 /* Check if REP prefix is OK. */
4789 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4790 {
4791 as_bad (_("invalid instruction `%s' after `%s'"),
4792 i.tm.name, i.rep_prefix);
4793 return;
4794 }
4795
c1ba0266
L
4796 /* Check for lock without a lockable instruction. Destination operand
4797 must be memory unless it is xchg (0x86). */
c32fa91d
L
4798 if (i.prefix[LOCK_PREFIX]
4799 && (!i.tm.opcode_modifier.islockable
c1ba0266
L
4800 || i.mem_operands == 0
4801 || (i.tm.base_opcode != 0x86
8dc0818e 4802 && !(i.flags[i.operands - 1] & Operand_Mem))))
c32fa91d
L
4803 {
4804 as_bad (_("expecting lockable instruction after `lock'"));
4805 return;
4806 }
4807
40d231b4
JB
4808 /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns. */
4809 if (i.prefix[DATA_PREFIX]
4810 && (is_any_vex_encoding (&i.tm)
4811 || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4812 || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
7a8655d2
JB
4813 {
4814 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4815 return;
4816 }
4817
42164a71 4818 /* Check if HLE prefix is OK. */
165de32a 4819 if (i.hle_prefix && !check_hle ())
42164a71
L
4820 return;
4821
7e8b059b
L
4822 /* Check BND prefix. */
4823 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4824 as_bad (_("expecting valid branch instruction after `bnd'"));
4825
04ef582a 4826 /* Check NOTRACK prefix. */
9fef80d6
L
4827 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4828 as_bad (_("expecting indirect branch instruction after `notrack'"));
04ef582a 4829
327e8c42
JB
4830 if (i.tm.cpu_flags.bitfield.cpumpx)
4831 {
4832 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4833 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4834 else if (flag_code != CODE_16BIT
4835 ? i.prefix[ADDR_PREFIX]
4836 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4837 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4838 }
7e8b059b
L
4839
4840 /* Insert BND prefix. */
76d3a78a
JB
4841 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4842 {
4843 if (!i.prefix[BND_PREFIX])
4844 add_prefix (BND_PREFIX_OPCODE);
4845 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4846 {
4847 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4848 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4849 }
4850 }
7e8b059b 4851
29b0f896 4852 /* Check string instruction segment overrides. */
51c8edf6 4853 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
29b0f896 4854 {
51c8edf6 4855 gas_assert (i.mem_operands);
29b0f896 4856 if (!check_string ())
5dd0794d 4857 return;
fc0763e6 4858 i.disp_operands = 0;
29b0f896 4859 }
5dd0794d 4860
b6f8c7c4
L
4861 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4862 optimize_encoding ();
4863
29b0f896
AM
4864 if (!process_suffix ())
4865 return;
e413e4e9 4866
921eafea 4867 /* Update operand types and check extended states. */
bc0844ae 4868 for (j = 0; j < i.operands; j++)
921eafea
L
4869 {
4870 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4871 switch (i.tm.operand_types[j].bitfield.class)
4872 {
4873 default:
4874 break;
4875 case RegMMX:
4876 i.xstate |= xstate_mmx;
4877 break;
4878 case RegMask:
4879 i.xstate |= xstate_zmm;
4880 break;
4881 case RegSIMD:
4882 if (i.tm.operand_types[j].bitfield.tmmword)
4883 i.xstate |= xstate_tmm;
4884 else if (i.tm.operand_types[j].bitfield.zmmword)
4885 i.xstate |= xstate_zmm;
4886 else if (i.tm.operand_types[j].bitfield.ymmword)
4887 i.xstate |= xstate_ymm;
4888 else if (i.tm.operand_types[j].bitfield.xmmword)
4889 i.xstate |= xstate_xmm;
4890 break;
4891 }
4892 }
bc0844ae 4893
29b0f896
AM
4894 /* Make still unresolved immediate matches conform to size of immediate
4895 given in i.suffix. */
4896 if (!finalize_imm ())
4897 return;
252b5132 4898
40fb9820 4899 if (i.types[0].bitfield.imm1)
29b0f896 4900 i.imm_operands = 0; /* kludge for shift insns. */
252b5132 4901
9afe6eb8
L
4902 /* We only need to check those implicit registers for instructions
4903 with 3 operands or less. */
4904 if (i.operands <= 3)
4905 for (j = 0; j < i.operands; j++)
75e5731b
JB
4906 if (i.types[j].bitfield.instance != InstanceNone
4907 && !i.types[j].bitfield.xmmword)
9afe6eb8 4908 i.reg_operands--;
40fb9820 4909
29b0f896
AM
4910 /* For insns with operands there are more diddles to do to the opcode. */
4911 if (i.operands)
4912 {
4913 if (!process_operands ())
4914 return;
4915 }
8c190ce0 4916 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
29b0f896
AM
4917 {
4918 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4919 as_warn (_("translating to `%sp'"), i.tm.name);
4920 }
252b5132 4921
7a8655d2 4922 if (is_any_vex_encoding (&i.tm))
9e5e5283 4923 {
c1dc7af5 4924 if (!cpu_arch_flags.bitfield.cpui286)
9e5e5283 4925 {
c1dc7af5 4926 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
9e5e5283
L
4927 i.tm.name);
4928 return;
4929 }
c0f3af97 4930
0b9404fd
JB
4931 /* Check for explicit REX prefix. */
4932 if (i.prefix[REX_PREFIX] || i.rex_encoding)
4933 {
4934 as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4935 return;
4936 }
4937
9e5e5283
L
4938 if (i.tm.opcode_modifier.vex)
4939 build_vex_prefix (t);
4940 else
4941 build_evex_prefix ();
0b9404fd
JB
4942
4943 /* The individual REX.RXBW bits got consumed. */
4944 i.rex &= REX_OPCODE;
9e5e5283 4945 }
43234a1e 4946
5dd85c99
SP
4947 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4948 instructions may define INT_OPCODE as well, so avoid this corner
4949 case for those instructions that use MODRM. */
4950 if (i.tm.base_opcode == INT_OPCODE
a6461c02
SP
4951 && !i.tm.opcode_modifier.modrm
4952 && i.op[0].imms->X_add_number == 3)
29b0f896
AM
4953 {
4954 i.tm.base_opcode = INT3_OPCODE;
4955 i.imm_operands = 0;
4956 }
252b5132 4957
0cfa3eb3
JB
4958 if ((i.tm.opcode_modifier.jump == JUMP
4959 || i.tm.opcode_modifier.jump == JUMP_BYTE
4960 || i.tm.opcode_modifier.jump == JUMP_DWORD)
29b0f896
AM
4961 && i.op[0].disps->X_op == O_constant)
4962 {
4963 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4964 the absolute address given by the constant. Since ix86 jumps and
4965 calls are pc relative, we need to generate a reloc. */
4966 i.op[0].disps->X_add_symbol = &abs_symbol;
4967 i.op[0].disps->X_op = O_symbol;
4968 }
252b5132 4969
29b0f896
AM
4970 /* For 8 bit registers we need an empty rex prefix. Also if the
4971 instruction already has a prefix, we need to convert old
4972 registers to new ones. */
773f551c 4973
bab6aec1 4974 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
29b0f896 4975 && (i.op[0].regs->reg_flags & RegRex64) != 0)
bab6aec1 4976 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
29b0f896 4977 && (i.op[1].regs->reg_flags & RegRex64) != 0)
bab6aec1
JB
4978 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4979 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
29b0f896
AM
4980 && i.rex != 0))
4981 {
4982 int x;
726c5dcd 4983
29b0f896
AM
4984 i.rex |= REX_OPCODE;
4985 for (x = 0; x < 2; x++)
4986 {
4987 /* Look for 8 bit operand that uses old registers. */
bab6aec1 4988 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
29b0f896 4989 && (i.op[x].regs->reg_flags & RegRex64) == 0)
773f551c 4990 {
3f93af61 4991 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
29b0f896
AM
4992 /* In case it is "hi" register, give up. */
4993 if (i.op[x].regs->reg_num > 3)
a540244d 4994 as_bad (_("can't encode register '%s%s' in an "
4eed87de 4995 "instruction requiring REX prefix."),
a540244d 4996 register_prefix, i.op[x].regs->reg_name);
773f551c 4997
29b0f896
AM
4998 /* Otherwise it is equivalent to the extended register.
4999 Since the encoding doesn't change this is merely
5000 cosmetic cleanup for debug output. */
5001
5002 i.op[x].regs = i.op[x].regs + 8;
773f551c 5003 }
29b0f896
AM
5004 }
5005 }
773f551c 5006
6b6b6807
L
5007 if (i.rex == 0 && i.rex_encoding)
5008 {
5009 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
3f93af61 5010 that uses legacy register. If it is "hi" register, don't add
6b6b6807
L
5011 the REX_OPCODE byte. */
5012 int x;
5013 for (x = 0; x < 2; x++)
bab6aec1 5014 if (i.types[x].bitfield.class == Reg
6b6b6807
L
5015 && i.types[x].bitfield.byte
5016 && (i.op[x].regs->reg_flags & RegRex64) == 0
5017 && i.op[x].regs->reg_num > 3)
5018 {
3f93af61 5019 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
6b6b6807
L
5020 i.rex_encoding = FALSE;
5021 break;
5022 }
5023
5024 if (i.rex_encoding)
5025 i.rex = REX_OPCODE;
5026 }
5027
7ab9ffdd 5028 if (i.rex != 0)
29b0f896
AM
5029 add_prefix (REX_OPCODE | i.rex);
5030
ae531041
L
5031 insert_lfence_before ();
5032
29b0f896
AM
5033 /* We are ready to output the insn. */
5034 output_insn ();
e379e5f3 5035
ae531041
L
5036 insert_lfence_after ();
5037
e379e5f3
L
5038 last_insn.seg = now_seg;
5039
5040 if (i.tm.opcode_modifier.isprefix)
5041 {
5042 last_insn.kind = last_insn_prefix;
5043 last_insn.name = i.tm.name;
5044 last_insn.file = as_where (&last_insn.line);
5045 }
5046 else
5047 last_insn.kind = last_insn_other;
29b0f896
AM
5048}
5049
5050static char *
e3bb37b5 5051parse_insn (char *line, char *mnemonic)
29b0f896
AM
5052{
5053 char *l = line;
5054 char *token_start = l;
5055 char *mnem_p;
5c6af06e 5056 int supported;
d3ce72d0 5057 const insn_template *t;
b6169b20 5058 char *dot_p = NULL;
29b0f896 5059
29b0f896
AM
5060 while (1)
5061 {
5062 mnem_p = mnemonic;
5063 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5064 {
b6169b20
L
5065 if (*mnem_p == '.')
5066 dot_p = mnem_p;
29b0f896
AM
5067 mnem_p++;
5068 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
45288df1 5069 {
29b0f896
AM
5070 as_bad (_("no such instruction: `%s'"), token_start);
5071 return NULL;
5072 }
5073 l++;
5074 }
5075 if (!is_space_char (*l)
5076 && *l != END_OF_INSN
e44823cf
JB
5077 && (intel_syntax
5078 || (*l != PREFIX_SEPARATOR
5079 && *l != ',')))
29b0f896
AM
5080 {
5081 as_bad (_("invalid character %s in mnemonic"),
5082 output_invalid (*l));
5083 return NULL;
5084 }
5085 if (token_start == l)
5086 {
e44823cf 5087 if (!intel_syntax && *l == PREFIX_SEPARATOR)
29b0f896
AM
5088 as_bad (_("expecting prefix; got nothing"));
5089 else
5090 as_bad (_("expecting mnemonic; got nothing"));
5091 return NULL;
5092 }
45288df1 5093
29b0f896 5094 /* Look up instruction (or prefix) via hash table. */
d3ce72d0 5095 current_templates = (const templates *) hash_find (op_hash, mnemonic);
47926f60 5096
29b0f896
AM
5097 if (*l != END_OF_INSN
5098 && (!is_space_char (*l) || l[1] != END_OF_INSN)
5099 && current_templates
40fb9820 5100 && current_templates->start->opcode_modifier.isprefix)
29b0f896 5101 {
c6fb90c8 5102 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
2dd88dca
JB
5103 {
5104 as_bad ((flag_code != CODE_64BIT
5105 ? _("`%s' is only supported in 64-bit mode")
5106 : _("`%s' is not supported in 64-bit mode")),
5107 current_templates->start->name);
5108 return NULL;
5109 }
29b0f896
AM
5110 /* If we are in 16-bit mode, do not allow addr16 or data16.
5111 Similarly, in 32-bit mode, do not allow addr32 or data32. */
673fe0f0
JB
5112 if ((current_templates->start->opcode_modifier.size == SIZE16
5113 || current_templates->start->opcode_modifier.size == SIZE32)
29b0f896 5114 && flag_code != CODE_64BIT
673fe0f0 5115 && ((current_templates->start->opcode_modifier.size == SIZE32)
29b0f896
AM
5116 ^ (flag_code == CODE_16BIT)))
5117 {
5118 as_bad (_("redundant %s prefix"),
5119 current_templates->start->name);
5120 return NULL;
45288df1 5121 }
86fa6981 5122 if (current_templates->start->opcode_length == 0)
29b0f896 5123 {
86fa6981
L
5124 /* Handle pseudo prefixes. */
5125 switch (current_templates->start->base_opcode)
5126 {
5127 case 0x0:
5128 /* {disp8} */
5129 i.disp_encoding = disp_encoding_8bit;
5130 break;
5131 case 0x1:
5132 /* {disp32} */
5133 i.disp_encoding = disp_encoding_32bit;
5134 break;
5135 case 0x2:
5136 /* {load} */
5137 i.dir_encoding = dir_encoding_load;
5138 break;
5139 case 0x3:
5140 /* {store} */
5141 i.dir_encoding = dir_encoding_store;
5142 break;
5143 case 0x4:
42e04b36
L
5144 /* {vex} */
5145 i.vec_encoding = vex_encoding_vex;
86fa6981
L
5146 break;
5147 case 0x5:
5148 /* {vex3} */
5149 i.vec_encoding = vex_encoding_vex3;
5150 break;
5151 case 0x6:
5152 /* {evex} */
5153 i.vec_encoding = vex_encoding_evex;
5154 break;
6b6b6807
L
5155 case 0x7:
5156 /* {rex} */
5157 i.rex_encoding = TRUE;
5158 break;
b6f8c7c4
L
5159 case 0x8:
5160 /* {nooptimize} */
5161 i.no_optimize = TRUE;
5162 break;
86fa6981
L
5163 default:
5164 abort ();
5165 }
5166 }
5167 else
5168 {
5169 /* Add prefix, checking for repeated prefixes. */
4e9ac44a 5170 switch (add_prefix (current_templates->start->base_opcode))
86fa6981 5171 {
4e9ac44a
L
5172 case PREFIX_EXIST:
5173 return NULL;
5174 case PREFIX_DS:
d777820b 5175 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4e9ac44a
L
5176 i.notrack_prefix = current_templates->start->name;
5177 break;
5178 case PREFIX_REP:
5179 if (current_templates->start->cpu_flags.bitfield.cpuhle)
5180 i.hle_prefix = current_templates->start->name;
5181 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5182 i.bnd_prefix = current_templates->start->name;
5183 else
5184 i.rep_prefix = current_templates->start->name;
5185 break;
5186 default:
5187 break;
86fa6981 5188 }
29b0f896
AM
5189 }
5190 /* Skip past PREFIX_SEPARATOR and reset token_start. */
5191 token_start = ++l;
5192 }
5193 else
5194 break;
5195 }
45288df1 5196
30a55f88 5197 if (!current_templates)
b6169b20 5198 {
07d5e953
JB
5199 /* Deprecated functionality (new code should use pseudo-prefixes instead):
5200 Check if we should swap operand or force 32bit displacement in
f8a5c266 5201 encoding. */
30a55f88 5202 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
64c49ab3 5203 i.dir_encoding = dir_encoding_swap;
8d63c93e 5204 else if (mnem_p - 3 == dot_p
a501d77e
L
5205 && dot_p[1] == 'd'
5206 && dot_p[2] == '8')
5207 i.disp_encoding = disp_encoding_8bit;
8d63c93e 5208 else if (mnem_p - 4 == dot_p
f8a5c266
L
5209 && dot_p[1] == 'd'
5210 && dot_p[2] == '3'
5211 && dot_p[3] == '2')
a501d77e 5212 i.disp_encoding = disp_encoding_32bit;
30a55f88
L
5213 else
5214 goto check_suffix;
5215 mnem_p = dot_p;
5216 *dot_p = '\0';
d3ce72d0 5217 current_templates = (const templates *) hash_find (op_hash, mnemonic);
b6169b20
L
5218 }
5219
29b0f896
AM
5220 if (!current_templates)
5221 {
dc1e8a47 5222 check_suffix:
1c529385 5223 if (mnem_p > mnemonic)
29b0f896 5224 {
1c529385
LH
5225 /* See if we can get a match by trimming off a suffix. */
5226 switch (mnem_p[-1])
29b0f896 5227 {
1c529385
LH
5228 case WORD_MNEM_SUFFIX:
5229 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
29b0f896
AM
5230 i.suffix = SHORT_MNEM_SUFFIX;
5231 else
1c529385
LH
5232 /* Fall through. */
5233 case BYTE_MNEM_SUFFIX:
5234 case QWORD_MNEM_SUFFIX:
5235 i.suffix = mnem_p[-1];
29b0f896 5236 mnem_p[-1] = '\0';
d3ce72d0 5237 current_templates = (const templates *) hash_find (op_hash,
1c529385
LH
5238 mnemonic);
5239 break;
5240 case SHORT_MNEM_SUFFIX:
5241 case LONG_MNEM_SUFFIX:
5242 if (!intel_syntax)
5243 {
5244 i.suffix = mnem_p[-1];
5245 mnem_p[-1] = '\0';
5246 current_templates = (const templates *) hash_find (op_hash,
5247 mnemonic);
5248 }
5249 break;
5250
5251 /* Intel Syntax. */
5252 case 'd':
5253 if (intel_syntax)
5254 {
5255 if (intel_float_operand (mnemonic) == 1)
5256 i.suffix = SHORT_MNEM_SUFFIX;
5257 else
5258 i.suffix = LONG_MNEM_SUFFIX;
5259 mnem_p[-1] = '\0';
5260 current_templates = (const templates *) hash_find (op_hash,
5261 mnemonic);
5262 }
5263 break;
29b0f896 5264 }
29b0f896 5265 }
1c529385 5266
29b0f896
AM
5267 if (!current_templates)
5268 {
5269 as_bad (_("no such instruction: `%s'"), token_start);
5270 return NULL;
5271 }
5272 }
252b5132 5273
0cfa3eb3
JB
5274 if (current_templates->start->opcode_modifier.jump == JUMP
5275 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
29b0f896
AM
5276 {
5277 /* Check for a branch hint. We allow ",pt" and ",pn" for
5278 predict taken and predict not taken respectively.
5279 I'm not sure that branch hints actually do anything on loop
5280 and jcxz insns (JumpByte) for current Pentium4 chips. They
5281 may work in the future and it doesn't hurt to accept them
5282 now. */
5283 if (l[0] == ',' && l[1] == 'p')
5284 {
5285 if (l[2] == 't')
5286 {
5287 if (!add_prefix (DS_PREFIX_OPCODE))
5288 return NULL;
5289 l += 3;
5290 }
5291 else if (l[2] == 'n')
5292 {
5293 if (!add_prefix (CS_PREFIX_OPCODE))
5294 return NULL;
5295 l += 3;
5296 }
5297 }
5298 }
5299 /* Any other comma loses. */
5300 if (*l == ',')
5301 {
5302 as_bad (_("invalid character %s in mnemonic"),
5303 output_invalid (*l));
5304 return NULL;
5305 }
252b5132 5306
29b0f896 5307 /* Check if instruction is supported on specified architecture. */
5c6af06e
JB
5308 supported = 0;
5309 for (t = current_templates->start; t < current_templates->end; ++t)
5310 {
c0f3af97
L
5311 supported |= cpu_flags_match (t);
5312 if (supported == CPU_FLAGS_PERFECT_MATCH)
548d0ee6
JB
5313 {
5314 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5315 as_warn (_("use .code16 to ensure correct addressing mode"));
3629bb00 5316
548d0ee6
JB
5317 return l;
5318 }
29b0f896 5319 }
3629bb00 5320
548d0ee6
JB
5321 if (!(supported & CPU_FLAGS_64BIT_MATCH))
5322 as_bad (flag_code == CODE_64BIT
5323 ? _("`%s' is not supported in 64-bit mode")
5324 : _("`%s' is only supported in 64-bit mode"),
5325 current_templates->start->name);
5326 else
5327 as_bad (_("`%s' is not supported on `%s%s'"),
5328 current_templates->start->name,
5329 cpu_arch_name ? cpu_arch_name : default_arch,
5330 cpu_sub_arch_name ? cpu_sub_arch_name : "");
252b5132 5331
548d0ee6 5332 return NULL;
29b0f896 5333}
252b5132 5334
29b0f896 5335static char *
e3bb37b5 5336parse_operands (char *l, const char *mnemonic)
29b0f896
AM
5337{
5338 char *token_start;
3138f287 5339
29b0f896
AM
5340 /* 1 if operand is pending after ','. */
5341 unsigned int expecting_operand = 0;
252b5132 5342
29b0f896
AM
5343 /* Non-zero if operand parens not balanced. */
5344 unsigned int paren_not_balanced;
5345
5346 while (*l != END_OF_INSN)
5347 {
5348 /* Skip optional white space before operand. */
5349 if (is_space_char (*l))
5350 ++l;
d02603dc 5351 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
29b0f896
AM
5352 {
5353 as_bad (_("invalid character %s before operand %d"),
5354 output_invalid (*l),
5355 i.operands + 1);
5356 return NULL;
5357 }
d02603dc 5358 token_start = l; /* After white space. */
29b0f896
AM
5359 paren_not_balanced = 0;
5360 while (paren_not_balanced || *l != ',')
5361 {
5362 if (*l == END_OF_INSN)
5363 {
5364 if (paren_not_balanced)
5365 {
5366 if (!intel_syntax)
5367 as_bad (_("unbalanced parenthesis in operand %d."),
5368 i.operands + 1);
5369 else
5370 as_bad (_("unbalanced brackets in operand %d."),
5371 i.operands + 1);
5372 return NULL;
5373 }
5374 else
5375 break; /* we are done */
5376 }
d02603dc 5377 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
29b0f896
AM
5378 {
5379 as_bad (_("invalid character %s in operand %d"),
5380 output_invalid (*l),
5381 i.operands + 1);
5382 return NULL;
5383 }
5384 if (!intel_syntax)
5385 {
5386 if (*l == '(')
5387 ++paren_not_balanced;
5388 if (*l == ')')
5389 --paren_not_balanced;
5390 }
5391 else
5392 {
5393 if (*l == '[')
5394 ++paren_not_balanced;
5395 if (*l == ']')
5396 --paren_not_balanced;
5397 }
5398 l++;
5399 }
5400 if (l != token_start)
5401 { /* Yes, we've read in another operand. */
5402 unsigned int operand_ok;
5403 this_operand = i.operands++;
5404 if (i.operands > MAX_OPERANDS)
5405 {
5406 as_bad (_("spurious operands; (%d operands/instruction max)"),
5407 MAX_OPERANDS);
5408 return NULL;
5409 }
9d46ce34 5410 i.types[this_operand].bitfield.unspecified = 1;
29b0f896
AM
5411 /* Now parse operand adding info to 'i' as we go along. */
5412 END_STRING_AND_SAVE (l);
5413
1286ab78
L
5414 if (i.mem_operands > 1)
5415 {
5416 as_bad (_("too many memory references for `%s'"),
5417 mnemonic);
5418 return 0;
5419 }
5420
29b0f896
AM
5421 if (intel_syntax)
5422 operand_ok =
5423 i386_intel_operand (token_start,
5424 intel_float_operand (mnemonic));
5425 else
a7619375 5426 operand_ok = i386_att_operand (token_start);
29b0f896
AM
5427
5428 RESTORE_END_STRING (l);
5429 if (!operand_ok)
5430 return NULL;
5431 }
5432 else
5433 {
5434 if (expecting_operand)
5435 {
5436 expecting_operand_after_comma:
5437 as_bad (_("expecting operand after ','; got nothing"));
5438 return NULL;
5439 }
5440 if (*l == ',')
5441 {
5442 as_bad (_("expecting operand before ','; got nothing"));
5443 return NULL;
5444 }
5445 }
7f3f1ea2 5446
29b0f896
AM
5447 /* Now *l must be either ',' or END_OF_INSN. */
5448 if (*l == ',')
5449 {
5450 if (*++l == END_OF_INSN)
5451 {
5452 /* Just skip it, if it's \n complain. */
5453 goto expecting_operand_after_comma;
5454 }
5455 expecting_operand = 1;
5456 }
5457 }
5458 return l;
5459}
7f3f1ea2 5460
050dfa73 5461static void
4d456e3d 5462swap_2_operands (int xchg1, int xchg2)
050dfa73
MM
5463{
5464 union i386_op temp_op;
40fb9820 5465 i386_operand_type temp_type;
c48dadc9 5466 unsigned int temp_flags;
050dfa73 5467 enum bfd_reloc_code_real temp_reloc;
4eed87de 5468
050dfa73
MM
5469 temp_type = i.types[xchg2];
5470 i.types[xchg2] = i.types[xchg1];
5471 i.types[xchg1] = temp_type;
c48dadc9
JB
5472
5473 temp_flags = i.flags[xchg2];
5474 i.flags[xchg2] = i.flags[xchg1];
5475 i.flags[xchg1] = temp_flags;
5476
050dfa73
MM
5477 temp_op = i.op[xchg2];
5478 i.op[xchg2] = i.op[xchg1];
5479 i.op[xchg1] = temp_op;
c48dadc9 5480
050dfa73
MM
5481 temp_reloc = i.reloc[xchg2];
5482 i.reloc[xchg2] = i.reloc[xchg1];
5483 i.reloc[xchg1] = temp_reloc;
43234a1e
L
5484
5485 if (i.mask)
5486 {
5487 if (i.mask->operand == xchg1)
5488 i.mask->operand = xchg2;
5489 else if (i.mask->operand == xchg2)
5490 i.mask->operand = xchg1;
5491 }
5492 if (i.broadcast)
5493 {
5494 if (i.broadcast->operand == xchg1)
5495 i.broadcast->operand = xchg2;
5496 else if (i.broadcast->operand == xchg2)
5497 i.broadcast->operand = xchg1;
5498 }
5499 if (i.rounding)
5500 {
5501 if (i.rounding->operand == xchg1)
5502 i.rounding->operand = xchg2;
5503 else if (i.rounding->operand == xchg2)
5504 i.rounding->operand = xchg1;
5505 }
050dfa73
MM
5506}
5507
29b0f896 5508static void
e3bb37b5 5509swap_operands (void)
29b0f896 5510{
b7c61d9a 5511 switch (i.operands)
050dfa73 5512 {
c0f3af97 5513 case 5:
b7c61d9a 5514 case 4:
4d456e3d 5515 swap_2_operands (1, i.operands - 2);
1a0670f3 5516 /* Fall through. */
b7c61d9a
L
5517 case 3:
5518 case 2:
4d456e3d 5519 swap_2_operands (0, i.operands - 1);
b7c61d9a
L
5520 break;
5521 default:
5522 abort ();
29b0f896 5523 }
29b0f896
AM
5524
5525 if (i.mem_operands == 2)
5526 {
5527 const seg_entry *temp_seg;
5528 temp_seg = i.seg[0];
5529 i.seg[0] = i.seg[1];
5530 i.seg[1] = temp_seg;
5531 }
5532}
252b5132 5533
29b0f896
AM
5534/* Try to ensure constant immediates are represented in the smallest
5535 opcode possible. */
5536static void
e3bb37b5 5537optimize_imm (void)
29b0f896
AM
5538{
5539 char guess_suffix = 0;
5540 int op;
252b5132 5541
29b0f896
AM
5542 if (i.suffix)
5543 guess_suffix = i.suffix;
5544 else if (i.reg_operands)
5545 {
5546 /* Figure out a suffix from the last register operand specified.
75e5731b
JB
5547 We can't do this properly yet, i.e. excluding special register
5548 instances, but the following works for instructions with
5549 immediates. In any case, we can't set i.suffix yet. */
29b0f896 5550 for (op = i.operands; --op >= 0;)
bab6aec1
JB
5551 if (i.types[op].bitfield.class != Reg)
5552 continue;
5553 else if (i.types[op].bitfield.byte)
7ab9ffdd 5554 {
40fb9820
L
5555 guess_suffix = BYTE_MNEM_SUFFIX;
5556 break;
5557 }
bab6aec1 5558 else if (i.types[op].bitfield.word)
252b5132 5559 {
40fb9820
L
5560 guess_suffix = WORD_MNEM_SUFFIX;
5561 break;
5562 }
bab6aec1 5563 else if (i.types[op].bitfield.dword)
40fb9820
L
5564 {
5565 guess_suffix = LONG_MNEM_SUFFIX;
5566 break;
5567 }
bab6aec1 5568 else if (i.types[op].bitfield.qword)
40fb9820
L
5569 {
5570 guess_suffix = QWORD_MNEM_SUFFIX;
29b0f896 5571 break;
252b5132 5572 }
29b0f896
AM
5573 }
5574 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5575 guess_suffix = WORD_MNEM_SUFFIX;
5576
5577 for (op = i.operands; --op >= 0;)
40fb9820 5578 if (operand_type_check (i.types[op], imm))
29b0f896
AM
5579 {
5580 switch (i.op[op].imms->X_op)
252b5132 5581 {
29b0f896
AM
5582 case O_constant:
5583 /* If a suffix is given, this operand may be shortened. */
5584 switch (guess_suffix)
252b5132 5585 {
29b0f896 5586 case LONG_MNEM_SUFFIX:
40fb9820
L
5587 i.types[op].bitfield.imm32 = 1;
5588 i.types[op].bitfield.imm64 = 1;
29b0f896
AM
5589 break;
5590 case WORD_MNEM_SUFFIX:
40fb9820
L
5591 i.types[op].bitfield.imm16 = 1;
5592 i.types[op].bitfield.imm32 = 1;
5593 i.types[op].bitfield.imm32s = 1;
5594 i.types[op].bitfield.imm64 = 1;
29b0f896
AM
5595 break;
5596 case BYTE_MNEM_SUFFIX:
40fb9820
L
5597 i.types[op].bitfield.imm8 = 1;
5598 i.types[op].bitfield.imm8s = 1;
5599 i.types[op].bitfield.imm16 = 1;
5600 i.types[op].bitfield.imm32 = 1;
5601 i.types[op].bitfield.imm32s = 1;
5602 i.types[op].bitfield.imm64 = 1;
29b0f896 5603 break;
252b5132 5604 }
252b5132 5605
29b0f896
AM
5606 /* If this operand is at most 16 bits, convert it
5607 to a signed 16 bit number before trying to see
5608 whether it will fit in an even smaller size.
5609 This allows a 16-bit operand such as $0xffe0 to
5610 be recognised as within Imm8S range. */
40fb9820 5611 if ((i.types[op].bitfield.imm16)
29b0f896 5612 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
252b5132 5613 {
29b0f896
AM
5614 i.op[op].imms->X_add_number =
5615 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5616 }
a28def75
L
5617#ifdef BFD64
5618 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
40fb9820 5619 if ((i.types[op].bitfield.imm32)
29b0f896
AM
5620 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5621 == 0))
5622 {
5623 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5624 ^ ((offsetT) 1 << 31))
5625 - ((offsetT) 1 << 31));
5626 }
a28def75 5627#endif
40fb9820 5628 i.types[op]
c6fb90c8
L
5629 = operand_type_or (i.types[op],
5630 smallest_imm_type (i.op[op].imms->X_add_number));
252b5132 5631
29b0f896
AM
5632 /* We must avoid matching of Imm32 templates when 64bit
5633 only immediate is available. */
5634 if (guess_suffix == QWORD_MNEM_SUFFIX)
40fb9820 5635 i.types[op].bitfield.imm32 = 0;
29b0f896 5636 break;
252b5132 5637
29b0f896
AM
5638 case O_absent:
5639 case O_register:
5640 abort ();
5641
5642 /* Symbols and expressions. */
5643 default:
9cd96992
JB
5644 /* Convert symbolic operand to proper sizes for matching, but don't
5645 prevent matching a set of insns that only supports sizes other
5646 than those matching the insn suffix. */
5647 {
40fb9820 5648 i386_operand_type mask, allowed;
d3ce72d0 5649 const insn_template *t;
9cd96992 5650
0dfbf9d7
L
5651 operand_type_set (&mask, 0);
5652 operand_type_set (&allowed, 0);
40fb9820 5653
4eed87de
AM
5654 for (t = current_templates->start;
5655 t < current_templates->end;
5656 ++t)
bab6aec1
JB
5657 {
5658 allowed = operand_type_or (allowed, t->operand_types[op]);
5659 allowed = operand_type_and (allowed, anyimm);
5660 }
9cd96992
JB
5661 switch (guess_suffix)
5662 {
5663 case QWORD_MNEM_SUFFIX:
40fb9820
L
5664 mask.bitfield.imm64 = 1;
5665 mask.bitfield.imm32s = 1;
9cd96992
JB
5666 break;
5667 case LONG_MNEM_SUFFIX:
40fb9820 5668 mask.bitfield.imm32 = 1;
9cd96992
JB
5669 break;
5670 case WORD_MNEM_SUFFIX:
40fb9820 5671 mask.bitfield.imm16 = 1;
9cd96992
JB
5672 break;
5673 case BYTE_MNEM_SUFFIX:
40fb9820 5674 mask.bitfield.imm8 = 1;
9cd96992
JB
5675 break;
5676 default:
9cd96992
JB
5677 break;
5678 }
c6fb90c8 5679 allowed = operand_type_and (mask, allowed);
0dfbf9d7 5680 if (!operand_type_all_zero (&allowed))
c6fb90c8 5681 i.types[op] = operand_type_and (i.types[op], mask);
9cd96992 5682 }
29b0f896 5683 break;
252b5132 5684 }
29b0f896
AM
5685 }
5686}
47926f60 5687
29b0f896
AM
5688/* Try to use the smallest displacement type too. */
5689static void
e3bb37b5 5690optimize_disp (void)
29b0f896
AM
5691{
5692 int op;
3e73aa7c 5693
29b0f896 5694 for (op = i.operands; --op >= 0;)
40fb9820 5695 if (operand_type_check (i.types[op], disp))
252b5132 5696 {
b300c311 5697 if (i.op[op].disps->X_op == O_constant)
252b5132 5698 {
91d6fa6a 5699 offsetT op_disp = i.op[op].disps->X_add_number;
29b0f896 5700
40fb9820 5701 if (i.types[op].bitfield.disp16
91d6fa6a 5702 && (op_disp & ~(offsetT) 0xffff) == 0)
b300c311
L
5703 {
5704 /* If this operand is at most 16 bits, convert
5705 to a signed 16 bit number and don't use 64bit
5706 displacement. */
91d6fa6a 5707 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
40fb9820 5708 i.types[op].bitfield.disp64 = 0;
b300c311 5709 }
a28def75
L
5710#ifdef BFD64
5711 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
40fb9820 5712 if (i.types[op].bitfield.disp32
91d6fa6a 5713 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
b300c311
L
5714 {
5715 /* If this operand is at most 32 bits, convert
5716 to a signed 32 bit number and don't use 64bit
5717 displacement. */
91d6fa6a
NC
5718 op_disp &= (((offsetT) 2 << 31) - 1);
5719 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
40fb9820 5720 i.types[op].bitfield.disp64 = 0;
b300c311 5721 }
a28def75 5722#endif
91d6fa6a 5723 if (!op_disp && i.types[op].bitfield.baseindex)
b300c311 5724 {
40fb9820
L
5725 i.types[op].bitfield.disp8 = 0;
5726 i.types[op].bitfield.disp16 = 0;
5727 i.types[op].bitfield.disp32 = 0;
5728 i.types[op].bitfield.disp32s = 0;
5729 i.types[op].bitfield.disp64 = 0;
b300c311
L
5730 i.op[op].disps = 0;
5731 i.disp_operands--;
5732 }
5733 else if (flag_code == CODE_64BIT)
5734 {
91d6fa6a 5735 if (fits_in_signed_long (op_disp))
28a9d8f5 5736 {
40fb9820
L
5737 i.types[op].bitfield.disp64 = 0;
5738 i.types[op].bitfield.disp32s = 1;
28a9d8f5 5739 }
0e1147d9 5740 if (i.prefix[ADDR_PREFIX]
91d6fa6a 5741 && fits_in_unsigned_long (op_disp))
40fb9820 5742 i.types[op].bitfield.disp32 = 1;
b300c311 5743 }
40fb9820
L
5744 if ((i.types[op].bitfield.disp32
5745 || i.types[op].bitfield.disp32s
5746 || i.types[op].bitfield.disp16)
b5014f7a 5747 && fits_in_disp8 (op_disp))
40fb9820 5748 i.types[op].bitfield.disp8 = 1;
252b5132 5749 }
67a4f2b7
AO
5750 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5751 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5752 {
5753 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5754 i.op[op].disps, 0, i.reloc[op]);
40fb9820
L
5755 i.types[op].bitfield.disp8 = 0;
5756 i.types[op].bitfield.disp16 = 0;
5757 i.types[op].bitfield.disp32 = 0;
5758 i.types[op].bitfield.disp32s = 0;
5759 i.types[op].bitfield.disp64 = 0;
67a4f2b7
AO
5760 }
5761 else
b300c311 5762 /* We only support 64bit displacement on constants. */
40fb9820 5763 i.types[op].bitfield.disp64 = 0;
252b5132 5764 }
29b0f896
AM
5765}
5766
4a1b91ea
L
5767/* Return 1 if there is a match in broadcast bytes between operand
5768 GIVEN and instruction template T. */
5769
5770static INLINE int
5771match_broadcast_size (const insn_template *t, unsigned int given)
5772{
5773 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5774 && i.types[given].bitfield.byte)
5775 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5776 && i.types[given].bitfield.word)
5777 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5778 && i.types[given].bitfield.dword)
5779 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5780 && i.types[given].bitfield.qword));
5781}
5782
6c30d220
L
5783/* Check if operands are valid for the instruction. */
5784
5785static int
5786check_VecOperands (const insn_template *t)
5787{
43234a1e 5788 unsigned int op;
e2195274 5789 i386_cpu_flags cpu;
e2195274
JB
5790
5791 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5792 any one operand are implicity requiring AVX512VL support if the actual
5793 operand size is YMMword or XMMword. Since this function runs after
5794 template matching, there's no need to check for YMMword/XMMword in
5795 the template. */
5796 cpu = cpu_flags_and (t->cpu_flags, avx512);
5797 if (!cpu_flags_all_zero (&cpu)
5798 && !t->cpu_flags.bitfield.cpuavx512vl
5799 && !cpu_arch_flags.bitfield.cpuavx512vl)
5800 {
5801 for (op = 0; op < t->operands; ++op)
5802 {
5803 if (t->operand_types[op].bitfield.zmmword
5804 && (i.types[op].bitfield.ymmword
5805 || i.types[op].bitfield.xmmword))
5806 {
5807 i.error = unsupported;
5808 return 1;
5809 }
5810 }
5811 }
43234a1e 5812
6c30d220 5813 /* Without VSIB byte, we can't have a vector register for index. */
63112cd6 5814 if (!t->opcode_modifier.sib
6c30d220 5815 && i.index_reg
1b54b8d7
JB
5816 && (i.index_reg->reg_type.bitfield.xmmword
5817 || i.index_reg->reg_type.bitfield.ymmword
5818 || i.index_reg->reg_type.bitfield.zmmword))
6c30d220
L
5819 {
5820 i.error = unsupported_vector_index_register;
5821 return 1;
5822 }
5823
ad8ecc81
MZ
5824 /* Check if default mask is allowed. */
5825 if (t->opcode_modifier.nodefmask
5826 && (!i.mask || i.mask->mask->reg_num == 0))
5827 {
5828 i.error = no_default_mask;
5829 return 1;
5830 }
5831
7bab8ab5
JB
5832 /* For VSIB byte, we need a vector register for index, and all vector
5833 registers must be distinct. */
260cd341 5834 if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
7bab8ab5
JB
5835 {
5836 if (!i.index_reg
63112cd6 5837 || !((t->opcode_modifier.sib == VECSIB128
1b54b8d7 5838 && i.index_reg->reg_type.bitfield.xmmword)
63112cd6 5839 || (t->opcode_modifier.sib == VECSIB256
1b54b8d7 5840 && i.index_reg->reg_type.bitfield.ymmword)
63112cd6 5841 || (t->opcode_modifier.sib == VECSIB512
1b54b8d7 5842 && i.index_reg->reg_type.bitfield.zmmword)))
7bab8ab5
JB
5843 {
5844 i.error = invalid_vsib_address;
5845 return 1;
5846 }
5847
43234a1e
L
5848 gas_assert (i.reg_operands == 2 || i.mask);
5849 if (i.reg_operands == 2 && !i.mask)
5850 {
3528c362 5851 gas_assert (i.types[0].bitfield.class == RegSIMD);
1b54b8d7
JB
5852 gas_assert (i.types[0].bitfield.xmmword
5853 || i.types[0].bitfield.ymmword);
3528c362 5854 gas_assert (i.types[2].bitfield.class == RegSIMD);
1b54b8d7
JB
5855 gas_assert (i.types[2].bitfield.xmmword
5856 || i.types[2].bitfield.ymmword);
43234a1e
L
5857 if (operand_check == check_none)
5858 return 0;
5859 if (register_number (i.op[0].regs)
5860 != register_number (i.index_reg)
5861 && register_number (i.op[2].regs)
5862 != register_number (i.index_reg)
5863 && register_number (i.op[0].regs)
5864 != register_number (i.op[2].regs))
5865 return 0;
5866 if (operand_check == check_error)
5867 {
5868 i.error = invalid_vector_register_set;
5869 return 1;
5870 }
5871 as_warn (_("mask, index, and destination registers should be distinct"));
5872 }
8444f82a
MZ
5873 else if (i.reg_operands == 1 && i.mask)
5874 {
3528c362 5875 if (i.types[1].bitfield.class == RegSIMD
1b54b8d7
JB
5876 && (i.types[1].bitfield.xmmword
5877 || i.types[1].bitfield.ymmword
5878 || i.types[1].bitfield.zmmword)
8444f82a
MZ
5879 && (register_number (i.op[1].regs)
5880 == register_number (i.index_reg)))
5881 {
5882 if (operand_check == check_error)
5883 {
5884 i.error = invalid_vector_register_set;
5885 return 1;
5886 }
5887 if (operand_check != check_none)
5888 as_warn (_("index and destination registers should be distinct"));
5889 }
5890 }
43234a1e 5891 }
7bab8ab5 5892
260cd341
LC
5893 /* For AMX instructions with three tmmword operands, all tmmword operand must be
5894 distinct */
5895 if (t->operand_types[0].bitfield.tmmword
5896 && i.reg_operands == 3)
5897 {
5898 if (register_number (i.op[0].regs)
5899 == register_number (i.op[1].regs)
5900 || register_number (i.op[0].regs)
5901 == register_number (i.op[2].regs)
5902 || register_number (i.op[1].regs)
5903 == register_number (i.op[2].regs))
5904 {
5905 i.error = invalid_tmm_register_set;
5906 return 1;
5907 }
5908 }
5909
43234a1e
L
5910 /* Check if broadcast is supported by the instruction and is applied
5911 to the memory operand. */
5912 if (i.broadcast)
5913 {
8e6e0792 5914 i386_operand_type type, overlap;
43234a1e
L
5915
5916 /* Check if specified broadcast is supported in this instruction,
4a1b91ea 5917 and its broadcast bytes match the memory operand. */
32546502 5918 op = i.broadcast->operand;
8e6e0792 5919 if (!t->opcode_modifier.broadcast
c48dadc9 5920 || !(i.flags[op] & Operand_Mem)
c39e5b26 5921 || (!i.types[op].bitfield.unspecified
4a1b91ea 5922 && !match_broadcast_size (t, op)))
43234a1e
L
5923 {
5924 bad_broadcast:
5925 i.error = unsupported_broadcast;
5926 return 1;
5927 }
8e6e0792 5928
4a1b91ea
L
5929 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5930 * i.broadcast->type);
8e6e0792 5931 operand_type_set (&type, 0);
4a1b91ea 5932 switch (i.broadcast->bytes)
8e6e0792 5933 {
4a1b91ea
L
5934 case 2:
5935 type.bitfield.word = 1;
5936 break;
5937 case 4:
5938 type.bitfield.dword = 1;
5939 break;
8e6e0792
JB
5940 case 8:
5941 type.bitfield.qword = 1;
5942 break;
5943 case 16:
5944 type.bitfield.xmmword = 1;
5945 break;
5946 case 32:
5947 type.bitfield.ymmword = 1;
5948 break;
5949 case 64:
5950 type.bitfield.zmmword = 1;
5951 break;
5952 default:
5953 goto bad_broadcast;
5954 }
5955
5956 overlap = operand_type_and (type, t->operand_types[op]);
bc49bfd8
JB
5957 if (t->operand_types[op].bitfield.class == RegSIMD
5958 && t->operand_types[op].bitfield.byte
5959 + t->operand_types[op].bitfield.word
5960 + t->operand_types[op].bitfield.dword
5961 + t->operand_types[op].bitfield.qword > 1)
5962 {
5963 overlap.bitfield.xmmword = 0;
5964 overlap.bitfield.ymmword = 0;
5965 overlap.bitfield.zmmword = 0;
5966 }
8e6e0792
JB
5967 if (operand_type_all_zero (&overlap))
5968 goto bad_broadcast;
5969
5970 if (t->opcode_modifier.checkregsize)
5971 {
5972 unsigned int j;
5973
e2195274 5974 type.bitfield.baseindex = 1;
8e6e0792
JB
5975 for (j = 0; j < i.operands; ++j)
5976 {
5977 if (j != op
5978 && !operand_type_register_match(i.types[j],
5979 t->operand_types[j],
5980 type,
5981 t->operand_types[op]))
5982 goto bad_broadcast;
5983 }
5984 }
43234a1e
L
5985 }
5986 /* If broadcast is supported in this instruction, we need to check if
5987 operand of one-element size isn't specified without broadcast. */
5988 else if (t->opcode_modifier.broadcast && i.mem_operands)
5989 {
5990 /* Find memory operand. */
5991 for (op = 0; op < i.operands; op++)
8dc0818e 5992 if (i.flags[op] & Operand_Mem)
43234a1e
L
5993 break;
5994 gas_assert (op < i.operands);
5995 /* Check size of the memory operand. */
4a1b91ea 5996 if (match_broadcast_size (t, op))
43234a1e
L
5997 {
5998 i.error = broadcast_needed;
5999 return 1;
6000 }
6001 }
c39e5b26
JB
6002 else
6003 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
43234a1e
L
6004
6005 /* Check if requested masking is supported. */
ae2387fe 6006 if (i.mask)
43234a1e 6007 {
ae2387fe
JB
6008 switch (t->opcode_modifier.masking)
6009 {
6010 case BOTH_MASKING:
6011 break;
6012 case MERGING_MASKING:
6013 if (i.mask->zeroing)
6014 {
6015 case 0:
6016 i.error = unsupported_masking;
6017 return 1;
6018 }
6019 break;
6020 case DYNAMIC_MASKING:
6021 /* Memory destinations allow only merging masking. */
6022 if (i.mask->zeroing && i.mem_operands)
6023 {
6024 /* Find memory operand. */
6025 for (op = 0; op < i.operands; op++)
c48dadc9 6026 if (i.flags[op] & Operand_Mem)
ae2387fe
JB
6027 break;
6028 gas_assert (op < i.operands);
6029 if (op == i.operands - 1)
6030 {
6031 i.error = unsupported_masking;
6032 return 1;
6033 }
6034 }
6035 break;
6036 default:
6037 abort ();
6038 }
43234a1e
L
6039 }
6040
6041 /* Check if masking is applied to dest operand. */
6042 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
6043 {
6044 i.error = mask_not_on_destination;
6045 return 1;
6046 }
6047
43234a1e
L
6048 /* Check RC/SAE. */
6049 if (i.rounding)
6050 {
a80195f1
JB
6051 if (!t->opcode_modifier.sae
6052 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
43234a1e
L
6053 {
6054 i.error = unsupported_rc_sae;
6055 return 1;
6056 }
6057 /* If the instruction has several immediate operands and one of
6058 them is rounding, the rounding operand should be the last
6059 immediate operand. */
6060 if (i.imm_operands > 1
6061 && i.rounding->operand != (int) (i.imm_operands - 1))
7bab8ab5 6062 {
43234a1e 6063 i.error = rc_sae_operand_not_last_imm;
7bab8ab5
JB
6064 return 1;
6065 }
6c30d220
L
6066 }
6067
da4977e0
JB
6068 /* Check the special Imm4 cases; must be the first operand. */
6069 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6070 {
6071 if (i.op[0].imms->X_op != O_constant
6072 || !fits_in_imm4 (i.op[0].imms->X_add_number))
6073 {
6074 i.error = bad_imm4;
6075 return 1;
6076 }
6077
6078 /* Turn off Imm<N> so that update_imm won't complain. */
6079 operand_type_set (&i.types[0], 0);
6080 }
6081
43234a1e 6082 /* Check vector Disp8 operand. */
b5014f7a
JB
6083 if (t->opcode_modifier.disp8memshift
6084 && i.disp_encoding != disp_encoding_32bit)
43234a1e
L
6085 {
6086 if (i.broadcast)
4a1b91ea 6087 i.memshift = t->opcode_modifier.broadcast - 1;
7091c612 6088 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
43234a1e 6089 i.memshift = t->opcode_modifier.disp8memshift;
7091c612
JB
6090 else
6091 {
6092 const i386_operand_type *type = NULL;
6093
6094 i.memshift = 0;
6095 for (op = 0; op < i.operands; op++)
8dc0818e 6096 if (i.flags[op] & Operand_Mem)
7091c612 6097 {
4174bfff
JB
6098 if (t->opcode_modifier.evex == EVEXLIG)
6099 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6100 else if (t->operand_types[op].bitfield.xmmword
6101 + t->operand_types[op].bitfield.ymmword
6102 + t->operand_types[op].bitfield.zmmword <= 1)
7091c612
JB
6103 type = &t->operand_types[op];
6104 else if (!i.types[op].bitfield.unspecified)
6105 type = &i.types[op];
6106 }
3528c362 6107 else if (i.types[op].bitfield.class == RegSIMD
4174bfff 6108 && t->opcode_modifier.evex != EVEXLIG)
7091c612
JB
6109 {
6110 if (i.types[op].bitfield.zmmword)
6111 i.memshift = 6;
6112 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6113 i.memshift = 5;
6114 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6115 i.memshift = 4;
6116 }
6117
6118 if (type)
6119 {
6120 if (type->bitfield.zmmword)
6121 i.memshift = 6;
6122 else if (type->bitfield.ymmword)
6123 i.memshift = 5;
6124 else if (type->bitfield.xmmword)
6125 i.memshift = 4;
6126 }
6127
6128 /* For the check in fits_in_disp8(). */
6129 if (i.memshift == 0)
6130 i.memshift = -1;
6131 }
43234a1e
L
6132
6133 for (op = 0; op < i.operands; op++)
6134 if (operand_type_check (i.types[op], disp)
6135 && i.op[op].disps->X_op == O_constant)
6136 {
b5014f7a 6137 if (fits_in_disp8 (i.op[op].disps->X_add_number))
43234a1e 6138 {
b5014f7a
JB
6139 i.types[op].bitfield.disp8 = 1;
6140 return 0;
43234a1e 6141 }
b5014f7a 6142 i.types[op].bitfield.disp8 = 0;
43234a1e
L
6143 }
6144 }
b5014f7a
JB
6145
6146 i.memshift = 0;
43234a1e 6147
6c30d220
L
6148 return 0;
6149}
6150
da4977e0 6151/* Check if encoding requirements are met by the instruction. */
a683cc34
SP
6152
6153static int
da4977e0 6154VEX_check_encoding (const insn_template *t)
a683cc34 6155{
da4977e0
JB
6156 if (i.vec_encoding == vex_encoding_error)
6157 {
6158 i.error = unsupported;
6159 return 1;
6160 }
6161
86fa6981 6162 if (i.vec_encoding == vex_encoding_evex)
43234a1e 6163 {
86fa6981 6164 /* This instruction must be encoded with EVEX prefix. */
e771e7c9 6165 if (!is_evex_encoding (t))
86fa6981
L
6166 {
6167 i.error = unsupported;
6168 return 1;
6169 }
6170 return 0;
43234a1e
L
6171 }
6172
a683cc34 6173 if (!t->opcode_modifier.vex)
86fa6981
L
6174 {
6175 /* This instruction template doesn't have VEX prefix. */
6176 if (i.vec_encoding != vex_encoding_default)
6177 {
6178 i.error = unsupported;
6179 return 1;
6180 }
6181 return 0;
6182 }
a683cc34 6183
a683cc34
SP
6184 return 0;
6185}
6186
d3ce72d0 6187static const insn_template *
83b16ac6 6188match_template (char mnem_suffix)
29b0f896
AM
6189{
6190 /* Points to template once we've found it. */
d3ce72d0 6191 const insn_template *t;
40fb9820 6192 i386_operand_type overlap0, overlap1, overlap2, overlap3;
c0f3af97 6193 i386_operand_type overlap4;
29b0f896 6194 unsigned int found_reverse_match;
dc2be329 6195 i386_opcode_modifier suffix_check;
40fb9820 6196 i386_operand_type operand_types [MAX_OPERANDS];
539e75ad 6197 int addr_prefix_disp;
45a4bb20 6198 unsigned int j, size_match, check_register;
5614d22c 6199 enum i386_error specific_error = 0;
29b0f896 6200
c0f3af97
L
6201#if MAX_OPERANDS != 5
6202# error "MAX_OPERANDS must be 5."
f48ff2ae
L
6203#endif
6204
29b0f896 6205 found_reverse_match = 0;
539e75ad 6206 addr_prefix_disp = -1;
40fb9820 6207
dc2be329 6208 /* Prepare for mnemonic suffix check. */
40fb9820 6209 memset (&suffix_check, 0, sizeof (suffix_check));
dc2be329
L
6210 switch (mnem_suffix)
6211 {
6212 case BYTE_MNEM_SUFFIX:
6213 suffix_check.no_bsuf = 1;
6214 break;
6215 case WORD_MNEM_SUFFIX:
6216 suffix_check.no_wsuf = 1;
6217 break;
6218 case SHORT_MNEM_SUFFIX:
6219 suffix_check.no_ssuf = 1;
6220 break;
6221 case LONG_MNEM_SUFFIX:
6222 suffix_check.no_lsuf = 1;
6223 break;
6224 case QWORD_MNEM_SUFFIX:
6225 suffix_check.no_qsuf = 1;
6226 break;
6227 default:
6228 /* NB: In Intel syntax, normally we can check for memory operand
6229 size when there is no mnemonic suffix. But jmp and call have
6230 2 different encodings with Dword memory operand size, one with
6231 No_ldSuf and the other without. i.suffix is set to
6232 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
6233 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6234 suffix_check.no_ldsuf = 1;
83b16ac6
JB
6235 }
6236
01559ecc
L
6237 /* Must have right number of operands. */
6238 i.error = number_of_operands_mismatch;
6239
45aa61fe 6240 for (t = current_templates->start; t < current_templates->end; t++)
29b0f896 6241 {
539e75ad 6242 addr_prefix_disp = -1;
dbbc8b7e 6243 found_reverse_match = 0;
539e75ad 6244
29b0f896
AM
6245 if (i.operands != t->operands)
6246 continue;
6247
50aecf8c 6248 /* Check processor support. */
a65babc9 6249 i.error = unsupported;
45a4bb20 6250 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
50aecf8c
L
6251 continue;
6252
e1d4d893 6253 /* Check AT&T mnemonic. */
a65babc9 6254 i.error = unsupported_with_intel_mnemonic;
e1d4d893 6255 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
1efbbeb4
L
6256 continue;
6257
4b5aaf5f 6258 /* Check AT&T/Intel syntax. */
a65babc9 6259 i.error = unsupported_syntax;
5c07affc 6260 if ((intel_syntax && t->opcode_modifier.attsyntax)
4b5aaf5f 6261 || (!intel_syntax && t->opcode_modifier.intelsyntax))
1efbbeb4
L
6262 continue;
6263
4b5aaf5f
L
6264 /* Check Intel64/AMD64 ISA. */
6265 switch (isa64)
6266 {
6267 default:
6268 /* Default: Don't accept Intel64. */
6269 if (t->opcode_modifier.isa64 == INTEL64)
6270 continue;
6271 break;
6272 case amd64:
6273 /* -mamd64: Don't accept Intel64 and Intel64 only. */
6274 if (t->opcode_modifier.isa64 >= INTEL64)
6275 continue;
6276 break;
6277 case intel64:
6278 /* -mintel64: Don't accept AMD64. */
5990e377 6279 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
4b5aaf5f
L
6280 continue;
6281 break;
6282 }
6283
dc2be329 6284 /* Check the suffix. */
a65babc9 6285 i.error = invalid_instruction_suffix;
dc2be329
L
6286 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6287 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6288 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6289 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6290 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6291 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
83b16ac6 6292 continue;
29b0f896 6293
3ac21baa
JB
6294 size_match = operand_size_match (t);
6295 if (!size_match)
7d5e4556 6296 continue;
539e75ad 6297
6f2f06be
JB
6298 /* This is intentionally not
6299
0cfa3eb3 6300 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6f2f06be
JB
6301
6302 as the case of a missing * on the operand is accepted (perhaps with
6303 a warning, issued further down). */
0cfa3eb3 6304 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6f2f06be
JB
6305 {
6306 i.error = operand_type_mismatch;
6307 continue;
6308 }
6309
5c07affc
L
6310 for (j = 0; j < MAX_OPERANDS; j++)
6311 operand_types[j] = t->operand_types[j];
6312
e365e234
JB
6313 /* In general, don't allow
6314 - 64-bit operands outside of 64-bit mode,
6315 - 32-bit operands on pre-386. */
4873e243 6316 j = i.imm_operands + (t->operands > i.imm_operands + 1);
e365e234
JB
6317 if (((i.suffix == QWORD_MNEM_SUFFIX
6318 && flag_code != CODE_64BIT
6319 && (t->base_opcode != 0x0fc7
6320 || t->extension_opcode != 1 /* cmpxchg8b */))
6321 || (i.suffix == LONG_MNEM_SUFFIX
6322 && !cpu_arch_flags.bitfield.cpui386))
45aa61fe 6323 && (intel_syntax
3cd7f3e3 6324 ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
45aa61fe
AM
6325 && !intel_float_operand (t->name))
6326 : intel_float_operand (t->name) != 2)
4873e243
JB
6327 && (t->operands == i.imm_operands
6328 || (operand_types[i.imm_operands].bitfield.class != RegMMX
6329 && operand_types[i.imm_operands].bitfield.class != RegSIMD
6330 && operand_types[i.imm_operands].bitfield.class != RegMask)
6331 || (operand_types[j].bitfield.class != RegMMX
6332 && operand_types[j].bitfield.class != RegSIMD
6333 && operand_types[j].bitfield.class != RegMask))
63112cd6 6334 && !t->opcode_modifier.sib)
192dc9c6
JB
6335 continue;
6336
29b0f896 6337 /* Do not verify operands when there are none. */
e365e234 6338 if (!t->operands)
da4977e0
JB
6339 {
6340 if (VEX_check_encoding (t))
6341 {
6342 specific_error = i.error;
6343 continue;
6344 }
6345
6346 /* We've found a match; break out of loop. */
6347 break;
6348 }
252b5132 6349
48bcea9f
JB
6350 if (!t->opcode_modifier.jump
6351 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6352 {
6353 /* There should be only one Disp operand. */
6354 for (j = 0; j < MAX_OPERANDS; j++)
6355 if (operand_type_check (operand_types[j], disp))
539e75ad 6356 break;
48bcea9f
JB
6357 if (j < MAX_OPERANDS)
6358 {
6359 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6360
6361 addr_prefix_disp = j;
6362
6363 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6364 operand into Disp32/Disp32/Disp16/Disp32 operand. */
6365 switch (flag_code)
40fb9820 6366 {
48bcea9f
JB
6367 case CODE_16BIT:
6368 override = !override;
6369 /* Fall through. */
6370 case CODE_32BIT:
6371 if (operand_types[j].bitfield.disp32
6372 && operand_types[j].bitfield.disp16)
40fb9820 6373 {
48bcea9f
JB
6374 operand_types[j].bitfield.disp16 = override;
6375 operand_types[j].bitfield.disp32 = !override;
40fb9820 6376 }
48bcea9f
JB
6377 operand_types[j].bitfield.disp32s = 0;
6378 operand_types[j].bitfield.disp64 = 0;
6379 break;
6380
6381 case CODE_64BIT:
6382 if (operand_types[j].bitfield.disp32s
6383 || operand_types[j].bitfield.disp64)
40fb9820 6384 {
48bcea9f
JB
6385 operand_types[j].bitfield.disp64 &= !override;
6386 operand_types[j].bitfield.disp32s &= !override;
6387 operand_types[j].bitfield.disp32 = override;
40fb9820 6388 }
48bcea9f
JB
6389 operand_types[j].bitfield.disp16 = 0;
6390 break;
40fb9820 6391 }
539e75ad 6392 }
48bcea9f 6393 }
539e75ad 6394
02a86693
L
6395 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
6396 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6397 continue;
6398
56ffb741 6399 /* We check register size if needed. */
e2195274
JB
6400 if (t->opcode_modifier.checkregsize)
6401 {
6402 check_register = (1 << t->operands) - 1;
6403 if (i.broadcast)
6404 check_register &= ~(1 << i.broadcast->operand);
6405 }
6406 else
6407 check_register = 0;
6408
c6fb90c8 6409 overlap0 = operand_type_and (i.types[0], operand_types[0]);
29b0f896
AM
6410 switch (t->operands)
6411 {
6412 case 1:
40fb9820 6413 if (!operand_type_match (overlap0, i.types[0]))
29b0f896
AM
6414 continue;
6415 break;
6416 case 2:
33eaf5de 6417 /* xchg %eax, %eax is a special case. It is an alias for nop
8b38ad71
L
6418 only in 32bit mode and we can use opcode 0x90. In 64bit
6419 mode, we can't use 0x90 for xchg %eax, %eax since it should
6420 zero-extend %eax to %rax. */
6421 if (flag_code == CODE_64BIT
6422 && t->base_opcode == 0x90
75e5731b
JB
6423 && i.types[0].bitfield.instance == Accum
6424 && i.types[0].bitfield.dword
6425 && i.types[1].bitfield.instance == Accum
6426 && i.types[1].bitfield.dword)
8b38ad71 6427 continue;
1212781b
JB
6428 /* xrelease mov %eax, <disp> is another special case. It must not
6429 match the accumulator-only encoding of mov. */
6430 if (flag_code != CODE_64BIT
6431 && i.hle_prefix
6432 && t->base_opcode == 0xa0
75e5731b 6433 && i.types[0].bitfield.instance == Accum
8dc0818e 6434 && (i.flags[1] & Operand_Mem))
1212781b 6435 continue;
f5eb1d70
JB
6436 /* Fall through. */
6437
6438 case 3:
3ac21baa
JB
6439 if (!(size_match & MATCH_STRAIGHT))
6440 goto check_reverse;
64c49ab3
JB
6441 /* Reverse direction of operands if swapping is possible in the first
6442 place (operands need to be symmetric) and
6443 - the load form is requested, and the template is a store form,
6444 - the store form is requested, and the template is a load form,
6445 - the non-default (swapped) form is requested. */
6446 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
f5eb1d70 6447 if (t->opcode_modifier.d && i.reg_operands == i.operands
64c49ab3
JB
6448 && !operand_type_all_zero (&overlap1))
6449 switch (i.dir_encoding)
6450 {
6451 case dir_encoding_load:
6452 if (operand_type_check (operand_types[i.operands - 1], anymem)
dfd69174 6453 || t->opcode_modifier.regmem)
64c49ab3
JB
6454 goto check_reverse;
6455 break;
6456
6457 case dir_encoding_store:
6458 if (!operand_type_check (operand_types[i.operands - 1], anymem)
dfd69174 6459 && !t->opcode_modifier.regmem)
64c49ab3
JB
6460 goto check_reverse;
6461 break;
6462
6463 case dir_encoding_swap:
6464 goto check_reverse;
6465
6466 case dir_encoding_default:
6467 break;
6468 }
86fa6981 6469 /* If we want store form, we skip the current load. */
64c49ab3
JB
6470 if ((i.dir_encoding == dir_encoding_store
6471 || i.dir_encoding == dir_encoding_swap)
86fa6981
L
6472 && i.mem_operands == 0
6473 && t->opcode_modifier.load)
fa99fab2 6474 continue;
1a0670f3 6475 /* Fall through. */
f48ff2ae 6476 case 4:
c0f3af97 6477 case 5:
c6fb90c8 6478 overlap1 = operand_type_and (i.types[1], operand_types[1]);
40fb9820
L
6479 if (!operand_type_match (overlap0, i.types[0])
6480 || !operand_type_match (overlap1, i.types[1])
e2195274 6481 || ((check_register & 3) == 3
dc821c5f 6482 && !operand_type_register_match (i.types[0],
40fb9820 6483 operand_types[0],
dc821c5f 6484 i.types[1],
40fb9820 6485 operand_types[1])))
29b0f896
AM
6486 {
6487 /* Check if other direction is valid ... */
38e314eb 6488 if (!t->opcode_modifier.d)
29b0f896
AM
6489 continue;
6490
dc1e8a47 6491 check_reverse:
3ac21baa
JB
6492 if (!(size_match & MATCH_REVERSE))
6493 continue;
29b0f896 6494 /* Try reversing direction of operands. */
f5eb1d70
JB
6495 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6496 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
40fb9820 6497 if (!operand_type_match (overlap0, i.types[0])
f5eb1d70 6498 || !operand_type_match (overlap1, i.types[i.operands - 1])
45664ddb 6499 || (check_register
dc821c5f 6500 && !operand_type_register_match (i.types[0],
f5eb1d70
JB
6501 operand_types[i.operands - 1],
6502 i.types[i.operands - 1],
45664ddb 6503 operand_types[0])))
29b0f896
AM
6504 {
6505 /* Does not match either direction. */
6506 continue;
6507 }
38e314eb 6508 /* found_reverse_match holds which of D or FloatR
29b0f896 6509 we've found. */
38e314eb
JB
6510 if (!t->opcode_modifier.d)
6511 found_reverse_match = 0;
6512 else if (operand_types[0].bitfield.tbyte)
8a2ed489 6513 found_reverse_match = Opcode_FloatD;
dbbc8b7e 6514 else if (operand_types[0].bitfield.xmmword
f5eb1d70 6515 || operand_types[i.operands - 1].bitfield.xmmword
3528c362
JB
6516 || operand_types[0].bitfield.class == RegMMX
6517 || operand_types[i.operands - 1].bitfield.class == RegMMX
dbbc8b7e
JB
6518 || is_any_vex_encoding(t))
6519 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6520 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
8a2ed489 6521 else
38e314eb 6522 found_reverse_match = Opcode_D;
40fb9820 6523 if (t->opcode_modifier.floatr)
8a2ed489 6524 found_reverse_match |= Opcode_FloatR;
29b0f896 6525 }
f48ff2ae 6526 else
29b0f896 6527 {
f48ff2ae 6528 /* Found a forward 2 operand match here. */
d1cbb4db
L
6529 switch (t->operands)
6530 {
c0f3af97
L
6531 case 5:
6532 overlap4 = operand_type_and (i.types[4],
6533 operand_types[4]);
1a0670f3 6534 /* Fall through. */
d1cbb4db 6535 case 4:
c6fb90c8
L
6536 overlap3 = operand_type_and (i.types[3],
6537 operand_types[3]);
1a0670f3 6538 /* Fall through. */
d1cbb4db 6539 case 3:
c6fb90c8
L
6540 overlap2 = operand_type_and (i.types[2],
6541 operand_types[2]);
d1cbb4db
L
6542 break;
6543 }
29b0f896 6544
f48ff2ae
L
6545 switch (t->operands)
6546 {
c0f3af97
L
6547 case 5:
6548 if (!operand_type_match (overlap4, i.types[4])
dc821c5f 6549 || !operand_type_register_match (i.types[3],
c0f3af97 6550 operand_types[3],
c0f3af97
L
6551 i.types[4],
6552 operand_types[4]))
6553 continue;
1a0670f3 6554 /* Fall through. */
f48ff2ae 6555 case 4:
40fb9820 6556 if (!operand_type_match (overlap3, i.types[3])
e2195274
JB
6557 || ((check_register & 0xa) == 0xa
6558 && !operand_type_register_match (i.types[1],
f7768225
JB
6559 operand_types[1],
6560 i.types[3],
e2195274
JB
6561 operand_types[3]))
6562 || ((check_register & 0xc) == 0xc
6563 && !operand_type_register_match (i.types[2],
6564 operand_types[2],
6565 i.types[3],
6566 operand_types[3])))
f48ff2ae 6567 continue;
1a0670f3 6568 /* Fall through. */
f48ff2ae
L
6569 case 3:
6570 /* Here we make use of the fact that there are no
23e42951 6571 reverse match 3 operand instructions. */
40fb9820 6572 if (!operand_type_match (overlap2, i.types[2])
e2195274
JB
6573 || ((check_register & 5) == 5
6574 && !operand_type_register_match (i.types[0],
23e42951
JB
6575 operand_types[0],
6576 i.types[2],
e2195274
JB
6577 operand_types[2]))
6578 || ((check_register & 6) == 6
6579 && !operand_type_register_match (i.types[1],
6580 operand_types[1],
6581 i.types[2],
6582 operand_types[2])))
f48ff2ae
L
6583 continue;
6584 break;
6585 }
29b0f896 6586 }
f48ff2ae 6587 /* Found either forward/reverse 2, 3 or 4 operand match here:
29b0f896
AM
6588 slip through to break. */
6589 }
c0f3af97 6590
da4977e0
JB
6591 /* Check if vector operands are valid. */
6592 if (check_VecOperands (t))
6593 {
6594 specific_error = i.error;
6595 continue;
6596 }
6597
6598 /* Check if VEX/EVEX encoding requirements can be satisfied. */
6599 if (VEX_check_encoding (t))
5614d22c
JB
6600 {
6601 specific_error = i.error;
6602 continue;
6603 }
a683cc34 6604
29b0f896
AM
6605 /* We've found a match; break out of loop. */
6606 break;
6607 }
6608
6609 if (t == current_templates->end)
6610 {
6611 /* We found no match. */
a65babc9 6612 const char *err_msg;
5614d22c 6613 switch (specific_error ? specific_error : i.error)
a65babc9
L
6614 {
6615 default:
6616 abort ();
86e026a4 6617 case operand_size_mismatch:
a65babc9
L
6618 err_msg = _("operand size mismatch");
6619 break;
6620 case operand_type_mismatch:
6621 err_msg = _("operand type mismatch");
6622 break;
6623 case register_type_mismatch:
6624 err_msg = _("register type mismatch");
6625 break;
6626 case number_of_operands_mismatch:
6627 err_msg = _("number of operands mismatch");
6628 break;
6629 case invalid_instruction_suffix:
6630 err_msg = _("invalid instruction suffix");
6631 break;
6632 case bad_imm4:
4a2608e3 6633 err_msg = _("constant doesn't fit in 4 bits");
a65babc9 6634 break;
a65babc9
L
6635 case unsupported_with_intel_mnemonic:
6636 err_msg = _("unsupported with Intel mnemonic");
6637 break;
6638 case unsupported_syntax:
6639 err_msg = _("unsupported syntax");
6640 break;
6641 case unsupported:
35262a23 6642 as_bad (_("unsupported instruction `%s'"),
10efe3f6
L
6643 current_templates->start->name);
6644 return NULL;
260cd341
LC
6645 case invalid_sib_address:
6646 err_msg = _("invalid SIB address");
6647 break;
6c30d220
L
6648 case invalid_vsib_address:
6649 err_msg = _("invalid VSIB address");
6650 break;
7bab8ab5
JB
6651 case invalid_vector_register_set:
6652 err_msg = _("mask, index, and destination registers must be distinct");
6653 break;
260cd341
LC
6654 case invalid_tmm_register_set:
6655 err_msg = _("all tmm registers must be distinct");
6656 break;
6c30d220
L
6657 case unsupported_vector_index_register:
6658 err_msg = _("unsupported vector index register");
6659 break;
43234a1e
L
6660 case unsupported_broadcast:
6661 err_msg = _("unsupported broadcast");
6662 break;
43234a1e
L
6663 case broadcast_needed:
6664 err_msg = _("broadcast is needed for operand of such type");
6665 break;
6666 case unsupported_masking:
6667 err_msg = _("unsupported masking");
6668 break;
6669 case mask_not_on_destination:
6670 err_msg = _("mask not on destination operand");
6671 break;
6672 case no_default_mask:
6673 err_msg = _("default mask isn't allowed");
6674 break;
6675 case unsupported_rc_sae:
6676 err_msg = _("unsupported static rounding/sae");
6677 break;
6678 case rc_sae_operand_not_last_imm:
6679 if (intel_syntax)
6680 err_msg = _("RC/SAE operand must precede immediate operands");
6681 else
6682 err_msg = _("RC/SAE operand must follow immediate operands");
6683 break;
6684 case invalid_register_operand:
6685 err_msg = _("invalid register operand");
6686 break;
a65babc9
L
6687 }
6688 as_bad (_("%s for `%s'"), err_msg,
891edac4 6689 current_templates->start->name);
fa99fab2 6690 return NULL;
29b0f896 6691 }
252b5132 6692
29b0f896
AM
6693 if (!quiet_warnings)
6694 {
6695 if (!intel_syntax
0cfa3eb3 6696 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6f2f06be 6697 as_warn (_("indirect %s without `*'"), t->name);
29b0f896 6698
40fb9820 6699 if (t->opcode_modifier.isprefix
3cd7f3e3 6700 && t->opcode_modifier.mnemonicsize == IGNORESIZE)
29b0f896
AM
6701 {
6702 /* Warn them that a data or address size prefix doesn't
6703 affect assembly of the next line of code. */
6704 as_warn (_("stand-alone `%s' prefix"), t->name);
6705 }
6706 }
6707
6708 /* Copy the template we found. */
6709 i.tm = *t;
539e75ad
L
6710
6711 if (addr_prefix_disp != -1)
6712 i.tm.operand_types[addr_prefix_disp]
6713 = operand_types[addr_prefix_disp];
6714
29b0f896
AM
6715 if (found_reverse_match)
6716 {
dfd69174
JB
6717 /* If we found a reverse match we must alter the opcode direction
6718 bit and clear/flip the regmem modifier one. found_reverse_match
6719 holds bits to change (different for int & float insns). */
29b0f896
AM
6720
6721 i.tm.base_opcode ^= found_reverse_match;
6722
f5eb1d70
JB
6723 i.tm.operand_types[0] = operand_types[i.operands - 1];
6724 i.tm.operand_types[i.operands - 1] = operand_types[0];
dfd69174
JB
6725
6726 /* Certain SIMD insns have their load forms specified in the opcode
6727 table, and hence we need to _set_ RegMem instead of clearing it.
6728 We need to avoid setting the bit though on insns like KMOVW. */
6729 i.tm.opcode_modifier.regmem
6730 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6731 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6732 && !i.tm.opcode_modifier.regmem;
29b0f896
AM
6733 }
6734
fa99fab2 6735 return t;
29b0f896
AM
6736}
6737
6738static int
e3bb37b5 6739check_string (void)
29b0f896 6740{
51c8edf6
JB
6741 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6742 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
8dc0818e 6743
51c8edf6 6744 if (i.seg[op] != NULL && i.seg[op] != &es)
29b0f896 6745 {
51c8edf6
JB
6746 as_bad (_("`%s' operand %u must use `%ses' segment"),
6747 i.tm.name,
6748 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6749 register_prefix);
6750 return 0;
29b0f896 6751 }
51c8edf6
JB
6752
6753 /* There's only ever one segment override allowed per instruction.
6754 This instruction possibly has a legal segment override on the
6755 second operand, so copy the segment to where non-string
6756 instructions store it, allowing common code. */
6757 i.seg[op] = i.seg[1];
6758
29b0f896
AM
6759 return 1;
6760}
6761
6762static int
543613e9 6763process_suffix (void)
29b0f896
AM
6764{
6765 /* If matched instruction specifies an explicit instruction mnemonic
6766 suffix, use it. */
673fe0f0 6767 if (i.tm.opcode_modifier.size == SIZE16)
40fb9820 6768 i.suffix = WORD_MNEM_SUFFIX;
673fe0f0 6769 else if (i.tm.opcode_modifier.size == SIZE32)
40fb9820 6770 i.suffix = LONG_MNEM_SUFFIX;
673fe0f0 6771 else if (i.tm.opcode_modifier.size == SIZE64)
40fb9820 6772 i.suffix = QWORD_MNEM_SUFFIX;
13e600d0 6773 else if (i.reg_operands
c8f8eebc
JB
6774 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6775 && !i.tm.opcode_modifier.addrprefixopreg)
29b0f896 6776 {
65fca059
JB
6777 unsigned int numop = i.operands;
6778
6779 /* movsx/movzx want only their source operand considered here, for the
6780 ambiguity checking below. The suffix will be replaced afterwards
6781 to represent the destination (register). */
6782 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6783 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6784 --i.operands;
6785
643bb870
JB
6786 /* crc32 needs REX.W set regardless of suffix / source operand size. */
6787 if (i.tm.base_opcode == 0xf20f38f0
6788 && i.tm.operand_types[1].bitfield.qword)
6789 i.rex |= REX_W;
6790
29b0f896 6791 /* If there's no instruction mnemonic suffix we try to invent one
13e600d0 6792 based on GPR operands. */
29b0f896
AM
6793 if (!i.suffix)
6794 {
6795 /* We take i.suffix from the last register operand specified,
6796 Destination register type is more significant than source
381d071f
L
6797 register type. crc32 in SSE4.2 prefers source register
6798 type. */
1a035124 6799 unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
20592a94 6800
1a035124
JB
6801 while (op--)
6802 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6803 || i.tm.operand_types[op].bitfield.instance == Accum)
6804 {
6805 if (i.types[op].bitfield.class != Reg)
6806 continue;
6807 if (i.types[op].bitfield.byte)
6808 i.suffix = BYTE_MNEM_SUFFIX;
6809 else if (i.types[op].bitfield.word)
6810 i.suffix = WORD_MNEM_SUFFIX;
6811 else if (i.types[op].bitfield.dword)
6812 i.suffix = LONG_MNEM_SUFFIX;
6813 else if (i.types[op].bitfield.qword)
6814 i.suffix = QWORD_MNEM_SUFFIX;
6815 else
6816 continue;
6817 break;
6818 }
65fca059
JB
6819
6820 /* As an exception, movsx/movzx silently default to a byte source
6821 in AT&T mode. */
6822 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6823 && !i.suffix && !intel_syntax)
6824 i.suffix = BYTE_MNEM_SUFFIX;
29b0f896
AM
6825 }
6826 else if (i.suffix == BYTE_MNEM_SUFFIX)
6827 {
2eb952a4 6828 if (intel_syntax
3cd7f3e3 6829 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
2eb952a4
L
6830 && i.tm.opcode_modifier.no_bsuf)
6831 i.suffix = 0;
6832 else if (!check_byte_reg ())
29b0f896
AM
6833 return 0;
6834 }
6835 else if (i.suffix == LONG_MNEM_SUFFIX)
6836 {
2eb952a4 6837 if (intel_syntax
3cd7f3e3 6838 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
9f123b91
JB
6839 && i.tm.opcode_modifier.no_lsuf
6840 && !i.tm.opcode_modifier.todword
6841 && !i.tm.opcode_modifier.toqword)
2eb952a4
L
6842 i.suffix = 0;
6843 else if (!check_long_reg ())
29b0f896
AM
6844 return 0;
6845 }
6846 else if (i.suffix == QWORD_MNEM_SUFFIX)
6847 {
955e1e6a 6848 if (intel_syntax
3cd7f3e3 6849 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
9f123b91
JB
6850 && i.tm.opcode_modifier.no_qsuf
6851 && !i.tm.opcode_modifier.todword
6852 && !i.tm.opcode_modifier.toqword)
955e1e6a
L
6853 i.suffix = 0;
6854 else if (!check_qword_reg ())
29b0f896
AM
6855 return 0;
6856 }
6857 else if (i.suffix == WORD_MNEM_SUFFIX)
6858 {
2eb952a4 6859 if (intel_syntax
3cd7f3e3 6860 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
2eb952a4
L
6861 && i.tm.opcode_modifier.no_wsuf)
6862 i.suffix = 0;
6863 else if (!check_word_reg ())
29b0f896
AM
6864 return 0;
6865 }
3cd7f3e3
L
6866 else if (intel_syntax
6867 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
29b0f896
AM
6868 /* Do nothing if the instruction is going to ignore the prefix. */
6869 ;
6870 else
6871 abort ();
65fca059
JB
6872
6873 /* Undo the movsx/movzx change done above. */
6874 i.operands = numop;
29b0f896 6875 }
3cd7f3e3
L
6876 else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6877 && !i.suffix)
29b0f896 6878 {
13e600d0
JB
6879 i.suffix = stackop_size;
6880 if (stackop_size == LONG_MNEM_SUFFIX)
06f74c5c
L
6881 {
6882 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6883 .code16gcc directive to support 16-bit mode with
6884 32-bit address. For IRET without a suffix, generate
6885 16-bit IRET (opcode 0xcf) to return from an interrupt
6886 handler. */
13e600d0
JB
6887 if (i.tm.base_opcode == 0xcf)
6888 {
6889 i.suffix = WORD_MNEM_SUFFIX;
6890 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6891 }
6892 /* Warn about changed behavior for segment register push/pop. */
6893 else if ((i.tm.base_opcode | 1) == 0x07)
6894 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6895 i.tm.name);
06f74c5c 6896 }
29b0f896 6897 }
c006a730 6898 else if (!i.suffix
0cfa3eb3
JB
6899 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6900 || i.tm.opcode_modifier.jump == JUMP_BYTE
6901 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
64e74474
AM
6902 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6903 && i.tm.extension_opcode <= 3)))
9306ca4a
JB
6904 {
6905 switch (flag_code)
6906 {
6907 case CODE_64BIT:
40fb9820 6908 if (!i.tm.opcode_modifier.no_qsuf)
9306ca4a 6909 {
828c2a25
JB
6910 if (i.tm.opcode_modifier.jump == JUMP_BYTE
6911 || i.tm.opcode_modifier.no_lsuf)
6912 i.suffix = QWORD_MNEM_SUFFIX;
9306ca4a
JB
6913 break;
6914 }
1a0670f3 6915 /* Fall through. */
9306ca4a 6916 case CODE_32BIT:
40fb9820 6917 if (!i.tm.opcode_modifier.no_lsuf)
9306ca4a
JB
6918 i.suffix = LONG_MNEM_SUFFIX;
6919 break;
6920 case CODE_16BIT:
40fb9820 6921 if (!i.tm.opcode_modifier.no_wsuf)
9306ca4a
JB
6922 i.suffix = WORD_MNEM_SUFFIX;
6923 break;
6924 }
6925 }
252b5132 6926
c006a730 6927 if (!i.suffix
3cd7f3e3 6928 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
873494c8
JB
6929 /* Also cover lret/retf/iret in 64-bit mode. */
6930 || (flag_code == CODE_64BIT
6931 && !i.tm.opcode_modifier.no_lsuf
6932 && !i.tm.opcode_modifier.no_qsuf))
3cd7f3e3 6933 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
8bbb3ad8
JB
6934 /* Explicit sizing prefixes are assumed to disambiguate insns. */
6935 && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
62b3f548
JB
6936 /* Accept FLDENV et al without suffix. */
6937 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
29b0f896 6938 {
6c0946d0 6939 unsigned int suffixes, evex = 0;
c006a730
JB
6940
6941 suffixes = !i.tm.opcode_modifier.no_bsuf;
6942 if (!i.tm.opcode_modifier.no_wsuf)
6943 suffixes |= 1 << 1;
6944 if (!i.tm.opcode_modifier.no_lsuf)
6945 suffixes |= 1 << 2;
6946 if (!i.tm.opcode_modifier.no_ldsuf)
6947 suffixes |= 1 << 3;
6948 if (!i.tm.opcode_modifier.no_ssuf)
6949 suffixes |= 1 << 4;
6950 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6951 suffixes |= 1 << 5;
6952
6c0946d0
JB
6953 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6954 also suitable for AT&T syntax mode, it was requested that this be
6955 restricted to just Intel syntax. */
b9915cbc 6956 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6c0946d0 6957 {
b9915cbc 6958 unsigned int op;
6c0946d0 6959
b9915cbc 6960 for (op = 0; op < i.tm.operands; ++op)
6c0946d0 6961 {
b9915cbc
JB
6962 if (is_evex_encoding (&i.tm)
6963 && !cpu_arch_flags.bitfield.cpuavx512vl)
6c0946d0 6964 {
b9915cbc
JB
6965 if (i.tm.operand_types[op].bitfield.ymmword)
6966 i.tm.operand_types[op].bitfield.xmmword = 0;
6967 if (i.tm.operand_types[op].bitfield.zmmword)
6968 i.tm.operand_types[op].bitfield.ymmword = 0;
6969 if (!i.tm.opcode_modifier.evex
6970 || i.tm.opcode_modifier.evex == EVEXDYN)
6971 i.tm.opcode_modifier.evex = EVEX512;
6972 }
6c0946d0 6973
b9915cbc
JB
6974 if (i.tm.operand_types[op].bitfield.xmmword
6975 + i.tm.operand_types[op].bitfield.ymmword
6976 + i.tm.operand_types[op].bitfield.zmmword < 2)
6977 continue;
6c0946d0 6978
b9915cbc
JB
6979 /* Any properly sized operand disambiguates the insn. */
6980 if (i.types[op].bitfield.xmmword
6981 || i.types[op].bitfield.ymmword
6982 || i.types[op].bitfield.zmmword)
6983 {
6984 suffixes &= ~(7 << 6);
6985 evex = 0;
6986 break;
6987 }
6c0946d0 6988
b9915cbc
JB
6989 if ((i.flags[op] & Operand_Mem)
6990 && i.tm.operand_types[op].bitfield.unspecified)
6991 {
6992 if (i.tm.operand_types[op].bitfield.xmmword)
6993 suffixes |= 1 << 6;
6994 if (i.tm.operand_types[op].bitfield.ymmword)
6995 suffixes |= 1 << 7;
6996 if (i.tm.operand_types[op].bitfield.zmmword)
6997 suffixes |= 1 << 8;
6998 if (is_evex_encoding (&i.tm))
6999 evex = EVEX512;
6c0946d0
JB
7000 }
7001 }
7002 }
7003
7004 /* Are multiple suffixes / operand sizes allowed? */
c006a730 7005 if (suffixes & (suffixes - 1))
9306ca4a 7006 {
873494c8 7007 if (intel_syntax
3cd7f3e3 7008 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
873494c8 7009 || operand_check == check_error))
9306ca4a 7010 {
c006a730 7011 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
9306ca4a
JB
7012 return 0;
7013 }
c006a730 7014 if (operand_check == check_error)
9306ca4a 7015 {
c006a730
JB
7016 as_bad (_("no instruction mnemonic suffix given and "
7017 "no register operands; can't size `%s'"), i.tm.name);
9306ca4a
JB
7018 return 0;
7019 }
c006a730 7020 if (operand_check == check_warning)
873494c8
JB
7021 as_warn (_("%s; using default for `%s'"),
7022 intel_syntax
7023 ? _("ambiguous operand size")
7024 : _("no instruction mnemonic suffix given and "
7025 "no register operands"),
7026 i.tm.name);
c006a730
JB
7027
7028 if (i.tm.opcode_modifier.floatmf)
7029 i.suffix = SHORT_MNEM_SUFFIX;
65fca059
JB
7030 else if ((i.tm.base_opcode | 8) == 0xfbe
7031 || (i.tm.base_opcode == 0x63
7032 && i.tm.cpu_flags.bitfield.cpu64))
7033 /* handled below */;
6c0946d0
JB
7034 else if (evex)
7035 i.tm.opcode_modifier.evex = evex;
c006a730
JB
7036 else if (flag_code == CODE_16BIT)
7037 i.suffix = WORD_MNEM_SUFFIX;
1a035124 7038 else if (!i.tm.opcode_modifier.no_lsuf)
c006a730 7039 i.suffix = LONG_MNEM_SUFFIX;
1a035124
JB
7040 else
7041 i.suffix = QWORD_MNEM_SUFFIX;
9306ca4a 7042 }
29b0f896 7043 }
252b5132 7044
65fca059
JB
7045 if ((i.tm.base_opcode | 8) == 0xfbe
7046 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
7047 {
7048 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7049 In AT&T syntax, if there is no suffix (warned about above), the default
7050 will be byte extension. */
7051 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7052 i.tm.base_opcode |= 1;
7053
7054 /* For further processing, the suffix should represent the destination
7055 (register). This is already the case when one was used with
7056 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7057 no suffix to begin with. */
7058 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7059 {
7060 if (i.types[1].bitfield.word)
7061 i.suffix = WORD_MNEM_SUFFIX;
7062 else if (i.types[1].bitfield.qword)
7063 i.suffix = QWORD_MNEM_SUFFIX;
7064 else
7065 i.suffix = LONG_MNEM_SUFFIX;
7066
7067 i.tm.opcode_modifier.w = 0;
7068 }
7069 }
7070
50128d0c
JB
7071 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7072 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7073 != (i.tm.operand_types[1].bitfield.class == Reg);
7074
d2224064
JB
7075 /* Change the opcode based on the operand size given by i.suffix. */
7076 switch (i.suffix)
29b0f896 7077 {
d2224064
JB
7078 /* Size floating point instruction. */
7079 case LONG_MNEM_SUFFIX:
7080 if (i.tm.opcode_modifier.floatmf)
7081 {
7082 i.tm.base_opcode ^= 4;
7083 break;
7084 }
7085 /* fall through */
7086 case WORD_MNEM_SUFFIX:
7087 case QWORD_MNEM_SUFFIX:
29b0f896 7088 /* It's not a byte, select word/dword operation. */
40fb9820 7089 if (i.tm.opcode_modifier.w)
29b0f896 7090 {
50128d0c 7091 if (i.short_form)
29b0f896
AM
7092 i.tm.base_opcode |= 8;
7093 else
7094 i.tm.base_opcode |= 1;
7095 }
d2224064
JB
7096 /* fall through */
7097 case SHORT_MNEM_SUFFIX:
29b0f896
AM
7098 /* Now select between word & dword operations via the operand
7099 size prefix, except for instructions that will ignore this
7100 prefix anyway. */
c8f8eebc 7101 if (i.suffix != QWORD_MNEM_SUFFIX
3cd7f3e3 7102 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
c8f8eebc
JB
7103 && !i.tm.opcode_modifier.floatmf
7104 && !is_any_vex_encoding (&i.tm)
7105 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7106 || (flag_code == CODE_64BIT
7107 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
24eab124
AM
7108 {
7109 unsigned int prefix = DATA_PREFIX_OPCODE;
543613e9 7110
0cfa3eb3 7111 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
29b0f896 7112 prefix = ADDR_PREFIX_OPCODE;
252b5132 7113
29b0f896
AM
7114 if (!add_prefix (prefix))
7115 return 0;
24eab124 7116 }
252b5132 7117
29b0f896
AM
7118 /* Set mode64 for an operand. */
7119 if (i.suffix == QWORD_MNEM_SUFFIX
9146926a 7120 && flag_code == CODE_64BIT
d2224064 7121 && !i.tm.opcode_modifier.norex64
4ed21b58 7122 && !i.tm.opcode_modifier.vexw
46e883c5 7123 /* Special case for xchg %rax,%rax. It is NOP and doesn't
d2224064
JB
7124 need rex64. */
7125 && ! (i.operands == 2
7126 && i.tm.base_opcode == 0x90
7127 && i.tm.extension_opcode == None
75e5731b
JB
7128 && i.types[0].bitfield.instance == Accum
7129 && i.types[0].bitfield.qword
7130 && i.types[1].bitfield.instance == Accum
7131 && i.types[1].bitfield.qword))
d2224064 7132 i.rex |= REX_W;
3e73aa7c 7133
d2224064 7134 break;
8bbb3ad8
JB
7135
7136 case 0:
7137 /* Select word/dword/qword operation with explict data sizing prefix
7138 when there are no suitable register operands. */
7139 if (i.tm.opcode_modifier.w
7140 && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7141 && (!i.reg_operands
7142 || (i.reg_operands == 1
7143 /* ShiftCount */
7144 && (i.tm.operand_types[0].bitfield.instance == RegC
7145 /* InOutPortReg */
7146 || i.tm.operand_types[0].bitfield.instance == RegD
7147 || i.tm.operand_types[1].bitfield.instance == RegD
7148 /* CRC32 */
7149 || i.tm.base_opcode == 0xf20f38f0))))
7150 i.tm.base_opcode |= 1;
7151 break;
29b0f896 7152 }
7ecd2f8b 7153
c8f8eebc 7154 if (i.tm.opcode_modifier.addrprefixopreg)
c0a30a9f 7155 {
c8f8eebc
JB
7156 gas_assert (!i.suffix);
7157 gas_assert (i.reg_operands);
c0a30a9f 7158
c8f8eebc
JB
7159 if (i.tm.operand_types[0].bitfield.instance == Accum
7160 || i.operands == 1)
7161 {
7162 /* The address size override prefix changes the size of the
7163 first operand. */
7164 if (flag_code == CODE_64BIT
7165 && i.op[0].regs->reg_type.bitfield.word)
7166 {
7167 as_bad (_("16-bit addressing unavailable for `%s'"),
7168 i.tm.name);
7169 return 0;
7170 }
7171
7172 if ((flag_code == CODE_32BIT
7173 ? i.op[0].regs->reg_type.bitfield.word
7174 : i.op[0].regs->reg_type.bitfield.dword)
7175 && !add_prefix (ADDR_PREFIX_OPCODE))
7176 return 0;
7177 }
c0a30a9f
L
7178 else
7179 {
c8f8eebc
JB
7180 /* Check invalid register operand when the address size override
7181 prefix changes the size of register operands. */
7182 unsigned int op;
7183 enum { need_word, need_dword, need_qword } need;
7184
7185 if (flag_code == CODE_32BIT)
7186 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7187 else if (i.prefix[ADDR_PREFIX])
c0a30a9f
L
7188 need = need_dword;
7189 else
7190 need = flag_code == CODE_64BIT ? need_qword : need_word;
c0a30a9f 7191
c8f8eebc
JB
7192 for (op = 0; op < i.operands; op++)
7193 {
7194 if (i.types[op].bitfield.class != Reg)
7195 continue;
7196
7197 switch (need)
7198 {
7199 case need_word:
7200 if (i.op[op].regs->reg_type.bitfield.word)
7201 continue;
7202 break;
7203 case need_dword:
7204 if (i.op[op].regs->reg_type.bitfield.dword)
7205 continue;
7206 break;
7207 case need_qword:
7208 if (i.op[op].regs->reg_type.bitfield.qword)
7209 continue;
7210 break;
7211 }
7212
7213 as_bad (_("invalid register operand size for `%s'"),
7214 i.tm.name);
7215 return 0;
7216 }
7217 }
c0a30a9f
L
7218 }
7219
29b0f896
AM
7220 return 1;
7221}
3e73aa7c 7222
29b0f896 7223static int
543613e9 7224check_byte_reg (void)
29b0f896
AM
7225{
7226 int op;
543613e9 7227
29b0f896
AM
7228 for (op = i.operands; --op >= 0;)
7229 {
dc821c5f 7230 /* Skip non-register operands. */
bab6aec1 7231 if (i.types[op].bitfield.class != Reg)
dc821c5f
JB
7232 continue;
7233
29b0f896
AM
7234 /* If this is an eight bit register, it's OK. If it's the 16 or
7235 32 bit version of an eight bit register, we will just use the
7236 low portion, and that's OK too. */
dc821c5f 7237 if (i.types[op].bitfield.byte)
29b0f896
AM
7238 continue;
7239
5a819eb9 7240 /* I/O port address operands are OK too. */
75e5731b
JB
7241 if (i.tm.operand_types[op].bitfield.instance == RegD
7242 && i.tm.operand_types[op].bitfield.word)
5a819eb9
JB
7243 continue;
7244
9706160a
JB
7245 /* crc32 only wants its source operand checked here. */
7246 if (i.tm.base_opcode == 0xf20f38f0 && op)
9344ff29
L
7247 continue;
7248
29b0f896 7249 /* Any other register is bad. */
73c76375
JB
7250 as_bad (_("`%s%s' not allowed with `%s%c'"),
7251 register_prefix, i.op[op].regs->reg_name,
7252 i.tm.name, i.suffix);
7253 return 0;
29b0f896
AM
7254 }
7255 return 1;
7256}
7257
7258static int
e3bb37b5 7259check_long_reg (void)
29b0f896
AM
7260{
7261 int op;
7262
7263 for (op = i.operands; --op >= 0;)
dc821c5f 7264 /* Skip non-register operands. */
bab6aec1 7265 if (i.types[op].bitfield.class != Reg)
dc821c5f 7266 continue;
29b0f896
AM
7267 /* Reject eight bit registers, except where the template requires
7268 them. (eg. movzb) */
dc821c5f 7269 else if (i.types[op].bitfield.byte
bab6aec1 7270 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7271 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7272 && (i.tm.operand_types[op].bitfield.word
7273 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7274 {
a540244d
L
7275 as_bad (_("`%s%s' not allowed with `%s%c'"),
7276 register_prefix,
29b0f896
AM
7277 i.op[op].regs->reg_name,
7278 i.tm.name,
7279 i.suffix);
7280 return 0;
7281 }
be4c5e58
L
7282 /* Error if the e prefix on a general reg is missing. */
7283 else if (i.types[op].bitfield.word
bab6aec1 7284 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7285 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7286 && i.tm.operand_types[op].bitfield.dword)
29b0f896 7287 {
be4c5e58
L
7288 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7289 register_prefix, i.op[op].regs->reg_name,
7290 i.suffix);
7291 return 0;
252b5132 7292 }
e4630f71 7293 /* Warn if the r prefix on a general reg is present. */
dc821c5f 7294 else if (i.types[op].bitfield.qword
bab6aec1 7295 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7296 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7297 && i.tm.operand_types[op].bitfield.dword)
252b5132 7298 {
34828aad 7299 if (intel_syntax
65fca059 7300 && i.tm.opcode_modifier.toqword
3528c362 7301 && i.types[0].bitfield.class != RegSIMD)
34828aad 7302 {
ca61edf2 7303 /* Convert to QWORD. We want REX byte. */
34828aad
L
7304 i.suffix = QWORD_MNEM_SUFFIX;
7305 }
7306 else
7307 {
2b5d6a91 7308 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
34828aad
L
7309 register_prefix, i.op[op].regs->reg_name,
7310 i.suffix);
7311 return 0;
7312 }
29b0f896
AM
7313 }
7314 return 1;
7315}
252b5132 7316
29b0f896 7317static int
e3bb37b5 7318check_qword_reg (void)
29b0f896
AM
7319{
7320 int op;
252b5132 7321
29b0f896 7322 for (op = i.operands; --op >= 0; )
dc821c5f 7323 /* Skip non-register operands. */
bab6aec1 7324 if (i.types[op].bitfield.class != Reg)
dc821c5f 7325 continue;
29b0f896
AM
7326 /* Reject eight bit registers, except where the template requires
7327 them. (eg. movzb) */
dc821c5f 7328 else if (i.types[op].bitfield.byte
bab6aec1 7329 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7330 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7331 && (i.tm.operand_types[op].bitfield.word
7332 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7333 {
a540244d
L
7334 as_bad (_("`%s%s' not allowed with `%s%c'"),
7335 register_prefix,
29b0f896
AM
7336 i.op[op].regs->reg_name,
7337 i.tm.name,
7338 i.suffix);
7339 return 0;
7340 }
e4630f71 7341 /* Warn if the r prefix on a general reg is missing. */
dc821c5f
JB
7342 else if ((i.types[op].bitfield.word
7343 || i.types[op].bitfield.dword)
bab6aec1 7344 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7345 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7346 && i.tm.operand_types[op].bitfield.qword)
29b0f896
AM
7347 {
7348 /* Prohibit these changes in the 64bit mode, since the
7349 lowering is more complicated. */
34828aad 7350 if (intel_syntax
ca61edf2 7351 && i.tm.opcode_modifier.todword
3528c362 7352 && i.types[0].bitfield.class != RegSIMD)
34828aad 7353 {
ca61edf2 7354 /* Convert to DWORD. We don't want REX byte. */
34828aad
L
7355 i.suffix = LONG_MNEM_SUFFIX;
7356 }
7357 else
7358 {
2b5d6a91 7359 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
34828aad
L
7360 register_prefix, i.op[op].regs->reg_name,
7361 i.suffix);
7362 return 0;
7363 }
252b5132 7364 }
29b0f896
AM
7365 return 1;
7366}
252b5132 7367
29b0f896 7368static int
e3bb37b5 7369check_word_reg (void)
29b0f896
AM
7370{
7371 int op;
7372 for (op = i.operands; --op >= 0;)
dc821c5f 7373 /* Skip non-register operands. */
bab6aec1 7374 if (i.types[op].bitfield.class != Reg)
dc821c5f 7375 continue;
29b0f896
AM
7376 /* Reject eight bit registers, except where the template requires
7377 them. (eg. movzb) */
dc821c5f 7378 else if (i.types[op].bitfield.byte
bab6aec1 7379 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7380 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f
JB
7381 && (i.tm.operand_types[op].bitfield.word
7382 || i.tm.operand_types[op].bitfield.dword))
29b0f896 7383 {
a540244d
L
7384 as_bad (_("`%s%s' not allowed with `%s%c'"),
7385 register_prefix,
29b0f896
AM
7386 i.op[op].regs->reg_name,
7387 i.tm.name,
7388 i.suffix);
7389 return 0;
7390 }
9706160a
JB
7391 /* Error if the e or r prefix on a general reg is present. */
7392 else if ((i.types[op].bitfield.dword
dc821c5f 7393 || i.types[op].bitfield.qword)
bab6aec1 7394 && (i.tm.operand_types[op].bitfield.class == Reg
75e5731b 7395 || i.tm.operand_types[op].bitfield.instance == Accum)
dc821c5f 7396 && i.tm.operand_types[op].bitfield.word)
252b5132 7397 {
9706160a
JB
7398 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7399 register_prefix, i.op[op].regs->reg_name,
7400 i.suffix);
7401 return 0;
29b0f896
AM
7402 }
7403 return 1;
7404}
252b5132 7405
29b0f896 7406static int
40fb9820 7407update_imm (unsigned int j)
29b0f896 7408{
bc0844ae 7409 i386_operand_type overlap = i.types[j];
40fb9820
L
7410 if ((overlap.bitfield.imm8
7411 || overlap.bitfield.imm8s
7412 || overlap.bitfield.imm16
7413 || overlap.bitfield.imm32
7414 || overlap.bitfield.imm32s
7415 || overlap.bitfield.imm64)
0dfbf9d7
L
7416 && !operand_type_equal (&overlap, &imm8)
7417 && !operand_type_equal (&overlap, &imm8s)
7418 && !operand_type_equal (&overlap, &imm16)
7419 && !operand_type_equal (&overlap, &imm32)
7420 && !operand_type_equal (&overlap, &imm32s)
7421 && !operand_type_equal (&overlap, &imm64))
29b0f896
AM
7422 {
7423 if (i.suffix)
7424 {
40fb9820
L
7425 i386_operand_type temp;
7426
0dfbf9d7 7427 operand_type_set (&temp, 0);
7ab9ffdd 7428 if (i.suffix == BYTE_MNEM_SUFFIX)
40fb9820
L
7429 {
7430 temp.bitfield.imm8 = overlap.bitfield.imm8;
7431 temp.bitfield.imm8s = overlap.bitfield.imm8s;
7432 }
7433 else if (i.suffix == WORD_MNEM_SUFFIX)
7434 temp.bitfield.imm16 = overlap.bitfield.imm16;
7435 else if (i.suffix == QWORD_MNEM_SUFFIX)
7436 {
7437 temp.bitfield.imm64 = overlap.bitfield.imm64;
7438 temp.bitfield.imm32s = overlap.bitfield.imm32s;
7439 }
7440 else
7441 temp.bitfield.imm32 = overlap.bitfield.imm32;
7442 overlap = temp;
29b0f896 7443 }
0dfbf9d7
L
7444 else if (operand_type_equal (&overlap, &imm16_32_32s)
7445 || operand_type_equal (&overlap, &imm16_32)
7446 || operand_type_equal (&overlap, &imm16_32s))
29b0f896 7447 {
40fb9820 7448 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
65da13b5 7449 overlap = imm16;
40fb9820 7450 else
65da13b5 7451 overlap = imm32s;
29b0f896 7452 }
8bbb3ad8
JB
7453 else if (i.prefix[REX_PREFIX] & REX_W)
7454 overlap = operand_type_and (overlap, imm32s);
7455 else if (i.prefix[DATA_PREFIX])
7456 overlap = operand_type_and (overlap,
7457 flag_code != CODE_16BIT ? imm16 : imm32);
0dfbf9d7
L
7458 if (!operand_type_equal (&overlap, &imm8)
7459 && !operand_type_equal (&overlap, &imm8s)
7460 && !operand_type_equal (&overlap, &imm16)
7461 && !operand_type_equal (&overlap, &imm32)
7462 && !operand_type_equal (&overlap, &imm32s)
7463 && !operand_type_equal (&overlap, &imm64))
29b0f896 7464 {
4eed87de
AM
7465 as_bad (_("no instruction mnemonic suffix given; "
7466 "can't determine immediate size"));
29b0f896
AM
7467 return 0;
7468 }
7469 }
40fb9820 7470 i.types[j] = overlap;
29b0f896 7471
40fb9820
L
7472 return 1;
7473}
7474
7475static int
7476finalize_imm (void)
7477{
bc0844ae 7478 unsigned int j, n;
29b0f896 7479
bc0844ae
L
7480 /* Update the first 2 immediate operands. */
7481 n = i.operands > 2 ? 2 : i.operands;
7482 if (n)
7483 {
7484 for (j = 0; j < n; j++)
7485 if (update_imm (j) == 0)
7486 return 0;
40fb9820 7487
bc0844ae
L
7488 /* The 3rd operand can't be immediate operand. */
7489 gas_assert (operand_type_check (i.types[2], imm) == 0);
7490 }
29b0f896
AM
7491
7492 return 1;
7493}
7494
7495static int
e3bb37b5 7496process_operands (void)
29b0f896
AM
7497{
7498 /* Default segment register this instruction will use for memory
7499 accesses. 0 means unknown. This is only for optimizing out
7500 unnecessary segment overrides. */
7501 const seg_entry *default_seg = 0;
7502
a5aeccd9
JB
7503 if (i.tm.opcode_modifier.sse2avx)
7504 {
7505 /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7506 need converting. */
7507 i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7508 i.prefix[REX_PREFIX] = 0;
7509 i.rex_encoding = 0;
7510 }
c423d21a
JB
7511 /* ImmExt should be processed after SSE2AVX. */
7512 else if (i.tm.opcode_modifier.immext)
7513 process_immext ();
a5aeccd9 7514
2426c15f 7515 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
29b0f896 7516 {
91d6fa6a
NC
7517 unsigned int dupl = i.operands;
7518 unsigned int dest = dupl - 1;
9fcfb3d7
L
7519 unsigned int j;
7520
c0f3af97 7521 /* The destination must be an xmm register. */
9c2799c2 7522 gas_assert (i.reg_operands
91d6fa6a 7523 && MAX_OPERANDS > dupl
7ab9ffdd 7524 && operand_type_equal (&i.types[dest], &regxmm));
c0f3af97 7525
75e5731b 7526 if (i.tm.operand_types[0].bitfield.instance == Accum
1b54b8d7 7527 && i.tm.operand_types[0].bitfield.xmmword)
e2ec9d29 7528 {
8cd7925b 7529 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
c0f3af97
L
7530 {
7531 /* Keep xmm0 for instructions with VEX prefix and 3
7532 sources. */
75e5731b 7533 i.tm.operand_types[0].bitfield.instance = InstanceNone;
3528c362 7534 i.tm.operand_types[0].bitfield.class = RegSIMD;
c0f3af97
L
7535 goto duplicate;
7536 }
e2ec9d29 7537 else
c0f3af97
L
7538 {
7539 /* We remove the first xmm0 and keep the number of
7540 operands unchanged, which in fact duplicates the
7541 destination. */
7542 for (j = 1; j < i.operands; j++)
7543 {
7544 i.op[j - 1] = i.op[j];
7545 i.types[j - 1] = i.types[j];
7546 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
8dc0818e 7547 i.flags[j - 1] = i.flags[j];
c0f3af97
L
7548 }
7549 }
7550 }
7551 else if (i.tm.opcode_modifier.implicit1stxmm0)
7ab9ffdd 7552 {
91d6fa6a 7553 gas_assert ((MAX_OPERANDS - 1) > dupl
8cd7925b
L
7554 && (i.tm.opcode_modifier.vexsources
7555 == VEX3SOURCES));
c0f3af97
L
7556
7557 /* Add the implicit xmm0 for instructions with VEX prefix
7558 and 3 sources. */
7559 for (j = i.operands; j > 0; j--)
7560 {
7561 i.op[j] = i.op[j - 1];
7562 i.types[j] = i.types[j - 1];
7563 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
8dc0818e 7564 i.flags[j] = i.flags[j - 1];
c0f3af97
L
7565 }
7566 i.op[0].regs
7567 = (const reg_entry *) hash_find (reg_hash, "xmm0");
7ab9ffdd 7568 i.types[0] = regxmm;
c0f3af97
L
7569 i.tm.operand_types[0] = regxmm;
7570
7571 i.operands += 2;
7572 i.reg_operands += 2;
7573 i.tm.operands += 2;
7574
91d6fa6a 7575 dupl++;
c0f3af97 7576 dest++;
91d6fa6a
NC
7577 i.op[dupl] = i.op[dest];
7578 i.types[dupl] = i.types[dest];
7579 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
8dc0818e 7580 i.flags[dupl] = i.flags[dest];
e2ec9d29 7581 }
c0f3af97
L
7582 else
7583 {
dc1e8a47 7584 duplicate:
c0f3af97
L
7585 i.operands++;
7586 i.reg_operands++;
7587 i.tm.operands++;
7588
91d6fa6a
NC
7589 i.op[dupl] = i.op[dest];
7590 i.types[dupl] = i.types[dest];
7591 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
8dc0818e 7592 i.flags[dupl] = i.flags[dest];
c0f3af97
L
7593 }
7594
7595 if (i.tm.opcode_modifier.immext)
7596 process_immext ();
7597 }
75e5731b 7598 else if (i.tm.operand_types[0].bitfield.instance == Accum
1b54b8d7 7599 && i.tm.operand_types[0].bitfield.xmmword)
c0f3af97
L
7600 {
7601 unsigned int j;
7602
9fcfb3d7
L
7603 for (j = 1; j < i.operands; j++)
7604 {
7605 i.op[j - 1] = i.op[j];
7606 i.types[j - 1] = i.types[j];
7607
7608 /* We need to adjust fields in i.tm since they are used by
7609 build_modrm_byte. */
7610 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
8dc0818e
JB
7611
7612 i.flags[j - 1] = i.flags[j];
9fcfb3d7
L
7613 }
7614
e2ec9d29
L
7615 i.operands--;
7616 i.reg_operands--;
e2ec9d29
L
7617 i.tm.operands--;
7618 }
920d2ddc
IT
7619 else if (i.tm.opcode_modifier.implicitquadgroup)
7620 {
a477a8c4
JB
7621 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7622
920d2ddc 7623 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
3528c362 7624 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
a477a8c4
JB
7625 regnum = register_number (i.op[1].regs);
7626 first_reg_in_group = regnum & ~3;
7627 last_reg_in_group = first_reg_in_group + 3;
7628 if (regnum != first_reg_in_group)
7629 as_warn (_("source register `%s%s' implicitly denotes"
7630 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7631 register_prefix, i.op[1].regs->reg_name,
7632 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7633 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7634 i.tm.name);
7635 }
e2ec9d29
L
7636 else if (i.tm.opcode_modifier.regkludge)
7637 {
7638 /* The imul $imm, %reg instruction is converted into
7639 imul $imm, %reg, %reg, and the clr %reg instruction
7640 is converted into xor %reg, %reg. */
7641
7642 unsigned int first_reg_op;
7643
7644 if (operand_type_check (i.types[0], reg))
7645 first_reg_op = 0;
7646 else
7647 first_reg_op = 1;
7648 /* Pretend we saw the extra register operand. */
9c2799c2 7649 gas_assert (i.reg_operands == 1
7ab9ffdd 7650 && i.op[first_reg_op + 1].regs == 0);
e2ec9d29
L
7651 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7652 i.types[first_reg_op + 1] = i.types[first_reg_op];
7653 i.operands++;
7654 i.reg_operands++;
29b0f896
AM
7655 }
7656
85b80b0f 7657 if (i.tm.opcode_modifier.modrm)
29b0f896
AM
7658 {
7659 /* The opcode is completed (modulo i.tm.extension_opcode which
52271982
AM
7660 must be put into the modrm byte). Now, we make the modrm and
7661 index base bytes based on all the info we've collected. */
29b0f896
AM
7662
7663 default_seg = build_modrm_byte ();
7664 }
00cee14f 7665 else if (i.types[0].bitfield.class == SReg)
85b80b0f
JB
7666 {
7667 if (flag_code != CODE_64BIT
7668 ? i.tm.base_opcode == POP_SEG_SHORT
7669 && i.op[0].regs->reg_num == 1
7670 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7671 && i.op[0].regs->reg_num < 4)
7672 {
7673 as_bad (_("you can't `%s %s%s'"),
7674 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7675 return 0;
7676 }
7677 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7678 {
7679 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7680 i.tm.opcode_length = 2;
7681 }
7682 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7683 }
8a2ed489 7684 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
29b0f896
AM
7685 {
7686 default_seg = &ds;
7687 }
40fb9820 7688 else if (i.tm.opcode_modifier.isstring)
29b0f896
AM
7689 {
7690 /* For the string instructions that allow a segment override
7691 on one of their operands, the default segment is ds. */
7692 default_seg = &ds;
7693 }
50128d0c 7694 else if (i.short_form)
85b80b0f
JB
7695 {
7696 /* The register or float register operand is in operand
7697 0 or 1. */
bab6aec1 7698 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
85b80b0f
JB
7699
7700 /* Register goes in low 3 bits of opcode. */
7701 i.tm.base_opcode |= i.op[op].regs->reg_num;
7702 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7703 i.rex |= REX_B;
7704 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7705 {
7706 /* Warn about some common errors, but press on regardless.
7707 The first case can be generated by gcc (<= 2.8.1). */
7708 if (i.operands == 2)
7709 {
7710 /* Reversed arguments on faddp, fsubp, etc. */
7711 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7712 register_prefix, i.op[!intel_syntax].regs->reg_name,
7713 register_prefix, i.op[intel_syntax].regs->reg_name);
7714 }
7715 else
7716 {
7717 /* Extraneous `l' suffix on fp insn. */
7718 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7719 register_prefix, i.op[0].regs->reg_name);
7720 }
7721 }
7722 }
29b0f896 7723
514a8bb0 7724 if ((i.seg[0] || i.prefix[SEG_PREFIX])
514a8bb0
JB
7725 && i.tm.base_opcode == 0x8d /* lea */
7726 && !is_any_vex_encoding(&i.tm))
92334ad2
JB
7727 {
7728 if (!quiet_warnings)
7729 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7730 if (optimize)
7731 {
7732 i.seg[0] = NULL;
7733 i.prefix[SEG_PREFIX] = 0;
7734 }
7735 }
52271982
AM
7736
7737 /* If a segment was explicitly specified, and the specified segment
b6773884
JB
7738 is neither the default nor the one already recorded from a prefix,
7739 use an opcode prefix to select it. If we never figured out what
7740 the default segment is, then default_seg will be zero at this
7741 point, and the specified segment prefix will always be used. */
7742 if (i.seg[0]
7743 && i.seg[0] != default_seg
7744 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
29b0f896
AM
7745 {
7746 if (!add_prefix (i.seg[0]->seg_prefix))
7747 return 0;
7748 }
7749 return 1;
7750}
7751
a5aeccd9
JB
7752static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7753 bfd_boolean do_sse2avx)
7754{
7755 if (r->reg_flags & RegRex)
7756 {
7757 if (i.rex & rex_bit)
7758 as_bad (_("same type of prefix used twice"));
7759 i.rex |= rex_bit;
7760 }
7761 else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7762 {
7763 gas_assert (i.vex.register_specifier == r);
7764 i.vex.register_specifier += 8;
7765 }
7766
7767 if (r->reg_flags & RegVRex)
7768 i.vrex |= rex_bit;
7769}
7770
29b0f896 7771static const seg_entry *
e3bb37b5 7772build_modrm_byte (void)
29b0f896
AM
7773{
7774 const seg_entry *default_seg = 0;
c0f3af97 7775 unsigned int source, dest;
8cd7925b 7776 int vex_3_sources;
c0f3af97 7777
8cd7925b 7778 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
c0f3af97
L
7779 if (vex_3_sources)
7780 {
91d6fa6a 7781 unsigned int nds, reg_slot;
4c2c6516 7782 expressionS *exp;
c0f3af97 7783
6b8d3588 7784 dest = i.operands - 1;
c0f3af97 7785 nds = dest - 1;
922d8de8 7786
a683cc34 7787 /* There are 2 kinds of instructions:
bed3d976 7788 1. 5 operands: 4 register operands or 3 register operands
9d3bf266 7789 plus 1 memory operand plus one Imm4 operand, VexXDS, and
bed3d976 7790 VexW0 or VexW1. The destination must be either XMM, YMM or
43234a1e 7791 ZMM register.
bed3d976 7792 2. 4 operands: 4 register operands or 3 register operands
2f1bada2 7793 plus 1 memory operand, with VexXDS. */
922d8de8 7794 gas_assert ((i.reg_operands == 4
bed3d976
JB
7795 || (i.reg_operands == 3 && i.mem_operands == 1))
7796 && i.tm.opcode_modifier.vexvvvv == VEXXDS
dcd7e323 7797 && i.tm.opcode_modifier.vexw
3528c362 7798 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
a683cc34 7799
48db9223
JB
7800 /* If VexW1 is set, the first non-immediate operand is the source and
7801 the second non-immediate one is encoded in the immediate operand. */
7802 if (i.tm.opcode_modifier.vexw == VEXW1)
7803 {
7804 source = i.imm_operands;
7805 reg_slot = i.imm_operands + 1;
7806 }
7807 else
7808 {
7809 source = i.imm_operands + 1;
7810 reg_slot = i.imm_operands;
7811 }
7812
a683cc34 7813 if (i.imm_operands == 0)
bed3d976
JB
7814 {
7815 /* When there is no immediate operand, generate an 8bit
7816 immediate operand to encode the first operand. */
7817 exp = &im_expressions[i.imm_operands++];
7818 i.op[i.operands].imms = exp;
7819 i.types[i.operands] = imm8;
7820 i.operands++;
7821
3528c362 7822 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
bed3d976
JB
7823 exp->X_op = O_constant;
7824 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
43234a1e
L
7825 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7826 }
922d8de8 7827 else
bed3d976 7828 {
9d3bf266
JB
7829 gas_assert (i.imm_operands == 1);
7830 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7831 gas_assert (!i.tm.opcode_modifier.immext);
a683cc34 7832
9d3bf266
JB
7833 /* Turn on Imm8 again so that output_imm will generate it. */
7834 i.types[0].bitfield.imm8 = 1;
bed3d976 7835
3528c362 7836 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
9d3bf266 7837 i.op[0].imms->X_add_number
bed3d976 7838 |= register_number (i.op[reg_slot].regs) << 4;
43234a1e 7839 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
bed3d976 7840 }
a683cc34 7841
3528c362 7842 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
dae39acc 7843 i.vex.register_specifier = i.op[nds].regs;
c0f3af97
L
7844 }
7845 else
7846 source = dest = 0;
29b0f896
AM
7847
7848 /* i.reg_operands MUST be the number of real register operands;
c0f3af97
L
7849 implicit registers do not count. If there are 3 register
7850 operands, it must be a instruction with VexNDS. For a
7851 instruction with VexNDD, the destination register is encoded
7852 in VEX prefix. If there are 4 register operands, it must be
7853 a instruction with VEX prefix and 3 sources. */
7ab9ffdd
L
7854 if (i.mem_operands == 0
7855 && ((i.reg_operands == 2
2426c15f 7856 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7ab9ffdd 7857 || (i.reg_operands == 3
2426c15f 7858 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7ab9ffdd 7859 || (i.reg_operands == 4 && vex_3_sources)))
29b0f896 7860 {
cab737b9
L
7861 switch (i.operands)
7862 {
7863 case 2:
7864 source = 0;
7865 break;
7866 case 3:
c81128dc
L
7867 /* When there are 3 operands, one of them may be immediate,
7868 which may be the first or the last operand. Otherwise,
c0f3af97
L
7869 the first operand must be shift count register (cl) or it
7870 is an instruction with VexNDS. */
9c2799c2 7871 gas_assert (i.imm_operands == 1
7ab9ffdd 7872 || (i.imm_operands == 0
2426c15f 7873 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
75e5731b
JB
7874 || (i.types[0].bitfield.instance == RegC
7875 && i.types[0].bitfield.byte))));
40fb9820 7876 if (operand_type_check (i.types[0], imm)
75e5731b
JB
7877 || (i.types[0].bitfield.instance == RegC
7878 && i.types[0].bitfield.byte))
40fb9820
L
7879 source = 1;
7880 else
7881 source = 0;
cab737b9
L
7882 break;
7883 case 4:
368d64cc
L
7884 /* When there are 4 operands, the first two must be 8bit
7885 immediate operands. The source operand will be the 3rd
c0f3af97
L
7886 one.
7887
7888 For instructions with VexNDS, if the first operand
7889 an imm8, the source operand is the 2nd one. If the last
7890 operand is imm8, the source operand is the first one. */
9c2799c2 7891 gas_assert ((i.imm_operands == 2
7ab9ffdd
L
7892 && i.types[0].bitfield.imm8
7893 && i.types[1].bitfield.imm8)
2426c15f 7894 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7ab9ffdd
L
7895 && i.imm_operands == 1
7896 && (i.types[0].bitfield.imm8
43234a1e
L
7897 || i.types[i.operands - 1].bitfield.imm8
7898 || i.rounding)));
9f2670f2
L
7899 if (i.imm_operands == 2)
7900 source = 2;
7901 else
c0f3af97
L
7902 {
7903 if (i.types[0].bitfield.imm8)
7904 source = 1;
7905 else
7906 source = 0;
7907 }
c0f3af97
L
7908 break;
7909 case 5:
e771e7c9 7910 if (is_evex_encoding (&i.tm))
43234a1e
L
7911 {
7912 /* For EVEX instructions, when there are 5 operands, the
7913 first one must be immediate operand. If the second one
7914 is immediate operand, the source operand is the 3th
7915 one. If the last one is immediate operand, the source
7916 operand is the 2nd one. */
7917 gas_assert (i.imm_operands == 2
7918 && i.tm.opcode_modifier.sae
7919 && operand_type_check (i.types[0], imm));
7920 if (operand_type_check (i.types[1], imm))
7921 source = 2;
7922 else if (operand_type_check (i.types[4], imm))
7923 source = 1;
7924 else
7925 abort ();
7926 }
cab737b9
L
7927 break;
7928 default:
7929 abort ();
7930 }
7931
c0f3af97
L
7932 if (!vex_3_sources)
7933 {
7934 dest = source + 1;
7935
43234a1e
L
7936 /* RC/SAE operand could be between DEST and SRC. That happens
7937 when one operand is GPR and the other one is XMM/YMM/ZMM
7938 register. */
7939 if (i.rounding && i.rounding->operand == (int) dest)
7940 dest++;
7941
2426c15f 7942 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
c0f3af97 7943 {
43234a1e 7944 /* For instructions with VexNDS, the register-only source
c5d0745b 7945 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
dfd69174 7946 register. It is encoded in VEX prefix. */
f12dc422
L
7947
7948 i386_operand_type op;
7949 unsigned int vvvv;
7950
c2ecccb3
L
7951 /* Swap two source operands if needed. */
7952 if (i.tm.opcode_modifier.swapsources)
f12dc422
L
7953 {
7954 vvvv = source;
7955 source = dest;
7956 }
7957 else
7958 vvvv = dest;
7959
7960 op = i.tm.operand_types[vvvv];
c0f3af97 7961 if ((dest + 1) >= i.operands
bab6aec1 7962 || ((op.bitfield.class != Reg
dc821c5f 7963 || (!op.bitfield.dword && !op.bitfield.qword))
3528c362 7964 && op.bitfield.class != RegSIMD
43234a1e 7965 && !operand_type_equal (&op, &regmask)))
c0f3af97 7966 abort ();
f12dc422 7967 i.vex.register_specifier = i.op[vvvv].regs;
c0f3af97
L
7968 dest++;
7969 }
7970 }
29b0f896
AM
7971
7972 i.rm.mode = 3;
dfd69174
JB
7973 /* One of the register operands will be encoded in the i.rm.reg
7974 field, the other in the combined i.rm.mode and i.rm.regmem
29b0f896
AM
7975 fields. If no form of this instruction supports a memory
7976 destination operand, then we assume the source operand may
7977 sometimes be a memory operand and so we need to store the
7978 destination in the i.rm.reg field. */
dfd69174 7979 if (!i.tm.opcode_modifier.regmem
40fb9820 7980 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
29b0f896
AM
7981 {
7982 i.rm.reg = i.op[dest].regs->reg_num;
7983 i.rm.regmem = i.op[source].regs->reg_num;
a5aeccd9
JB
7984 set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
7985 set_rex_vrex (i.op[source].regs, REX_B, FALSE);
29b0f896
AM
7986 }
7987 else
7988 {
7989 i.rm.reg = i.op[source].regs->reg_num;
7990 i.rm.regmem = i.op[dest].regs->reg_num;
a5aeccd9
JB
7991 set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
7992 set_rex_vrex (i.op[source].regs, REX_R, FALSE);
29b0f896 7993 }
e0c7f900 7994 if (flag_code != CODE_64BIT && (i.rex & REX_R))
c4a530c5 7995 {
4a5c67ed 7996 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
c4a530c5 7997 abort ();
e0c7f900 7998 i.rex &= ~REX_R;
c4a530c5
JB
7999 add_prefix (LOCK_PREFIX_OPCODE);
8000 }
29b0f896
AM
8001 }
8002 else
8003 { /* If it's not 2 reg operands... */
c0f3af97
L
8004 unsigned int mem;
8005
29b0f896
AM
8006 if (i.mem_operands)
8007 {
8008 unsigned int fake_zero_displacement = 0;
99018f42 8009 unsigned int op;
4eed87de 8010
7ab9ffdd 8011 for (op = 0; op < i.operands; op++)
8dc0818e 8012 if (i.flags[op] & Operand_Mem)
7ab9ffdd 8013 break;
7ab9ffdd 8014 gas_assert (op < i.operands);
29b0f896 8015
63112cd6 8016 if (i.tm.opcode_modifier.sib)
6c30d220 8017 {
260cd341
LC
8018 /* The index register of VSIB shouldn't be RegIZ. */
8019 if (i.tm.opcode_modifier.sib != SIBMEM
8020 && i.index_reg->reg_num == RegIZ)
6c30d220
L
8021 abort ();
8022
8023 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8024 if (!i.base_reg)
8025 {
8026 i.sib.base = NO_BASE_REGISTER;
8027 i.sib.scale = i.log2_scale_factor;
8028 i.types[op].bitfield.disp8 = 0;
8029 i.types[op].bitfield.disp16 = 0;
8030 i.types[op].bitfield.disp64 = 0;
43083a50 8031 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
6c30d220
L
8032 {
8033 /* Must be 32 bit */
8034 i.types[op].bitfield.disp32 = 1;
8035 i.types[op].bitfield.disp32s = 0;
8036 }
8037 else
8038 {
8039 i.types[op].bitfield.disp32 = 0;
8040 i.types[op].bitfield.disp32s = 1;
8041 }
8042 }
260cd341
LC
8043
8044 /* Since the mandatory SIB always has index register, so
8045 the code logic remains unchanged. The non-mandatory SIB
8046 without index register is allowed and will be handled
8047 later. */
8048 if (i.index_reg)
8049 {
8050 if (i.index_reg->reg_num == RegIZ)
8051 i.sib.index = NO_INDEX_REGISTER;
8052 else
8053 i.sib.index = i.index_reg->reg_num;
8054 set_rex_vrex (i.index_reg, REX_X, FALSE);
8055 }
6c30d220
L
8056 }
8057
29b0f896
AM
8058 default_seg = &ds;
8059
8060 if (i.base_reg == 0)
8061 {
8062 i.rm.mode = 0;
8063 if (!i.disp_operands)
9bb129e8 8064 fake_zero_displacement = 1;
29b0f896
AM
8065 if (i.index_reg == 0)
8066 {
73053c1f
JB
8067 i386_operand_type newdisp;
8068
260cd341
LC
8069 /* Both check for VSIB and mandatory non-vector SIB. */
8070 gas_assert (!i.tm.opcode_modifier.sib
8071 || i.tm.opcode_modifier.sib == SIBMEM);
29b0f896 8072 /* Operand is just <disp> */
20f0a1fc 8073 if (flag_code == CODE_64BIT)
29b0f896
AM
8074 {
8075 /* 64bit mode overwrites the 32bit absolute
8076 addressing by RIP relative addressing and
8077 absolute addressing is encoded by one of the
8078 redundant SIB forms. */
8079 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8080 i.sib.base = NO_BASE_REGISTER;
8081 i.sib.index = NO_INDEX_REGISTER;
73053c1f 8082 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
20f0a1fc 8083 }
fc225355
L
8084 else if ((flag_code == CODE_16BIT)
8085 ^ (i.prefix[ADDR_PREFIX] != 0))
20f0a1fc
NC
8086 {
8087 i.rm.regmem = NO_BASE_REGISTER_16;
73053c1f 8088 newdisp = disp16;
20f0a1fc
NC
8089 }
8090 else
8091 {
8092 i.rm.regmem = NO_BASE_REGISTER;
73053c1f 8093 newdisp = disp32;
29b0f896 8094 }
73053c1f
JB
8095 i.types[op] = operand_type_and_not (i.types[op], anydisp);
8096 i.types[op] = operand_type_or (i.types[op], newdisp);
29b0f896 8097 }
63112cd6 8098 else if (!i.tm.opcode_modifier.sib)
29b0f896 8099 {
6c30d220 8100 /* !i.base_reg && i.index_reg */
e968fc9b 8101 if (i.index_reg->reg_num == RegIZ)
db51cc60
L
8102 i.sib.index = NO_INDEX_REGISTER;
8103 else
8104 i.sib.index = i.index_reg->reg_num;
29b0f896
AM
8105 i.sib.base = NO_BASE_REGISTER;
8106 i.sib.scale = i.log2_scale_factor;
8107 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
40fb9820
L
8108 i.types[op].bitfield.disp8 = 0;
8109 i.types[op].bitfield.disp16 = 0;
8110 i.types[op].bitfield.disp64 = 0;
43083a50 8111 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
40fb9820
L
8112 {
8113 /* Must be 32 bit */
8114 i.types[op].bitfield.disp32 = 1;
8115 i.types[op].bitfield.disp32s = 0;
8116 }
29b0f896 8117 else
40fb9820
L
8118 {
8119 i.types[op].bitfield.disp32 = 0;
8120 i.types[op].bitfield.disp32s = 1;
8121 }
29b0f896 8122 if ((i.index_reg->reg_flags & RegRex) != 0)
161a04f6 8123 i.rex |= REX_X;
29b0f896
AM
8124 }
8125 }
8126 /* RIP addressing for 64bit mode. */
e968fc9b 8127 else if (i.base_reg->reg_num == RegIP)
29b0f896 8128 {
63112cd6 8129 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896 8130 i.rm.regmem = NO_BASE_REGISTER;
40fb9820
L
8131 i.types[op].bitfield.disp8 = 0;
8132 i.types[op].bitfield.disp16 = 0;
8133 i.types[op].bitfield.disp32 = 0;
8134 i.types[op].bitfield.disp32s = 1;
8135 i.types[op].bitfield.disp64 = 0;
71903a11 8136 i.flags[op] |= Operand_PCrel;
20f0a1fc
NC
8137 if (! i.disp_operands)
8138 fake_zero_displacement = 1;
29b0f896 8139 }
dc821c5f 8140 else if (i.base_reg->reg_type.bitfield.word)
29b0f896 8141 {
63112cd6 8142 gas_assert (!i.tm.opcode_modifier.sib);
29b0f896
AM
8143 switch (i.base_reg->reg_num)
8144 {
8145 case 3: /* (%bx) */
8146 if (i.index_reg == 0)
8147 i.rm.regmem = 7;
8148 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
8149 i.rm.regmem = i.index_reg->reg_num - 6;
8150 break;
8151 case 5: /* (%bp) */
8152 default_seg = &ss;
8153 if (i.index_reg == 0)
8154 {
8155 i.rm.regmem = 6;
40fb9820 8156 if (operand_type_check (i.types[op], disp) == 0)
29b0f896
AM
8157 {
8158 /* fake (%bp) into 0(%bp) */
b5014f7a 8159 i.types[op].bitfield.disp8 = 1;
252b5132 8160 fake_zero_displacement = 1;
29b0f896
AM
8161 }
8162 }
8163 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
8164 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8165 break;
8166 default: /* (%si) -> 4 or (%di) -> 5 */
8167 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8168 }
8169 i.rm.mode = mode_from_disp_size (i.types[op]);
8170 }
8171 else /* i.base_reg and 32/64 bit mode */
8172 {
8173 if (flag_code == CODE_64BIT
40fb9820
L
8174 && operand_type_check (i.types[op], disp))
8175 {
73053c1f
JB
8176 i.types[op].bitfield.disp16 = 0;
8177 i.types[op].bitfield.disp64 = 0;
40fb9820 8178 if (i.prefix[ADDR_PREFIX] == 0)
73053c1f
JB
8179 {
8180 i.types[op].bitfield.disp32 = 0;
8181 i.types[op].bitfield.disp32s = 1;
8182 }
40fb9820 8183 else
73053c1f
JB
8184 {
8185 i.types[op].bitfield.disp32 = 1;
8186 i.types[op].bitfield.disp32s = 0;
8187 }
40fb9820 8188 }
20f0a1fc 8189
63112cd6 8190 if (!i.tm.opcode_modifier.sib)
6c30d220 8191 i.rm.regmem = i.base_reg->reg_num;
29b0f896 8192 if ((i.base_reg->reg_flags & RegRex) != 0)
161a04f6 8193 i.rex |= REX_B;
29b0f896
AM
8194 i.sib.base = i.base_reg->reg_num;
8195 /* x86-64 ignores REX prefix bit here to avoid decoder
8196 complications. */
848930b2
JB
8197 if (!(i.base_reg->reg_flags & RegRex)
8198 && (i.base_reg->reg_num == EBP_REG_NUM
8199 || i.base_reg->reg_num == ESP_REG_NUM))
29b0f896 8200 default_seg = &ss;
848930b2 8201 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
29b0f896 8202 {
848930b2 8203 fake_zero_displacement = 1;
b5014f7a 8204 i.types[op].bitfield.disp8 = 1;
29b0f896
AM
8205 }
8206 i.sib.scale = i.log2_scale_factor;
8207 if (i.index_reg == 0)
8208 {
260cd341
LC
8209 /* Only check for VSIB. */
8210 gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8211 && i.tm.opcode_modifier.sib != VECSIB256
8212 && i.tm.opcode_modifier.sib != VECSIB512);
8213
29b0f896
AM
8214 /* <disp>(%esp) becomes two byte modrm with no index
8215 register. We've already stored the code for esp
8216 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8217 Any base register besides %esp will not use the
8218 extra modrm byte. */
8219 i.sib.index = NO_INDEX_REGISTER;
29b0f896 8220 }
63112cd6 8221 else if (!i.tm.opcode_modifier.sib)
29b0f896 8222 {
e968fc9b 8223 if (i.index_reg->reg_num == RegIZ)
db51cc60
L
8224 i.sib.index = NO_INDEX_REGISTER;
8225 else
8226 i.sib.index = i.index_reg->reg_num;
29b0f896
AM
8227 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8228 if ((i.index_reg->reg_flags & RegRex) != 0)
161a04f6 8229 i.rex |= REX_X;
29b0f896 8230 }
67a4f2b7
AO
8231
8232 if (i.disp_operands
8233 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8234 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8235 i.rm.mode = 0;
8236 else
a501d77e
L
8237 {
8238 if (!fake_zero_displacement
8239 && !i.disp_operands
8240 && i.disp_encoding)
8241 {
8242 fake_zero_displacement = 1;
8243 if (i.disp_encoding == disp_encoding_8bit)
8244 i.types[op].bitfield.disp8 = 1;
8245 else
8246 i.types[op].bitfield.disp32 = 1;
8247 }
8248 i.rm.mode = mode_from_disp_size (i.types[op]);
8249 }
29b0f896 8250 }
252b5132 8251
29b0f896
AM
8252 if (fake_zero_displacement)
8253 {
8254 /* Fakes a zero displacement assuming that i.types[op]
8255 holds the correct displacement size. */
8256 expressionS *exp;
8257
9c2799c2 8258 gas_assert (i.op[op].disps == 0);
29b0f896
AM
8259 exp = &disp_expressions[i.disp_operands++];
8260 i.op[op].disps = exp;
8261 exp->X_op = O_constant;
8262 exp->X_add_number = 0;
8263 exp->X_add_symbol = (symbolS *) 0;
8264 exp->X_op_symbol = (symbolS *) 0;
8265 }
c0f3af97
L
8266
8267 mem = op;
29b0f896 8268 }
c0f3af97
L
8269 else
8270 mem = ~0;
252b5132 8271
8c43a48b 8272 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
5dd85c99
SP
8273 {
8274 if (operand_type_check (i.types[0], imm))
8275 i.vex.register_specifier = NULL;
8276 else
8277 {
8278 /* VEX.vvvv encodes one of the sources when the first
8279 operand is not an immediate. */
1ef99a7b 8280 if (i.tm.opcode_modifier.vexw == VEXW0)
5dd85c99
SP
8281 i.vex.register_specifier = i.op[0].regs;
8282 else
8283 i.vex.register_specifier = i.op[1].regs;
8284 }
8285
8286 /* Destination is a XMM register encoded in the ModRM.reg
8287 and VEX.R bit. */
8288 i.rm.reg = i.op[2].regs->reg_num;
8289 if ((i.op[2].regs->reg_flags & RegRex) != 0)
8290 i.rex |= REX_R;
8291
8292 /* ModRM.rm and VEX.B encodes the other source. */
8293 if (!i.mem_operands)
8294 {
8295 i.rm.mode = 3;
8296
1ef99a7b 8297 if (i.tm.opcode_modifier.vexw == VEXW0)
5dd85c99
SP
8298 i.rm.regmem = i.op[1].regs->reg_num;
8299 else
8300 i.rm.regmem = i.op[0].regs->reg_num;
8301
8302 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8303 i.rex |= REX_B;
8304 }
8305 }
2426c15f 8306 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
f88c9eb0
SP
8307 {
8308 i.vex.register_specifier = i.op[2].regs;
8309 if (!i.mem_operands)
8310 {
8311 i.rm.mode = 3;
8312 i.rm.regmem = i.op[1].regs->reg_num;
8313 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8314 i.rex |= REX_B;
8315 }
8316 }
29b0f896
AM
8317 /* Fill in i.rm.reg or i.rm.regmem field with register operand
8318 (if any) based on i.tm.extension_opcode. Again, we must be
8319 careful to make sure that segment/control/debug/test/MMX
8320 registers are coded into the i.rm.reg field. */
f88c9eb0 8321 else if (i.reg_operands)
29b0f896 8322 {
99018f42 8323 unsigned int op;
7ab9ffdd
L
8324 unsigned int vex_reg = ~0;
8325
8326 for (op = 0; op < i.operands; op++)
921eafea
L
8327 if (i.types[op].bitfield.class == Reg
8328 || i.types[op].bitfield.class == RegBND
8329 || i.types[op].bitfield.class == RegMask
8330 || i.types[op].bitfield.class == SReg
8331 || i.types[op].bitfield.class == RegCR
8332 || i.types[op].bitfield.class == RegDR
8333 || i.types[op].bitfield.class == RegTR
8334 || i.types[op].bitfield.class == RegSIMD
8335 || i.types[op].bitfield.class == RegMMX)
8336 break;
c0209578 8337
7ab9ffdd
L
8338 if (vex_3_sources)
8339 op = dest;
2426c15f 8340 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7ab9ffdd
L
8341 {
8342 /* For instructions with VexNDS, the register-only
8343 source operand is encoded in VEX prefix. */
8344 gas_assert (mem != (unsigned int) ~0);
c0f3af97 8345
7ab9ffdd 8346 if (op > mem)
c0f3af97 8347 {
7ab9ffdd
L
8348 vex_reg = op++;
8349 gas_assert (op < i.operands);
c0f3af97
L
8350 }
8351 else
c0f3af97 8352 {
f12dc422
L
8353 /* Check register-only source operand when two source
8354 operands are swapped. */
8355 if (!i.tm.operand_types[op].bitfield.baseindex
8356 && i.tm.operand_types[op + 1].bitfield.baseindex)
8357 {
8358 vex_reg = op;
8359 op += 2;
8360 gas_assert (mem == (vex_reg + 1)
8361 && op < i.operands);
8362 }
8363 else
8364 {
8365 vex_reg = op + 1;
8366 gas_assert (vex_reg < i.operands);
8367 }
c0f3af97 8368 }
7ab9ffdd 8369 }
2426c15f 8370 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7ab9ffdd 8371 {
f12dc422 8372 /* For instructions with VexNDD, the register destination
7ab9ffdd 8373 is encoded in VEX prefix. */
f12dc422
L
8374 if (i.mem_operands == 0)
8375 {
8376 /* There is no memory operand. */
8377 gas_assert ((op + 2) == i.operands);
8378 vex_reg = op + 1;
8379 }
8380 else
8d63c93e 8381 {
ed438a93
JB
8382 /* There are only 2 non-immediate operands. */
8383 gas_assert (op < i.imm_operands + 2
8384 && i.operands == i.imm_operands + 2);
8385 vex_reg = i.imm_operands + 1;
f12dc422 8386 }
7ab9ffdd
L
8387 }
8388 else
8389 gas_assert (op < i.operands);
99018f42 8390
7ab9ffdd
L
8391 if (vex_reg != (unsigned int) ~0)
8392 {
f12dc422 8393 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7ab9ffdd 8394
bab6aec1 8395 if ((type->bitfield.class != Reg
dc821c5f 8396 || (!type->bitfield.dword && !type->bitfield.qword))
3528c362 8397 && type->bitfield.class != RegSIMD
43234a1e 8398 && !operand_type_equal (type, &regmask))
7ab9ffdd 8399 abort ();
f88c9eb0 8400
7ab9ffdd
L
8401 i.vex.register_specifier = i.op[vex_reg].regs;
8402 }
8403
1b9f0c97
L
8404 /* Don't set OP operand twice. */
8405 if (vex_reg != op)
7ab9ffdd 8406 {
1b9f0c97
L
8407 /* If there is an extension opcode to put here, the
8408 register number must be put into the regmem field. */
8409 if (i.tm.extension_opcode != None)
8410 {
8411 i.rm.regmem = i.op[op].regs->reg_num;
a5aeccd9
JB
8412 set_rex_vrex (i.op[op].regs, REX_B,
8413 i.tm.opcode_modifier.sse2avx);
1b9f0c97
L
8414 }
8415 else
8416 {
8417 i.rm.reg = i.op[op].regs->reg_num;
a5aeccd9
JB
8418 set_rex_vrex (i.op[op].regs, REX_R,
8419 i.tm.opcode_modifier.sse2avx);
1b9f0c97 8420 }
7ab9ffdd 8421 }
252b5132 8422
29b0f896
AM
8423 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8424 must set it to 3 to indicate this is a register operand
8425 in the regmem field. */
8426 if (!i.mem_operands)
8427 i.rm.mode = 3;
8428 }
252b5132 8429
29b0f896 8430 /* Fill in i.rm.reg field with extension opcode (if any). */
c1e679ec 8431 if (i.tm.extension_opcode != None)
29b0f896
AM
8432 i.rm.reg = i.tm.extension_opcode;
8433 }
8434 return default_seg;
8435}
252b5132 8436
376cd056
JB
8437static unsigned int
8438flip_code16 (unsigned int code16)
8439{
8440 gas_assert (i.tm.operands == 1);
8441
8442 return !(i.prefix[REX_PREFIX] & REX_W)
8443 && (code16 ? i.tm.operand_types[0].bitfield.disp32
8444 || i.tm.operand_types[0].bitfield.disp32s
8445 : i.tm.operand_types[0].bitfield.disp16)
8446 ? CODE16 : 0;
8447}
8448
29b0f896 8449static void
e3bb37b5 8450output_branch (void)
29b0f896
AM
8451{
8452 char *p;
f8a5c266 8453 int size;
29b0f896
AM
8454 int code16;
8455 int prefix;
8456 relax_substateT subtype;
8457 symbolS *sym;
8458 offsetT off;
8459
f8a5c266 8460 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
a501d77e 8461 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
29b0f896
AM
8462
8463 prefix = 0;
8464 if (i.prefix[DATA_PREFIX] != 0)
252b5132 8465 {
29b0f896
AM
8466 prefix = 1;
8467 i.prefixes -= 1;
376cd056 8468 code16 ^= flip_code16(code16);
252b5132 8469 }
29b0f896
AM
8470 /* Pentium4 branch hints. */
8471 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8472 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
2f66722d 8473 {
29b0f896
AM
8474 prefix++;
8475 i.prefixes--;
8476 }
8477 if (i.prefix[REX_PREFIX] != 0)
8478 {
8479 prefix++;
8480 i.prefixes--;
2f66722d
AM
8481 }
8482
7e8b059b
L
8483 /* BND prefixed jump. */
8484 if (i.prefix[BND_PREFIX] != 0)
8485 {
6cb0a70e
JB
8486 prefix++;
8487 i.prefixes--;
7e8b059b
L
8488 }
8489
f2810fe0
JB
8490 if (i.prefixes != 0)
8491 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
29b0f896
AM
8492
8493 /* It's always a symbol; End frag & setup for relax.
8494 Make sure there is enough room in this frag for the largest
8495 instruction we may generate in md_convert_frag. This is 2
8496 bytes for the opcode and room for the prefix and largest
8497 displacement. */
8498 frag_grow (prefix + 2 + 4);
8499 /* Prefix and 1 opcode byte go in fr_fix. */
8500 p = frag_more (prefix + 1);
8501 if (i.prefix[DATA_PREFIX] != 0)
8502 *p++ = DATA_PREFIX_OPCODE;
8503 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8504 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8505 *p++ = i.prefix[SEG_PREFIX];
6cb0a70e
JB
8506 if (i.prefix[BND_PREFIX] != 0)
8507 *p++ = BND_PREFIX_OPCODE;
29b0f896
AM
8508 if (i.prefix[REX_PREFIX] != 0)
8509 *p++ = i.prefix[REX_PREFIX];
8510 *p = i.tm.base_opcode;
8511
8512 if ((unsigned char) *p == JUMP_PC_RELATIVE)
f8a5c266 8513 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
40fb9820 8514 else if (cpu_arch_flags.bitfield.cpui386)
f8a5c266 8515 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
29b0f896 8516 else
f8a5c266 8517 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
29b0f896 8518 subtype |= code16;
3e73aa7c 8519
29b0f896
AM
8520 sym = i.op[0].disps->X_add_symbol;
8521 off = i.op[0].disps->X_add_number;
3e73aa7c 8522
29b0f896
AM
8523 if (i.op[0].disps->X_op != O_constant
8524 && i.op[0].disps->X_op != O_symbol)
3e73aa7c 8525 {
29b0f896
AM
8526 /* Handle complex expressions. */
8527 sym = make_expr_symbol (i.op[0].disps);
8528 off = 0;
8529 }
3e73aa7c 8530
29b0f896
AM
8531 /* 1 possible extra opcode + 4 byte displacement go in var part.
8532 Pass reloc in fr_var. */
d258b828 8533 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
29b0f896 8534}
3e73aa7c 8535
bd7ab16b
L
8536#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8537/* Return TRUE iff PLT32 relocation should be used for branching to
8538 symbol S. */
8539
8540static bfd_boolean
8541need_plt32_p (symbolS *s)
8542{
8543 /* PLT32 relocation is ELF only. */
8544 if (!IS_ELF)
8545 return FALSE;
8546
a5def729
RO
8547#ifdef TE_SOLARIS
8548 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8549 krtld support it. */
8550 return FALSE;
8551#endif
8552
bd7ab16b
L
8553 /* Since there is no need to prepare for PLT branch on x86-64, we
8554 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8555 be used as a marker for 32-bit PC-relative branches. */
8556 if (!object_64bit)
8557 return FALSE;
8558
8559 /* Weak or undefined symbol need PLT32 relocation. */
8560 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8561 return TRUE;
8562
8563 /* Non-global symbol doesn't need PLT32 relocation. */
8564 if (! S_IS_EXTERNAL (s))
8565 return FALSE;
8566
8567 /* Other global symbols need PLT32 relocation. NB: Symbol with
8568 non-default visibilities are treated as normal global symbol
8569 so that PLT32 relocation can be used as a marker for 32-bit
8570 PC-relative branches. It is useful for linker relaxation. */
8571 return TRUE;
8572}
8573#endif
8574
29b0f896 8575static void
e3bb37b5 8576output_jump (void)
29b0f896
AM
8577{
8578 char *p;
8579 int size;
3e02c1cc 8580 fixS *fixP;
bd7ab16b 8581 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
29b0f896 8582
0cfa3eb3 8583 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
29b0f896
AM
8584 {
8585 /* This is a loop or jecxz type instruction. */
8586 size = 1;
8587 if (i.prefix[ADDR_PREFIX] != 0)
8588 {
8589 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8590 i.prefixes -= 1;
8591 }
8592 /* Pentium4 branch hints. */
8593 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8594 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8595 {
8596 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8597 i.prefixes--;
3e73aa7c
JH
8598 }
8599 }
29b0f896
AM
8600 else
8601 {
8602 int code16;
3e73aa7c 8603
29b0f896
AM
8604 code16 = 0;
8605 if (flag_code == CODE_16BIT)
8606 code16 = CODE16;
3e73aa7c 8607
29b0f896
AM
8608 if (i.prefix[DATA_PREFIX] != 0)
8609 {
8610 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8611 i.prefixes -= 1;
376cd056 8612 code16 ^= flip_code16(code16);
29b0f896 8613 }
252b5132 8614
29b0f896
AM
8615 size = 4;
8616 if (code16)
8617 size = 2;
8618 }
9fcc94b6 8619
6cb0a70e
JB
8620 /* BND prefixed jump. */
8621 if (i.prefix[BND_PREFIX] != 0)
29b0f896 8622 {
6cb0a70e 8623 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
29b0f896
AM
8624 i.prefixes -= 1;
8625 }
252b5132 8626
6cb0a70e 8627 if (i.prefix[REX_PREFIX] != 0)
7e8b059b 8628 {
6cb0a70e 8629 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
7e8b059b
L
8630 i.prefixes -= 1;
8631 }
8632
f2810fe0
JB
8633 if (i.prefixes != 0)
8634 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
e0890092 8635
42164a71
L
8636 p = frag_more (i.tm.opcode_length + size);
8637 switch (i.tm.opcode_length)
8638 {
8639 case 2:
8640 *p++ = i.tm.base_opcode >> 8;
1a0670f3 8641 /* Fall through. */
42164a71
L
8642 case 1:
8643 *p++ = i.tm.base_opcode;
8644 break;
8645 default:
8646 abort ();
8647 }
e0890092 8648
bd7ab16b
L
8649#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8650 if (size == 4
8651 && jump_reloc == NO_RELOC
8652 && need_plt32_p (i.op[0].disps->X_add_symbol))
8653 jump_reloc = BFD_RELOC_X86_64_PLT32;
8654#endif
8655
8656 jump_reloc = reloc (size, 1, 1, jump_reloc);
8657
3e02c1cc 8658 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
bd7ab16b 8659 i.op[0].disps, 1, jump_reloc);
3e02c1cc
AM
8660
8661 /* All jumps handled here are signed, but don't use a signed limit
8662 check for 32 and 16 bit jumps as we want to allow wrap around at
8663 4G and 64k respectively. */
8664 if (size == 1)
8665 fixP->fx_signed = 1;
29b0f896 8666}
e0890092 8667
29b0f896 8668static void
e3bb37b5 8669output_interseg_jump (void)
29b0f896
AM
8670{
8671 char *p;
8672 int size;
8673 int prefix;
8674 int code16;
252b5132 8675
29b0f896
AM
8676 code16 = 0;
8677 if (flag_code == CODE_16BIT)
8678 code16 = CODE16;
a217f122 8679
29b0f896
AM
8680 prefix = 0;
8681 if (i.prefix[DATA_PREFIX] != 0)
8682 {
8683 prefix = 1;
8684 i.prefixes -= 1;
8685 code16 ^= CODE16;
8686 }
6cb0a70e
JB
8687
8688 gas_assert (!i.prefix[REX_PREFIX]);
252b5132 8689
29b0f896
AM
8690 size = 4;
8691 if (code16)
8692 size = 2;
252b5132 8693
f2810fe0
JB
8694 if (i.prefixes != 0)
8695 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
252b5132 8696
29b0f896
AM
8697 /* 1 opcode; 2 segment; offset */
8698 p = frag_more (prefix + 1 + 2 + size);
3e73aa7c 8699
29b0f896
AM
8700 if (i.prefix[DATA_PREFIX] != 0)
8701 *p++ = DATA_PREFIX_OPCODE;
252b5132 8702
29b0f896
AM
8703 if (i.prefix[REX_PREFIX] != 0)
8704 *p++ = i.prefix[REX_PREFIX];
252b5132 8705
29b0f896
AM
8706 *p++ = i.tm.base_opcode;
8707 if (i.op[1].imms->X_op == O_constant)
8708 {
8709 offsetT n = i.op[1].imms->X_add_number;
252b5132 8710
29b0f896
AM
8711 if (size == 2
8712 && !fits_in_unsigned_word (n)
8713 && !fits_in_signed_word (n))
8714 {
8715 as_bad (_("16-bit jump out of range"));
8716 return;
8717 }
8718 md_number_to_chars (p, n, size);
8719 }
8720 else
8721 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
d258b828 8722 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
29b0f896
AM
8723 if (i.op[0].imms->X_op != O_constant)
8724 as_bad (_("can't handle non absolute segment in `%s'"),
8725 i.tm.name);
8726 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8727}
a217f122 8728
b4a3a7b4
L
8729#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8730void
8731x86_cleanup (void)
8732{
8733 char *p;
8734 asection *seg = now_seg;
8735 subsegT subseg = now_subseg;
8736 asection *sec;
8737 unsigned int alignment, align_size_1;
8738 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8739 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8740 unsigned int padding;
8741
8742 if (!IS_ELF || !x86_used_note)
8743 return;
8744
b4a3a7b4
L
8745 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8746
8747 /* The .note.gnu.property section layout:
8748
8749 Field Length Contents
8750 ---- ---- ----
8751 n_namsz 4 4
8752 n_descsz 4 The note descriptor size
8753 n_type 4 NT_GNU_PROPERTY_TYPE_0
8754 n_name 4 "GNU"
8755 n_desc n_descsz The program property array
8756 .... .... ....
8757 */
8758
8759 /* Create the .note.gnu.property section. */
8760 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
fd361982 8761 bfd_set_section_flags (sec,
b4a3a7b4
L
8762 (SEC_ALLOC
8763 | SEC_LOAD
8764 | SEC_DATA
8765 | SEC_HAS_CONTENTS
8766 | SEC_READONLY));
8767
8768 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8769 {
8770 align_size_1 = 7;
8771 alignment = 3;
8772 }
8773 else
8774 {
8775 align_size_1 = 3;
8776 alignment = 2;
8777 }
8778
fd361982 8779 bfd_set_section_alignment (sec, alignment);
b4a3a7b4
L
8780 elf_section_type (sec) = SHT_NOTE;
8781
8782 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8783 + 4-byte data */
8784 isa_1_descsz_raw = 4 + 4 + 4;
8785 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8786 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8787
8788 feature_2_descsz_raw = isa_1_descsz;
8789 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8790 + 4-byte data */
8791 feature_2_descsz_raw += 4 + 4 + 4;
8792 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8793 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8794 & ~align_size_1);
8795
8796 descsz = feature_2_descsz;
8797 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8798 p = frag_more (4 + 4 + 4 + 4 + descsz);
8799
8800 /* Write n_namsz. */
8801 md_number_to_chars (p, (valueT) 4, 4);
8802
8803 /* Write n_descsz. */
8804 md_number_to_chars (p + 4, (valueT) descsz, 4);
8805
8806 /* Write n_type. */
8807 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8808
8809 /* Write n_name. */
8810 memcpy (p + 4 * 3, "GNU", 4);
8811
8812 /* Write 4-byte type. */
8813 md_number_to_chars (p + 4 * 4,
8814 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8815
8816 /* Write 4-byte data size. */
8817 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8818
8819 /* Write 4-byte data. */
8820 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8821
8822 /* Zero out paddings. */
8823 padding = isa_1_descsz - isa_1_descsz_raw;
8824 if (padding)
8825 memset (p + 4 * 7, 0, padding);
8826
8827 /* Write 4-byte type. */
8828 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8829 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8830
8831 /* Write 4-byte data size. */
8832 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8833
8834 /* Write 4-byte data. */
8835 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8836 (valueT) x86_feature_2_used, 4);
8837
8838 /* Zero out paddings. */
8839 padding = feature_2_descsz - feature_2_descsz_raw;
8840 if (padding)
8841 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8842
8843 /* We probably can't restore the current segment, for there likely
8844 isn't one yet... */
8845 if (seg && subseg)
8846 subseg_set (seg, subseg);
8847}
8848#endif
8849
9c33702b
JB
8850static unsigned int
8851encoding_length (const fragS *start_frag, offsetT start_off,
8852 const char *frag_now_ptr)
8853{
8854 unsigned int len = 0;
8855
8856 if (start_frag != frag_now)
8857 {
8858 const fragS *fr = start_frag;
8859
8860 do {
8861 len += fr->fr_fix;
8862 fr = fr->fr_next;
8863 } while (fr && fr != frag_now);
8864 }
8865
8866 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8867}
8868
e379e5f3 8869/* Return 1 for test, and, cmp, add, sub, inc and dec which may
79d72f45
HL
8870 be macro-fused with conditional jumps.
8871 NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8872 or is one of the following format:
8873
8874 cmp m, imm
8875 add m, imm
8876 sub m, imm
8877 test m, imm
8878 and m, imm
8879 inc m
8880 dec m
8881
8882 it is unfusible. */
e379e5f3
L
8883
8884static int
79d72f45 8885maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
e379e5f3
L
8886{
8887 /* No RIP address. */
8888 if (i.base_reg && i.base_reg->reg_num == RegIP)
8889 return 0;
8890
8891 /* No VEX/EVEX encoding. */
8892 if (is_any_vex_encoding (&i.tm))
8893 return 0;
8894
79d72f45
HL
8895 /* add, sub without add/sub m, imm. */
8896 if (i.tm.base_opcode <= 5
e379e5f3
L
8897 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8898 || ((i.tm.base_opcode | 3) == 0x83
79d72f45 8899 && (i.tm.extension_opcode == 0x5
e379e5f3 8900 || i.tm.extension_opcode == 0x0)))
79d72f45
HL
8901 {
8902 *mf_cmp_p = mf_cmp_alu_cmp;
8903 return !(i.mem_operands && i.imm_operands);
8904 }
e379e5f3 8905
79d72f45
HL
8906 /* and without and m, imm. */
8907 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8908 || ((i.tm.base_opcode | 3) == 0x83
8909 && i.tm.extension_opcode == 0x4))
8910 {
8911 *mf_cmp_p = mf_cmp_test_and;
8912 return !(i.mem_operands && i.imm_operands);
8913 }
8914
8915 /* test without test m imm. */
e379e5f3
L
8916 if ((i.tm.base_opcode | 1) == 0x85
8917 || (i.tm.base_opcode | 1) == 0xa9
8918 || ((i.tm.base_opcode | 1) == 0xf7
79d72f45
HL
8919 && i.tm.extension_opcode == 0))
8920 {
8921 *mf_cmp_p = mf_cmp_test_and;
8922 return !(i.mem_operands && i.imm_operands);
8923 }
8924
8925 /* cmp without cmp m, imm. */
8926 if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
e379e5f3
L
8927 || ((i.tm.base_opcode | 3) == 0x83
8928 && (i.tm.extension_opcode == 0x7)))
79d72f45
HL
8929 {
8930 *mf_cmp_p = mf_cmp_alu_cmp;
8931 return !(i.mem_operands && i.imm_operands);
8932 }
e379e5f3 8933
79d72f45 8934 /* inc, dec without inc/dec m. */
e379e5f3
L
8935 if ((i.tm.cpu_flags.bitfield.cpuno64
8936 && (i.tm.base_opcode | 0xf) == 0x4f)
8937 || ((i.tm.base_opcode | 1) == 0xff
8938 && i.tm.extension_opcode <= 0x1))
79d72f45
HL
8939 {
8940 *mf_cmp_p = mf_cmp_incdec;
8941 return !i.mem_operands;
8942 }
e379e5f3
L
8943
8944 return 0;
8945}
8946
8947/* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8948
8949static int
79d72f45 8950add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
e379e5f3
L
8951{
8952 /* NB: Don't work with COND_JUMP86 without i386. */
8953 if (!align_branch_power
8954 || now_seg == absolute_section
8955 || !cpu_arch_flags.bitfield.cpui386
8956 || !(align_branch & align_branch_fused_bit))
8957 return 0;
8958
79d72f45 8959 if (maybe_fused_with_jcc_p (mf_cmp_p))
e379e5f3
L
8960 {
8961 if (last_insn.kind == last_insn_other
8962 || last_insn.seg != now_seg)
8963 return 1;
8964 if (flag_debug)
8965 as_warn_where (last_insn.file, last_insn.line,
8966 _("`%s` skips -malign-branch-boundary on `%s`"),
8967 last_insn.name, i.tm.name);
8968 }
8969
8970 return 0;
8971}
8972
8973/* Return 1 if a BRANCH_PREFIX frag should be generated. */
8974
8975static int
8976add_branch_prefix_frag_p (void)
8977{
8978 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8979 to PadLock instructions since they include prefixes in opcode. */
8980 if (!align_branch_power
8981 || !align_branch_prefix_size
8982 || now_seg == absolute_section
8983 || i.tm.cpu_flags.bitfield.cpupadlock
8984 || !cpu_arch_flags.bitfield.cpui386)
8985 return 0;
8986
8987 /* Don't add prefix if it is a prefix or there is no operand in case
8988 that segment prefix is special. */
8989 if (!i.operands || i.tm.opcode_modifier.isprefix)
8990 return 0;
8991
8992 if (last_insn.kind == last_insn_other
8993 || last_insn.seg != now_seg)
8994 return 1;
8995
8996 if (flag_debug)
8997 as_warn_where (last_insn.file, last_insn.line,
8998 _("`%s` skips -malign-branch-boundary on `%s`"),
8999 last_insn.name, i.tm.name);
9000
9001 return 0;
9002}
9003
9004/* Return 1 if a BRANCH_PADDING frag should be generated. */
9005
9006static int
79d72f45
HL
9007add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9008 enum mf_jcc_kind *mf_jcc_p)
e379e5f3
L
9009{
9010 int add_padding;
9011
9012 /* NB: Don't work with COND_JUMP86 without i386. */
9013 if (!align_branch_power
9014 || now_seg == absolute_section
9015 || !cpu_arch_flags.bitfield.cpui386)
9016 return 0;
9017
9018 add_padding = 0;
9019
9020 /* Check for jcc and direct jmp. */
9021 if (i.tm.opcode_modifier.jump == JUMP)
9022 {
9023 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9024 {
9025 *branch_p = align_branch_jmp;
9026 add_padding = align_branch & align_branch_jmp_bit;
9027 }
9028 else
9029 {
79d72f45
HL
9030 /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9031 igore the lowest bit. */
9032 *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
e379e5f3
L
9033 *branch_p = align_branch_jcc;
9034 if ((align_branch & align_branch_jcc_bit))
9035 add_padding = 1;
9036 }
9037 }
9038 else if (is_any_vex_encoding (&i.tm))
9039 return 0;
9040 else if ((i.tm.base_opcode | 1) == 0xc3)
9041 {
9042 /* Near ret. */
9043 *branch_p = align_branch_ret;
9044 if ((align_branch & align_branch_ret_bit))
9045 add_padding = 1;
9046 }
9047 else
9048 {
9049 /* Check for indirect jmp, direct and indirect calls. */
9050 if (i.tm.base_opcode == 0xe8)
9051 {
9052 /* Direct call. */
9053 *branch_p = align_branch_call;
9054 if ((align_branch & align_branch_call_bit))
9055 add_padding = 1;
9056 }
9057 else if (i.tm.base_opcode == 0xff
9058 && (i.tm.extension_opcode == 2
9059 || i.tm.extension_opcode == 4))
9060 {
9061 /* Indirect call and jmp. */
9062 *branch_p = align_branch_indirect;
9063 if ((align_branch & align_branch_indirect_bit))
9064 add_padding = 1;
9065 }
9066
9067 if (add_padding
9068 && i.disp_operands
9069 && tls_get_addr
9070 && (i.op[0].disps->X_op == O_symbol
9071 || (i.op[0].disps->X_op == O_subtract
9072 && i.op[0].disps->X_op_symbol == GOT_symbol)))
9073 {
9074 symbolS *s = i.op[0].disps->X_add_symbol;
9075 /* No padding to call to global or undefined tls_get_addr. */
9076 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9077 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9078 return 0;
9079 }
9080 }
9081
9082 if (add_padding
9083 && last_insn.kind != last_insn_other
9084 && last_insn.seg == now_seg)
9085 {
9086 if (flag_debug)
9087 as_warn_where (last_insn.file, last_insn.line,
9088 _("`%s` skips -malign-branch-boundary on `%s`"),
9089 last_insn.name, i.tm.name);
9090 return 0;
9091 }
9092
9093 return add_padding;
9094}
9095
29b0f896 9096static void
e3bb37b5 9097output_insn (void)
29b0f896 9098{
2bbd9c25
JJ
9099 fragS *insn_start_frag;
9100 offsetT insn_start_off;
e379e5f3
L
9101 fragS *fragP = NULL;
9102 enum align_branch_kind branch = align_branch_none;
79d72f45
HL
9103 /* The initializer is arbitrary just to avoid uninitialized error.
9104 it's actually either assigned in add_branch_padding_frag_p
9105 or never be used. */
9106 enum mf_jcc_kind mf_jcc = mf_jcc_jo;
2bbd9c25 9107
b4a3a7b4
L
9108#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9109 if (IS_ELF && x86_used_note)
9110 {
9111 if (i.tm.cpu_flags.bitfield.cpucmov)
9112 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
9113 if (i.tm.cpu_flags.bitfield.cpusse)
9114 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
9115 if (i.tm.cpu_flags.bitfield.cpusse2)
9116 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
9117 if (i.tm.cpu_flags.bitfield.cpusse3)
9118 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
9119 if (i.tm.cpu_flags.bitfield.cpussse3)
9120 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
9121 if (i.tm.cpu_flags.bitfield.cpusse4_1)
9122 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
9123 if (i.tm.cpu_flags.bitfield.cpusse4_2)
9124 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
9125 if (i.tm.cpu_flags.bitfield.cpuavx)
9126 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
9127 if (i.tm.cpu_flags.bitfield.cpuavx2)
9128 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
9129 if (i.tm.cpu_flags.bitfield.cpufma)
9130 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
9131 if (i.tm.cpu_flags.bitfield.cpuavx512f)
9132 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
9133 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
9134 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
9135 if (i.tm.cpu_flags.bitfield.cpuavx512er)
9136 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
9137 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
9138 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
9139 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
9140 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
9141 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
9142 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
9143 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
9144 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
9145 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
9146 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
9147 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
9148 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
9149 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
9150 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
9151 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
9152 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
9153 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
9154 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
9155 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
9156 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
9157 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
9158 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
462cac58
L
9159 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
9160 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
b4a3a7b4
L
9161
9162 if (i.tm.cpu_flags.bitfield.cpu8087
9163 || i.tm.cpu_flags.bitfield.cpu287
9164 || i.tm.cpu_flags.bitfield.cpu387
9165 || i.tm.cpu_flags.bitfield.cpu687
9166 || i.tm.cpu_flags.bitfield.cpufisttp)
9167 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
921eafea 9168 if ((i.xstate & xstate_mmx)
319ff62c 9169 || i.tm.base_opcode == 0xf77 /* emms */
921eafea 9170 || i.tm.base_opcode == 0xf0e /* femms */)
b4a3a7b4 9171 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
921eafea 9172 if ((i.xstate & xstate_xmm))
b4a3a7b4 9173 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
921eafea 9174 if ((i.xstate & xstate_ymm) == xstate_ymm)
b4a3a7b4 9175 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
921eafea 9176 if ((i.xstate & xstate_zmm) == xstate_zmm)
b4a3a7b4
L
9177 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9178 if (i.tm.cpu_flags.bitfield.cpufxsr)
9179 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9180 if (i.tm.cpu_flags.bitfield.cpuxsave)
9181 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9182 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9183 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9184 if (i.tm.cpu_flags.bitfield.cpuxsavec)
9185 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9186 }
9187#endif
9188
29b0f896
AM
9189 /* Tie dwarf2 debug info to the address at the start of the insn.
9190 We can't do this after the insn has been output as the current
9191 frag may have been closed off. eg. by frag_var. */
9192 dwarf2_emit_insn (0);
9193
2bbd9c25
JJ
9194 insn_start_frag = frag_now;
9195 insn_start_off = frag_now_fix ();
9196
79d72f45 9197 if (add_branch_padding_frag_p (&branch, &mf_jcc))
e379e5f3
L
9198 {
9199 char *p;
9200 /* Branch can be 8 bytes. Leave some room for prefixes. */
9201 unsigned int max_branch_padding_size = 14;
9202
9203 /* Align section to boundary. */
9204 record_alignment (now_seg, align_branch_power);
9205
9206 /* Make room for padding. */
9207 frag_grow (max_branch_padding_size);
9208
9209 /* Start of the padding. */
9210 p = frag_more (0);
9211
9212 fragP = frag_now;
9213
9214 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9215 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9216 NULL, 0, p);
9217
79d72f45 9218 fragP->tc_frag_data.mf_type = mf_jcc;
e379e5f3
L
9219 fragP->tc_frag_data.branch_type = branch;
9220 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9221 }
9222
29b0f896 9223 /* Output jumps. */
0cfa3eb3 9224 if (i.tm.opcode_modifier.jump == JUMP)
29b0f896 9225 output_branch ();
0cfa3eb3
JB
9226 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9227 || i.tm.opcode_modifier.jump == JUMP_DWORD)
29b0f896 9228 output_jump ();
0cfa3eb3 9229 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
29b0f896
AM
9230 output_interseg_jump ();
9231 else
9232 {
9233 /* Output normal instructions here. */
9234 char *p;
9235 unsigned char *q;
47465058 9236 unsigned int j;
331d2d0d 9237 unsigned int prefix;
79d72f45 9238 enum mf_cmp_kind mf_cmp;
4dffcebc 9239
e4e00185 9240 if (avoid_fence
c3949f43
JB
9241 && (i.tm.base_opcode == 0xfaee8
9242 || i.tm.base_opcode == 0xfaef0
9243 || i.tm.base_opcode == 0xfaef8))
e4e00185
AS
9244 {
9245 /* Encode lfence, mfence, and sfence as
9246 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
9247 offsetT val = 0x240483f0ULL;
9248 p = frag_more (5);
9249 md_number_to_chars (p, val, 5);
9250 return;
9251 }
9252
d022bddd
IT
9253 /* Some processors fail on LOCK prefix. This options makes
9254 assembler ignore LOCK prefix and serves as a workaround. */
9255 if (omit_lock_prefix)
9256 {
9257 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9258 return;
9259 i.prefix[LOCK_PREFIX] = 0;
9260 }
9261
e379e5f3
L
9262 if (branch)
9263 /* Skip if this is a branch. */
9264 ;
79d72f45 9265 else if (add_fused_jcc_padding_frag_p (&mf_cmp))
e379e5f3
L
9266 {
9267 /* Make room for padding. */
9268 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9269 p = frag_more (0);
9270
9271 fragP = frag_now;
9272
9273 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9274 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9275 NULL, 0, p);
9276
79d72f45 9277 fragP->tc_frag_data.mf_type = mf_cmp;
e379e5f3
L
9278 fragP->tc_frag_data.branch_type = align_branch_fused;
9279 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9280 }
9281 else if (add_branch_prefix_frag_p ())
9282 {
9283 unsigned int max_prefix_size = align_branch_prefix_size;
9284
9285 /* Make room for padding. */
9286 frag_grow (max_prefix_size);
9287 p = frag_more (0);
9288
9289 fragP = frag_now;
9290
9291 frag_var (rs_machine_dependent, max_prefix_size, 0,
9292 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9293 NULL, 0, p);
9294
9295 fragP->tc_frag_data.max_bytes = max_prefix_size;
9296 }
9297
43234a1e
L
9298 /* Since the VEX/EVEX prefix contains the implicit prefix, we
9299 don't need the explicit prefix. */
9300 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
bc4bd9ab 9301 {
c0f3af97 9302 switch (i.tm.opcode_length)
bc4bd9ab 9303 {
c0f3af97
L
9304 case 3:
9305 if (i.tm.base_opcode & 0xff000000)
4dffcebc 9306 {
c0f3af97 9307 prefix = (i.tm.base_opcode >> 24) & 0xff;
c3949f43
JB
9308 if (!i.tm.cpu_flags.bitfield.cpupadlock
9309 || prefix != REPE_PREFIX_OPCODE
9310 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
9311 add_prefix (prefix);
c0f3af97
L
9312 }
9313 break;
9314 case 2:
9315 if ((i.tm.base_opcode & 0xff0000) != 0)
9316 {
9317 prefix = (i.tm.base_opcode >> 16) & 0xff;
c3949f43 9318 add_prefix (prefix);
4dffcebc 9319 }
c0f3af97
L
9320 break;
9321 case 1:
9322 break;
390c91cf
L
9323 case 0:
9324 /* Check for pseudo prefixes. */
9325 as_bad_where (insn_start_frag->fr_file,
9326 insn_start_frag->fr_line,
9327 _("pseudo prefix without instruction"));
9328 return;
c0f3af97
L
9329 default:
9330 abort ();
bc4bd9ab 9331 }
c0f3af97 9332
6d19a37a 9333#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
cf61b747
L
9334 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9335 R_X86_64_GOTTPOFF relocation so that linker can safely
14470f07
L
9336 perform IE->LE optimization. A dummy REX_OPCODE prefix
9337 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9338 relocation for GDesc -> IE/LE optimization. */
cf61b747
L
9339 if (x86_elf_abi == X86_64_X32_ABI
9340 && i.operands == 2
14470f07
L
9341 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9342 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
cf61b747
L
9343 && i.prefix[REX_PREFIX] == 0)
9344 add_prefix (REX_OPCODE);
6d19a37a 9345#endif
cf61b747 9346
c0f3af97
L
9347 /* The prefix bytes. */
9348 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9349 if (*q)
9350 FRAG_APPEND_1_CHAR (*q);
0f10071e 9351 }
ae5c1c7b 9352 else
c0f3af97
L
9353 {
9354 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9355 if (*q)
9356 switch (j)
9357 {
c0f3af97
L
9358 case SEG_PREFIX:
9359 case ADDR_PREFIX:
9360 FRAG_APPEND_1_CHAR (*q);
9361 break;
9362 default:
9363 /* There should be no other prefixes for instructions
9364 with VEX prefix. */
9365 abort ();
9366 }
9367
43234a1e
L
9368 /* For EVEX instructions i.vrex should become 0 after
9369 build_evex_prefix. For VEX instructions upper 16 registers
9370 aren't available, so VREX should be 0. */
9371 if (i.vrex)
9372 abort ();
c0f3af97
L
9373 /* Now the VEX prefix. */
9374 p = frag_more (i.vex.length);
9375 for (j = 0; j < i.vex.length; j++)
9376 p[j] = i.vex.bytes[j];
9377 }
252b5132 9378
29b0f896 9379 /* Now the opcode; be careful about word order here! */
4dffcebc 9380 if (i.tm.opcode_length == 1)
29b0f896
AM
9381 {
9382 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9383 }
9384 else
9385 {
4dffcebc 9386 switch (i.tm.opcode_length)
331d2d0d 9387 {
43234a1e
L
9388 case 4:
9389 p = frag_more (4);
9390 *p++ = (i.tm.base_opcode >> 24) & 0xff;
9391 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9392 break;
4dffcebc 9393 case 3:
331d2d0d
L
9394 p = frag_more (3);
9395 *p++ = (i.tm.base_opcode >> 16) & 0xff;
4dffcebc
L
9396 break;
9397 case 2:
9398 p = frag_more (2);
9399 break;
9400 default:
9401 abort ();
9402 break;
331d2d0d 9403 }
0f10071e 9404
29b0f896
AM
9405 /* Put out high byte first: can't use md_number_to_chars! */
9406 *p++ = (i.tm.base_opcode >> 8) & 0xff;
9407 *p = i.tm.base_opcode & 0xff;
9408 }
3e73aa7c 9409
29b0f896 9410 /* Now the modrm byte and sib byte (if present). */
40fb9820 9411 if (i.tm.opcode_modifier.modrm)
29b0f896 9412 {
4a3523fa
L
9413 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
9414 | i.rm.reg << 3
9415 | i.rm.mode << 6));
29b0f896
AM
9416 /* If i.rm.regmem == ESP (4)
9417 && i.rm.mode != (Register mode)
9418 && not 16 bit
9419 ==> need second modrm byte. */
9420 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9421 && i.rm.mode != 3
dc821c5f 9422 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
4a3523fa
L
9423 FRAG_APPEND_1_CHAR ((i.sib.base << 0
9424 | i.sib.index << 3
9425 | i.sib.scale << 6));
29b0f896 9426 }
3e73aa7c 9427
29b0f896 9428 if (i.disp_operands)
2bbd9c25 9429 output_disp (insn_start_frag, insn_start_off);
3e73aa7c 9430
29b0f896 9431 if (i.imm_operands)
2bbd9c25 9432 output_imm (insn_start_frag, insn_start_off);
9c33702b
JB
9433
9434 /*
9435 * frag_now_fix () returning plain abs_section_offset when we're in the
9436 * absolute section, and abs_section_offset not getting updated as data
9437 * gets added to the frag breaks the logic below.
9438 */
9439 if (now_seg != absolute_section)
9440 {
9441 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9442 if (j > 15)
9443 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9444 j);
e379e5f3
L
9445 else if (fragP)
9446 {
9447 /* NB: Don't add prefix with GOTPC relocation since
9448 output_disp() above depends on the fixed encoding
9449 length. Can't add prefix with TLS relocation since
9450 it breaks TLS linker optimization. */
9451 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9452 /* Prefix count on the current instruction. */
9453 unsigned int count = i.vex.length;
9454 unsigned int k;
9455 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9456 /* REX byte is encoded in VEX/EVEX prefix. */
9457 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9458 count++;
9459
9460 /* Count prefixes for extended opcode maps. */
9461 if (!i.vex.length)
9462 switch (i.tm.opcode_length)
9463 {
9464 case 3:
9465 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9466 {
9467 count++;
9468 switch ((i.tm.base_opcode >> 8) & 0xff)
9469 {
9470 case 0x38:
9471 case 0x3a:
9472 count++;
9473 break;
9474 default:
9475 break;
9476 }
9477 }
9478 break;
9479 case 2:
9480 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9481 count++;
9482 break;
9483 case 1:
9484 break;
9485 default:
9486 abort ();
9487 }
9488
9489 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9490 == BRANCH_PREFIX)
9491 {
9492 /* Set the maximum prefix size in BRANCH_PREFIX
9493 frag. */
9494 if (fragP->tc_frag_data.max_bytes > max)
9495 fragP->tc_frag_data.max_bytes = max;
9496 if (fragP->tc_frag_data.max_bytes > count)
9497 fragP->tc_frag_data.max_bytes -= count;
9498 else
9499 fragP->tc_frag_data.max_bytes = 0;
9500 }
9501 else
9502 {
9503 /* Remember the maximum prefix size in FUSED_JCC_PADDING
9504 frag. */
9505 unsigned int max_prefix_size;
9506 if (align_branch_prefix_size > max)
9507 max_prefix_size = max;
9508 else
9509 max_prefix_size = align_branch_prefix_size;
9510 if (max_prefix_size > count)
9511 fragP->tc_frag_data.max_prefix_length
9512 = max_prefix_size - count;
9513 }
9514
9515 /* Use existing segment prefix if possible. Use CS
9516 segment prefix in 64-bit mode. In 32-bit mode, use SS
9517 segment prefix with ESP/EBP base register and use DS
9518 segment prefix without ESP/EBP base register. */
9519 if (i.prefix[SEG_PREFIX])
9520 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9521 else if (flag_code == CODE_64BIT)
9522 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9523 else if (i.base_reg
9524 && (i.base_reg->reg_num == 4
9525 || i.base_reg->reg_num == 5))
9526 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9527 else
9528 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9529 }
9c33702b 9530 }
29b0f896 9531 }
252b5132 9532
e379e5f3
L
9533 /* NB: Don't work with COND_JUMP86 without i386. */
9534 if (align_branch_power
9535 && now_seg != absolute_section
9536 && cpu_arch_flags.bitfield.cpui386)
9537 {
9538 /* Terminate each frag so that we can add prefix and check for
9539 fused jcc. */
9540 frag_wane (frag_now);
9541 frag_new (0);
9542 }
9543
29b0f896
AM
9544#ifdef DEBUG386
9545 if (flag_debug)
9546 {
7b81dfbb 9547 pi ("" /*line*/, &i);
29b0f896
AM
9548 }
9549#endif /* DEBUG386 */
9550}
252b5132 9551
e205caa7
L
9552/* Return the size of the displacement operand N. */
9553
9554static int
9555disp_size (unsigned int n)
9556{
9557 int size = 4;
43234a1e 9558
b5014f7a 9559 if (i.types[n].bitfield.disp64)
40fb9820
L
9560 size = 8;
9561 else if (i.types[n].bitfield.disp8)
9562 size = 1;
9563 else if (i.types[n].bitfield.disp16)
9564 size = 2;
e205caa7
L
9565 return size;
9566}
9567
9568/* Return the size of the immediate operand N. */
9569
9570static int
9571imm_size (unsigned int n)
9572{
9573 int size = 4;
40fb9820
L
9574 if (i.types[n].bitfield.imm64)
9575 size = 8;
9576 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9577 size = 1;
9578 else if (i.types[n].bitfield.imm16)
9579 size = 2;
e205caa7
L
9580 return size;
9581}
9582
29b0f896 9583static void
64e74474 9584output_disp (fragS *insn_start_frag, offsetT insn_start_off)
29b0f896
AM
9585{
9586 char *p;
9587 unsigned int n;
252b5132 9588
29b0f896
AM
9589 for (n = 0; n < i.operands; n++)
9590 {
b5014f7a 9591 if (operand_type_check (i.types[n], disp))
29b0f896
AM
9592 {
9593 if (i.op[n].disps->X_op == O_constant)
9594 {
e205caa7 9595 int size = disp_size (n);
43234a1e 9596 offsetT val = i.op[n].disps->X_add_number;
252b5132 9597
629cfaf1
JB
9598 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9599 size);
29b0f896
AM
9600 p = frag_more (size);
9601 md_number_to_chars (p, val, size);
9602 }
9603 else
9604 {
f86103b7 9605 enum bfd_reloc_code_real reloc_type;
e205caa7 9606 int size = disp_size (n);
40fb9820 9607 int sign = i.types[n].bitfield.disp32s;
29b0f896 9608 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
02a86693 9609 fixS *fixP;
29b0f896 9610
e205caa7 9611 /* We can't have 8 bit displacement here. */
9c2799c2 9612 gas_assert (!i.types[n].bitfield.disp8);
e205caa7 9613
29b0f896
AM
9614 /* The PC relative address is computed relative
9615 to the instruction boundary, so in case immediate
9616 fields follows, we need to adjust the value. */
9617 if (pcrel && i.imm_operands)
9618 {
29b0f896 9619 unsigned int n1;
e205caa7 9620 int sz = 0;
252b5132 9621
29b0f896 9622 for (n1 = 0; n1 < i.operands; n1++)
40fb9820 9623 if (operand_type_check (i.types[n1], imm))
252b5132 9624 {
e205caa7
L
9625 /* Only one immediate is allowed for PC
9626 relative address. */
9c2799c2 9627 gas_assert (sz == 0);
e205caa7
L
9628 sz = imm_size (n1);
9629 i.op[n].disps->X_add_number -= sz;
252b5132 9630 }
29b0f896 9631 /* We should find the immediate. */
9c2799c2 9632 gas_assert (sz != 0);
29b0f896 9633 }
520dc8e8 9634
29b0f896 9635 p = frag_more (size);
d258b828 9636 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
d6ab8113 9637 if (GOT_symbol
2bbd9c25 9638 && GOT_symbol == i.op[n].disps->X_add_symbol
d6ab8113 9639 && (((reloc_type == BFD_RELOC_32
7b81dfbb
AJ
9640 || reloc_type == BFD_RELOC_X86_64_32S
9641 || (reloc_type == BFD_RELOC_64
9642 && object_64bit))
d6ab8113
JB
9643 && (i.op[n].disps->X_op == O_symbol
9644 || (i.op[n].disps->X_op == O_add
9645 && ((symbol_get_value_expression
9646 (i.op[n].disps->X_op_symbol)->X_op)
9647 == O_subtract))))
9648 || reloc_type == BFD_RELOC_32_PCREL))
2bbd9c25 9649 {
4fa24527 9650 if (!object_64bit)
7b81dfbb
AJ
9651 {
9652 reloc_type = BFD_RELOC_386_GOTPC;
e379e5f3 9653 i.has_gotpc_tls_reloc = TRUE;
d583596c
JB
9654 i.op[n].imms->X_add_number +=
9655 encoding_length (insn_start_frag, insn_start_off, p);
7b81dfbb
AJ
9656 }
9657 else if (reloc_type == BFD_RELOC_64)
9658 reloc_type = BFD_RELOC_X86_64_GOTPC64;
d6ab8113 9659 else
7b81dfbb
AJ
9660 /* Don't do the adjustment for x86-64, as there
9661 the pcrel addressing is relative to the _next_
9662 insn, and that is taken care of in other code. */
d6ab8113 9663 reloc_type = BFD_RELOC_X86_64_GOTPC32;
2bbd9c25 9664 }
e379e5f3
L
9665 else if (align_branch_power)
9666 {
9667 switch (reloc_type)
9668 {
9669 case BFD_RELOC_386_TLS_GD:
9670 case BFD_RELOC_386_TLS_LDM:
9671 case BFD_RELOC_386_TLS_IE:
9672 case BFD_RELOC_386_TLS_IE_32:
9673 case BFD_RELOC_386_TLS_GOTIE:
9674 case BFD_RELOC_386_TLS_GOTDESC:
9675 case BFD_RELOC_386_TLS_DESC_CALL:
9676 case BFD_RELOC_X86_64_TLSGD:
9677 case BFD_RELOC_X86_64_TLSLD:
9678 case BFD_RELOC_X86_64_GOTTPOFF:
9679 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9680 case BFD_RELOC_X86_64_TLSDESC_CALL:
9681 i.has_gotpc_tls_reloc = TRUE;
9682 default:
9683 break;
9684 }
9685 }
02a86693
L
9686 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9687 size, i.op[n].disps, pcrel,
9688 reloc_type);
9689 /* Check for "call/jmp *mem", "mov mem, %reg",
9690 "test %reg, mem" and "binop mem, %reg" where binop
9691 is one of adc, add, and, cmp, or, sbb, sub, xor
e60f4d3b
L
9692 instructions without data prefix. Always generate
9693 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9694 if (i.prefix[DATA_PREFIX] == 0
9695 && (generate_relax_relocations
9696 || (!object_64bit
9697 && i.rm.mode == 0
9698 && i.rm.regmem == 5))
0cb4071e
L
9699 && (i.rm.mode == 2
9700 || (i.rm.mode == 0 && i.rm.regmem == 5))
2ae4c703 9701 && !is_any_vex_encoding(&i.tm)
02a86693
L
9702 && ((i.operands == 1
9703 && i.tm.base_opcode == 0xff
9704 && (i.rm.reg == 2 || i.rm.reg == 4))
9705 || (i.operands == 2
9706 && (i.tm.base_opcode == 0x8b
9707 || i.tm.base_opcode == 0x85
2ae4c703 9708 || (i.tm.base_opcode & ~0x38) == 0x03))))
02a86693
L
9709 {
9710 if (object_64bit)
9711 {
9712 fixP->fx_tcbit = i.rex != 0;
9713 if (i.base_reg
e968fc9b 9714 && (i.base_reg->reg_num == RegIP))
02a86693
L
9715 fixP->fx_tcbit2 = 1;
9716 }
9717 else
9718 fixP->fx_tcbit2 = 1;
9719 }
29b0f896
AM
9720 }
9721 }
9722 }
9723}
252b5132 9724
29b0f896 9725static void
64e74474 9726output_imm (fragS *insn_start_frag, offsetT insn_start_off)
29b0f896
AM
9727{
9728 char *p;
9729 unsigned int n;
252b5132 9730
29b0f896
AM
9731 for (n = 0; n < i.operands; n++)
9732 {
43234a1e
L
9733 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9734 if (i.rounding && (int) n == i.rounding->operand)
9735 continue;
9736
40fb9820 9737 if (operand_type_check (i.types[n], imm))
29b0f896
AM
9738 {
9739 if (i.op[n].imms->X_op == O_constant)
9740 {
e205caa7 9741 int size = imm_size (n);
29b0f896 9742 offsetT val;
b4cac588 9743
29b0f896
AM
9744 val = offset_in_range (i.op[n].imms->X_add_number,
9745 size);
9746 p = frag_more (size);
9747 md_number_to_chars (p, val, size);
9748 }
9749 else
9750 {
9751 /* Not absolute_section.
9752 Need a 32-bit fixup (don't support 8bit
9753 non-absolute imms). Try to support other
9754 sizes ... */
f86103b7 9755 enum bfd_reloc_code_real reloc_type;
e205caa7
L
9756 int size = imm_size (n);
9757 int sign;
29b0f896 9758
40fb9820 9759 if (i.types[n].bitfield.imm32s
a7d61044 9760 && (i.suffix == QWORD_MNEM_SUFFIX
40fb9820 9761 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
29b0f896 9762 sign = 1;
e205caa7
L
9763 else
9764 sign = 0;
520dc8e8 9765
29b0f896 9766 p = frag_more (size);
d258b828 9767 reloc_type = reloc (size, 0, sign, i.reloc[n]);
f86103b7 9768
2bbd9c25
JJ
9769 /* This is tough to explain. We end up with this one if we
9770 * have operands that look like
9771 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9772 * obtain the absolute address of the GOT, and it is strongly
9773 * preferable from a performance point of view to avoid using
9774 * a runtime relocation for this. The actual sequence of
9775 * instructions often look something like:
9776 *
9777 * call .L66
9778 * .L66:
9779 * popl %ebx
9780 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9781 *
9782 * The call and pop essentially return the absolute address
9783 * of the label .L66 and store it in %ebx. The linker itself
9784 * will ultimately change the first operand of the addl so
9785 * that %ebx points to the GOT, but to keep things simple, the
9786 * .o file must have this operand set so that it generates not
9787 * the absolute address of .L66, but the absolute address of
9788 * itself. This allows the linker itself simply treat a GOTPC
9789 * relocation as asking for a pcrel offset to the GOT to be
9790 * added in, and the addend of the relocation is stored in the
9791 * operand field for the instruction itself.
9792 *
9793 * Our job here is to fix the operand so that it would add
9794 * the correct offset so that %ebx would point to itself. The
9795 * thing that is tricky is that .-.L66 will point to the
9796 * beginning of the instruction, so we need to further modify
9797 * the operand so that it will point to itself. There are
9798 * other cases where you have something like:
9799 *
9800 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9801 *
9802 * and here no correction would be required. Internally in
9803 * the assembler we treat operands of this form as not being
9804 * pcrel since the '.' is explicitly mentioned, and I wonder
9805 * whether it would simplify matters to do it this way. Who
9806 * knows. In earlier versions of the PIC patches, the
9807 * pcrel_adjust field was used to store the correction, but
9808 * since the expression is not pcrel, I felt it would be
9809 * confusing to do it this way. */
9810
d6ab8113 9811 if ((reloc_type == BFD_RELOC_32
7b81dfbb
AJ
9812 || reloc_type == BFD_RELOC_X86_64_32S
9813 || reloc_type == BFD_RELOC_64)
29b0f896
AM
9814 && GOT_symbol
9815 && GOT_symbol == i.op[n].imms->X_add_symbol
9816 && (i.op[n].imms->X_op == O_symbol
9817 || (i.op[n].imms->X_op == O_add
9818 && ((symbol_get_value_expression
9819 (i.op[n].imms->X_op_symbol)->X_op)
9820 == O_subtract))))
9821 {
4fa24527 9822 if (!object_64bit)
d6ab8113 9823 reloc_type = BFD_RELOC_386_GOTPC;
7b81dfbb 9824 else if (size == 4)
d6ab8113 9825 reloc_type = BFD_RELOC_X86_64_GOTPC32;
7b81dfbb
AJ
9826 else if (size == 8)
9827 reloc_type = BFD_RELOC_X86_64_GOTPC64;
e379e5f3 9828 i.has_gotpc_tls_reloc = TRUE;
d583596c
JB
9829 i.op[n].imms->X_add_number +=
9830 encoding_length (insn_start_frag, insn_start_off, p);
29b0f896 9831 }
29b0f896
AM
9832 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9833 i.op[n].imms, 0, reloc_type);
9834 }
9835 }
9836 }
252b5132
RH
9837}
9838\f
d182319b
JB
9839/* x86_cons_fix_new is called via the expression parsing code when a
9840 reloc is needed. We use this hook to get the correct .got reloc. */
d182319b
JB
9841static int cons_sign = -1;
9842
9843void
e3bb37b5 9844x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
62ebcb5c 9845 expressionS *exp, bfd_reloc_code_real_type r)
d182319b 9846{
d258b828 9847 r = reloc (len, 0, cons_sign, r);
d182319b
JB
9848
9849#ifdef TE_PE
9850 if (exp->X_op == O_secrel)
9851 {
9852 exp->X_op = O_symbol;
9853 r = BFD_RELOC_32_SECREL;
9854 }
9855#endif
9856
9857 fix_new_exp (frag, off, len, exp, 0, r);
9858}
9859
357d1bd8
L
9860/* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9861 purpose of the `.dc.a' internal pseudo-op. */
9862
9863int
9864x86_address_bytes (void)
9865{
9866 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9867 return 4;
9868 return stdoutput->arch_info->bits_per_address / 8;
9869}
9870
d382c579
TG
9871#if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9872 || defined (LEX_AT)
d258b828 9873# define lex_got(reloc, adjust, types) NULL
718ddfc0 9874#else
f3c180ae
AM
9875/* Parse operands of the form
9876 <symbol>@GOTOFF+<nnn>
9877 and similar .plt or .got references.
9878
9879 If we find one, set up the correct relocation in RELOC and copy the
9880 input string, minus the `@GOTOFF' into a malloc'd buffer for
9881 parsing by the calling routine. Return this buffer, and if ADJUST
9882 is non-null set it to the length of the string we removed from the
9883 input line. Otherwise return NULL. */
9884static char *
91d6fa6a 9885lex_got (enum bfd_reloc_code_real *rel,
64e74474 9886 int *adjust,
d258b828 9887 i386_operand_type *types)
f3c180ae 9888{
7b81dfbb
AJ
9889 /* Some of the relocations depend on the size of what field is to
9890 be relocated. But in our callers i386_immediate and i386_displacement
9891 we don't yet know the operand size (this will be set by insn
9892 matching). Hence we record the word32 relocation here,
9893 and adjust the reloc according to the real size in reloc(). */
f3c180ae
AM
9894 static const struct {
9895 const char *str;
cff8d58a 9896 int len;
4fa24527 9897 const enum bfd_reloc_code_real rel[2];
40fb9820 9898 const i386_operand_type types64;
f3c180ae 9899 } gotrel[] = {
8ce3d284 9900#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
9901 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9902 BFD_RELOC_SIZE32 },
9903 OPERAND_TYPE_IMM32_64 },
8ce3d284 9904#endif
cff8d58a
L
9905 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9906 BFD_RELOC_X86_64_PLTOFF64 },
40fb9820 9907 OPERAND_TYPE_IMM64 },
cff8d58a
L
9908 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9909 BFD_RELOC_X86_64_PLT32 },
40fb9820 9910 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9911 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9912 BFD_RELOC_X86_64_GOTPLT64 },
40fb9820 9913 OPERAND_TYPE_IMM64_DISP64 },
cff8d58a
L
9914 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9915 BFD_RELOC_X86_64_GOTOFF64 },
40fb9820 9916 OPERAND_TYPE_IMM64_DISP64 },
cff8d58a
L
9917 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9918 BFD_RELOC_X86_64_GOTPCREL },
40fb9820 9919 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9920 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9921 BFD_RELOC_X86_64_TLSGD },
40fb9820 9922 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9923 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9924 _dummy_first_bfd_reloc_code_real },
40fb9820 9925 OPERAND_TYPE_NONE },
cff8d58a
L
9926 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9927 BFD_RELOC_X86_64_TLSLD },
40fb9820 9928 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9929 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9930 BFD_RELOC_X86_64_GOTTPOFF },
40fb9820 9931 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9932 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9933 BFD_RELOC_X86_64_TPOFF32 },
40fb9820 9934 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
cff8d58a
L
9935 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9936 _dummy_first_bfd_reloc_code_real },
40fb9820 9937 OPERAND_TYPE_NONE },
cff8d58a
L
9938 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9939 BFD_RELOC_X86_64_DTPOFF32 },
40fb9820 9940 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
cff8d58a
L
9941 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9942 _dummy_first_bfd_reloc_code_real },
40fb9820 9943 OPERAND_TYPE_NONE },
cff8d58a
L
9944 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9945 _dummy_first_bfd_reloc_code_real },
40fb9820 9946 OPERAND_TYPE_NONE },
cff8d58a
L
9947 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9948 BFD_RELOC_X86_64_GOT32 },
40fb9820 9949 OPERAND_TYPE_IMM32_32S_64_DISP32 },
cff8d58a
L
9950 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9951 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
40fb9820 9952 OPERAND_TYPE_IMM32_32S_DISP32 },
cff8d58a
L
9953 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9954 BFD_RELOC_X86_64_TLSDESC_CALL },
40fb9820 9955 OPERAND_TYPE_IMM32_32S_DISP32 },
f3c180ae
AM
9956 };
9957 char *cp;
9958 unsigned int j;
9959
d382c579 9960#if defined (OBJ_MAYBE_ELF)
718ddfc0
JB
9961 if (!IS_ELF)
9962 return NULL;
d382c579 9963#endif
718ddfc0 9964
f3c180ae 9965 for (cp = input_line_pointer; *cp != '@'; cp++)
67c11a9b 9966 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
f3c180ae
AM
9967 return NULL;
9968
47465058 9969 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
f3c180ae 9970 {
cff8d58a 9971 int len = gotrel[j].len;
28f81592 9972 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
f3c180ae 9973 {
4fa24527 9974 if (gotrel[j].rel[object_64bit] != 0)
f3c180ae 9975 {
28f81592
AM
9976 int first, second;
9977 char *tmpbuf, *past_reloc;
f3c180ae 9978
91d6fa6a 9979 *rel = gotrel[j].rel[object_64bit];
f3c180ae 9980
3956db08
JB
9981 if (types)
9982 {
9983 if (flag_code != CODE_64BIT)
40fb9820
L
9984 {
9985 types->bitfield.imm32 = 1;
9986 types->bitfield.disp32 = 1;
9987 }
3956db08
JB
9988 else
9989 *types = gotrel[j].types64;
9990 }
9991
8fd4256d 9992 if (j != 0 && GOT_symbol == NULL)
f3c180ae
AM
9993 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9994
28f81592 9995 /* The length of the first part of our input line. */
f3c180ae 9996 first = cp - input_line_pointer;
28f81592
AM
9997
9998 /* The second part goes from after the reloc token until
67c11a9b 9999 (and including) an end_of_line char or comma. */
28f81592 10000 past_reloc = cp + 1 + len;
67c11a9b
AM
10001 cp = past_reloc;
10002 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10003 ++cp;
10004 second = cp + 1 - past_reloc;
28f81592
AM
10005
10006 /* Allocate and copy string. The trailing NUL shouldn't
10007 be necessary, but be safe. */
add39d23 10008 tmpbuf = XNEWVEC (char, first + second + 2);
f3c180ae 10009 memcpy (tmpbuf, input_line_pointer, first);
0787a12d
AM
10010 if (second != 0 && *past_reloc != ' ')
10011 /* Replace the relocation token with ' ', so that
10012 errors like foo@GOTOFF1 will be detected. */
10013 tmpbuf[first++] = ' ';
af89796a
L
10014 else
10015 /* Increment length by 1 if the relocation token is
10016 removed. */
10017 len++;
10018 if (adjust)
10019 *adjust = len;
0787a12d
AM
10020 memcpy (tmpbuf + first, past_reloc, second);
10021 tmpbuf[first + second] = '\0';
f3c180ae
AM
10022 return tmpbuf;
10023 }
10024
4fa24527
JB
10025 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10026 gotrel[j].str, 1 << (5 + object_64bit));
f3c180ae
AM
10027 return NULL;
10028 }
10029 }
10030
10031 /* Might be a symbol version string. Don't as_bad here. */
10032 return NULL;
10033}
4e4f7c87 10034#endif
f3c180ae 10035
a988325c
NC
10036#ifdef TE_PE
10037#ifdef lex_got
10038#undef lex_got
10039#endif
10040/* Parse operands of the form
10041 <symbol>@SECREL32+<nnn>
10042
10043 If we find one, set up the correct relocation in RELOC and copy the
10044 input string, minus the `@SECREL32' into a malloc'd buffer for
10045 parsing by the calling routine. Return this buffer, and if ADJUST
10046 is non-null set it to the length of the string we removed from the
34bca508
L
10047 input line. Otherwise return NULL.
10048
a988325c
NC
10049 This function is copied from the ELF version above adjusted for PE targets. */
10050
10051static char *
10052lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10053 int *adjust ATTRIBUTE_UNUSED,
d258b828 10054 i386_operand_type *types)
a988325c
NC
10055{
10056 static const struct
10057 {
10058 const char *str;
10059 int len;
10060 const enum bfd_reloc_code_real rel[2];
10061 const i386_operand_type types64;
10062 }
10063 gotrel[] =
10064 {
10065 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
10066 BFD_RELOC_32_SECREL },
10067 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10068 };
10069
10070 char *cp;
10071 unsigned j;
10072
10073 for (cp = input_line_pointer; *cp != '@'; cp++)
10074 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10075 return NULL;
10076
10077 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10078 {
10079 int len = gotrel[j].len;
10080
10081 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10082 {
10083 if (gotrel[j].rel[object_64bit] != 0)
10084 {
10085 int first, second;
10086 char *tmpbuf, *past_reloc;
10087
10088 *rel = gotrel[j].rel[object_64bit];
10089 if (adjust)
10090 *adjust = len;
10091
10092 if (types)
10093 {
10094 if (flag_code != CODE_64BIT)
10095 {
10096 types->bitfield.imm32 = 1;
10097 types->bitfield.disp32 = 1;
10098 }
10099 else
10100 *types = gotrel[j].types64;
10101 }
10102
10103 /* The length of the first part of our input line. */
10104 first = cp - input_line_pointer;
10105
10106 /* The second part goes from after the reloc token until
10107 (and including) an end_of_line char or comma. */
10108 past_reloc = cp + 1 + len;
10109 cp = past_reloc;
10110 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10111 ++cp;
10112 second = cp + 1 - past_reloc;
10113
10114 /* Allocate and copy string. The trailing NUL shouldn't
10115 be necessary, but be safe. */
add39d23 10116 tmpbuf = XNEWVEC (char, first + second + 2);
a988325c
NC
10117 memcpy (tmpbuf, input_line_pointer, first);
10118 if (second != 0 && *past_reloc != ' ')
10119 /* Replace the relocation token with ' ', so that
10120 errors like foo@SECLREL321 will be detected. */
10121 tmpbuf[first++] = ' ';
10122 memcpy (tmpbuf + first, past_reloc, second);
10123 tmpbuf[first + second] = '\0';
10124 return tmpbuf;
10125 }
10126
10127 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10128 gotrel[j].str, 1 << (5 + object_64bit));
10129 return NULL;
10130 }
10131 }
10132
10133 /* Might be a symbol version string. Don't as_bad here. */
10134 return NULL;
10135}
10136
10137#endif /* TE_PE */
10138
62ebcb5c 10139bfd_reloc_code_real_type
e3bb37b5 10140x86_cons (expressionS *exp, int size)
f3c180ae 10141{
62ebcb5c
AM
10142 bfd_reloc_code_real_type got_reloc = NO_RELOC;
10143
ee86248c
JB
10144 intel_syntax = -intel_syntax;
10145
3c7b9c2c 10146 exp->X_md = 0;
4fa24527 10147 if (size == 4 || (object_64bit && size == 8))
f3c180ae
AM
10148 {
10149 /* Handle @GOTOFF and the like in an expression. */
10150 char *save;
10151 char *gotfree_input_line;
4a57f2cf 10152 int adjust = 0;
f3c180ae
AM
10153
10154 save = input_line_pointer;
d258b828 10155 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
f3c180ae
AM
10156 if (gotfree_input_line)
10157 input_line_pointer = gotfree_input_line;
10158
10159 expression (exp);
10160
10161 if (gotfree_input_line)
10162 {
10163 /* expression () has merrily parsed up to the end of line,
10164 or a comma - in the wrong buffer. Transfer how far
10165 input_line_pointer has moved to the right buffer. */
10166 input_line_pointer = (save
10167 + (input_line_pointer - gotfree_input_line)
10168 + adjust);
10169 free (gotfree_input_line);
3992d3b7
AM
10170 if (exp->X_op == O_constant
10171 || exp->X_op == O_absent
10172 || exp->X_op == O_illegal
0398aac5 10173 || exp->X_op == O_register
3992d3b7
AM
10174 || exp->X_op == O_big)
10175 {
10176 char c = *input_line_pointer;
10177 *input_line_pointer = 0;
10178 as_bad (_("missing or invalid expression `%s'"), save);
10179 *input_line_pointer = c;
10180 }
b9519cfe
L
10181 else if ((got_reloc == BFD_RELOC_386_PLT32
10182 || got_reloc == BFD_RELOC_X86_64_PLT32)
10183 && exp->X_op != O_symbol)
10184 {
10185 char c = *input_line_pointer;
10186 *input_line_pointer = 0;
10187 as_bad (_("invalid PLT expression `%s'"), save);
10188 *input_line_pointer = c;
10189 }
f3c180ae
AM
10190 }
10191 }
10192 else
10193 expression (exp);
ee86248c
JB
10194
10195 intel_syntax = -intel_syntax;
10196
10197 if (intel_syntax)
10198 i386_intel_simplify (exp);
62ebcb5c
AM
10199
10200 return got_reloc;
f3c180ae 10201}
f3c180ae 10202
9f32dd5b
L
10203static void
10204signed_cons (int size)
6482c264 10205{
d182319b
JB
10206 if (flag_code == CODE_64BIT)
10207 cons_sign = 1;
10208 cons (size);
10209 cons_sign = -1;
6482c264
NC
10210}
10211
d182319b 10212#ifdef TE_PE
6482c264 10213static void
7016a5d5 10214pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
6482c264
NC
10215{
10216 expressionS exp;
10217
10218 do
10219 {
10220 expression (&exp);
10221 if (exp.X_op == O_symbol)
10222 exp.X_op = O_secrel;
10223
10224 emit_expr (&exp, 4);
10225 }
10226 while (*input_line_pointer++ == ',');
10227
10228 input_line_pointer--;
10229 demand_empty_rest_of_line ();
10230}
6482c264
NC
10231#endif
10232
43234a1e
L
10233/* Handle Vector operations. */
10234
10235static char *
10236check_VecOperations (char *op_string, char *op_end)
10237{
10238 const reg_entry *mask;
10239 const char *saved;
10240 char *end_op;
10241
10242 while (*op_string
10243 && (op_end == NULL || op_string < op_end))
10244 {
10245 saved = op_string;
10246 if (*op_string == '{')
10247 {
10248 op_string++;
10249
10250 /* Check broadcasts. */
10251 if (strncmp (op_string, "1to", 3) == 0)
10252 {
10253 int bcst_type;
10254
10255 if (i.broadcast)
10256 goto duplicated_vec_op;
10257
10258 op_string += 3;
10259 if (*op_string == '8')
8e6e0792 10260 bcst_type = 8;
b28d1bda 10261 else if (*op_string == '4')
8e6e0792 10262 bcst_type = 4;
b28d1bda 10263 else if (*op_string == '2')
8e6e0792 10264 bcst_type = 2;
43234a1e
L
10265 else if (*op_string == '1'
10266 && *(op_string+1) == '6')
10267 {
8e6e0792 10268 bcst_type = 16;
43234a1e
L
10269 op_string++;
10270 }
10271 else
10272 {
10273 as_bad (_("Unsupported broadcast: `%s'"), saved);
10274 return NULL;
10275 }
10276 op_string++;
10277
10278 broadcast_op.type = bcst_type;
10279 broadcast_op.operand = this_operand;
1f75763a 10280 broadcast_op.bytes = 0;
43234a1e
L
10281 i.broadcast = &broadcast_op;
10282 }
10283 /* Check masking operation. */
10284 else if ((mask = parse_register (op_string, &end_op)) != NULL)
10285 {
8a6fb3f9
JB
10286 if (mask == &bad_reg)
10287 return NULL;
10288
43234a1e 10289 /* k0 can't be used for write mask. */
f74a6307 10290 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
43234a1e 10291 {
6d2cd6b2
JB
10292 as_bad (_("`%s%s' can't be used for write mask"),
10293 register_prefix, mask->reg_name);
43234a1e
L
10294 return NULL;
10295 }
10296
10297 if (!i.mask)
10298 {
10299 mask_op.mask = mask;
10300 mask_op.zeroing = 0;
10301 mask_op.operand = this_operand;
10302 i.mask = &mask_op;
10303 }
10304 else
10305 {
10306 if (i.mask->mask)
10307 goto duplicated_vec_op;
10308
10309 i.mask->mask = mask;
10310
10311 /* Only "{z}" is allowed here. No need to check
10312 zeroing mask explicitly. */
10313 if (i.mask->operand != this_operand)
10314 {
10315 as_bad (_("invalid write mask `%s'"), saved);
10316 return NULL;
10317 }
10318 }
10319
10320 op_string = end_op;
10321 }
10322 /* Check zeroing-flag for masking operation. */
10323 else if (*op_string == 'z')
10324 {
10325 if (!i.mask)
10326 {
10327 mask_op.mask = NULL;
10328 mask_op.zeroing = 1;
10329 mask_op.operand = this_operand;
10330 i.mask = &mask_op;
10331 }
10332 else
10333 {
10334 if (i.mask->zeroing)
10335 {
10336 duplicated_vec_op:
10337 as_bad (_("duplicated `%s'"), saved);
10338 return NULL;
10339 }
10340
10341 i.mask->zeroing = 1;
10342
10343 /* Only "{%k}" is allowed here. No need to check mask
10344 register explicitly. */
10345 if (i.mask->operand != this_operand)
10346 {
10347 as_bad (_("invalid zeroing-masking `%s'"),
10348 saved);
10349 return NULL;
10350 }
10351 }
10352
10353 op_string++;
10354 }
10355 else
10356 goto unknown_vec_op;
10357
10358 if (*op_string != '}')
10359 {
10360 as_bad (_("missing `}' in `%s'"), saved);
10361 return NULL;
10362 }
10363 op_string++;
0ba3a731
L
10364
10365 /* Strip whitespace since the addition of pseudo prefixes
10366 changed how the scrubber treats '{'. */
10367 if (is_space_char (*op_string))
10368 ++op_string;
10369
43234a1e
L
10370 continue;
10371 }
10372 unknown_vec_op:
10373 /* We don't know this one. */
10374 as_bad (_("unknown vector operation: `%s'"), saved);
10375 return NULL;
10376 }
10377
6d2cd6b2
JB
10378 if (i.mask && i.mask->zeroing && !i.mask->mask)
10379 {
10380 as_bad (_("zeroing-masking only allowed with write mask"));
10381 return NULL;
10382 }
10383
43234a1e
L
10384 return op_string;
10385}
10386
252b5132 10387static int
70e41ade 10388i386_immediate (char *imm_start)
252b5132
RH
10389{
10390 char *save_input_line_pointer;
f3c180ae 10391 char *gotfree_input_line;
252b5132 10392 segT exp_seg = 0;
47926f60 10393 expressionS *exp;
40fb9820
L
10394 i386_operand_type types;
10395
0dfbf9d7 10396 operand_type_set (&types, ~0);
252b5132
RH
10397
10398 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10399 {
31b2323c
L
10400 as_bad (_("at most %d immediate operands are allowed"),
10401 MAX_IMMEDIATE_OPERANDS);
252b5132
RH
10402 return 0;
10403 }
10404
10405 exp = &im_expressions[i.imm_operands++];
520dc8e8 10406 i.op[this_operand].imms = exp;
252b5132
RH
10407
10408 if (is_space_char (*imm_start))
10409 ++imm_start;
10410
10411 save_input_line_pointer = input_line_pointer;
10412 input_line_pointer = imm_start;
10413
d258b828 10414 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
f3c180ae
AM
10415 if (gotfree_input_line)
10416 input_line_pointer = gotfree_input_line;
252b5132
RH
10417
10418 exp_seg = expression (exp);
10419
83183c0c 10420 SKIP_WHITESPACE ();
43234a1e
L
10421
10422 /* Handle vector operations. */
10423 if (*input_line_pointer == '{')
10424 {
10425 input_line_pointer = check_VecOperations (input_line_pointer,
10426 NULL);
10427 if (input_line_pointer == NULL)
10428 return 0;
10429 }
10430
252b5132 10431 if (*input_line_pointer)
f3c180ae 10432 as_bad (_("junk `%s' after expression"), input_line_pointer);
252b5132
RH
10433
10434 input_line_pointer = save_input_line_pointer;
f3c180ae 10435 if (gotfree_input_line)
ee86248c
JB
10436 {
10437 free (gotfree_input_line);
10438
10439 if (exp->X_op == O_constant || exp->X_op == O_register)
10440 exp->X_op = O_illegal;
10441 }
10442
10443 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10444}
252b5132 10445
ee86248c
JB
10446static int
10447i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10448 i386_operand_type types, const char *imm_start)
10449{
10450 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
252b5132 10451 {
313c53d1
L
10452 if (imm_start)
10453 as_bad (_("missing or invalid immediate expression `%s'"),
10454 imm_start);
3992d3b7 10455 return 0;
252b5132 10456 }
3e73aa7c 10457 else if (exp->X_op == O_constant)
252b5132 10458 {
47926f60 10459 /* Size it properly later. */
40fb9820 10460 i.types[this_operand].bitfield.imm64 = 1;
13f864ae
L
10461 /* If not 64bit, sign extend val. */
10462 if (flag_code != CODE_64BIT
4eed87de
AM
10463 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10464 exp->X_add_number
10465 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
252b5132 10466 }
4c63da97 10467#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
f86103b7 10468 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
31312f95 10469 && exp_seg != absolute_section
47926f60 10470 && exp_seg != text_section
24eab124
AM
10471 && exp_seg != data_section
10472 && exp_seg != bss_section
10473 && exp_seg != undefined_section
f86103b7 10474 && !bfd_is_com_section (exp_seg))
252b5132 10475 {
d0b47220 10476 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
252b5132
RH
10477 return 0;
10478 }
10479#endif
a841bdf5 10480 else if (!intel_syntax && exp_seg == reg_section)
bb8f5920 10481 {
313c53d1
L
10482 if (imm_start)
10483 as_bad (_("illegal immediate register operand %s"), imm_start);
bb8f5920
L
10484 return 0;
10485 }
252b5132
RH
10486 else
10487 {
10488 /* This is an address. The size of the address will be
24eab124 10489 determined later, depending on destination register,
3e73aa7c 10490 suffix, or the default for the section. */
40fb9820
L
10491 i.types[this_operand].bitfield.imm8 = 1;
10492 i.types[this_operand].bitfield.imm16 = 1;
10493 i.types[this_operand].bitfield.imm32 = 1;
10494 i.types[this_operand].bitfield.imm32s = 1;
10495 i.types[this_operand].bitfield.imm64 = 1;
c6fb90c8
L
10496 i.types[this_operand] = operand_type_and (i.types[this_operand],
10497 types);
252b5132
RH
10498 }
10499
10500 return 1;
10501}
10502
551c1ca1 10503static char *
e3bb37b5 10504i386_scale (char *scale)
252b5132 10505{
551c1ca1
AM
10506 offsetT val;
10507 char *save = input_line_pointer;
252b5132 10508
551c1ca1
AM
10509 input_line_pointer = scale;
10510 val = get_absolute_expression ();
10511
10512 switch (val)
252b5132 10513 {
551c1ca1 10514 case 1:
252b5132
RH
10515 i.log2_scale_factor = 0;
10516 break;
551c1ca1 10517 case 2:
252b5132
RH
10518 i.log2_scale_factor = 1;
10519 break;
551c1ca1 10520 case 4:
252b5132
RH
10521 i.log2_scale_factor = 2;
10522 break;
551c1ca1 10523 case 8:
252b5132
RH
10524 i.log2_scale_factor = 3;
10525 break;
10526 default:
a724f0f4
JB
10527 {
10528 char sep = *input_line_pointer;
10529
10530 *input_line_pointer = '\0';
10531 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10532 scale);
10533 *input_line_pointer = sep;
10534 input_line_pointer = save;
10535 return NULL;
10536 }
252b5132 10537 }
29b0f896 10538 if (i.log2_scale_factor != 0 && i.index_reg == 0)
252b5132
RH
10539 {
10540 as_warn (_("scale factor of %d without an index register"),
24eab124 10541 1 << i.log2_scale_factor);
252b5132 10542 i.log2_scale_factor = 0;
252b5132 10543 }
551c1ca1
AM
10544 scale = input_line_pointer;
10545 input_line_pointer = save;
10546 return scale;
252b5132
RH
10547}
10548
252b5132 10549static int
e3bb37b5 10550i386_displacement (char *disp_start, char *disp_end)
252b5132 10551{
29b0f896 10552 expressionS *exp;
252b5132
RH
10553 segT exp_seg = 0;
10554 char *save_input_line_pointer;
f3c180ae 10555 char *gotfree_input_line;
40fb9820
L
10556 int override;
10557 i386_operand_type bigdisp, types = anydisp;
3992d3b7 10558 int ret;
252b5132 10559
31b2323c
L
10560 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10561 {
10562 as_bad (_("at most %d displacement operands are allowed"),
10563 MAX_MEMORY_OPERANDS);
10564 return 0;
10565 }
10566
0dfbf9d7 10567 operand_type_set (&bigdisp, 0);
6f2f06be 10568 if (i.jumpabsolute
48bcea9f 10569 || i.types[this_operand].bitfield.baseindex
0cfa3eb3
JB
10570 || (current_templates->start->opcode_modifier.jump != JUMP
10571 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
e05278af 10572 {
48bcea9f 10573 i386_addressing_mode ();
e05278af 10574 override = (i.prefix[ADDR_PREFIX] != 0);
40fb9820
L
10575 if (flag_code == CODE_64BIT)
10576 {
10577 if (!override)
10578 {
10579 bigdisp.bitfield.disp32s = 1;
10580 bigdisp.bitfield.disp64 = 1;
10581 }
48bcea9f
JB
10582 else
10583 bigdisp.bitfield.disp32 = 1;
40fb9820
L
10584 }
10585 else if ((flag_code == CODE_16BIT) ^ override)
40fb9820 10586 bigdisp.bitfield.disp16 = 1;
48bcea9f
JB
10587 else
10588 bigdisp.bitfield.disp32 = 1;
e05278af
JB
10589 }
10590 else
10591 {
376cd056
JB
10592 /* For PC-relative branches, the width of the displacement may be
10593 dependent upon data size, but is never dependent upon address size.
10594 Also make sure to not unintentionally match against a non-PC-relative
10595 branch template. */
10596 static templates aux_templates;
10597 const insn_template *t = current_templates->start;
10598 bfd_boolean has_intel64 = FALSE;
10599
10600 aux_templates.start = t;
10601 while (++t < current_templates->end)
10602 {
10603 if (t->opcode_modifier.jump
10604 != current_templates->start->opcode_modifier.jump)
10605 break;
4b5aaf5f 10606 if ((t->opcode_modifier.isa64 >= INTEL64))
376cd056
JB
10607 has_intel64 = TRUE;
10608 }
10609 if (t < current_templates->end)
10610 {
10611 aux_templates.end = t;
10612 current_templates = &aux_templates;
10613 }
10614
e05278af 10615 override = (i.prefix[DATA_PREFIX] != 0);
40fb9820
L
10616 if (flag_code == CODE_64BIT)
10617 {
376cd056
JB
10618 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10619 && (!intel64 || !has_intel64))
40fb9820
L
10620 bigdisp.bitfield.disp16 = 1;
10621 else
48bcea9f 10622 bigdisp.bitfield.disp32s = 1;
40fb9820
L
10623 }
10624 else
e05278af
JB
10625 {
10626 if (!override)
10627 override = (i.suffix == (flag_code != CODE_16BIT
10628 ? WORD_MNEM_SUFFIX
10629 : LONG_MNEM_SUFFIX));
40fb9820
L
10630 bigdisp.bitfield.disp32 = 1;
10631 if ((flag_code == CODE_16BIT) ^ override)
10632 {
10633 bigdisp.bitfield.disp32 = 0;
10634 bigdisp.bitfield.disp16 = 1;
10635 }
e05278af 10636 }
e05278af 10637 }
c6fb90c8
L
10638 i.types[this_operand] = operand_type_or (i.types[this_operand],
10639 bigdisp);
252b5132
RH
10640
10641 exp = &disp_expressions[i.disp_operands];
520dc8e8 10642 i.op[this_operand].disps = exp;
252b5132
RH
10643 i.disp_operands++;
10644 save_input_line_pointer = input_line_pointer;
10645 input_line_pointer = disp_start;
10646 END_STRING_AND_SAVE (disp_end);
10647
10648#ifndef GCC_ASM_O_HACK
10649#define GCC_ASM_O_HACK 0
10650#endif
10651#if GCC_ASM_O_HACK
10652 END_STRING_AND_SAVE (disp_end + 1);
40fb9820 10653 if (i.types[this_operand].bitfield.baseIndex
24eab124 10654 && displacement_string_end[-1] == '+')
252b5132
RH
10655 {
10656 /* This hack is to avoid a warning when using the "o"
24eab124
AM
10657 constraint within gcc asm statements.
10658 For instance:
10659
10660 #define _set_tssldt_desc(n,addr,limit,type) \
10661 __asm__ __volatile__ ( \
10662 "movw %w2,%0\n\t" \
10663 "movw %w1,2+%0\n\t" \
10664 "rorl $16,%1\n\t" \
10665 "movb %b1,4+%0\n\t" \
10666 "movb %4,5+%0\n\t" \
10667 "movb $0,6+%0\n\t" \
10668 "movb %h1,7+%0\n\t" \
10669 "rorl $16,%1" \
10670 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10671
10672 This works great except that the output assembler ends
10673 up looking a bit weird if it turns out that there is
10674 no offset. You end up producing code that looks like:
10675
10676 #APP
10677 movw $235,(%eax)
10678 movw %dx,2+(%eax)
10679 rorl $16,%edx
10680 movb %dl,4+(%eax)
10681 movb $137,5+(%eax)
10682 movb $0,6+(%eax)
10683 movb %dh,7+(%eax)
10684 rorl $16,%edx
10685 #NO_APP
10686
47926f60 10687 So here we provide the missing zero. */
24eab124
AM
10688
10689 *displacement_string_end = '0';
252b5132
RH
10690 }
10691#endif
d258b828 10692 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
f3c180ae
AM
10693 if (gotfree_input_line)
10694 input_line_pointer = gotfree_input_line;
252b5132 10695
24eab124 10696 exp_seg = expression (exp);
252b5132 10697
636c26b0
AM
10698 SKIP_WHITESPACE ();
10699 if (*input_line_pointer)
10700 as_bad (_("junk `%s' after expression"), input_line_pointer);
10701#if GCC_ASM_O_HACK
10702 RESTORE_END_STRING (disp_end + 1);
10703#endif
636c26b0 10704 input_line_pointer = save_input_line_pointer;
636c26b0 10705 if (gotfree_input_line)
ee86248c
JB
10706 {
10707 free (gotfree_input_line);
10708
10709 if (exp->X_op == O_constant || exp->X_op == O_register)
10710 exp->X_op = O_illegal;
10711 }
10712
10713 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10714
10715 RESTORE_END_STRING (disp_end);
10716
10717 return ret;
10718}
10719
10720static int
10721i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10722 i386_operand_type types, const char *disp_start)
10723{
10724 i386_operand_type bigdisp;
10725 int ret = 1;
636c26b0 10726
24eab124
AM
10727 /* We do this to make sure that the section symbol is in
10728 the symbol table. We will ultimately change the relocation
47926f60 10729 to be relative to the beginning of the section. */
1ae12ab7 10730 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
d6ab8113
JB
10731 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10732 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
24eab124 10733 {
636c26b0 10734 if (exp->X_op != O_symbol)
3992d3b7 10735 goto inv_disp;
636c26b0 10736
e5cb08ac 10737 if (S_IS_LOCAL (exp->X_add_symbol)
c64efb4b
L
10738 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10739 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
24eab124 10740 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
24eab124
AM
10741 exp->X_op = O_subtract;
10742 exp->X_op_symbol = GOT_symbol;
1ae12ab7 10743 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
29b0f896 10744 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
d6ab8113
JB
10745 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10746 i.reloc[this_operand] = BFD_RELOC_64;
23df1078 10747 else
29b0f896 10748 i.reloc[this_operand] = BFD_RELOC_32;
24eab124 10749 }
252b5132 10750
3992d3b7
AM
10751 else if (exp->X_op == O_absent
10752 || exp->X_op == O_illegal
ee86248c 10753 || exp->X_op == O_big)
2daf4fd8 10754 {
3992d3b7
AM
10755 inv_disp:
10756 as_bad (_("missing or invalid displacement expression `%s'"),
2daf4fd8 10757 disp_start);
3992d3b7 10758 ret = 0;
2daf4fd8
AM
10759 }
10760
0e1147d9
L
10761 else if (flag_code == CODE_64BIT
10762 && !i.prefix[ADDR_PREFIX]
10763 && exp->X_op == O_constant)
10764 {
10765 /* Since displacement is signed extended to 64bit, don't allow
10766 disp32 and turn off disp32s if they are out of range. */
10767 i.types[this_operand].bitfield.disp32 = 0;
10768 if (!fits_in_signed_long (exp->X_add_number))
10769 {
10770 i.types[this_operand].bitfield.disp32s = 0;
10771 if (i.types[this_operand].bitfield.baseindex)
10772 {
10773 as_bad (_("0x%lx out range of signed 32bit displacement"),
10774 (long) exp->X_add_number);
10775 ret = 0;
10776 }
10777 }
10778 }
10779
4c63da97 10780#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
3992d3b7
AM
10781 else if (exp->X_op != O_constant
10782 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10783 && exp_seg != absolute_section
10784 && exp_seg != text_section
10785 && exp_seg != data_section
10786 && exp_seg != bss_section
10787 && exp_seg != undefined_section
10788 && !bfd_is_com_section (exp_seg))
24eab124 10789 {
d0b47220 10790 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
3992d3b7 10791 ret = 0;
24eab124 10792 }
252b5132 10793#endif
3956db08 10794
48bcea9f
JB
10795 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10796 /* Constants get taken care of by optimize_disp(). */
10797 && exp->X_op != O_constant)
10798 i.types[this_operand].bitfield.disp8 = 1;
10799
40fb9820
L
10800 /* Check if this is a displacement only operand. */
10801 bigdisp = i.types[this_operand];
10802 bigdisp.bitfield.disp8 = 0;
10803 bigdisp.bitfield.disp16 = 0;
10804 bigdisp.bitfield.disp32 = 0;
10805 bigdisp.bitfield.disp32s = 0;
10806 bigdisp.bitfield.disp64 = 0;
0dfbf9d7 10807 if (operand_type_all_zero (&bigdisp))
c6fb90c8
L
10808 i.types[this_operand] = operand_type_and (i.types[this_operand],
10809 types);
3956db08 10810
3992d3b7 10811 return ret;
252b5132
RH
10812}
10813
2abc2bec
JB
10814/* Return the active addressing mode, taking address override and
10815 registers forming the address into consideration. Update the
10816 address override prefix if necessary. */
47926f60 10817
2abc2bec
JB
10818static enum flag_code
10819i386_addressing_mode (void)
252b5132 10820{
be05d201
L
10821 enum flag_code addr_mode;
10822
10823 if (i.prefix[ADDR_PREFIX])
10824 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
a23b33b3
JB
10825 else if (flag_code == CODE_16BIT
10826 && current_templates->start->cpu_flags.bitfield.cpumpx
10827 /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10828 from md_assemble() by "is not a valid base/index expression"
10829 when there is a base and/or index. */
10830 && !i.types[this_operand].bitfield.baseindex)
10831 {
10832 /* MPX insn memory operands with neither base nor index must be forced
10833 to use 32-bit addressing in 16-bit mode. */
10834 addr_mode = CODE_32BIT;
10835 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10836 ++i.prefixes;
10837 gas_assert (!i.types[this_operand].bitfield.disp16);
10838 gas_assert (!i.types[this_operand].bitfield.disp32);
10839 }
be05d201
L
10840 else
10841 {
10842 addr_mode = flag_code;
10843
24eab124 10844#if INFER_ADDR_PREFIX
be05d201
L
10845 if (i.mem_operands == 0)
10846 {
10847 /* Infer address prefix from the first memory operand. */
10848 const reg_entry *addr_reg = i.base_reg;
10849
10850 if (addr_reg == NULL)
10851 addr_reg = i.index_reg;
eecb386c 10852
be05d201
L
10853 if (addr_reg)
10854 {
e968fc9b 10855 if (addr_reg->reg_type.bitfield.dword)
be05d201
L
10856 addr_mode = CODE_32BIT;
10857 else if (flag_code != CODE_64BIT
dc821c5f 10858 && addr_reg->reg_type.bitfield.word)
be05d201
L
10859 addr_mode = CODE_16BIT;
10860
10861 if (addr_mode != flag_code)
10862 {
10863 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10864 i.prefixes += 1;
10865 /* Change the size of any displacement too. At most one
10866 of Disp16 or Disp32 is set.
10867 FIXME. There doesn't seem to be any real need for
10868 separate Disp16 and Disp32 flags. The same goes for
10869 Imm16 and Imm32. Removing them would probably clean
10870 up the code quite a lot. */
10871 if (flag_code != CODE_64BIT
10872 && (i.types[this_operand].bitfield.disp16
10873 || i.types[this_operand].bitfield.disp32))
10874 i.types[this_operand]
10875 = operand_type_xor (i.types[this_operand], disp16_32);
10876 }
10877 }
10878 }
24eab124 10879#endif
be05d201
L
10880 }
10881
2abc2bec
JB
10882 return addr_mode;
10883}
10884
10885/* Make sure the memory operand we've been dealt is valid.
10886 Return 1 on success, 0 on a failure. */
10887
10888static int
10889i386_index_check (const char *operand_string)
10890{
10891 const char *kind = "base/index";
10892 enum flag_code addr_mode = i386_addressing_mode ();
10893
fc0763e6 10894 if (current_templates->start->opcode_modifier.isstring
c3949f43 10895 && !current_templates->start->cpu_flags.bitfield.cpupadlock
fc0763e6
JB
10896 && (current_templates->end[-1].opcode_modifier.isstring
10897 || i.mem_operands))
10898 {
10899 /* Memory operands of string insns are special in that they only allow
10900 a single register (rDI, rSI, or rBX) as their memory address. */
be05d201
L
10901 const reg_entry *expected_reg;
10902 static const char *di_si[][2] =
10903 {
10904 { "esi", "edi" },
10905 { "si", "di" },
10906 { "rsi", "rdi" }
10907 };
10908 static const char *bx[] = { "ebx", "bx", "rbx" };
fc0763e6
JB
10909
10910 kind = "string address";
10911
8325cc63 10912 if (current_templates->start->opcode_modifier.repprefixok)
fc0763e6 10913 {
51c8edf6
JB
10914 int es_op = current_templates->end[-1].opcode_modifier.isstring
10915 - IS_STRING_ES_OP0;
10916 int op = 0;
fc0763e6 10917
51c8edf6 10918 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
fc0763e6
JB
10919 || ((!i.mem_operands != !intel_syntax)
10920 && current_templates->end[-1].operand_types[1]
10921 .bitfield.baseindex))
51c8edf6
JB
10922 op = 1;
10923 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
fc0763e6
JB
10924 }
10925 else
be05d201 10926 expected_reg = hash_find (reg_hash, bx[addr_mode]);
fc0763e6 10927
be05d201
L
10928 if (i.base_reg != expected_reg
10929 || i.index_reg
fc0763e6 10930 || operand_type_check (i.types[this_operand], disp))
fc0763e6 10931 {
be05d201
L
10932 /* The second memory operand must have the same size as
10933 the first one. */
10934 if (i.mem_operands
10935 && i.base_reg
10936 && !((addr_mode == CODE_64BIT
dc821c5f 10937 && i.base_reg->reg_type.bitfield.qword)
be05d201 10938 || (addr_mode == CODE_32BIT
dc821c5f
JB
10939 ? i.base_reg->reg_type.bitfield.dword
10940 : i.base_reg->reg_type.bitfield.word)))
be05d201
L
10941 goto bad_address;
10942
fc0763e6
JB
10943 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10944 operand_string,
10945 intel_syntax ? '[' : '(',
10946 register_prefix,
be05d201 10947 expected_reg->reg_name,
fc0763e6 10948 intel_syntax ? ']' : ')');
be05d201 10949 return 1;
fc0763e6 10950 }
be05d201
L
10951 else
10952 return 1;
10953
dc1e8a47 10954 bad_address:
be05d201
L
10955 as_bad (_("`%s' is not a valid %s expression"),
10956 operand_string, kind);
10957 return 0;
3e73aa7c
JH
10958 }
10959 else
10960 {
be05d201
L
10961 if (addr_mode != CODE_16BIT)
10962 {
10963 /* 32-bit/64-bit checks. */
10964 if ((i.base_reg
e968fc9b
JB
10965 && ((addr_mode == CODE_64BIT
10966 ? !i.base_reg->reg_type.bitfield.qword
10967 : !i.base_reg->reg_type.bitfield.dword)
10968 || (i.index_reg && i.base_reg->reg_num == RegIP)
10969 || i.base_reg->reg_num == RegIZ))
be05d201 10970 || (i.index_reg
1b54b8d7
JB
10971 && !i.index_reg->reg_type.bitfield.xmmword
10972 && !i.index_reg->reg_type.bitfield.ymmword
10973 && !i.index_reg->reg_type.bitfield.zmmword
be05d201 10974 && ((addr_mode == CODE_64BIT
e968fc9b
JB
10975 ? !i.index_reg->reg_type.bitfield.qword
10976 : !i.index_reg->reg_type.bitfield.dword)
be05d201
L
10977 || !i.index_reg->reg_type.bitfield.baseindex)))
10978 goto bad_address;
8178be5b 10979
260cd341 10980 /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
8178be5b 10981 if (current_templates->start->base_opcode == 0xf30f1b
260cd341
LC
10982 || (current_templates->start->base_opcode & ~1) == 0x0f1a
10983 || current_templates->start->opcode_modifier.sib == SIBMEM)
8178be5b
JB
10984 {
10985 /* They cannot use RIP-relative addressing. */
e968fc9b 10986 if (i.base_reg && i.base_reg->reg_num == RegIP)
8178be5b
JB
10987 {
10988 as_bad (_("`%s' cannot be used here"), operand_string);
10989 return 0;
10990 }
10991
10992 /* bndldx and bndstx ignore their scale factor. */
260cd341 10993 if ((current_templates->start->base_opcode & ~1) == 0x0f1a
8178be5b
JB
10994 && i.log2_scale_factor)
10995 as_warn (_("register scaling is being ignored here"));
10996 }
be05d201
L
10997 }
10998 else
3e73aa7c 10999 {
be05d201 11000 /* 16-bit checks. */
3e73aa7c 11001 if ((i.base_reg
dc821c5f 11002 && (!i.base_reg->reg_type.bitfield.word
40fb9820 11003 || !i.base_reg->reg_type.bitfield.baseindex))
3e73aa7c 11004 || (i.index_reg
dc821c5f 11005 && (!i.index_reg->reg_type.bitfield.word
40fb9820 11006 || !i.index_reg->reg_type.bitfield.baseindex
29b0f896
AM
11007 || !(i.base_reg
11008 && i.base_reg->reg_num < 6
11009 && i.index_reg->reg_num >= 6
11010 && i.log2_scale_factor == 0))))
be05d201 11011 goto bad_address;
3e73aa7c
JH
11012 }
11013 }
be05d201 11014 return 1;
24eab124 11015}
252b5132 11016
43234a1e
L
11017/* Handle vector immediates. */
11018
11019static int
11020RC_SAE_immediate (const char *imm_start)
11021{
11022 unsigned int match_found, j;
11023 const char *pstr = imm_start;
11024 expressionS *exp;
11025
11026 if (*pstr != '{')
11027 return 0;
11028
11029 pstr++;
11030 match_found = 0;
11031 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
11032 {
11033 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
11034 {
11035 if (!i.rounding)
11036 {
11037 rc_op.type = RC_NamesTable[j].type;
11038 rc_op.operand = this_operand;
11039 i.rounding = &rc_op;
11040 }
11041 else
11042 {
11043 as_bad (_("duplicated `%s'"), imm_start);
11044 return 0;
11045 }
11046 pstr += RC_NamesTable[j].len;
11047 match_found = 1;
11048 break;
11049 }
11050 }
11051 if (!match_found)
11052 return 0;
11053
11054 if (*pstr++ != '}')
11055 {
11056 as_bad (_("Missing '}': '%s'"), imm_start);
11057 return 0;
11058 }
11059 /* RC/SAE immediate string should contain nothing more. */;
11060 if (*pstr != 0)
11061 {
11062 as_bad (_("Junk after '}': '%s'"), imm_start);
11063 return 0;
11064 }
11065
11066 exp = &im_expressions[i.imm_operands++];
11067 i.op[this_operand].imms = exp;
11068
11069 exp->X_op = O_constant;
11070 exp->X_add_number = 0;
11071 exp->X_add_symbol = (symbolS *) 0;
11072 exp->X_op_symbol = (symbolS *) 0;
11073
11074 i.types[this_operand].bitfield.imm8 = 1;
11075 return 1;
11076}
11077
8325cc63
JB
11078/* Only string instructions can have a second memory operand, so
11079 reduce current_templates to just those if it contains any. */
11080static int
11081maybe_adjust_templates (void)
11082{
11083 const insn_template *t;
11084
11085 gas_assert (i.mem_operands == 1);
11086
11087 for (t = current_templates->start; t < current_templates->end; ++t)
11088 if (t->opcode_modifier.isstring)
11089 break;
11090
11091 if (t < current_templates->end)
11092 {
11093 static templates aux_templates;
11094 bfd_boolean recheck;
11095
11096 aux_templates.start = t;
11097 for (; t < current_templates->end; ++t)
11098 if (!t->opcode_modifier.isstring)
11099 break;
11100 aux_templates.end = t;
11101
11102 /* Determine whether to re-check the first memory operand. */
11103 recheck = (aux_templates.start != current_templates->start
11104 || t != current_templates->end);
11105
11106 current_templates = &aux_templates;
11107
11108 if (recheck)
11109 {
11110 i.mem_operands = 0;
11111 if (i.memop1_string != NULL
11112 && i386_index_check (i.memop1_string) == 0)
11113 return 0;
11114 i.mem_operands = 1;
11115 }
11116 }
11117
11118 return 1;
11119}
11120
fc0763e6 11121/* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
47926f60 11122 on error. */
252b5132 11123
252b5132 11124static int
a7619375 11125i386_att_operand (char *operand_string)
252b5132 11126{
af6bdddf
AM
11127 const reg_entry *r;
11128 char *end_op;
24eab124 11129 char *op_string = operand_string;
252b5132 11130
24eab124 11131 if (is_space_char (*op_string))
252b5132
RH
11132 ++op_string;
11133
24eab124 11134 /* We check for an absolute prefix (differentiating,
47926f60 11135 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
24eab124
AM
11136 if (*op_string == ABSOLUTE_PREFIX)
11137 {
11138 ++op_string;
11139 if (is_space_char (*op_string))
11140 ++op_string;
6f2f06be 11141 i.jumpabsolute = TRUE;
24eab124 11142 }
252b5132 11143
47926f60 11144 /* Check if operand is a register. */
4d1bb795 11145 if ((r = parse_register (op_string, &end_op)) != NULL)
24eab124 11146 {
40fb9820
L
11147 i386_operand_type temp;
11148
8a6fb3f9
JB
11149 if (r == &bad_reg)
11150 return 0;
11151
24eab124
AM
11152 /* Check for a segment override by searching for ':' after a
11153 segment register. */
11154 op_string = end_op;
11155 if (is_space_char (*op_string))
11156 ++op_string;
00cee14f 11157 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
24eab124
AM
11158 {
11159 switch (r->reg_num)
11160 {
11161 case 0:
11162 i.seg[i.mem_operands] = &es;
11163 break;
11164 case 1:
11165 i.seg[i.mem_operands] = &cs;
11166 break;
11167 case 2:
11168 i.seg[i.mem_operands] = &ss;
11169 break;
11170 case 3:
11171 i.seg[i.mem_operands] = &ds;
11172 break;
11173 case 4:
11174 i.seg[i.mem_operands] = &fs;
11175 break;
11176 case 5:
11177 i.seg[i.mem_operands] = &gs;
11178 break;
11179 }
252b5132 11180
24eab124 11181 /* Skip the ':' and whitespace. */
252b5132
RH
11182 ++op_string;
11183 if (is_space_char (*op_string))
24eab124 11184 ++op_string;
252b5132 11185
24eab124
AM
11186 if (!is_digit_char (*op_string)
11187 && !is_identifier_char (*op_string)
11188 && *op_string != '('
11189 && *op_string != ABSOLUTE_PREFIX)
11190 {
11191 as_bad (_("bad memory operand `%s'"), op_string);
11192 return 0;
11193 }
47926f60 11194 /* Handle case of %es:*foo. */
24eab124
AM
11195 if (*op_string == ABSOLUTE_PREFIX)
11196 {
11197 ++op_string;
11198 if (is_space_char (*op_string))
11199 ++op_string;
6f2f06be 11200 i.jumpabsolute = TRUE;
24eab124
AM
11201 }
11202 goto do_memory_reference;
11203 }
43234a1e
L
11204
11205 /* Handle vector operations. */
11206 if (*op_string == '{')
11207 {
11208 op_string = check_VecOperations (op_string, NULL);
11209 if (op_string == NULL)
11210 return 0;
11211 }
11212
24eab124
AM
11213 if (*op_string)
11214 {
d0b47220 11215 as_bad (_("junk `%s' after register"), op_string);
24eab124
AM
11216 return 0;
11217 }
40fb9820
L
11218 temp = r->reg_type;
11219 temp.bitfield.baseindex = 0;
c6fb90c8
L
11220 i.types[this_operand] = operand_type_or (i.types[this_operand],
11221 temp);
7d5e4556 11222 i.types[this_operand].bitfield.unspecified = 0;
520dc8e8 11223 i.op[this_operand].regs = r;
24eab124
AM
11224 i.reg_operands++;
11225 }
af6bdddf
AM
11226 else if (*op_string == REGISTER_PREFIX)
11227 {
11228 as_bad (_("bad register name `%s'"), op_string);
11229 return 0;
11230 }
24eab124 11231 else if (*op_string == IMMEDIATE_PREFIX)
ce8a8b2f 11232 {
24eab124 11233 ++op_string;
6f2f06be 11234 if (i.jumpabsolute)
24eab124 11235 {
d0b47220 11236 as_bad (_("immediate operand illegal with absolute jump"));
24eab124
AM
11237 return 0;
11238 }
11239 if (!i386_immediate (op_string))
11240 return 0;
11241 }
43234a1e
L
11242 else if (RC_SAE_immediate (operand_string))
11243 {
11244 /* If it is a RC or SAE immediate, do nothing. */
11245 ;
11246 }
24eab124
AM
11247 else if (is_digit_char (*op_string)
11248 || is_identifier_char (*op_string)
d02603dc 11249 || *op_string == '"'
e5cb08ac 11250 || *op_string == '(')
24eab124 11251 {
47926f60 11252 /* This is a memory reference of some sort. */
af6bdddf 11253 char *base_string;
252b5132 11254
47926f60 11255 /* Start and end of displacement string expression (if found). */
eecb386c
AM
11256 char *displacement_string_start;
11257 char *displacement_string_end;
43234a1e 11258 char *vop_start;
252b5132 11259
24eab124 11260 do_memory_reference:
8325cc63
JB
11261 if (i.mem_operands == 1 && !maybe_adjust_templates ())
11262 return 0;
24eab124 11263 if ((i.mem_operands == 1
40fb9820 11264 && !current_templates->start->opcode_modifier.isstring)
24eab124
AM
11265 || i.mem_operands == 2)
11266 {
11267 as_bad (_("too many memory references for `%s'"),
11268 current_templates->start->name);
11269 return 0;
11270 }
252b5132 11271
24eab124
AM
11272 /* Check for base index form. We detect the base index form by
11273 looking for an ')' at the end of the operand, searching
11274 for the '(' matching it, and finding a REGISTER_PREFIX or ','
11275 after the '('. */
af6bdddf 11276 base_string = op_string + strlen (op_string);
c3332e24 11277
43234a1e
L
11278 /* Handle vector operations. */
11279 vop_start = strchr (op_string, '{');
11280 if (vop_start && vop_start < base_string)
11281 {
11282 if (check_VecOperations (vop_start, base_string) == NULL)
11283 return 0;
11284 base_string = vop_start;
11285 }
11286
af6bdddf
AM
11287 --base_string;
11288 if (is_space_char (*base_string))
11289 --base_string;
252b5132 11290
47926f60 11291 /* If we only have a displacement, set-up for it to be parsed later. */
af6bdddf
AM
11292 displacement_string_start = op_string;
11293 displacement_string_end = base_string + 1;
252b5132 11294
24eab124
AM
11295 if (*base_string == ')')
11296 {
af6bdddf 11297 char *temp_string;
24eab124
AM
11298 unsigned int parens_balanced = 1;
11299 /* We've already checked that the number of left & right ()'s are
47926f60 11300 equal, so this loop will not be infinite. */
24eab124
AM
11301 do
11302 {
11303 base_string--;
11304 if (*base_string == ')')
11305 parens_balanced++;
11306 if (*base_string == '(')
11307 parens_balanced--;
11308 }
11309 while (parens_balanced);
c3332e24 11310
af6bdddf 11311 temp_string = base_string;
c3332e24 11312
24eab124 11313 /* Skip past '(' and whitespace. */
252b5132
RH
11314 ++base_string;
11315 if (is_space_char (*base_string))
24eab124 11316 ++base_string;
252b5132 11317
af6bdddf 11318 if (*base_string == ','
4eed87de
AM
11319 || ((i.base_reg = parse_register (base_string, &end_op))
11320 != NULL))
252b5132 11321 {
af6bdddf 11322 displacement_string_end = temp_string;
252b5132 11323
40fb9820 11324 i.types[this_operand].bitfield.baseindex = 1;
252b5132 11325
af6bdddf 11326 if (i.base_reg)
24eab124 11327 {
8a6fb3f9
JB
11328 if (i.base_reg == &bad_reg)
11329 return 0;
24eab124
AM
11330 base_string = end_op;
11331 if (is_space_char (*base_string))
11332 ++base_string;
af6bdddf
AM
11333 }
11334
11335 /* There may be an index reg or scale factor here. */
11336 if (*base_string == ',')
11337 {
11338 ++base_string;
11339 if (is_space_char (*base_string))
11340 ++base_string;
11341
4eed87de
AM
11342 if ((i.index_reg = parse_register (base_string, &end_op))
11343 != NULL)
24eab124 11344 {
8a6fb3f9
JB
11345 if (i.index_reg == &bad_reg)
11346 return 0;
af6bdddf 11347 base_string = end_op;
24eab124
AM
11348 if (is_space_char (*base_string))
11349 ++base_string;
af6bdddf
AM
11350 if (*base_string == ',')
11351 {
11352 ++base_string;
11353 if (is_space_char (*base_string))
11354 ++base_string;
11355 }
e5cb08ac 11356 else if (*base_string != ')')
af6bdddf 11357 {
4eed87de
AM
11358 as_bad (_("expecting `,' or `)' "
11359 "after index register in `%s'"),
af6bdddf
AM
11360 operand_string);
11361 return 0;
11362 }
24eab124 11363 }
af6bdddf 11364 else if (*base_string == REGISTER_PREFIX)
24eab124 11365 {
f76bf5e0
L
11366 end_op = strchr (base_string, ',');
11367 if (end_op)
11368 *end_op = '\0';
af6bdddf 11369 as_bad (_("bad register name `%s'"), base_string);
24eab124
AM
11370 return 0;
11371 }
252b5132 11372
47926f60 11373 /* Check for scale factor. */
551c1ca1 11374 if (*base_string != ')')
af6bdddf 11375 {
551c1ca1
AM
11376 char *end_scale = i386_scale (base_string);
11377
11378 if (!end_scale)
af6bdddf 11379 return 0;
24eab124 11380
551c1ca1 11381 base_string = end_scale;
af6bdddf
AM
11382 if (is_space_char (*base_string))
11383 ++base_string;
11384 if (*base_string != ')')
11385 {
4eed87de
AM
11386 as_bad (_("expecting `)' "
11387 "after scale factor in `%s'"),
af6bdddf
AM
11388 operand_string);
11389 return 0;
11390 }
11391 }
11392 else if (!i.index_reg)
24eab124 11393 {
4eed87de
AM
11394 as_bad (_("expecting index register or scale factor "
11395 "after `,'; got '%c'"),
af6bdddf 11396 *base_string);
24eab124
AM
11397 return 0;
11398 }
11399 }
af6bdddf 11400 else if (*base_string != ')')
24eab124 11401 {
4eed87de
AM
11402 as_bad (_("expecting `,' or `)' "
11403 "after base register in `%s'"),
af6bdddf 11404 operand_string);
24eab124
AM
11405 return 0;
11406 }
c3332e24 11407 }
af6bdddf 11408 else if (*base_string == REGISTER_PREFIX)
c3332e24 11409 {
f76bf5e0
L
11410 end_op = strchr (base_string, ',');
11411 if (end_op)
11412 *end_op = '\0';
af6bdddf 11413 as_bad (_("bad register name `%s'"), base_string);
24eab124 11414 return 0;
c3332e24 11415 }
24eab124
AM
11416 }
11417
11418 /* If there's an expression beginning the operand, parse it,
11419 assuming displacement_string_start and
11420 displacement_string_end are meaningful. */
11421 if (displacement_string_start != displacement_string_end)
11422 {
11423 if (!i386_displacement (displacement_string_start,
11424 displacement_string_end))
11425 return 0;
11426 }
11427
11428 /* Special case for (%dx) while doing input/output op. */
11429 if (i.base_reg
75e5731b
JB
11430 && i.base_reg->reg_type.bitfield.instance == RegD
11431 && i.base_reg->reg_type.bitfield.word
24eab124
AM
11432 && i.index_reg == 0
11433 && i.log2_scale_factor == 0
11434 && i.seg[i.mem_operands] == 0
40fb9820 11435 && !operand_type_check (i.types[this_operand], disp))
24eab124 11436 {
2fb5be8d 11437 i.types[this_operand] = i.base_reg->reg_type;
24eab124
AM
11438 return 1;
11439 }
11440
eecb386c
AM
11441 if (i386_index_check (operand_string) == 0)
11442 return 0;
c48dadc9 11443 i.flags[this_operand] |= Operand_Mem;
8325cc63
JB
11444 if (i.mem_operands == 0)
11445 i.memop1_string = xstrdup (operand_string);
24eab124
AM
11446 i.mem_operands++;
11447 }
11448 else
ce8a8b2f
AM
11449 {
11450 /* It's not a memory operand; argh! */
24eab124
AM
11451 as_bad (_("invalid char %s beginning operand %d `%s'"),
11452 output_invalid (*op_string),
11453 this_operand + 1,
11454 op_string);
11455 return 0;
11456 }
47926f60 11457 return 1; /* Normal return. */
252b5132
RH
11458}
11459\f
fa94de6b
RM
11460/* Calculate the maximum variable size (i.e., excluding fr_fix)
11461 that an rs_machine_dependent frag may reach. */
11462
11463unsigned int
11464i386_frag_max_var (fragS *frag)
11465{
11466 /* The only relaxable frags are for jumps.
11467 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
11468 gas_assert (frag->fr_type == rs_machine_dependent);
11469 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11470}
11471
b084df0b
L
11472#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11473static int
8dcea932 11474elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
b084df0b
L
11475{
11476 /* STT_GNU_IFUNC symbol must go through PLT. */
11477 if ((symbol_get_bfdsym (fr_symbol)->flags
11478 & BSF_GNU_INDIRECT_FUNCTION) != 0)
11479 return 0;
11480
11481 if (!S_IS_EXTERNAL (fr_symbol))
11482 /* Symbol may be weak or local. */
11483 return !S_IS_WEAK (fr_symbol);
11484
8dcea932
L
11485 /* Global symbols with non-default visibility can't be preempted. */
11486 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11487 return 1;
11488
11489 if (fr_var != NO_RELOC)
11490 switch ((enum bfd_reloc_code_real) fr_var)
11491 {
11492 case BFD_RELOC_386_PLT32:
11493 case BFD_RELOC_X86_64_PLT32:
33eaf5de 11494 /* Symbol with PLT relocation may be preempted. */
8dcea932
L
11495 return 0;
11496 default:
11497 abort ();
11498 }
11499
b084df0b
L
11500 /* Global symbols with default visibility in a shared library may be
11501 preempted by another definition. */
8dcea932 11502 return !shared;
b084df0b
L
11503}
11504#endif
11505
79d72f45
HL
11506/* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11507 Note also work for Skylake and Cascadelake.
11508---------------------------------------------------------------------
11509| JCC | ADD/SUB/CMP | INC/DEC | TEST/AND |
11510| ------ | ----------- | ------- | -------- |
11511| Jo | N | N | Y |
11512| Jno | N | N | Y |
11513| Jc/Jb | Y | N | Y |
11514| Jae/Jnb | Y | N | Y |
11515| Je/Jz | Y | Y | Y |
11516| Jne/Jnz | Y | Y | Y |
11517| Jna/Jbe | Y | N | Y |
11518| Ja/Jnbe | Y | N | Y |
11519| Js | N | N | Y |
11520| Jns | N | N | Y |
11521| Jp/Jpe | N | N | Y |
11522| Jnp/Jpo | N | N | Y |
11523| Jl/Jnge | Y | Y | Y |
11524| Jge/Jnl | Y | Y | Y |
11525| Jle/Jng | Y | Y | Y |
11526| Jg/Jnle | Y | Y | Y |
11527--------------------------------------------------------------------- */
11528static int
11529i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11530{
11531 if (mf_cmp == mf_cmp_alu_cmp)
11532 return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11533 || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11534 if (mf_cmp == mf_cmp_incdec)
11535 return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11536 || mf_jcc == mf_jcc_jle);
11537 if (mf_cmp == mf_cmp_test_and)
11538 return 1;
11539 return 0;
11540}
11541
e379e5f3
L
11542/* Return the next non-empty frag. */
11543
11544static fragS *
11545i386_next_non_empty_frag (fragS *fragP)
11546{
11547 /* There may be a frag with a ".fill 0" when there is no room in
11548 the current frag for frag_grow in output_insn. */
11549 for (fragP = fragP->fr_next;
11550 (fragP != NULL
11551 && fragP->fr_type == rs_fill
11552 && fragP->fr_fix == 0);
11553 fragP = fragP->fr_next)
11554 ;
11555 return fragP;
11556}
11557
11558/* Return the next jcc frag after BRANCH_PADDING. */
11559
11560static fragS *
79d72f45 11561i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
e379e5f3 11562{
79d72f45
HL
11563 fragS *branch_fragP;
11564 if (!pad_fragP)
e379e5f3
L
11565 return NULL;
11566
79d72f45
HL
11567 if (pad_fragP->fr_type == rs_machine_dependent
11568 && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
e379e5f3
L
11569 == BRANCH_PADDING))
11570 {
79d72f45
HL
11571 branch_fragP = i386_next_non_empty_frag (pad_fragP);
11572 if (branch_fragP->fr_type != rs_machine_dependent)
e379e5f3 11573 return NULL;
79d72f45
HL
11574 if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11575 && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11576 pad_fragP->tc_frag_data.mf_type))
11577 return branch_fragP;
e379e5f3
L
11578 }
11579
11580 return NULL;
11581}
11582
11583/* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
11584
11585static void
11586i386_classify_machine_dependent_frag (fragS *fragP)
11587{
11588 fragS *cmp_fragP;
11589 fragS *pad_fragP;
11590 fragS *branch_fragP;
11591 fragS *next_fragP;
11592 unsigned int max_prefix_length;
11593
11594 if (fragP->tc_frag_data.classified)
11595 return;
11596
11597 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11598 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11599 for (next_fragP = fragP;
11600 next_fragP != NULL;
11601 next_fragP = next_fragP->fr_next)
11602 {
11603 next_fragP->tc_frag_data.classified = 1;
11604 if (next_fragP->fr_type == rs_machine_dependent)
11605 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11606 {
11607 case BRANCH_PADDING:
11608 /* The BRANCH_PADDING frag must be followed by a branch
11609 frag. */
11610 branch_fragP = i386_next_non_empty_frag (next_fragP);
11611 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11612 break;
11613 case FUSED_JCC_PADDING:
11614 /* Check if this is a fused jcc:
11615 FUSED_JCC_PADDING
11616 CMP like instruction
11617 BRANCH_PADDING
11618 COND_JUMP
11619 */
11620 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11621 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
79d72f45 11622 branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
e379e5f3
L
11623 if (branch_fragP)
11624 {
11625 /* The BRANCH_PADDING frag is merged with the
11626 FUSED_JCC_PADDING frag. */
11627 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11628 /* CMP like instruction size. */
11629 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11630 frag_wane (pad_fragP);
11631 /* Skip to branch_fragP. */
11632 next_fragP = branch_fragP;
11633 }
11634 else if (next_fragP->tc_frag_data.max_prefix_length)
11635 {
11636 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11637 a fused jcc. */
11638 next_fragP->fr_subtype
11639 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11640 next_fragP->tc_frag_data.max_bytes
11641 = next_fragP->tc_frag_data.max_prefix_length;
11642 /* This will be updated in the BRANCH_PREFIX scan. */
11643 next_fragP->tc_frag_data.max_prefix_length = 0;
11644 }
11645 else
11646 frag_wane (next_fragP);
11647 break;
11648 }
11649 }
11650
11651 /* Stop if there is no BRANCH_PREFIX. */
11652 if (!align_branch_prefix_size)
11653 return;
11654
11655 /* Scan for BRANCH_PREFIX. */
11656 for (; fragP != NULL; fragP = fragP->fr_next)
11657 {
11658 if (fragP->fr_type != rs_machine_dependent
11659 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11660 != BRANCH_PREFIX))
11661 continue;
11662
11663 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11664 COND_JUMP_PREFIX. */
11665 max_prefix_length = 0;
11666 for (next_fragP = fragP;
11667 next_fragP != NULL;
11668 next_fragP = next_fragP->fr_next)
11669 {
11670 if (next_fragP->fr_type == rs_fill)
11671 /* Skip rs_fill frags. */
11672 continue;
11673 else if (next_fragP->fr_type != rs_machine_dependent)
11674 /* Stop for all other frags. */
11675 break;
11676
11677 /* rs_machine_dependent frags. */
11678 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11679 == BRANCH_PREFIX)
11680 {
11681 /* Count BRANCH_PREFIX frags. */
11682 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11683 {
11684 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11685 frag_wane (next_fragP);
11686 }
11687 else
11688 max_prefix_length
11689 += next_fragP->tc_frag_data.max_bytes;
11690 }
11691 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11692 == BRANCH_PADDING)
11693 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11694 == FUSED_JCC_PADDING))
11695 {
11696 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11697 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11698 break;
11699 }
11700 else
11701 /* Stop for other rs_machine_dependent frags. */
11702 break;
11703 }
11704
11705 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11706
11707 /* Skip to the next frag. */
11708 fragP = next_fragP;
11709 }
11710}
11711
11712/* Compute padding size for
11713
11714 FUSED_JCC_PADDING
11715 CMP like instruction
11716 BRANCH_PADDING
11717 COND_JUMP/UNCOND_JUMP
11718
11719 or
11720
11721 BRANCH_PADDING
11722 COND_JUMP/UNCOND_JUMP
11723 */
11724
11725static int
11726i386_branch_padding_size (fragS *fragP, offsetT address)
11727{
11728 unsigned int offset, size, padding_size;
11729 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11730
11731 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11732 if (!address)
11733 address = fragP->fr_address;
11734 address += fragP->fr_fix;
11735
11736 /* CMP like instrunction size. */
11737 size = fragP->tc_frag_data.cmp_size;
11738
11739 /* The base size of the branch frag. */
11740 size += branch_fragP->fr_fix;
11741
11742 /* Add opcode and displacement bytes for the rs_machine_dependent
11743 branch frag. */
11744 if (branch_fragP->fr_type == rs_machine_dependent)
11745 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11746
11747 /* Check if branch is within boundary and doesn't end at the last
11748 byte. */
11749 offset = address & ((1U << align_branch_power) - 1);
11750 if ((offset + size) >= (1U << align_branch_power))
11751 /* Padding needed to avoid crossing boundary. */
11752 padding_size = (1U << align_branch_power) - offset;
11753 else
11754 /* No padding needed. */
11755 padding_size = 0;
11756
11757 /* The return value may be saved in tc_frag_data.length which is
11758 unsigned byte. */
11759 if (!fits_in_unsigned_byte (padding_size))
11760 abort ();
11761
11762 return padding_size;
11763}
11764
11765/* i386_generic_table_relax_frag()
11766
11767 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11768 grow/shrink padding to align branch frags. Hand others to
11769 relax_frag(). */
11770
11771long
11772i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11773{
11774 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11775 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11776 {
11777 long padding_size = i386_branch_padding_size (fragP, 0);
11778 long grow = padding_size - fragP->tc_frag_data.length;
11779
11780 /* When the BRANCH_PREFIX frag is used, the computed address
11781 must match the actual address and there should be no padding. */
11782 if (fragP->tc_frag_data.padding_address
11783 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11784 || padding_size))
11785 abort ();
11786
11787 /* Update the padding size. */
11788 if (grow)
11789 fragP->tc_frag_data.length = padding_size;
11790
11791 return grow;
11792 }
11793 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11794 {
11795 fragS *padding_fragP, *next_fragP;
11796 long padding_size, left_size, last_size;
11797
11798 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11799 if (!padding_fragP)
11800 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11801 return (fragP->tc_frag_data.length
11802 - fragP->tc_frag_data.last_length);
11803
11804 /* Compute the relative address of the padding frag in the very
11805 first time where the BRANCH_PREFIX frag sizes are zero. */
11806 if (!fragP->tc_frag_data.padding_address)
11807 fragP->tc_frag_data.padding_address
11808 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11809
11810 /* First update the last length from the previous interation. */
11811 left_size = fragP->tc_frag_data.prefix_length;
11812 for (next_fragP = fragP;
11813 next_fragP != padding_fragP;
11814 next_fragP = next_fragP->fr_next)
11815 if (next_fragP->fr_type == rs_machine_dependent
11816 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11817 == BRANCH_PREFIX))
11818 {
11819 if (left_size)
11820 {
11821 int max = next_fragP->tc_frag_data.max_bytes;
11822 if (max)
11823 {
11824 int size;
11825 if (max > left_size)
11826 size = left_size;
11827 else
11828 size = max;
11829 left_size -= size;
11830 next_fragP->tc_frag_data.last_length = size;
11831 }
11832 }
11833 else
11834 next_fragP->tc_frag_data.last_length = 0;
11835 }
11836
11837 /* Check the padding size for the padding frag. */
11838 padding_size = i386_branch_padding_size
11839 (padding_fragP, (fragP->fr_address
11840 + fragP->tc_frag_data.padding_address));
11841
11842 last_size = fragP->tc_frag_data.prefix_length;
11843 /* Check if there is change from the last interation. */
11844 if (padding_size == last_size)
11845 {
11846 /* Update the expected address of the padding frag. */
11847 padding_fragP->tc_frag_data.padding_address
11848 = (fragP->fr_address + padding_size
11849 + fragP->tc_frag_data.padding_address);
11850 return 0;
11851 }
11852
11853 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11854 {
11855 /* No padding if there is no sufficient room. Clear the
11856 expected address of the padding frag. */
11857 padding_fragP->tc_frag_data.padding_address = 0;
11858 padding_size = 0;
11859 }
11860 else
11861 /* Store the expected address of the padding frag. */
11862 padding_fragP->tc_frag_data.padding_address
11863 = (fragP->fr_address + padding_size
11864 + fragP->tc_frag_data.padding_address);
11865
11866 fragP->tc_frag_data.prefix_length = padding_size;
11867
11868 /* Update the length for the current interation. */
11869 left_size = padding_size;
11870 for (next_fragP = fragP;
11871 next_fragP != padding_fragP;
11872 next_fragP = next_fragP->fr_next)
11873 if (next_fragP->fr_type == rs_machine_dependent
11874 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11875 == BRANCH_PREFIX))
11876 {
11877 if (left_size)
11878 {
11879 int max = next_fragP->tc_frag_data.max_bytes;
11880 if (max)
11881 {
11882 int size;
11883 if (max > left_size)
11884 size = left_size;
11885 else
11886 size = max;
11887 left_size -= size;
11888 next_fragP->tc_frag_data.length = size;
11889 }
11890 }
11891 else
11892 next_fragP->tc_frag_data.length = 0;
11893 }
11894
11895 return (fragP->tc_frag_data.length
11896 - fragP->tc_frag_data.last_length);
11897 }
11898 return relax_frag (segment, fragP, stretch);
11899}
11900
ee7fcc42
AM
11901/* md_estimate_size_before_relax()
11902
11903 Called just before relax() for rs_machine_dependent frags. The x86
11904 assembler uses these frags to handle variable size jump
11905 instructions.
11906
11907 Any symbol that is now undefined will not become defined.
11908 Return the correct fr_subtype in the frag.
11909 Return the initial "guess for variable size of frag" to caller.
11910 The guess is actually the growth beyond the fixed part. Whatever
11911 we do to grow the fixed or variable part contributes to our
11912 returned value. */
11913
252b5132 11914int
7016a5d5 11915md_estimate_size_before_relax (fragS *fragP, segT segment)
252b5132 11916{
e379e5f3
L
11917 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11918 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11919 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11920 {
11921 i386_classify_machine_dependent_frag (fragP);
11922 return fragP->tc_frag_data.length;
11923 }
11924
252b5132 11925 /* We've already got fragP->fr_subtype right; all we have to do is
b98ef147
AM
11926 check for un-relaxable symbols. On an ELF system, we can't relax
11927 an externally visible symbol, because it may be overridden by a
11928 shared library. */
11929 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
6d249963 11930#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 11931 || (IS_ELF
8dcea932
L
11932 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11933 fragP->fr_var))
fbeb56a4
DK
11934#endif
11935#if defined (OBJ_COFF) && defined (TE_PE)
7ab9ffdd 11936 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
fbeb56a4 11937 && S_IS_WEAK (fragP->fr_symbol))
b98ef147
AM
11938#endif
11939 )
252b5132 11940 {
b98ef147
AM
11941 /* Symbol is undefined in this segment, or we need to keep a
11942 reloc so that weak symbols can be overridden. */
11943 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
f86103b7 11944 enum bfd_reloc_code_real reloc_type;
ee7fcc42
AM
11945 unsigned char *opcode;
11946 int old_fr_fix;
f6af82bd 11947
ee7fcc42 11948 if (fragP->fr_var != NO_RELOC)
1e9cc1c2 11949 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
b98ef147 11950 else if (size == 2)
f6af82bd 11951 reloc_type = BFD_RELOC_16_PCREL;
bd7ab16b
L
11952#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11953 else if (need_plt32_p (fragP->fr_symbol))
11954 reloc_type = BFD_RELOC_X86_64_PLT32;
11955#endif
f6af82bd
AM
11956 else
11957 reloc_type = BFD_RELOC_32_PCREL;
252b5132 11958
ee7fcc42
AM
11959 old_fr_fix = fragP->fr_fix;
11960 opcode = (unsigned char *) fragP->fr_opcode;
11961
fddf5b5b 11962 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
252b5132 11963 {
fddf5b5b
AM
11964 case UNCOND_JUMP:
11965 /* Make jmp (0xeb) a (d)word displacement jump. */
47926f60 11966 opcode[0] = 0xe9;
252b5132 11967 fragP->fr_fix += size;
062cd5e7
AS
11968 fix_new (fragP, old_fr_fix, size,
11969 fragP->fr_symbol,
11970 fragP->fr_offset, 1,
11971 reloc_type);
252b5132
RH
11972 break;
11973
fddf5b5b 11974 case COND_JUMP86:
412167cb
AM
11975 if (size == 2
11976 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
fddf5b5b
AM
11977 {
11978 /* Negate the condition, and branch past an
11979 unconditional jump. */
11980 opcode[0] ^= 1;
11981 opcode[1] = 3;
11982 /* Insert an unconditional jump. */
11983 opcode[2] = 0xe9;
11984 /* We added two extra opcode bytes, and have a two byte
11985 offset. */
11986 fragP->fr_fix += 2 + 2;
062cd5e7
AS
11987 fix_new (fragP, old_fr_fix + 2, 2,
11988 fragP->fr_symbol,
11989 fragP->fr_offset, 1,
11990 reloc_type);
fddf5b5b
AM
11991 break;
11992 }
11993 /* Fall through. */
11994
11995 case COND_JUMP:
412167cb
AM
11996 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11997 {
3e02c1cc
AM
11998 fixS *fixP;
11999
412167cb 12000 fragP->fr_fix += 1;
3e02c1cc
AM
12001 fixP = fix_new (fragP, old_fr_fix, 1,
12002 fragP->fr_symbol,
12003 fragP->fr_offset, 1,
12004 BFD_RELOC_8_PCREL);
12005 fixP->fx_signed = 1;
412167cb
AM
12006 break;
12007 }
93c2a809 12008
24eab124 12009 /* This changes the byte-displacement jump 0x7N
fddf5b5b 12010 to the (d)word-displacement jump 0x0f,0x8N. */
252b5132 12011 opcode[1] = opcode[0] + 0x10;
f6af82bd 12012 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
47926f60
KH
12013 /* We've added an opcode byte. */
12014 fragP->fr_fix += 1 + size;
062cd5e7
AS
12015 fix_new (fragP, old_fr_fix + 1, size,
12016 fragP->fr_symbol,
12017 fragP->fr_offset, 1,
12018 reloc_type);
252b5132 12019 break;
fddf5b5b
AM
12020
12021 default:
12022 BAD_CASE (fragP->fr_subtype);
12023 break;
252b5132
RH
12024 }
12025 frag_wane (fragP);
ee7fcc42 12026 return fragP->fr_fix - old_fr_fix;
252b5132 12027 }
93c2a809 12028
93c2a809
AM
12029 /* Guess size depending on current relax state. Initially the relax
12030 state will correspond to a short jump and we return 1, because
12031 the variable part of the frag (the branch offset) is one byte
12032 long. However, we can relax a section more than once and in that
12033 case we must either set fr_subtype back to the unrelaxed state,
12034 or return the value for the appropriate branch. */
12035 return md_relax_table[fragP->fr_subtype].rlx_length;
ee7fcc42
AM
12036}
12037
47926f60
KH
12038/* Called after relax() is finished.
12039
12040 In: Address of frag.
12041 fr_type == rs_machine_dependent.
12042 fr_subtype is what the address relaxed to.
12043
12044 Out: Any fixSs and constants are set up.
12045 Caller will turn frag into a ".space 0". */
12046
252b5132 12047void
7016a5d5
TG
12048md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12049 fragS *fragP)
252b5132 12050{
29b0f896 12051 unsigned char *opcode;
252b5132 12052 unsigned char *where_to_put_displacement = NULL;
847f7ad4
AM
12053 offsetT target_address;
12054 offsetT opcode_address;
252b5132 12055 unsigned int extension = 0;
847f7ad4 12056 offsetT displacement_from_opcode_start;
252b5132 12057
e379e5f3
L
12058 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12059 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12060 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12061 {
12062 /* Generate nop padding. */
12063 unsigned int size = fragP->tc_frag_data.length;
12064 if (size)
12065 {
12066 if (size > fragP->tc_frag_data.max_bytes)
12067 abort ();
12068
12069 if (flag_debug)
12070 {
12071 const char *msg;
12072 const char *branch = "branch";
12073 const char *prefix = "";
12074 fragS *padding_fragP;
12075 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12076 == BRANCH_PREFIX)
12077 {
12078 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12079 switch (fragP->tc_frag_data.default_prefix)
12080 {
12081 default:
12082 abort ();
12083 break;
12084 case CS_PREFIX_OPCODE:
12085 prefix = " cs";
12086 break;
12087 case DS_PREFIX_OPCODE:
12088 prefix = " ds";
12089 break;
12090 case ES_PREFIX_OPCODE:
12091 prefix = " es";
12092 break;
12093 case FS_PREFIX_OPCODE:
12094 prefix = " fs";
12095 break;
12096 case GS_PREFIX_OPCODE:
12097 prefix = " gs";
12098 break;
12099 case SS_PREFIX_OPCODE:
12100 prefix = " ss";
12101 break;
12102 }
12103 if (padding_fragP)
12104 msg = _("%s:%u: add %d%s at 0x%llx to align "
12105 "%s within %d-byte boundary\n");
12106 else
12107 msg = _("%s:%u: add additional %d%s at 0x%llx to "
12108 "align %s within %d-byte boundary\n");
12109 }
12110 else
12111 {
12112 padding_fragP = fragP;
12113 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12114 "%s within %d-byte boundary\n");
12115 }
12116
12117 if (padding_fragP)
12118 switch (padding_fragP->tc_frag_data.branch_type)
12119 {
12120 case align_branch_jcc:
12121 branch = "jcc";
12122 break;
12123 case align_branch_fused:
12124 branch = "fused jcc";
12125 break;
12126 case align_branch_jmp:
12127 branch = "jmp";
12128 break;
12129 case align_branch_call:
12130 branch = "call";
12131 break;
12132 case align_branch_indirect:
12133 branch = "indiret branch";
12134 break;
12135 case align_branch_ret:
12136 branch = "ret";
12137 break;
12138 default:
12139 break;
12140 }
12141
12142 fprintf (stdout, msg,
12143 fragP->fr_file, fragP->fr_line, size, prefix,
12144 (long long) fragP->fr_address, branch,
12145 1 << align_branch_power);
12146 }
12147 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12148 memset (fragP->fr_opcode,
12149 fragP->tc_frag_data.default_prefix, size);
12150 else
12151 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12152 size, 0);
12153 fragP->fr_fix += size;
12154 }
12155 return;
12156 }
12157
252b5132
RH
12158 opcode = (unsigned char *) fragP->fr_opcode;
12159
47926f60 12160 /* Address we want to reach in file space. */
252b5132 12161 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
252b5132 12162
47926f60 12163 /* Address opcode resides at in file space. */
252b5132
RH
12164 opcode_address = fragP->fr_address + fragP->fr_fix;
12165
47926f60 12166 /* Displacement from opcode start to fill into instruction. */
252b5132
RH
12167 displacement_from_opcode_start = target_address - opcode_address;
12168
fddf5b5b 12169 if ((fragP->fr_subtype & BIG) == 0)
252b5132 12170 {
47926f60
KH
12171 /* Don't have to change opcode. */
12172 extension = 1; /* 1 opcode + 1 displacement */
252b5132 12173 where_to_put_displacement = &opcode[1];
fddf5b5b
AM
12174 }
12175 else
12176 {
12177 if (no_cond_jump_promotion
12178 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
4eed87de
AM
12179 as_warn_where (fragP->fr_file, fragP->fr_line,
12180 _("long jump required"));
252b5132 12181
fddf5b5b
AM
12182 switch (fragP->fr_subtype)
12183 {
12184 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12185 extension = 4; /* 1 opcode + 4 displacement */
12186 opcode[0] = 0xe9;
12187 where_to_put_displacement = &opcode[1];
12188 break;
252b5132 12189
fddf5b5b
AM
12190 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12191 extension = 2; /* 1 opcode + 2 displacement */
12192 opcode[0] = 0xe9;
12193 where_to_put_displacement = &opcode[1];
12194 break;
252b5132 12195
fddf5b5b
AM
12196 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12197 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12198 extension = 5; /* 2 opcode + 4 displacement */
12199 opcode[1] = opcode[0] + 0x10;
12200 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12201 where_to_put_displacement = &opcode[2];
12202 break;
252b5132 12203
fddf5b5b
AM
12204 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12205 extension = 3; /* 2 opcode + 2 displacement */
12206 opcode[1] = opcode[0] + 0x10;
12207 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12208 where_to_put_displacement = &opcode[2];
12209 break;
252b5132 12210
fddf5b5b
AM
12211 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12212 extension = 4;
12213 opcode[0] ^= 1;
12214 opcode[1] = 3;
12215 opcode[2] = 0xe9;
12216 where_to_put_displacement = &opcode[3];
12217 break;
12218
12219 default:
12220 BAD_CASE (fragP->fr_subtype);
12221 break;
12222 }
252b5132 12223 }
fddf5b5b 12224
7b81dfbb
AJ
12225 /* If size if less then four we are sure that the operand fits,
12226 but if it's 4, then it could be that the displacement is larger
12227 then -/+ 2GB. */
12228 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12229 && object_64bit
12230 && ((addressT) (displacement_from_opcode_start - extension
4eed87de
AM
12231 + ((addressT) 1 << 31))
12232 > (((addressT) 2 << 31) - 1)))
7b81dfbb
AJ
12233 {
12234 as_bad_where (fragP->fr_file, fragP->fr_line,
12235 _("jump target out of range"));
12236 /* Make us emit 0. */
12237 displacement_from_opcode_start = extension;
12238 }
47926f60 12239 /* Now put displacement after opcode. */
252b5132
RH
12240 md_number_to_chars ((char *) where_to_put_displacement,
12241 (valueT) (displacement_from_opcode_start - extension),
fddf5b5b 12242 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
252b5132
RH
12243 fragP->fr_fix += extension;
12244}
12245\f
7016a5d5 12246/* Apply a fixup (fixP) to segment data, once it has been determined
252b5132
RH
12247 by our caller that we have all the info we need to fix it up.
12248
7016a5d5
TG
12249 Parameter valP is the pointer to the value of the bits.
12250
252b5132
RH
12251 On the 386, immediates, displacements, and data pointers are all in
12252 the same (little-endian) format, so we don't need to care about which
12253 we are handling. */
12254
94f592af 12255void
7016a5d5 12256md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
252b5132 12257{
94f592af 12258 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
c6682705 12259 valueT value = *valP;
252b5132 12260
f86103b7 12261#if !defined (TE_Mach)
93382f6d
AM
12262 if (fixP->fx_pcrel)
12263 {
12264 switch (fixP->fx_r_type)
12265 {
5865bb77
ILT
12266 default:
12267 break;
12268
d6ab8113
JB
12269 case BFD_RELOC_64:
12270 fixP->fx_r_type = BFD_RELOC_64_PCREL;
12271 break;
93382f6d 12272 case BFD_RELOC_32:
ae8887b5 12273 case BFD_RELOC_X86_64_32S:
93382f6d
AM
12274 fixP->fx_r_type = BFD_RELOC_32_PCREL;
12275 break;
12276 case BFD_RELOC_16:
12277 fixP->fx_r_type = BFD_RELOC_16_PCREL;
12278 break;
12279 case BFD_RELOC_8:
12280 fixP->fx_r_type = BFD_RELOC_8_PCREL;
12281 break;
12282 }
12283 }
252b5132 12284
a161fe53 12285 if (fixP->fx_addsy != NULL
31312f95 12286 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
d6ab8113 12287 || fixP->fx_r_type == BFD_RELOC_64_PCREL
31312f95 12288 || fixP->fx_r_type == BFD_RELOC_16_PCREL
d258b828 12289 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
31312f95 12290 && !use_rela_relocations)
252b5132 12291 {
31312f95
AM
12292 /* This is a hack. There should be a better way to handle this.
12293 This covers for the fact that bfd_install_relocation will
12294 subtract the current location (for partial_inplace, PC relative
12295 relocations); see more below. */
252b5132 12296#ifndef OBJ_AOUT
718ddfc0 12297 if (IS_ELF
252b5132
RH
12298#ifdef TE_PE
12299 || OUTPUT_FLAVOR == bfd_target_coff_flavour
12300#endif
12301 )
12302 value += fixP->fx_where + fixP->fx_frag->fr_address;
12303#endif
12304#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 12305 if (IS_ELF)
252b5132 12306 {
6539b54b 12307 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
2f66722d 12308
6539b54b 12309 if ((sym_seg == seg
2f66722d 12310 || (symbol_section_p (fixP->fx_addsy)
6539b54b 12311 && sym_seg != absolute_section))
af65af87 12312 && !generic_force_reloc (fixP))
2f66722d
AM
12313 {
12314 /* Yes, we add the values in twice. This is because
6539b54b
AM
12315 bfd_install_relocation subtracts them out again. I think
12316 bfd_install_relocation is broken, but I don't dare change
2f66722d
AM
12317 it. FIXME. */
12318 value += fixP->fx_where + fixP->fx_frag->fr_address;
12319 }
252b5132
RH
12320 }
12321#endif
12322#if defined (OBJ_COFF) && defined (TE_PE)
977cdf5a
NC
12323 /* For some reason, the PE format does not store a
12324 section address offset for a PC relative symbol. */
12325 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
7be1c489 12326 || S_IS_WEAK (fixP->fx_addsy))
252b5132
RH
12327 value += md_pcrel_from (fixP);
12328#endif
12329 }
fbeb56a4 12330#if defined (OBJ_COFF) && defined (TE_PE)
f01c1a09
NC
12331 if (fixP->fx_addsy != NULL
12332 && S_IS_WEAK (fixP->fx_addsy)
12333 /* PR 16858: Do not modify weak function references. */
12334 && ! fixP->fx_pcrel)
fbeb56a4 12335 {
296a8689
NC
12336#if !defined (TE_PEP)
12337 /* For x86 PE weak function symbols are neither PC-relative
12338 nor do they set S_IS_FUNCTION. So the only reliable way
12339 to detect them is to check the flags of their containing
12340 section. */
12341 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12342 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12343 ;
12344 else
12345#endif
fbeb56a4
DK
12346 value -= S_GET_VALUE (fixP->fx_addsy);
12347 }
12348#endif
252b5132
RH
12349
12350 /* Fix a few things - the dynamic linker expects certain values here,
0234cb7c 12351 and we must not disappoint it. */
252b5132 12352#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
718ddfc0 12353 if (IS_ELF && fixP->fx_addsy)
47926f60
KH
12354 switch (fixP->fx_r_type)
12355 {
12356 case BFD_RELOC_386_PLT32:
3e73aa7c 12357 case BFD_RELOC_X86_64_PLT32:
b9519cfe
L
12358 /* Make the jump instruction point to the address of the operand.
12359 At runtime we merely add the offset to the actual PLT entry.
12360 NB: Subtract the offset size only for jump instructions. */
12361 if (fixP->fx_pcrel)
12362 value = -4;
47926f60 12363 break;
31312f95 12364
13ae64f3
JJ
12365 case BFD_RELOC_386_TLS_GD:
12366 case BFD_RELOC_386_TLS_LDM:
13ae64f3 12367 case BFD_RELOC_386_TLS_IE_32:
37e55690
JJ
12368 case BFD_RELOC_386_TLS_IE:
12369 case BFD_RELOC_386_TLS_GOTIE:
67a4f2b7 12370 case BFD_RELOC_386_TLS_GOTDESC:
bffbf940
JJ
12371 case BFD_RELOC_X86_64_TLSGD:
12372 case BFD_RELOC_X86_64_TLSLD:
12373 case BFD_RELOC_X86_64_GOTTPOFF:
67a4f2b7 12374 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
00f7efb6
JJ
12375 value = 0; /* Fully resolved at runtime. No addend. */
12376 /* Fallthrough */
12377 case BFD_RELOC_386_TLS_LE:
12378 case BFD_RELOC_386_TLS_LDO_32:
12379 case BFD_RELOC_386_TLS_LE_32:
12380 case BFD_RELOC_X86_64_DTPOFF32:
d6ab8113 12381 case BFD_RELOC_X86_64_DTPOFF64:
00f7efb6 12382 case BFD_RELOC_X86_64_TPOFF32:
d6ab8113 12383 case BFD_RELOC_X86_64_TPOFF64:
00f7efb6
JJ
12384 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12385 break;
12386
67a4f2b7
AO
12387 case BFD_RELOC_386_TLS_DESC_CALL:
12388 case BFD_RELOC_X86_64_TLSDESC_CALL:
12389 value = 0; /* Fully resolved at runtime. No addend. */
12390 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12391 fixP->fx_done = 0;
12392 return;
12393
47926f60
KH
12394 case BFD_RELOC_VTABLE_INHERIT:
12395 case BFD_RELOC_VTABLE_ENTRY:
12396 fixP->fx_done = 0;
94f592af 12397 return;
47926f60
KH
12398
12399 default:
12400 break;
12401 }
12402#endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
c6682705 12403 *valP = value;
f86103b7 12404#endif /* !defined (TE_Mach) */
3e73aa7c 12405
3e73aa7c 12406 /* Are we finished with this relocation now? */
c6682705 12407 if (fixP->fx_addsy == NULL)
3e73aa7c 12408 fixP->fx_done = 1;
fbeb56a4
DK
12409#if defined (OBJ_COFF) && defined (TE_PE)
12410 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12411 {
12412 fixP->fx_done = 0;
12413 /* Remember value for tc_gen_reloc. */
12414 fixP->fx_addnumber = value;
12415 /* Clear out the frag for now. */
12416 value = 0;
12417 }
12418#endif
3e73aa7c
JH
12419 else if (use_rela_relocations)
12420 {
12421 fixP->fx_no_overflow = 1;
062cd5e7
AS
12422 /* Remember value for tc_gen_reloc. */
12423 fixP->fx_addnumber = value;
3e73aa7c
JH
12424 value = 0;
12425 }
f86103b7 12426
94f592af 12427 md_number_to_chars (p, value, fixP->fx_size);
252b5132 12428}
252b5132 12429\f
6d4af3c2 12430const char *
499ac353 12431md_atof (int type, char *litP, int *sizeP)
252b5132 12432{
499ac353
NC
12433 /* This outputs the LITTLENUMs in REVERSE order;
12434 in accord with the bigendian 386. */
12435 return ieee_md_atof (type, litP, sizeP, FALSE);
252b5132
RH
12436}
12437\f
2d545b82 12438static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
252b5132 12439
252b5132 12440static char *
e3bb37b5 12441output_invalid (int c)
252b5132 12442{
3882b010 12443 if (ISPRINT (c))
f9f21a03
L
12444 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12445 "'%c'", c);
252b5132 12446 else
f9f21a03 12447 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
2d545b82 12448 "(0x%x)", (unsigned char) c);
252b5132
RH
12449 return output_invalid_buf;
12450}
12451
8a6fb3f9
JB
12452/* Verify that @r can be used in the current context. */
12453
12454static bfd_boolean check_register (const reg_entry *r)
12455{
12456 if (allow_pseudo_reg)
12457 return TRUE;
12458
12459 if (operand_type_all_zero (&r->reg_type))
12460 return FALSE;
12461
12462 if ((r->reg_type.bitfield.dword
12463 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12464 || r->reg_type.bitfield.class == RegCR
22e00a3f 12465 || r->reg_type.bitfield.class == RegDR)
8a6fb3f9
JB
12466 && !cpu_arch_flags.bitfield.cpui386)
12467 return FALSE;
12468
22e00a3f
JB
12469 if (r->reg_type.bitfield.class == RegTR
12470 && (flag_code == CODE_64BIT
12471 || !cpu_arch_flags.bitfield.cpui386
12472 || cpu_arch_isa_flags.bitfield.cpui586
12473 || cpu_arch_isa_flags.bitfield.cpui686))
12474 return FALSE;
12475
8a6fb3f9
JB
12476 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12477 return FALSE;
12478
12479 if (!cpu_arch_flags.bitfield.cpuavx512f)
12480 {
12481 if (r->reg_type.bitfield.zmmword
12482 || r->reg_type.bitfield.class == RegMask)
12483 return FALSE;
12484
12485 if (!cpu_arch_flags.bitfield.cpuavx)
12486 {
12487 if (r->reg_type.bitfield.ymmword)
12488 return FALSE;
12489
12490 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12491 return FALSE;
12492 }
12493 }
12494
260cd341
LC
12495 if (r->reg_type.bitfield.tmmword
12496 && (!cpu_arch_flags.bitfield.cpuamx_tile
12497 || flag_code != CODE_64BIT))
12498 return FALSE;
12499
8a6fb3f9
JB
12500 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12501 return FALSE;
12502
12503 /* Don't allow fake index register unless allow_index_reg isn't 0. */
12504 if (!allow_index_reg && r->reg_num == RegIZ)
12505 return FALSE;
12506
12507 /* Upper 16 vector registers are only available with VREX in 64bit
12508 mode, and require EVEX encoding. */
12509 if (r->reg_flags & RegVRex)
12510 {
12511 if (!cpu_arch_flags.bitfield.cpuavx512f
12512 || flag_code != CODE_64BIT)
12513 return FALSE;
12514
da4977e0
JB
12515 if (i.vec_encoding == vex_encoding_default)
12516 i.vec_encoding = vex_encoding_evex;
12517 else if (i.vec_encoding != vex_encoding_evex)
12518 i.vec_encoding = vex_encoding_error;
8a6fb3f9
JB
12519 }
12520
12521 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12522 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12523 && flag_code != CODE_64BIT)
12524 return FALSE;
12525
12526 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12527 && !intel_syntax)
12528 return FALSE;
12529
12530 return TRUE;
12531}
12532
af6bdddf 12533/* REG_STRING starts *before* REGISTER_PREFIX. */
252b5132
RH
12534
12535static const reg_entry *
4d1bb795 12536parse_real_register (char *reg_string, char **end_op)
252b5132 12537{
af6bdddf
AM
12538 char *s = reg_string;
12539 char *p;
252b5132
RH
12540 char reg_name_given[MAX_REG_NAME_SIZE + 1];
12541 const reg_entry *r;
12542
12543 /* Skip possible REGISTER_PREFIX and possible whitespace. */
12544 if (*s == REGISTER_PREFIX)
12545 ++s;
12546
12547 if (is_space_char (*s))
12548 ++s;
12549
12550 p = reg_name_given;
af6bdddf 12551 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
252b5132
RH
12552 {
12553 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
af6bdddf
AM
12554 return (const reg_entry *) NULL;
12555 s++;
252b5132
RH
12556 }
12557
6588847e
DN
12558 /* For naked regs, make sure that we are not dealing with an identifier.
12559 This prevents confusing an identifier like `eax_var' with register
12560 `eax'. */
12561 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12562 return (const reg_entry *) NULL;
12563
af6bdddf 12564 *end_op = s;
252b5132
RH
12565
12566 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
12567
5f47d35b 12568 /* Handle floating point regs, allowing spaces in the (i) part. */
47926f60 12569 if (r == i386_regtab /* %st is first entry of table */)
5f47d35b 12570 {
0e0eea78
JB
12571 if (!cpu_arch_flags.bitfield.cpu8087
12572 && !cpu_arch_flags.bitfield.cpu287
af32b722
JB
12573 && !cpu_arch_flags.bitfield.cpu387
12574 && !allow_pseudo_reg)
0e0eea78
JB
12575 return (const reg_entry *) NULL;
12576
5f47d35b
AM
12577 if (is_space_char (*s))
12578 ++s;
12579 if (*s == '(')
12580 {
af6bdddf 12581 ++s;
5f47d35b
AM
12582 if (is_space_char (*s))
12583 ++s;
12584 if (*s >= '0' && *s <= '7')
12585 {
db557034 12586 int fpr = *s - '0';
af6bdddf 12587 ++s;
5f47d35b
AM
12588 if (is_space_char (*s))
12589 ++s;
12590 if (*s == ')')
12591 {
12592 *end_op = s + 1;
1e9cc1c2 12593 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
db557034
AM
12594 know (r);
12595 return r + fpr;
5f47d35b 12596 }
5f47d35b 12597 }
47926f60 12598 /* We have "%st(" then garbage. */
5f47d35b
AM
12599 return (const reg_entry *) NULL;
12600 }
12601 }
12602
8a6fb3f9 12603 return r && check_register (r) ? r : NULL;
252b5132 12604}
4d1bb795
JB
12605
12606/* REG_STRING starts *before* REGISTER_PREFIX. */
12607
12608static const reg_entry *
12609parse_register (char *reg_string, char **end_op)
12610{
12611 const reg_entry *r;
12612
12613 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12614 r = parse_real_register (reg_string, end_op);
12615 else
12616 r = NULL;
12617 if (!r)
12618 {
12619 char *save = input_line_pointer;
12620 char c;
12621 symbolS *symbolP;
12622
12623 input_line_pointer = reg_string;
d02603dc 12624 c = get_symbol_name (&reg_string);
4d1bb795
JB
12625 symbolP = symbol_find (reg_string);
12626 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12627 {
12628 const expressionS *e = symbol_get_value_expression (symbolP);
12629
0398aac5 12630 know (e->X_op == O_register);
4eed87de 12631 know (e->X_add_number >= 0
c3fe08fa 12632 && (valueT) e->X_add_number < i386_regtab_size);
4d1bb795 12633 r = i386_regtab + e->X_add_number;
8a6fb3f9
JB
12634 if (!check_register (r))
12635 {
12636 as_bad (_("register '%s%s' cannot be used here"),
12637 register_prefix, r->reg_name);
12638 r = &bad_reg;
12639 }
4d1bb795
JB
12640 *end_op = input_line_pointer;
12641 }
12642 *input_line_pointer = c;
12643 input_line_pointer = save;
12644 }
12645 return r;
12646}
12647
12648int
12649i386_parse_name (char *name, expressionS *e, char *nextcharP)
12650{
12651 const reg_entry *r;
12652 char *end = input_line_pointer;
12653
12654 *end = *nextcharP;
12655 r = parse_register (name, &input_line_pointer);
12656 if (r && end <= input_line_pointer)
12657 {
12658 *nextcharP = *input_line_pointer;
12659 *input_line_pointer = 0;
8a6fb3f9
JB
12660 if (r != &bad_reg)
12661 {
12662 e->X_op = O_register;
12663 e->X_add_number = r - i386_regtab;
12664 }
12665 else
12666 e->X_op = O_illegal;
4d1bb795
JB
12667 return 1;
12668 }
12669 input_line_pointer = end;
12670 *end = 0;
ee86248c 12671 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
4d1bb795
JB
12672}
12673
12674void
12675md_operand (expressionS *e)
12676{
ee86248c
JB
12677 char *end;
12678 const reg_entry *r;
4d1bb795 12679
ee86248c
JB
12680 switch (*input_line_pointer)
12681 {
12682 case REGISTER_PREFIX:
12683 r = parse_real_register (input_line_pointer, &end);
4d1bb795
JB
12684 if (r)
12685 {
12686 e->X_op = O_register;
12687 e->X_add_number = r - i386_regtab;
12688 input_line_pointer = end;
12689 }
ee86248c
JB
12690 break;
12691
12692 case '[':
9c2799c2 12693 gas_assert (intel_syntax);
ee86248c
JB
12694 end = input_line_pointer++;
12695 expression (e);
12696 if (*input_line_pointer == ']')
12697 {
12698 ++input_line_pointer;
12699 e->X_op_symbol = make_expr_symbol (e);
12700 e->X_add_symbol = NULL;
12701 e->X_add_number = 0;
12702 e->X_op = O_index;
12703 }
12704 else
12705 {
12706 e->X_op = O_absent;
12707 input_line_pointer = end;
12708 }
12709 break;
4d1bb795
JB
12710 }
12711}
12712
252b5132 12713\f
4cc782b5 12714#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
b6f8c7c4 12715const char *md_shortopts = "kVQ:sqnO::";
252b5132 12716#else
b6f8c7c4 12717const char *md_shortopts = "qnO::";
252b5132 12718#endif
6e0b89ee 12719
3e73aa7c 12720#define OPTION_32 (OPTION_MD_BASE + 0)
b3b91714
AM
12721#define OPTION_64 (OPTION_MD_BASE + 1)
12722#define OPTION_DIVIDE (OPTION_MD_BASE + 2)
9103f4f4
L
12723#define OPTION_MARCH (OPTION_MD_BASE + 3)
12724#define OPTION_MTUNE (OPTION_MD_BASE + 4)
1efbbeb4
L
12725#define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12726#define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12727#define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12728#define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
bd5dea88 12729#define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
c0f3af97 12730#define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
daf50ae7 12731#define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
7bab8ab5
JB
12732#define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12733#define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12734#define OPTION_X32 (OPTION_MD_BASE + 14)
7e8b059b 12735#define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
43234a1e
L
12736#define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12737#define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
167ad85b 12738#define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
d1982f93 12739#define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
d3d3c6db 12740#define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
8dcea932 12741#define OPTION_MSHARED (OPTION_MD_BASE + 21)
5db04b09
L
12742#define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12743#define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
e4e00185 12744#define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
b4a3a7b4 12745#define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
03751133 12746#define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
e379e5f3
L
12747#define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12748#define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12749#define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
76cf450b 12750#define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
ae531041
L
12751#define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12752#define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12753#define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
b3b91714 12754
99ad8390
NC
12755struct option md_longopts[] =
12756{
3e73aa7c 12757 {"32", no_argument, NULL, OPTION_32},
321098a5 12758#if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
d382c579 12759 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
3e73aa7c 12760 {"64", no_argument, NULL, OPTION_64},
351f65ca
L
12761#endif
12762#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
570561f7 12763 {"x32", no_argument, NULL, OPTION_X32},
8dcea932 12764 {"mshared", no_argument, NULL, OPTION_MSHARED},
b4a3a7b4 12765 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
6e0b89ee 12766#endif
b3b91714 12767 {"divide", no_argument, NULL, OPTION_DIVIDE},
9103f4f4
L
12768 {"march", required_argument, NULL, OPTION_MARCH},
12769 {"mtune", required_argument, NULL, OPTION_MTUNE},
1efbbeb4
L
12770 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12771 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12772 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12773 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
c0f3af97 12774 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
daf50ae7 12775 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
7bab8ab5 12776 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
539f890d 12777 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
03751133 12778 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
7e8b059b 12779 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
43234a1e
L
12780 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12781 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
167ad85b
TG
12782# if defined (TE_PE) || defined (TE_PEP)
12783 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12784#endif
d1982f93 12785 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
e4e00185 12786 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
0cb4071e 12787 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
d3d3c6db 12788 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
e379e5f3
L
12789 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12790 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12791 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
76cf450b 12792 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
ae531041
L
12793 {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12794 {"mlfence-before-indirect-branch", required_argument, NULL,
12795 OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12796 {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
5db04b09
L
12797 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12798 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
252b5132
RH
12799 {NULL, no_argument, NULL, 0}
12800};
12801size_t md_longopts_size = sizeof (md_longopts);
12802
12803int
17b9d67d 12804md_parse_option (int c, const char *arg)
252b5132 12805{
91d6fa6a 12806 unsigned int j;
e379e5f3 12807 char *arch, *next, *saved, *type;
9103f4f4 12808
252b5132
RH
12809 switch (c)
12810 {
12b55ccc
L
12811 case 'n':
12812 optimize_align_code = 0;
12813 break;
12814
a38cf1db
AM
12815 case 'q':
12816 quiet_warnings = 1;
252b5132
RH
12817 break;
12818
12819#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
a38cf1db
AM
12820 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12821 should be emitted or not. FIXME: Not implemented. */
12822 case 'Q':
d4693039
JB
12823 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12824 return 0;
252b5132
RH
12825 break;
12826
12827 /* -V: SVR4 argument to print version ID. */
12828 case 'V':
12829 print_version_id ();
12830 break;
12831
a38cf1db
AM
12832 /* -k: Ignore for FreeBSD compatibility. */
12833 case 'k':
252b5132 12834 break;
4cc782b5
ILT
12835
12836 case 's':
12837 /* -s: On i386 Solaris, this tells the native assembler to use
29b0f896 12838 .stab instead of .stab.excl. We always use .stab anyhow. */
4cc782b5 12839 break;
8dcea932
L
12840
12841 case OPTION_MSHARED:
12842 shared = 1;
12843 break;
b4a3a7b4
L
12844
12845 case OPTION_X86_USED_NOTE:
12846 if (strcasecmp (arg, "yes") == 0)
12847 x86_used_note = 1;
12848 else if (strcasecmp (arg, "no") == 0)
12849 x86_used_note = 0;
12850 else
12851 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12852 break;
12853
12854
99ad8390 12855#endif
321098a5 12856#if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
d382c579 12857 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
3e73aa7c
JH
12858 case OPTION_64:
12859 {
12860 const char **list, **l;
12861
3e73aa7c
JH
12862 list = bfd_target_list ();
12863 for (l = list; *l != NULL; l++)
8620418b 12864 if (CONST_STRNEQ (*l, "elf64-x86-64")
99ad8390
NC
12865 || strcmp (*l, "coff-x86-64") == 0
12866 || strcmp (*l, "pe-x86-64") == 0
d382c579
TG
12867 || strcmp (*l, "pei-x86-64") == 0
12868 || strcmp (*l, "mach-o-x86-64") == 0)
6e0b89ee
AM
12869 {
12870 default_arch = "x86_64";
12871 break;
12872 }
3e73aa7c 12873 if (*l == NULL)
2b5d6a91 12874 as_fatal (_("no compiled in support for x86_64"));
3e73aa7c
JH
12875 free (list);
12876 }
12877 break;
12878#endif
252b5132 12879
351f65ca 12880#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
570561f7 12881 case OPTION_X32:
351f65ca
L
12882 if (IS_ELF)
12883 {
12884 const char **list, **l;
12885
12886 list = bfd_target_list ();
12887 for (l = list; *l != NULL; l++)
12888 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12889 {
12890 default_arch = "x86_64:32";
12891 break;
12892 }
12893 if (*l == NULL)
2b5d6a91 12894 as_fatal (_("no compiled in support for 32bit x86_64"));
351f65ca
L
12895 free (list);
12896 }
12897 else
12898 as_fatal (_("32bit x86_64 is only supported for ELF"));
12899 break;
12900#endif
12901
6e0b89ee
AM
12902 case OPTION_32:
12903 default_arch = "i386";
12904 break;
12905
b3b91714
AM
12906 case OPTION_DIVIDE:
12907#ifdef SVR4_COMMENT_CHARS
12908 {
12909 char *n, *t;
12910 const char *s;
12911
add39d23 12912 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
b3b91714
AM
12913 t = n;
12914 for (s = i386_comment_chars; *s != '\0'; s++)
12915 if (*s != '/')
12916 *t++ = *s;
12917 *t = '\0';
12918 i386_comment_chars = n;
12919 }
12920#endif
12921 break;
12922
9103f4f4 12923 case OPTION_MARCH:
293f5f65
L
12924 saved = xstrdup (arg);
12925 arch = saved;
12926 /* Allow -march=+nosse. */
12927 if (*arch == '+')
12928 arch++;
6305a203 12929 do
9103f4f4 12930 {
6305a203 12931 if (*arch == '.')
2b5d6a91 12932 as_fatal (_("invalid -march= option: `%s'"), arg);
6305a203
L
12933 next = strchr (arch, '+');
12934 if (next)
12935 *next++ = '\0';
91d6fa6a 12936 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9103f4f4 12937 {
91d6fa6a 12938 if (strcmp (arch, cpu_arch [j].name) == 0)
ccc9c027 12939 {
6305a203 12940 /* Processor. */
1ded5609
JB
12941 if (! cpu_arch[j].flags.bitfield.cpui386)
12942 continue;
12943
91d6fa6a 12944 cpu_arch_name = cpu_arch[j].name;
6305a203 12945 cpu_sub_arch_name = NULL;
91d6fa6a
NC
12946 cpu_arch_flags = cpu_arch[j].flags;
12947 cpu_arch_isa = cpu_arch[j].type;
12948 cpu_arch_isa_flags = cpu_arch[j].flags;
6305a203
L
12949 if (!cpu_arch_tune_set)
12950 {
12951 cpu_arch_tune = cpu_arch_isa;
12952 cpu_arch_tune_flags = cpu_arch_isa_flags;
12953 }
12954 break;
12955 }
91d6fa6a
NC
12956 else if (*cpu_arch [j].name == '.'
12957 && strcmp (arch, cpu_arch [j].name + 1) == 0)
6305a203 12958 {
33eaf5de 12959 /* ISA extension. */
6305a203 12960 i386_cpu_flags flags;
309d3373 12961
293f5f65
L
12962 flags = cpu_flags_or (cpu_arch_flags,
12963 cpu_arch[j].flags);
81486035 12964
5b64d091 12965 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
6305a203
L
12966 {
12967 if (cpu_sub_arch_name)
12968 {
12969 char *name = cpu_sub_arch_name;
12970 cpu_sub_arch_name = concat (name,
91d6fa6a 12971 cpu_arch[j].name,
1bf57e9f 12972 (const char *) NULL);
6305a203
L
12973 free (name);
12974 }
12975 else
91d6fa6a 12976 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
6305a203 12977 cpu_arch_flags = flags;
a586129e 12978 cpu_arch_isa_flags = flags;
6305a203 12979 }
0089dace
L
12980 else
12981 cpu_arch_isa_flags
12982 = cpu_flags_or (cpu_arch_isa_flags,
12983 cpu_arch[j].flags);
6305a203 12984 break;
ccc9c027 12985 }
9103f4f4 12986 }
6305a203 12987
293f5f65
L
12988 if (j >= ARRAY_SIZE (cpu_arch))
12989 {
33eaf5de 12990 /* Disable an ISA extension. */
293f5f65
L
12991 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12992 if (strcmp (arch, cpu_noarch [j].name) == 0)
12993 {
12994 i386_cpu_flags flags;
12995
12996 flags = cpu_flags_and_not (cpu_arch_flags,
12997 cpu_noarch[j].flags);
12998 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12999 {
13000 if (cpu_sub_arch_name)
13001 {
13002 char *name = cpu_sub_arch_name;
13003 cpu_sub_arch_name = concat (arch,
13004 (const char *) NULL);
13005 free (name);
13006 }
13007 else
13008 cpu_sub_arch_name = xstrdup (arch);
13009 cpu_arch_flags = flags;
13010 cpu_arch_isa_flags = flags;
13011 }
13012 break;
13013 }
13014
13015 if (j >= ARRAY_SIZE (cpu_noarch))
13016 j = ARRAY_SIZE (cpu_arch);
13017 }
13018
91d6fa6a 13019 if (j >= ARRAY_SIZE (cpu_arch))
2b5d6a91 13020 as_fatal (_("invalid -march= option: `%s'"), arg);
6305a203
L
13021
13022 arch = next;
9103f4f4 13023 }
293f5f65
L
13024 while (next != NULL);
13025 free (saved);
9103f4f4
L
13026 break;
13027
13028 case OPTION_MTUNE:
13029 if (*arg == '.')
2b5d6a91 13030 as_fatal (_("invalid -mtune= option: `%s'"), arg);
91d6fa6a 13031 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9103f4f4 13032 {
91d6fa6a 13033 if (strcmp (arg, cpu_arch [j].name) == 0)
9103f4f4 13034 {
ccc9c027 13035 cpu_arch_tune_set = 1;
91d6fa6a
NC
13036 cpu_arch_tune = cpu_arch [j].type;
13037 cpu_arch_tune_flags = cpu_arch[j].flags;
9103f4f4
L
13038 break;
13039 }
13040 }
91d6fa6a 13041 if (j >= ARRAY_SIZE (cpu_arch))
2b5d6a91 13042 as_fatal (_("invalid -mtune= option: `%s'"), arg);
9103f4f4
L
13043 break;
13044
1efbbeb4
L
13045 case OPTION_MMNEMONIC:
13046 if (strcasecmp (arg, "att") == 0)
13047 intel_mnemonic = 0;
13048 else if (strcasecmp (arg, "intel") == 0)
13049 intel_mnemonic = 1;
13050 else
2b5d6a91 13051 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
1efbbeb4
L
13052 break;
13053
13054 case OPTION_MSYNTAX:
13055 if (strcasecmp (arg, "att") == 0)
13056 intel_syntax = 0;
13057 else if (strcasecmp (arg, "intel") == 0)
13058 intel_syntax = 1;
13059 else
2b5d6a91 13060 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
1efbbeb4
L
13061 break;
13062
13063 case OPTION_MINDEX_REG:
13064 allow_index_reg = 1;
13065 break;
13066
13067 case OPTION_MNAKED_REG:
13068 allow_naked_reg = 1;
13069 break;
13070
c0f3af97
L
13071 case OPTION_MSSE2AVX:
13072 sse2avx = 1;
13073 break;
13074
daf50ae7
L
13075 case OPTION_MSSE_CHECK:
13076 if (strcasecmp (arg, "error") == 0)
7bab8ab5 13077 sse_check = check_error;
daf50ae7 13078 else if (strcasecmp (arg, "warning") == 0)
7bab8ab5 13079 sse_check = check_warning;
daf50ae7 13080 else if (strcasecmp (arg, "none") == 0)
7bab8ab5 13081 sse_check = check_none;
daf50ae7 13082 else
2b5d6a91 13083 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
daf50ae7
L
13084 break;
13085
7bab8ab5
JB
13086 case OPTION_MOPERAND_CHECK:
13087 if (strcasecmp (arg, "error") == 0)
13088 operand_check = check_error;
13089 else if (strcasecmp (arg, "warning") == 0)
13090 operand_check = check_warning;
13091 else if (strcasecmp (arg, "none") == 0)
13092 operand_check = check_none;
13093 else
13094 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13095 break;
13096
539f890d
L
13097 case OPTION_MAVXSCALAR:
13098 if (strcasecmp (arg, "128") == 0)
13099 avxscalar = vex128;
13100 else if (strcasecmp (arg, "256") == 0)
13101 avxscalar = vex256;
13102 else
2b5d6a91 13103 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
539f890d
L
13104 break;
13105
03751133
L
13106 case OPTION_MVEXWIG:
13107 if (strcmp (arg, "0") == 0)
40c9c8de 13108 vexwig = vexw0;
03751133 13109 else if (strcmp (arg, "1") == 0)
40c9c8de 13110 vexwig = vexw1;
03751133
L
13111 else
13112 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13113 break;
13114
7e8b059b
L
13115 case OPTION_MADD_BND_PREFIX:
13116 add_bnd_prefix = 1;
13117 break;
13118
43234a1e
L
13119 case OPTION_MEVEXLIG:
13120 if (strcmp (arg, "128") == 0)
13121 evexlig = evexl128;
13122 else if (strcmp (arg, "256") == 0)
13123 evexlig = evexl256;
13124 else if (strcmp (arg, "512") == 0)
13125 evexlig = evexl512;
13126 else
13127 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13128 break;
13129
d3d3c6db
IT
13130 case OPTION_MEVEXRCIG:
13131 if (strcmp (arg, "rne") == 0)
13132 evexrcig = rne;
13133 else if (strcmp (arg, "rd") == 0)
13134 evexrcig = rd;
13135 else if (strcmp (arg, "ru") == 0)
13136 evexrcig = ru;
13137 else if (strcmp (arg, "rz") == 0)
13138 evexrcig = rz;
13139 else
13140 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13141 break;
13142
43234a1e
L
13143 case OPTION_MEVEXWIG:
13144 if (strcmp (arg, "0") == 0)
13145 evexwig = evexw0;
13146 else if (strcmp (arg, "1") == 0)
13147 evexwig = evexw1;
13148 else
13149 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13150 break;
13151
167ad85b
TG
13152# if defined (TE_PE) || defined (TE_PEP)
13153 case OPTION_MBIG_OBJ:
13154 use_big_obj = 1;
13155 break;
13156#endif
13157
d1982f93 13158 case OPTION_MOMIT_LOCK_PREFIX:
d022bddd
IT
13159 if (strcasecmp (arg, "yes") == 0)
13160 omit_lock_prefix = 1;
13161 else if (strcasecmp (arg, "no") == 0)
13162 omit_lock_prefix = 0;
13163 else
13164 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13165 break;
13166
e4e00185
AS
13167 case OPTION_MFENCE_AS_LOCK_ADD:
13168 if (strcasecmp (arg, "yes") == 0)
13169 avoid_fence = 1;
13170 else if (strcasecmp (arg, "no") == 0)
13171 avoid_fence = 0;
13172 else
13173 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13174 break;
13175
ae531041
L
13176 case OPTION_MLFENCE_AFTER_LOAD:
13177 if (strcasecmp (arg, "yes") == 0)
13178 lfence_after_load = 1;
13179 else if (strcasecmp (arg, "no") == 0)
13180 lfence_after_load = 0;
13181 else
13182 as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13183 break;
13184
13185 case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13186 if (strcasecmp (arg, "all") == 0)
a09f656b 13187 {
13188 lfence_before_indirect_branch = lfence_branch_all;
13189 if (lfence_before_ret == lfence_before_ret_none)
13190 lfence_before_ret = lfence_before_ret_shl;
13191 }
ae531041
L
13192 else if (strcasecmp (arg, "memory") == 0)
13193 lfence_before_indirect_branch = lfence_branch_memory;
13194 else if (strcasecmp (arg, "register") == 0)
13195 lfence_before_indirect_branch = lfence_branch_register;
13196 else if (strcasecmp (arg, "none") == 0)
13197 lfence_before_indirect_branch = lfence_branch_none;
13198 else
13199 as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13200 arg);
13201 break;
13202
13203 case OPTION_MLFENCE_BEFORE_RET:
13204 if (strcasecmp (arg, "or") == 0)
13205 lfence_before_ret = lfence_before_ret_or;
13206 else if (strcasecmp (arg, "not") == 0)
13207 lfence_before_ret = lfence_before_ret_not;
a09f656b 13208 else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13209 lfence_before_ret = lfence_before_ret_shl;
ae531041
L
13210 else if (strcasecmp (arg, "none") == 0)
13211 lfence_before_ret = lfence_before_ret_none;
13212 else
13213 as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13214 arg);
13215 break;
13216
0cb4071e
L
13217 case OPTION_MRELAX_RELOCATIONS:
13218 if (strcasecmp (arg, "yes") == 0)
13219 generate_relax_relocations = 1;
13220 else if (strcasecmp (arg, "no") == 0)
13221 generate_relax_relocations = 0;
13222 else
13223 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13224 break;
13225
e379e5f3
L
13226 case OPTION_MALIGN_BRANCH_BOUNDARY:
13227 {
13228 char *end;
13229 long int align = strtoul (arg, &end, 0);
13230 if (*end == '\0')
13231 {
13232 if (align == 0)
13233 {
13234 align_branch_power = 0;
13235 break;
13236 }
13237 else if (align >= 16)
13238 {
13239 int align_power;
13240 for (align_power = 0;
13241 (align & 1) == 0;
13242 align >>= 1, align_power++)
13243 continue;
13244 /* Limit alignment power to 31. */
13245 if (align == 1 && align_power < 32)
13246 {
13247 align_branch_power = align_power;
13248 break;
13249 }
13250 }
13251 }
13252 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13253 }
13254 break;
13255
13256 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13257 {
13258 char *end;
13259 int align = strtoul (arg, &end, 0);
13260 /* Some processors only support 5 prefixes. */
13261 if (*end == '\0' && align >= 0 && align < 6)
13262 {
13263 align_branch_prefix_size = align;
13264 break;
13265 }
13266 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13267 arg);
13268 }
13269 break;
13270
13271 case OPTION_MALIGN_BRANCH:
13272 align_branch = 0;
13273 saved = xstrdup (arg);
13274 type = saved;
13275 do
13276 {
13277 next = strchr (type, '+');
13278 if (next)
13279 *next++ = '\0';
13280 if (strcasecmp (type, "jcc") == 0)
13281 align_branch |= align_branch_jcc_bit;
13282 else if (strcasecmp (type, "fused") == 0)
13283 align_branch |= align_branch_fused_bit;
13284 else if (strcasecmp (type, "jmp") == 0)
13285 align_branch |= align_branch_jmp_bit;
13286 else if (strcasecmp (type, "call") == 0)
13287 align_branch |= align_branch_call_bit;
13288 else if (strcasecmp (type, "ret") == 0)
13289 align_branch |= align_branch_ret_bit;
13290 else if (strcasecmp (type, "indirect") == 0)
13291 align_branch |= align_branch_indirect_bit;
13292 else
13293 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13294 type = next;
13295 }
13296 while (next != NULL);
13297 free (saved);
13298 break;
13299
76cf450b
L
13300 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13301 align_branch_power = 5;
13302 align_branch_prefix_size = 5;
13303 align_branch = (align_branch_jcc_bit
13304 | align_branch_fused_bit
13305 | align_branch_jmp_bit);
13306 break;
13307
5db04b09 13308 case OPTION_MAMD64:
4b5aaf5f 13309 isa64 = amd64;
5db04b09
L
13310 break;
13311
13312 case OPTION_MINTEL64:
4b5aaf5f 13313 isa64 = intel64;
5db04b09
L
13314 break;
13315
b6f8c7c4
L
13316 case 'O':
13317 if (arg == NULL)
13318 {
13319 optimize = 1;
13320 /* Turn off -Os. */
13321 optimize_for_space = 0;
13322 }
13323 else if (*arg == 's')
13324 {
13325 optimize_for_space = 1;
13326 /* Turn on all encoding optimizations. */
41fd2579 13327 optimize = INT_MAX;
b6f8c7c4
L
13328 }
13329 else
13330 {
13331 optimize = atoi (arg);
13332 /* Turn off -Os. */
13333 optimize_for_space = 0;
13334 }
13335 break;
13336
252b5132
RH
13337 default:
13338 return 0;
13339 }
13340 return 1;
13341}
13342
8a2c8fef
L
13343#define MESSAGE_TEMPLATE \
13344" "
13345
293f5f65
L
13346static char *
13347output_message (FILE *stream, char *p, char *message, char *start,
13348 int *left_p, const char *name, int len)
13349{
13350 int size = sizeof (MESSAGE_TEMPLATE);
13351 int left = *left_p;
13352
13353 /* Reserve 2 spaces for ", " or ",\0" */
13354 left -= len + 2;
13355
13356 /* Check if there is any room. */
13357 if (left >= 0)
13358 {
13359 if (p != start)
13360 {
13361 *p++ = ',';
13362 *p++ = ' ';
13363 }
13364 p = mempcpy (p, name, len);
13365 }
13366 else
13367 {
13368 /* Output the current message now and start a new one. */
13369 *p++ = ',';
13370 *p = '\0';
13371 fprintf (stream, "%s\n", message);
13372 p = start;
13373 left = size - (start - message) - len - 2;
13374
13375 gas_assert (left >= 0);
13376
13377 p = mempcpy (p, name, len);
13378 }
13379
13380 *left_p = left;
13381 return p;
13382}
13383
8a2c8fef 13384static void
1ded5609 13385show_arch (FILE *stream, int ext, int check)
8a2c8fef
L
13386{
13387 static char message[] = MESSAGE_TEMPLATE;
13388 char *start = message + 27;
13389 char *p;
13390 int size = sizeof (MESSAGE_TEMPLATE);
13391 int left;
13392 const char *name;
13393 int len;
13394 unsigned int j;
13395
13396 p = start;
13397 left = size - (start - message);
13398 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13399 {
13400 /* Should it be skipped? */
13401 if (cpu_arch [j].skip)
13402 continue;
13403
13404 name = cpu_arch [j].name;
13405 len = cpu_arch [j].len;
13406 if (*name == '.')
13407 {
13408 /* It is an extension. Skip if we aren't asked to show it. */
13409 if (ext)
13410 {
13411 name++;
13412 len--;
13413 }
13414 else
13415 continue;
13416 }
13417 else if (ext)
13418 {
13419 /* It is an processor. Skip if we show only extension. */
13420 continue;
13421 }
1ded5609
JB
13422 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13423 {
13424 /* It is an impossible processor - skip. */
13425 continue;
13426 }
8a2c8fef 13427
293f5f65 13428 p = output_message (stream, p, message, start, &left, name, len);
8a2c8fef
L
13429 }
13430
293f5f65
L
13431 /* Display disabled extensions. */
13432 if (ext)
13433 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13434 {
13435 name = cpu_noarch [j].name;
13436 len = cpu_noarch [j].len;
13437 p = output_message (stream, p, message, start, &left, name,
13438 len);
13439 }
13440
8a2c8fef
L
13441 *p = '\0';
13442 fprintf (stream, "%s\n", message);
13443}
13444
252b5132 13445void
8a2c8fef 13446md_show_usage (FILE *stream)
252b5132 13447{
4cc782b5
ILT
13448#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13449 fprintf (stream, _("\
d4693039 13450 -Qy, -Qn ignored\n\
a38cf1db 13451 -V print assembler version number\n\
b3b91714
AM
13452 -k ignored\n"));
13453#endif
13454 fprintf (stream, _("\
12b55ccc 13455 -n Do not optimize code alignment\n\
b3b91714
AM
13456 -q quieten some warnings\n"));
13457#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13458 fprintf (stream, _("\
a38cf1db 13459 -s ignored\n"));
b3b91714 13460#endif
d7f449c0
L
13461#if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13462 || defined (TE_PE) || defined (TE_PEP))
751d281c 13463 fprintf (stream, _("\
570561f7 13464 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
751d281c 13465#endif
b3b91714
AM
13466#ifdef SVR4_COMMENT_CHARS
13467 fprintf (stream, _("\
13468 --divide do not treat `/' as a comment character\n"));
a38cf1db
AM
13469#else
13470 fprintf (stream, _("\
b3b91714 13471 --divide ignored\n"));
4cc782b5 13472#endif
9103f4f4 13473 fprintf (stream, _("\
6305a203 13474 -march=CPU[,+EXTENSION...]\n\
8a2c8fef 13475 generate code for CPU and EXTENSION, CPU is one of:\n"));
1ded5609 13476 show_arch (stream, 0, 1);
8a2c8fef
L
13477 fprintf (stream, _("\
13478 EXTENSION is combination of:\n"));
1ded5609 13479 show_arch (stream, 1, 0);
6305a203 13480 fprintf (stream, _("\
8a2c8fef 13481 -mtune=CPU optimize for CPU, CPU is one of:\n"));
1ded5609 13482 show_arch (stream, 0, 0);
ba104c83 13483 fprintf (stream, _("\
c0f3af97
L
13484 -msse2avx encode SSE instructions with VEX prefix\n"));
13485 fprintf (stream, _("\
7c5c05ef 13486 -msse-check=[none|error|warning] (default: warning)\n\
daf50ae7
L
13487 check SSE instructions\n"));
13488 fprintf (stream, _("\
7c5c05ef 13489 -moperand-check=[none|error|warning] (default: warning)\n\
7bab8ab5
JB
13490 check operand combinations for validity\n"));
13491 fprintf (stream, _("\
7c5c05ef
L
13492 -mavxscalar=[128|256] (default: 128)\n\
13493 encode scalar AVX instructions with specific vector\n\
539f890d
L
13494 length\n"));
13495 fprintf (stream, _("\
03751133
L
13496 -mvexwig=[0|1] (default: 0)\n\
13497 encode VEX instructions with specific VEX.W value\n\
13498 for VEX.W bit ignored instructions\n"));
13499 fprintf (stream, _("\
7c5c05ef
L
13500 -mevexlig=[128|256|512] (default: 128)\n\
13501 encode scalar EVEX instructions with specific vector\n\
43234a1e
L
13502 length\n"));
13503 fprintf (stream, _("\
7c5c05ef
L
13504 -mevexwig=[0|1] (default: 0)\n\
13505 encode EVEX instructions with specific EVEX.W value\n\
43234a1e
L
13506 for EVEX.W bit ignored instructions\n"));
13507 fprintf (stream, _("\
7c5c05ef 13508 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
d3d3c6db
IT
13509 encode EVEX instructions with specific EVEX.RC value\n\
13510 for SAE-only ignored instructions\n"));
13511 fprintf (stream, _("\
7c5c05ef
L
13512 -mmnemonic=[att|intel] "));
13513 if (SYSV386_COMPAT)
13514 fprintf (stream, _("(default: att)\n"));
13515 else
13516 fprintf (stream, _("(default: intel)\n"));
13517 fprintf (stream, _("\
13518 use AT&T/Intel mnemonic\n"));
ba104c83 13519 fprintf (stream, _("\
7c5c05ef
L
13520 -msyntax=[att|intel] (default: att)\n\
13521 use AT&T/Intel syntax\n"));
ba104c83
L
13522 fprintf (stream, _("\
13523 -mindex-reg support pseudo index registers\n"));
13524 fprintf (stream, _("\
13525 -mnaked-reg don't require `%%' prefix for registers\n"));
13526 fprintf (stream, _("\
7e8b059b 13527 -madd-bnd-prefix add BND prefix for all valid branches\n"));
b4a3a7b4 13528#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8dcea932
L
13529 fprintf (stream, _("\
13530 -mshared disable branch optimization for shared code\n"));
b4a3a7b4
L
13531 fprintf (stream, _("\
13532 -mx86-used-note=[no|yes] "));
13533 if (DEFAULT_X86_USED_NOTE)
13534 fprintf (stream, _("(default: yes)\n"));
13535 else
13536 fprintf (stream, _("(default: no)\n"));
13537 fprintf (stream, _("\
13538 generate x86 used ISA and feature properties\n"));
13539#endif
13540#if defined (TE_PE) || defined (TE_PEP)
167ad85b
TG
13541 fprintf (stream, _("\
13542 -mbig-obj generate big object files\n"));
13543#endif
d022bddd 13544 fprintf (stream, _("\
7c5c05ef 13545 -momit-lock-prefix=[no|yes] (default: no)\n\
d022bddd 13546 strip all lock prefixes\n"));
5db04b09 13547 fprintf (stream, _("\
7c5c05ef 13548 -mfence-as-lock-add=[no|yes] (default: no)\n\
e4e00185
AS
13549 encode lfence, mfence and sfence as\n\
13550 lock addl $0x0, (%%{re}sp)\n"));
13551 fprintf (stream, _("\
7c5c05ef
L
13552 -mrelax-relocations=[no|yes] "));
13553 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13554 fprintf (stream, _("(default: yes)\n"));
13555 else
13556 fprintf (stream, _("(default: no)\n"));
13557 fprintf (stream, _("\
0cb4071e
L
13558 generate relax relocations\n"));
13559 fprintf (stream, _("\
e379e5f3
L
13560 -malign-branch-boundary=NUM (default: 0)\n\
13561 align branches within NUM byte boundary\n"));
13562 fprintf (stream, _("\
13563 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13564 TYPE is combination of jcc, fused, jmp, call, ret,\n\
13565 indirect\n\
13566 specify types of branches to align\n"));
13567 fprintf (stream, _("\
13568 -malign-branch-prefix-size=NUM (default: 5)\n\
13569 align branches with NUM prefixes per instruction\n"));
13570 fprintf (stream, _("\
76cf450b
L
13571 -mbranches-within-32B-boundaries\n\
13572 align branches within 32 byte boundary\n"));
13573 fprintf (stream, _("\
ae531041
L
13574 -mlfence-after-load=[no|yes] (default: no)\n\
13575 generate lfence after load\n"));
13576 fprintf (stream, _("\
13577 -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13578 generate lfence before indirect near branch\n"));
13579 fprintf (stream, _("\
a09f656b 13580 -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
ae531041
L
13581 generate lfence before ret\n"));
13582 fprintf (stream, _("\
7c5c05ef 13583 -mamd64 accept only AMD64 ISA [default]\n"));
5db04b09
L
13584 fprintf (stream, _("\
13585 -mintel64 accept only Intel64 ISA\n"));
252b5132
RH
13586}
13587
3e73aa7c 13588#if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
321098a5 13589 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
e57f8c65 13590 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
252b5132
RH
13591
13592/* Pick the target format to use. */
13593
47926f60 13594const char *
e3bb37b5 13595i386_target_format (void)
252b5132 13596{
351f65ca
L
13597 if (!strncmp (default_arch, "x86_64", 6))
13598 {
13599 update_code_flag (CODE_64BIT, 1);
13600 if (default_arch[6] == '\0')
7f56bc95 13601 x86_elf_abi = X86_64_ABI;
351f65ca 13602 else
7f56bc95 13603 x86_elf_abi = X86_64_X32_ABI;
351f65ca 13604 }
3e73aa7c 13605 else if (!strcmp (default_arch, "i386"))
78f12dd3 13606 update_code_flag (CODE_32BIT, 1);
5197d474
L
13607 else if (!strcmp (default_arch, "iamcu"))
13608 {
13609 update_code_flag (CODE_32BIT, 1);
13610 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13611 {
13612 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13613 cpu_arch_name = "iamcu";
13614 cpu_sub_arch_name = NULL;
13615 cpu_arch_flags = iamcu_flags;
13616 cpu_arch_isa = PROCESSOR_IAMCU;
13617 cpu_arch_isa_flags = iamcu_flags;
13618 if (!cpu_arch_tune_set)
13619 {
13620 cpu_arch_tune = cpu_arch_isa;
13621 cpu_arch_tune_flags = cpu_arch_isa_flags;
13622 }
13623 }
8d471ec1 13624 else if (cpu_arch_isa != PROCESSOR_IAMCU)
5197d474
L
13625 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13626 cpu_arch_name);
13627 }
3e73aa7c 13628 else
2b5d6a91 13629 as_fatal (_("unknown architecture"));
89507696
JB
13630
13631 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13632 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13633 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13634 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13635
252b5132
RH
13636 switch (OUTPUT_FLAVOR)
13637 {
9384f2ff 13638#if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
4c63da97 13639 case bfd_target_aout_flavour:
47926f60 13640 return AOUT_TARGET_FORMAT;
4c63da97 13641#endif
9384f2ff
AM
13642#if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13643# if defined (TE_PE) || defined (TE_PEP)
13644 case bfd_target_coff_flavour:
167ad85b
TG
13645 if (flag_code == CODE_64BIT)
13646 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13647 else
251dae91 13648 return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
9384f2ff 13649# elif defined (TE_GO32)
0561d57c
JK
13650 case bfd_target_coff_flavour:
13651 return "coff-go32";
9384f2ff 13652# else
252b5132
RH
13653 case bfd_target_coff_flavour:
13654 return "coff-i386";
9384f2ff 13655# endif
4c63da97 13656#endif
3e73aa7c 13657#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
252b5132 13658 case bfd_target_elf_flavour:
3e73aa7c 13659 {
351f65ca
L
13660 const char *format;
13661
13662 switch (x86_elf_abi)
4fa24527 13663 {
351f65ca
L
13664 default:
13665 format = ELF_TARGET_FORMAT;
e379e5f3
L
13666#ifndef TE_SOLARIS
13667 tls_get_addr = "___tls_get_addr";
13668#endif
351f65ca 13669 break;
7f56bc95 13670 case X86_64_ABI:
351f65ca 13671 use_rela_relocations = 1;
4fa24527 13672 object_64bit = 1;
e379e5f3
L
13673#ifndef TE_SOLARIS
13674 tls_get_addr = "__tls_get_addr";
13675#endif
351f65ca
L
13676 format = ELF_TARGET_FORMAT64;
13677 break;
7f56bc95 13678 case X86_64_X32_ABI:
4fa24527 13679 use_rela_relocations = 1;
351f65ca 13680 object_64bit = 1;
e379e5f3
L
13681#ifndef TE_SOLARIS
13682 tls_get_addr = "__tls_get_addr";
13683#endif
862be3fb 13684 disallow_64bit_reloc = 1;
351f65ca
L
13685 format = ELF_TARGET_FORMAT32;
13686 break;
4fa24527 13687 }
3632d14b 13688 if (cpu_arch_isa == PROCESSOR_L1OM)
8a9036a4 13689 {
7f56bc95 13690 if (x86_elf_abi != X86_64_ABI)
8a9036a4
L
13691 as_fatal (_("Intel L1OM is 64bit only"));
13692 return ELF_TARGET_L1OM_FORMAT;
13693 }
b49f93f6 13694 else if (cpu_arch_isa == PROCESSOR_K1OM)
7a9068fe
L
13695 {
13696 if (x86_elf_abi != X86_64_ABI)
13697 as_fatal (_("Intel K1OM is 64bit only"));
13698 return ELF_TARGET_K1OM_FORMAT;
13699 }
81486035
L
13700 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13701 {
13702 if (x86_elf_abi != I386_ABI)
13703 as_fatal (_("Intel MCU is 32bit only"));
13704 return ELF_TARGET_IAMCU_FORMAT;
13705 }
8a9036a4 13706 else
351f65ca 13707 return format;
3e73aa7c 13708 }
e57f8c65
TG
13709#endif
13710#if defined (OBJ_MACH_O)
13711 case bfd_target_mach_o_flavour:
d382c579
TG
13712 if (flag_code == CODE_64BIT)
13713 {
13714 use_rela_relocations = 1;
13715 object_64bit = 1;
13716 return "mach-o-x86-64";
13717 }
13718 else
13719 return "mach-o-i386";
4c63da97 13720#endif
252b5132
RH
13721 default:
13722 abort ();
13723 return NULL;
13724 }
13725}
13726
47926f60 13727#endif /* OBJ_MAYBE_ more than one */
252b5132 13728\f
252b5132 13729symbolS *
7016a5d5 13730md_undefined_symbol (char *name)
252b5132 13731{
18dc2407
ILT
13732 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13733 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13734 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13735 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
24eab124
AM
13736 {
13737 if (!GOT_symbol)
13738 {
13739 if (symbol_find (name))
13740 as_bad (_("GOT already in symbol table"));
13741 GOT_symbol = symbol_new (name, undefined_section,
13742 (valueT) 0, &zero_address_frag);
13743 };
13744 return GOT_symbol;
13745 }
252b5132
RH
13746 return 0;
13747}
13748
13749/* Round up a section size to the appropriate boundary. */
47926f60 13750
252b5132 13751valueT
7016a5d5 13752md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
252b5132 13753{
4c63da97
AM
13754#if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13755 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13756 {
13757 /* For a.out, force the section size to be aligned. If we don't do
13758 this, BFD will align it for us, but it will not write out the
13759 final bytes of the section. This may be a bug in BFD, but it is
13760 easier to fix it here since that is how the other a.out targets
13761 work. */
13762 int align;
13763
fd361982 13764 align = bfd_section_alignment (segment);
8d3842cd 13765 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
4c63da97 13766 }
252b5132
RH
13767#endif
13768
13769 return size;
13770}
13771
13772/* On the i386, PC-relative offsets are relative to the start of the
13773 next instruction. That is, the address of the offset, plus its
13774 size, since the offset is always the last part of the insn. */
13775
13776long
e3bb37b5 13777md_pcrel_from (fixS *fixP)
252b5132
RH
13778{
13779 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13780}
13781
13782#ifndef I386COFF
13783
13784static void
e3bb37b5 13785s_bss (int ignore ATTRIBUTE_UNUSED)
252b5132 13786{
29b0f896 13787 int temp;
252b5132 13788
8a75718c
JB
13789#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13790 if (IS_ELF)
13791 obj_elf_section_change_hook ();
13792#endif
252b5132
RH
13793 temp = get_absolute_expression ();
13794 subseg_set (bss_section, (subsegT) temp);
13795 demand_empty_rest_of_line ();
13796}
13797
13798#endif
13799
e379e5f3
L
13800/* Remember constant directive. */
13801
13802void
13803i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13804{
13805 if (last_insn.kind != last_insn_directive
13806 && (bfd_section_flags (now_seg) & SEC_CODE))
13807 {
13808 last_insn.seg = now_seg;
13809 last_insn.kind = last_insn_directive;
13810 last_insn.name = "constant directive";
13811 last_insn.file = as_where (&last_insn.line);
ae531041
L
13812 if (lfence_before_ret != lfence_before_ret_none)
13813 {
13814 if (lfence_before_indirect_branch != lfence_branch_none)
13815 as_warn (_("constant directive skips -mlfence-before-ret "
13816 "and -mlfence-before-indirect-branch"));
13817 else
13818 as_warn (_("constant directive skips -mlfence-before-ret"));
13819 }
13820 else if (lfence_before_indirect_branch != lfence_branch_none)
13821 as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
e379e5f3
L
13822 }
13823}
13824
252b5132 13825void
e3bb37b5 13826i386_validate_fix (fixS *fixp)
252b5132 13827{
02a86693 13828 if (fixp->fx_subsy)
252b5132 13829 {
02a86693 13830 if (fixp->fx_subsy == GOT_symbol)
23df1078 13831 {
02a86693
L
13832 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13833 {
13834 if (!object_64bit)
13835 abort ();
13836#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13837 if (fixp->fx_tcbit2)
56ceb5b5
L
13838 fixp->fx_r_type = (fixp->fx_tcbit
13839 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13840 : BFD_RELOC_X86_64_GOTPCRELX);
02a86693
L
13841 else
13842#endif
13843 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13844 }
d6ab8113 13845 else
02a86693
L
13846 {
13847 if (!object_64bit)
13848 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13849 else
13850 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13851 }
13852 fixp->fx_subsy = 0;
23df1078 13853 }
252b5132 13854 }
02a86693
L
13855#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13856 else if (!object_64bit)
13857 {
13858 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13859 && fixp->fx_tcbit2)
13860 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13861 }
13862#endif
252b5132
RH
13863}
13864
252b5132 13865arelent *
7016a5d5 13866tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
252b5132
RH
13867{
13868 arelent *rel;
13869 bfd_reloc_code_real_type code;
13870
13871 switch (fixp->fx_r_type)
13872 {
8ce3d284 13873#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8fd4256d
L
13874 case BFD_RELOC_SIZE32:
13875 case BFD_RELOC_SIZE64:
13876 if (S_IS_DEFINED (fixp->fx_addsy)
13877 && !S_IS_EXTERNAL (fixp->fx_addsy))
13878 {
13879 /* Resolve size relocation against local symbol to size of
13880 the symbol plus addend. */
13881 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13882 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13883 && !fits_in_unsigned_long (value))
13884 as_bad_where (fixp->fx_file, fixp->fx_line,
13885 _("symbol size computation overflow"));
13886 fixp->fx_addsy = NULL;
13887 fixp->fx_subsy = NULL;
13888 md_apply_fix (fixp, (valueT *) &value, NULL);
13889 return NULL;
13890 }
8ce3d284 13891#endif
1a0670f3 13892 /* Fall through. */
8fd4256d 13893
3e73aa7c
JH
13894 case BFD_RELOC_X86_64_PLT32:
13895 case BFD_RELOC_X86_64_GOT32:
13896 case BFD_RELOC_X86_64_GOTPCREL:
56ceb5b5
L
13897 case BFD_RELOC_X86_64_GOTPCRELX:
13898 case BFD_RELOC_X86_64_REX_GOTPCRELX:
252b5132
RH
13899 case BFD_RELOC_386_PLT32:
13900 case BFD_RELOC_386_GOT32:
02a86693 13901 case BFD_RELOC_386_GOT32X:
252b5132
RH
13902 case BFD_RELOC_386_GOTOFF:
13903 case BFD_RELOC_386_GOTPC:
13ae64f3
JJ
13904 case BFD_RELOC_386_TLS_GD:
13905 case BFD_RELOC_386_TLS_LDM:
13906 case BFD_RELOC_386_TLS_LDO_32:
13907 case BFD_RELOC_386_TLS_IE_32:
37e55690
JJ
13908 case BFD_RELOC_386_TLS_IE:
13909 case BFD_RELOC_386_TLS_GOTIE:
13ae64f3
JJ
13910 case BFD_RELOC_386_TLS_LE_32:
13911 case BFD_RELOC_386_TLS_LE:
67a4f2b7
AO
13912 case BFD_RELOC_386_TLS_GOTDESC:
13913 case BFD_RELOC_386_TLS_DESC_CALL:
bffbf940
JJ
13914 case BFD_RELOC_X86_64_TLSGD:
13915 case BFD_RELOC_X86_64_TLSLD:
13916 case BFD_RELOC_X86_64_DTPOFF32:
d6ab8113 13917 case BFD_RELOC_X86_64_DTPOFF64:
bffbf940
JJ
13918 case BFD_RELOC_X86_64_GOTTPOFF:
13919 case BFD_RELOC_X86_64_TPOFF32:
d6ab8113
JB
13920 case BFD_RELOC_X86_64_TPOFF64:
13921 case BFD_RELOC_X86_64_GOTOFF64:
13922 case BFD_RELOC_X86_64_GOTPC32:
7b81dfbb
AJ
13923 case BFD_RELOC_X86_64_GOT64:
13924 case BFD_RELOC_X86_64_GOTPCREL64:
13925 case BFD_RELOC_X86_64_GOTPC64:
13926 case BFD_RELOC_X86_64_GOTPLT64:
13927 case BFD_RELOC_X86_64_PLTOFF64:
67a4f2b7
AO
13928 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13929 case BFD_RELOC_X86_64_TLSDESC_CALL:
252b5132
RH
13930 case BFD_RELOC_RVA:
13931 case BFD_RELOC_VTABLE_ENTRY:
13932 case BFD_RELOC_VTABLE_INHERIT:
6482c264
NC
13933#ifdef TE_PE
13934 case BFD_RELOC_32_SECREL:
13935#endif
252b5132
RH
13936 code = fixp->fx_r_type;
13937 break;
dbbaec26
L
13938 case BFD_RELOC_X86_64_32S:
13939 if (!fixp->fx_pcrel)
13940 {
13941 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13942 code = fixp->fx_r_type;
13943 break;
13944 }
1a0670f3 13945 /* Fall through. */
252b5132 13946 default:
93382f6d 13947 if (fixp->fx_pcrel)
252b5132 13948 {
93382f6d
AM
13949 switch (fixp->fx_size)
13950 {
13951 default:
b091f402
AM
13952 as_bad_where (fixp->fx_file, fixp->fx_line,
13953 _("can not do %d byte pc-relative relocation"),
13954 fixp->fx_size);
93382f6d
AM
13955 code = BFD_RELOC_32_PCREL;
13956 break;
13957 case 1: code = BFD_RELOC_8_PCREL; break;
13958 case 2: code = BFD_RELOC_16_PCREL; break;
d258b828 13959 case 4: code = BFD_RELOC_32_PCREL; break;
d6ab8113
JB
13960#ifdef BFD64
13961 case 8: code = BFD_RELOC_64_PCREL; break;
13962#endif
93382f6d
AM
13963 }
13964 }
13965 else
13966 {
13967 switch (fixp->fx_size)
13968 {
13969 default:
b091f402
AM
13970 as_bad_where (fixp->fx_file, fixp->fx_line,
13971 _("can not do %d byte relocation"),
13972 fixp->fx_size);
93382f6d
AM
13973 code = BFD_RELOC_32;
13974 break;
13975 case 1: code = BFD_RELOC_8; break;
13976 case 2: code = BFD_RELOC_16; break;
13977 case 4: code = BFD_RELOC_32; break;
937149dd 13978#ifdef BFD64
3e73aa7c 13979 case 8: code = BFD_RELOC_64; break;
937149dd 13980#endif
93382f6d 13981 }
252b5132
RH
13982 }
13983 break;
13984 }
252b5132 13985
d182319b
JB
13986 if ((code == BFD_RELOC_32
13987 || code == BFD_RELOC_32_PCREL
13988 || code == BFD_RELOC_X86_64_32S)
252b5132
RH
13989 && GOT_symbol
13990 && fixp->fx_addsy == GOT_symbol)
3e73aa7c 13991 {
4fa24527 13992 if (!object_64bit)
d6ab8113
JB
13993 code = BFD_RELOC_386_GOTPC;
13994 else
13995 code = BFD_RELOC_X86_64_GOTPC32;
3e73aa7c 13996 }
7b81dfbb
AJ
13997 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13998 && GOT_symbol
13999 && fixp->fx_addsy == GOT_symbol)
14000 {
14001 code = BFD_RELOC_X86_64_GOTPC64;
14002 }
252b5132 14003
add39d23
TS
14004 rel = XNEW (arelent);
14005 rel->sym_ptr_ptr = XNEW (asymbol *);
49309057 14006 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
252b5132
RH
14007
14008 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
c87db184 14009
3e73aa7c
JH
14010 if (!use_rela_relocations)
14011 {
14012 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
14013 vtable entry to be used in the relocation's section offset. */
14014 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
14015 rel->address = fixp->fx_offset;
fbeb56a4
DK
14016#if defined (OBJ_COFF) && defined (TE_PE)
14017 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
14018 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
14019 else
14020#endif
c6682705 14021 rel->addend = 0;
3e73aa7c
JH
14022 }
14023 /* Use the rela in 64bit mode. */
252b5132 14024 else
3e73aa7c 14025 {
862be3fb
L
14026 if (disallow_64bit_reloc)
14027 switch (code)
14028 {
862be3fb
L
14029 case BFD_RELOC_X86_64_DTPOFF64:
14030 case BFD_RELOC_X86_64_TPOFF64:
14031 case BFD_RELOC_64_PCREL:
14032 case BFD_RELOC_X86_64_GOTOFF64:
14033 case BFD_RELOC_X86_64_GOT64:
14034 case BFD_RELOC_X86_64_GOTPCREL64:
14035 case BFD_RELOC_X86_64_GOTPC64:
14036 case BFD_RELOC_X86_64_GOTPLT64:
14037 case BFD_RELOC_X86_64_PLTOFF64:
14038 as_bad_where (fixp->fx_file, fixp->fx_line,
14039 _("cannot represent relocation type %s in x32 mode"),
14040 bfd_get_reloc_code_name (code));
14041 break;
14042 default:
14043 break;
14044 }
14045
062cd5e7
AS
14046 if (!fixp->fx_pcrel)
14047 rel->addend = fixp->fx_offset;
14048 else
14049 switch (code)
14050 {
14051 case BFD_RELOC_X86_64_PLT32:
14052 case BFD_RELOC_X86_64_GOT32:
14053 case BFD_RELOC_X86_64_GOTPCREL:
56ceb5b5
L
14054 case BFD_RELOC_X86_64_GOTPCRELX:
14055 case BFD_RELOC_X86_64_REX_GOTPCRELX:
bffbf940
JJ
14056 case BFD_RELOC_X86_64_TLSGD:
14057 case BFD_RELOC_X86_64_TLSLD:
14058 case BFD_RELOC_X86_64_GOTTPOFF:
67a4f2b7
AO
14059 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14060 case BFD_RELOC_X86_64_TLSDESC_CALL:
062cd5e7
AS
14061 rel->addend = fixp->fx_offset - fixp->fx_size;
14062 break;
14063 default:
14064 rel->addend = (section->vma
14065 - fixp->fx_size
14066 + fixp->fx_addnumber
14067 + md_pcrel_from (fixp));
14068 break;
14069 }
3e73aa7c
JH
14070 }
14071
252b5132
RH
14072 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14073 if (rel->howto == NULL)
14074 {
14075 as_bad_where (fixp->fx_file, fixp->fx_line,
d0b47220 14076 _("cannot represent relocation type %s"),
252b5132
RH
14077 bfd_get_reloc_code_name (code));
14078 /* Set howto to a garbage value so that we can keep going. */
14079 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
9c2799c2 14080 gas_assert (rel->howto != NULL);
252b5132
RH
14081 }
14082
14083 return rel;
14084}
14085
ee86248c 14086#include "tc-i386-intel.c"
54cfded0 14087
a60de03c
JB
14088void
14089tc_x86_parse_to_dw2regnum (expressionS *exp)
54cfded0 14090{
a60de03c
JB
14091 int saved_naked_reg;
14092 char saved_register_dot;
54cfded0 14093
a60de03c
JB
14094 saved_naked_reg = allow_naked_reg;
14095 allow_naked_reg = 1;
14096 saved_register_dot = register_chars['.'];
14097 register_chars['.'] = '.';
14098 allow_pseudo_reg = 1;
14099 expression_and_evaluate (exp);
14100 allow_pseudo_reg = 0;
14101 register_chars['.'] = saved_register_dot;
14102 allow_naked_reg = saved_naked_reg;
14103
e96d56a1 14104 if (exp->X_op == O_register && exp->X_add_number >= 0)
54cfded0 14105 {
a60de03c
JB
14106 if ((addressT) exp->X_add_number < i386_regtab_size)
14107 {
14108 exp->X_op = O_constant;
14109 exp->X_add_number = i386_regtab[exp->X_add_number]
14110 .dw2_regnum[flag_code >> 1];
14111 }
14112 else
14113 exp->X_op = O_illegal;
54cfded0 14114 }
54cfded0
AM
14115}
14116
14117void
14118tc_x86_frame_initial_instructions (void)
14119{
a60de03c
JB
14120 static unsigned int sp_regno[2];
14121
14122 if (!sp_regno[flag_code >> 1])
14123 {
14124 char *saved_input = input_line_pointer;
14125 char sp[][4] = {"esp", "rsp"};
14126 expressionS exp;
a4447b93 14127
a60de03c
JB
14128 input_line_pointer = sp[flag_code >> 1];
14129 tc_x86_parse_to_dw2regnum (&exp);
9c2799c2 14130 gas_assert (exp.X_op == O_constant);
a60de03c
JB
14131 sp_regno[flag_code >> 1] = exp.X_add_number;
14132 input_line_pointer = saved_input;
14133 }
a4447b93 14134
61ff971f
L
14135 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14136 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
54cfded0 14137}
d2b2c203 14138
d7921315
L
14139int
14140x86_dwarf2_addr_size (void)
14141{
14142#if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14143 if (x86_elf_abi == X86_64_X32_ABI)
14144 return 4;
14145#endif
14146 return bfd_arch_bits_per_address (stdoutput) / 8;
14147}
14148
d2b2c203
DJ
14149int
14150i386_elf_section_type (const char *str, size_t len)
14151{
14152 if (flag_code == CODE_64BIT
14153 && len == sizeof ("unwind") - 1
14154 && strncmp (str, "unwind", 6) == 0)
14155 return SHT_X86_64_UNWIND;
14156
14157 return -1;
14158}
bb41ade5 14159
ad5fec3b
EB
14160#ifdef TE_SOLARIS
14161void
14162i386_solaris_fix_up_eh_frame (segT sec)
14163{
14164 if (flag_code == CODE_64BIT)
14165 elf_section_type (sec) = SHT_X86_64_UNWIND;
14166}
14167#endif
14168
bb41ade5
AM
14169#ifdef TE_PE
14170void
14171tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14172{
91d6fa6a 14173 expressionS exp;
bb41ade5 14174
91d6fa6a
NC
14175 exp.X_op = O_secrel;
14176 exp.X_add_symbol = symbol;
14177 exp.X_add_number = 0;
14178 emit_expr (&exp, size);
bb41ade5
AM
14179}
14180#endif
3b22753a
L
14181
14182#if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14183/* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
14184
01e1a5bc 14185bfd_vma
6d4af3c2 14186x86_64_section_letter (int letter, const char **ptr_msg)
3b22753a
L
14187{
14188 if (flag_code == CODE_64BIT)
14189 {
14190 if (letter == 'l')
14191 return SHF_X86_64_LARGE;
14192
8f3bae45 14193 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
64e74474 14194 }
3b22753a 14195 else
8f3bae45 14196 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
3b22753a
L
14197 return -1;
14198}
14199
01e1a5bc 14200bfd_vma
3b22753a
L
14201x86_64_section_word (char *str, size_t len)
14202{
8620418b 14203 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
3b22753a
L
14204 return SHF_X86_64_LARGE;
14205
14206 return -1;
14207}
14208
14209static void
14210handle_large_common (int small ATTRIBUTE_UNUSED)
14211{
14212 if (flag_code != CODE_64BIT)
14213 {
14214 s_comm_internal (0, elf_common_parse);
14215 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14216 }
14217 else
14218 {
14219 static segT lbss_section;
14220 asection *saved_com_section_ptr = elf_com_section_ptr;
14221 asection *saved_bss_section = bss_section;
14222
14223 if (lbss_section == NULL)
14224 {
14225 flagword applicable;
14226 segT seg = now_seg;
14227 subsegT subseg = now_subseg;
14228
14229 /* The .lbss section is for local .largecomm symbols. */
14230 lbss_section = subseg_new (".lbss", 0);
14231 applicable = bfd_applicable_section_flags (stdoutput);
fd361982 14232 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
3b22753a
L
14233 seg_info (lbss_section)->bss = 1;
14234
14235 subseg_set (seg, subseg);
14236 }
14237
14238 elf_com_section_ptr = &_bfd_elf_large_com_section;
14239 bss_section = lbss_section;
14240
14241 s_comm_internal (0, elf_common_parse);
14242
14243 elf_com_section_ptr = saved_com_section_ptr;
14244 bss_section = saved_bss_section;
14245 }
14246}
14247#endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 2.489683 seconds and 4 git commands to generate.