147acdfa36c73343ac692d122640c6c60b0daf89
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999,
3 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011,
4 2012, 2013, 2014
5 Free Software Foundation, Inc.
6
7 This file is part of GAS, the GNU Assembler.
8
9 GAS is free software; you can redistribute it and/or modify
10 it under the terms of the GNU General Public License as published by
11 the Free Software Foundation; either version 3, or (at your option)
12 any later version.
13
14 GAS is distributed in the hope that it will be useful,
15 but WITHOUT ANY WARRANTY; without even the implied warranty of
16 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 GNU General Public License for more details.
18
19 You should have received a copy of the GNU General Public License
20 along with GAS; see the file COPYING. If not, write to the Free
21 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
22 02110-1301, USA. */
23
24 /* Intel 80386 machine specific gas.
25 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
26 x86_64 support by Jan Hubicka (jh@suse.cz)
27 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
28 Bugs & suggestions are completely welcome. This is free software.
29 Please help us make it better. */
30
31 #include "as.h"
32 #include "safe-ctype.h"
33 #include "subsegs.h"
34 #include "dwarf2dbg.h"
35 #include "dw2gencfi.h"
36 #include "elf/x86-64.h"
37 #include "opcodes/i386-init.h"
38
39 #ifndef REGISTER_WARNINGS
40 #define REGISTER_WARNINGS 1
41 #endif
42
43 #ifndef INFER_ADDR_PREFIX
44 #define INFER_ADDR_PREFIX 1
45 #endif
46
47 #ifndef DEFAULT_ARCH
48 #define DEFAULT_ARCH "i386"
49 #endif
50
51 #ifndef INLINE
52 #if __GNUC__ >= 2
53 #define INLINE __inline__
54 #else
55 #define INLINE
56 #endif
57 #endif
58
59 /* Prefixes will be emitted in the order defined below.
60 WAIT_PREFIX must be the first prefix since FWAIT is really is an
61 instruction, and so must come before any prefixes.
62 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
63 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
64 #define WAIT_PREFIX 0
65 #define SEG_PREFIX 1
66 #define ADDR_PREFIX 2
67 #define DATA_PREFIX 3
68 #define REP_PREFIX 4
69 #define HLE_PREFIX REP_PREFIX
70 #define BND_PREFIX REP_PREFIX
71 #define LOCK_PREFIX 5
72 #define REX_PREFIX 6 /* must come last. */
73 #define MAX_PREFIXES 7 /* max prefixes per opcode */
74
75 /* we define the syntax here (modulo base,index,scale syntax) */
76 #define REGISTER_PREFIX '%'
77 #define IMMEDIATE_PREFIX '$'
78 #define ABSOLUTE_PREFIX '*'
79
80 /* these are the instruction mnemonic suffixes in AT&T syntax or
81 memory operand size in Intel syntax. */
82 #define WORD_MNEM_SUFFIX 'w'
83 #define BYTE_MNEM_SUFFIX 'b'
84 #define SHORT_MNEM_SUFFIX 's'
85 #define LONG_MNEM_SUFFIX 'l'
86 #define QWORD_MNEM_SUFFIX 'q'
87 #define XMMWORD_MNEM_SUFFIX 'x'
88 #define YMMWORD_MNEM_SUFFIX 'y'
89 #define ZMMWORD_MNEM_SUFFIX 'z'
90 /* Intel Syntax. Use a non-ascii letter since since it never appears
91 in instructions. */
92 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
93
94 #define END_OF_INSN '\0'
95
96 /*
97 'templates' is for grouping together 'template' structures for opcodes
98 of the same name. This is only used for storing the insns in the grand
99 ole hash table of insns.
100 The templates themselves start at START and range up to (but not including)
101 END.
102 */
103 typedef struct
104 {
105 const insn_template *start;
106 const insn_template *end;
107 }
108 templates;
109
110 /* 386 operand encoding bytes: see 386 book for details of this. */
111 typedef struct
112 {
113 unsigned int regmem; /* codes register or memory operand */
114 unsigned int reg; /* codes register operand (or extended opcode) */
115 unsigned int mode; /* how to interpret regmem & reg */
116 }
117 modrm_byte;
118
119 /* x86-64 extension prefix. */
120 typedef int rex_byte;
121
122 /* 386 opcode byte to code indirect addressing. */
123 typedef struct
124 {
125 unsigned base;
126 unsigned index;
127 unsigned scale;
128 }
129 sib_byte;
130
131 /* x86 arch names, types and features */
132 typedef struct
133 {
134 const char *name; /* arch name */
135 unsigned int len; /* arch string length */
136 enum processor_type type; /* arch type */
137 i386_cpu_flags flags; /* cpu feature flags */
138 unsigned int skip; /* show_arch should skip this. */
139 unsigned int negated; /* turn off indicated flags. */
140 }
141 arch_entry;
142
143 static void update_code_flag (int, int);
144 static void set_code_flag (int);
145 static void set_16bit_gcc_code_flag (int);
146 static void set_intel_syntax (int);
147 static void set_intel_mnemonic (int);
148 static void set_allow_index_reg (int);
149 static void set_check (int);
150 static void set_cpu_arch (int);
151 #ifdef TE_PE
152 static void pe_directive_secrel (int);
153 #endif
154 static void signed_cons (int);
155 static char *output_invalid (int c);
156 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
157 const char *);
158 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
159 const char *);
160 static int i386_att_operand (char *);
161 static int i386_intel_operand (char *, int);
162 static int i386_intel_simplify (expressionS *);
163 static int i386_intel_parse_name (const char *, expressionS *);
164 static const reg_entry *parse_register (char *, char **);
165 static char *parse_insn (char *, char *);
166 static char *parse_operands (char *, const char *);
167 static void swap_operands (void);
168 static void swap_2_operands (int, int);
169 static void optimize_imm (void);
170 static void optimize_disp (void);
171 static const insn_template *match_template (void);
172 static int check_string (void);
173 static int process_suffix (void);
174 static int check_byte_reg (void);
175 static int check_long_reg (void);
176 static int check_qword_reg (void);
177 static int check_word_reg (void);
178 static int finalize_imm (void);
179 static int process_operands (void);
180 static const seg_entry *build_modrm_byte (void);
181 static void output_insn (void);
182 static void output_imm (fragS *, offsetT);
183 static void output_disp (fragS *, offsetT);
184 #ifndef I386COFF
185 static void s_bss (int);
186 #endif
187 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
188 static void handle_large_common (int small ATTRIBUTE_UNUSED);
189 #endif
190
191 static const char *default_arch = DEFAULT_ARCH;
192
193 /* This struct describes rounding control and SAE in the instruction. */
194 struct RC_Operation
195 {
196 enum rc_type
197 {
198 rne = 0,
199 rd,
200 ru,
201 rz,
202 saeonly
203 } type;
204 int operand;
205 };
206
207 static struct RC_Operation rc_op;
208
209 /* The struct describes masking, applied to OPERAND in the instruction.
210 MASK is a pointer to the corresponding mask register. ZEROING tells
211 whether merging or zeroing mask is used. */
212 struct Mask_Operation
213 {
214 const reg_entry *mask;
215 unsigned int zeroing;
216 /* The operand where this operation is associated. */
217 int operand;
218 };
219
220 static struct Mask_Operation mask_op;
221
222 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
223 broadcast factor. */
224 struct Broadcast_Operation
225 {
226 /* Type of broadcast: no broadcast, {1to8}, or {1to16}. */
227 int type;
228
229 /* Index of broadcasted operand. */
230 int operand;
231 };
232
233 static struct Broadcast_Operation broadcast_op;
234
235 /* VEX prefix. */
236 typedef struct
237 {
238 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
239 unsigned char bytes[4];
240 unsigned int length;
241 /* Destination or source register specifier. */
242 const reg_entry *register_specifier;
243 } vex_prefix;
244
245 /* 'md_assemble ()' gathers together information and puts it into a
246 i386_insn. */
247
248 union i386_op
249 {
250 expressionS *disps;
251 expressionS *imms;
252 const reg_entry *regs;
253 };
254
255 enum i386_error
256 {
257 operand_size_mismatch,
258 operand_type_mismatch,
259 register_type_mismatch,
260 number_of_operands_mismatch,
261 invalid_instruction_suffix,
262 bad_imm4,
263 old_gcc_only,
264 unsupported_with_intel_mnemonic,
265 unsupported_syntax,
266 unsupported,
267 invalid_vsib_address,
268 invalid_vector_register_set,
269 unsupported_vector_index_register,
270 unsupported_broadcast,
271 broadcast_not_on_src_operand,
272 broadcast_needed,
273 unsupported_masking,
274 mask_not_on_destination,
275 no_default_mask,
276 unsupported_rc_sae,
277 rc_sae_operand_not_last_imm,
278 invalid_register_operand,
279 try_vector_disp8
280 };
281
282 struct _i386_insn
283 {
284 /* TM holds the template for the insn were currently assembling. */
285 insn_template tm;
286
287 /* SUFFIX holds the instruction size suffix for byte, word, dword
288 or qword, if given. */
289 char suffix;
290
291 /* OPERANDS gives the number of given operands. */
292 unsigned int operands;
293
294 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
295 of given register, displacement, memory operands and immediate
296 operands. */
297 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
298
299 /* TYPES [i] is the type (see above #defines) which tells us how to
300 use OP[i] for the corresponding operand. */
301 i386_operand_type types[MAX_OPERANDS];
302
303 /* Displacement expression, immediate expression, or register for each
304 operand. */
305 union i386_op op[MAX_OPERANDS];
306
307 /* Flags for operands. */
308 unsigned int flags[MAX_OPERANDS];
309 #define Operand_PCrel 1
310
311 /* Relocation type for operand */
312 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
313
314 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
315 the base index byte below. */
316 const reg_entry *base_reg;
317 const reg_entry *index_reg;
318 unsigned int log2_scale_factor;
319
320 /* SEG gives the seg_entries of this insn. They are zero unless
321 explicit segment overrides are given. */
322 const seg_entry *seg[2];
323
324 /* PREFIX holds all the given prefix opcodes (usually null).
325 PREFIXES is the number of prefix opcodes. */
326 unsigned int prefixes;
327 unsigned char prefix[MAX_PREFIXES];
328
329 /* RM and SIB are the modrm byte and the sib byte where the
330 addressing modes of this insn are encoded. */
331 modrm_byte rm;
332 rex_byte rex;
333 rex_byte vrex;
334 sib_byte sib;
335 vex_prefix vex;
336
337 /* Masking attributes. */
338 struct Mask_Operation *mask;
339
340 /* Rounding control and SAE attributes. */
341 struct RC_Operation *rounding;
342
343 /* Broadcasting attributes. */
344 struct Broadcast_Operation *broadcast;
345
346 /* Compressed disp8*N attribute. */
347 unsigned int memshift;
348
349 /* Swap operand in encoding. */
350 unsigned int swap_operand;
351
352 /* Prefer 8bit or 32bit displacement in encoding. */
353 enum
354 {
355 disp_encoding_default = 0,
356 disp_encoding_8bit,
357 disp_encoding_32bit
358 } disp_encoding;
359
360 /* REP prefix. */
361 const char *rep_prefix;
362
363 /* HLE prefix. */
364 const char *hle_prefix;
365
366 /* Have BND prefix. */
367 const char *bnd_prefix;
368
369 /* Need VREX to support upper 16 registers. */
370 int need_vrex;
371
372 /* Error message. */
373 enum i386_error error;
374 };
375
376 typedef struct _i386_insn i386_insn;
377
378 /* Link RC type with corresponding string, that'll be looked for in
379 asm. */
380 struct RC_name
381 {
382 enum rc_type type;
383 const char *name;
384 unsigned int len;
385 };
386
387 static const struct RC_name RC_NamesTable[] =
388 {
389 { rne, STRING_COMMA_LEN ("rn-sae") },
390 { rd, STRING_COMMA_LEN ("rd-sae") },
391 { ru, STRING_COMMA_LEN ("ru-sae") },
392 { rz, STRING_COMMA_LEN ("rz-sae") },
393 { saeonly, STRING_COMMA_LEN ("sae") },
394 };
395
396 /* List of chars besides those in app.c:symbol_chars that can start an
397 operand. Used to prevent the scrubber eating vital white-space. */
398 const char extra_symbol_chars[] = "*%-([{"
399 #ifdef LEX_AT
400 "@"
401 #endif
402 #ifdef LEX_QM
403 "?"
404 #endif
405 ;
406
407 #if (defined (TE_I386AIX) \
408 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
409 && !defined (TE_GNU) \
410 && !defined (TE_LINUX) \
411 && !defined (TE_NACL) \
412 && !defined (TE_NETWARE) \
413 && !defined (TE_FreeBSD) \
414 && !defined (TE_DragonFly) \
415 && !defined (TE_NetBSD)))
416 /* This array holds the chars that always start a comment. If the
417 pre-processor is disabled, these aren't very useful. The option
418 --divide will remove '/' from this list. */
419 const char *i386_comment_chars = "#/";
420 #define SVR4_COMMENT_CHARS 1
421 #define PREFIX_SEPARATOR '\\'
422
423 #else
424 const char *i386_comment_chars = "#";
425 #define PREFIX_SEPARATOR '/'
426 #endif
427
428 /* This array holds the chars that only start a comment at the beginning of
429 a line. If the line seems to have the form '# 123 filename'
430 .line and .file directives will appear in the pre-processed output.
431 Note that input_file.c hand checks for '#' at the beginning of the
432 first line of the input file. This is because the compiler outputs
433 #NO_APP at the beginning of its output.
434 Also note that comments started like this one will always work if
435 '/' isn't otherwise defined. */
436 const char line_comment_chars[] = "#/";
437
438 const char line_separator_chars[] = ";";
439
440 /* Chars that can be used to separate mant from exp in floating point
441 nums. */
442 const char EXP_CHARS[] = "eE";
443
444 /* Chars that mean this number is a floating point constant
445 As in 0f12.456
446 or 0d1.2345e12. */
447 const char FLT_CHARS[] = "fFdDxX";
448
449 /* Tables for lexical analysis. */
450 static char mnemonic_chars[256];
451 static char register_chars[256];
452 static char operand_chars[256];
453 static char identifier_chars[256];
454 static char digit_chars[256];
455
456 /* Lexical macros. */
457 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
458 #define is_operand_char(x) (operand_chars[(unsigned char) x])
459 #define is_register_char(x) (register_chars[(unsigned char) x])
460 #define is_space_char(x) ((x) == ' ')
461 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
462 #define is_digit_char(x) (digit_chars[(unsigned char) x])
463
464 /* All non-digit non-letter characters that may occur in an operand. */
465 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
466
467 /* md_assemble() always leaves the strings it's passed unaltered. To
468 effect this we maintain a stack of saved characters that we've smashed
469 with '\0's (indicating end of strings for various sub-fields of the
470 assembler instruction). */
471 static char save_stack[32];
472 static char *save_stack_p;
473 #define END_STRING_AND_SAVE(s) \
474 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
475 #define RESTORE_END_STRING(s) \
476 do { *(s) = *--save_stack_p; } while (0)
477
478 /* The instruction we're assembling. */
479 static i386_insn i;
480
481 /* Possible templates for current insn. */
482 static const templates *current_templates;
483
484 /* Per instruction expressionS buffers: max displacements & immediates. */
485 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
486 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
487
488 /* Current operand we are working on. */
489 static int this_operand = -1;
490
491 /* We support four different modes. FLAG_CODE variable is used to distinguish
492 these. */
493
494 enum flag_code {
495 CODE_32BIT,
496 CODE_16BIT,
497 CODE_64BIT };
498
499 static enum flag_code flag_code;
500 static unsigned int object_64bit;
501 static unsigned int disallow_64bit_reloc;
502 static int use_rela_relocations = 0;
503
504 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
505 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
506 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
507
508 /* The ELF ABI to use. */
509 enum x86_elf_abi
510 {
511 I386_ABI,
512 X86_64_ABI,
513 X86_64_X32_ABI
514 };
515
516 static enum x86_elf_abi x86_elf_abi = I386_ABI;
517 #endif
518
519 /* 1 for intel syntax,
520 0 if att syntax. */
521 static int intel_syntax = 0;
522
523 /* 1 for intel mnemonic,
524 0 if att mnemonic. */
525 static int intel_mnemonic = !SYSV386_COMPAT;
526
527 /* 1 if support old (<= 2.8.1) versions of gcc. */
528 static int old_gcc = OLDGCC_COMPAT;
529
530 /* 1 if pseudo registers are permitted. */
531 static int allow_pseudo_reg = 0;
532
533 /* 1 if register prefix % not required. */
534 static int allow_naked_reg = 0;
535
536 /* 1 if the assembler should add BND prefix for all control-tranferring
537 instructions supporting it, even if this prefix wasn't specified
538 explicitly. */
539 static int add_bnd_prefix = 0;
540
541 /* 1 if pseudo index register, eiz/riz, is allowed . */
542 static int allow_index_reg = 0;
543
544 static enum check_kind
545 {
546 check_none = 0,
547 check_warning,
548 check_error
549 }
550 sse_check, operand_check = check_warning;
551
552 /* Register prefix used for error message. */
553 static const char *register_prefix = "%";
554
555 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
556 leave, push, and pop instructions so that gcc has the same stack
557 frame as in 32 bit mode. */
558 static char stackop_size = '\0';
559
560 /* Non-zero to optimize code alignment. */
561 int optimize_align_code = 1;
562
563 /* Non-zero to quieten some warnings. */
564 static int quiet_warnings = 0;
565
566 /* CPU name. */
567 static const char *cpu_arch_name = NULL;
568 static char *cpu_sub_arch_name = NULL;
569
570 /* CPU feature flags. */
571 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
572
573 /* If we have selected a cpu we are generating instructions for. */
574 static int cpu_arch_tune_set = 0;
575
576 /* Cpu we are generating instructions for. */
577 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
578
579 /* CPU feature flags of cpu we are generating instructions for. */
580 static i386_cpu_flags cpu_arch_tune_flags;
581
582 /* CPU instruction set architecture used. */
583 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
584
585 /* CPU feature flags of instruction set architecture used. */
586 i386_cpu_flags cpu_arch_isa_flags;
587
588 /* If set, conditional jumps are not automatically promoted to handle
589 larger than a byte offset. */
590 static unsigned int no_cond_jump_promotion = 0;
591
592 /* Encode SSE instructions with VEX prefix. */
593 static unsigned int sse2avx;
594
595 /* Encode scalar AVX instructions with specific vector length. */
596 static enum
597 {
598 vex128 = 0,
599 vex256
600 } avxscalar;
601
602 /* Encode scalar EVEX LIG instructions with specific vector length. */
603 static enum
604 {
605 evexl128 = 0,
606 evexl256,
607 evexl512
608 } evexlig;
609
610 /* Encode EVEX WIG instructions with specific evex.w. */
611 static enum
612 {
613 evexw0 = 0,
614 evexw1
615 } evexwig;
616
617 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
618 static symbolS *GOT_symbol;
619
620 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
621 unsigned int x86_dwarf2_return_column;
622
623 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
624 int x86_cie_data_alignment;
625
626 /* Interface to relax_segment.
627 There are 3 major relax states for 386 jump insns because the
628 different types of jumps add different sizes to frags when we're
629 figuring out what sort of jump to choose to reach a given label. */
630
631 /* Types. */
632 #define UNCOND_JUMP 0
633 #define COND_JUMP 1
634 #define COND_JUMP86 2
635
636 /* Sizes. */
637 #define CODE16 1
638 #define SMALL 0
639 #define SMALL16 (SMALL | CODE16)
640 #define BIG 2
641 #define BIG16 (BIG | CODE16)
642
643 #ifndef INLINE
644 #ifdef __GNUC__
645 #define INLINE __inline__
646 #else
647 #define INLINE
648 #endif
649 #endif
650
651 #define ENCODE_RELAX_STATE(type, size) \
652 ((relax_substateT) (((type) << 2) | (size)))
653 #define TYPE_FROM_RELAX_STATE(s) \
654 ((s) >> 2)
655 #define DISP_SIZE_FROM_RELAX_STATE(s) \
656 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
657
658 /* This table is used by relax_frag to promote short jumps to long
659 ones where necessary. SMALL (short) jumps may be promoted to BIG
660 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
661 don't allow a short jump in a 32 bit code segment to be promoted to
662 a 16 bit offset jump because it's slower (requires data size
663 prefix), and doesn't work, unless the destination is in the bottom
664 64k of the code segment (The top 16 bits of eip are zeroed). */
665
666 const relax_typeS md_relax_table[] =
667 {
668 /* The fields are:
669 1) most positive reach of this state,
670 2) most negative reach of this state,
671 3) how many bytes this mode will have in the variable part of the frag
672 4) which index into the table to try if we can't fit into this one. */
673
674 /* UNCOND_JUMP states. */
675 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
676 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
677 /* dword jmp adds 4 bytes to frag:
678 0 extra opcode bytes, 4 displacement bytes. */
679 {0, 0, 4, 0},
680 /* word jmp adds 2 byte2 to frag:
681 0 extra opcode bytes, 2 displacement bytes. */
682 {0, 0, 2, 0},
683
684 /* COND_JUMP states. */
685 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
686 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
687 /* dword conditionals adds 5 bytes to frag:
688 1 extra opcode byte, 4 displacement bytes. */
689 {0, 0, 5, 0},
690 /* word conditionals add 3 bytes to frag:
691 1 extra opcode byte, 2 displacement bytes. */
692 {0, 0, 3, 0},
693
694 /* COND_JUMP86 states. */
695 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
696 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
697 /* dword conditionals adds 5 bytes to frag:
698 1 extra opcode byte, 4 displacement bytes. */
699 {0, 0, 5, 0},
700 /* word conditionals add 4 bytes to frag:
701 1 displacement byte and a 3 byte long branch insn. */
702 {0, 0, 4, 0}
703 };
704
705 static const arch_entry cpu_arch[] =
706 {
707 /* Do not replace the first two entries - i386_target_format()
708 relies on them being there in this order. */
709 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
710 CPU_GENERIC32_FLAGS, 0, 0 },
711 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
712 CPU_GENERIC64_FLAGS, 0, 0 },
713 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
714 CPU_NONE_FLAGS, 0, 0 },
715 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
716 CPU_I186_FLAGS, 0, 0 },
717 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
718 CPU_I286_FLAGS, 0, 0 },
719 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
720 CPU_I386_FLAGS, 0, 0 },
721 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
722 CPU_I486_FLAGS, 0, 0 },
723 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
724 CPU_I586_FLAGS, 0, 0 },
725 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
726 CPU_I686_FLAGS, 0, 0 },
727 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
728 CPU_I586_FLAGS, 0, 0 },
729 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
730 CPU_PENTIUMPRO_FLAGS, 0, 0 },
731 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
732 CPU_P2_FLAGS, 0, 0 },
733 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
734 CPU_P3_FLAGS, 0, 0 },
735 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
736 CPU_P4_FLAGS, 0, 0 },
737 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
738 CPU_CORE_FLAGS, 0, 0 },
739 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
740 CPU_NOCONA_FLAGS, 0, 0 },
741 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
742 CPU_CORE_FLAGS, 1, 0 },
743 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
744 CPU_CORE_FLAGS, 0, 0 },
745 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
746 CPU_CORE2_FLAGS, 1, 0 },
747 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
748 CPU_CORE2_FLAGS, 0, 0 },
749 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
750 CPU_COREI7_FLAGS, 0, 0 },
751 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
752 CPU_L1OM_FLAGS, 0, 0 },
753 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
754 CPU_K1OM_FLAGS, 0, 0 },
755 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
756 CPU_K6_FLAGS, 0, 0 },
757 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
758 CPU_K6_2_FLAGS, 0, 0 },
759 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
760 CPU_ATHLON_FLAGS, 0, 0 },
761 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
762 CPU_K8_FLAGS, 1, 0 },
763 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
764 CPU_K8_FLAGS, 0, 0 },
765 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
766 CPU_K8_FLAGS, 0, 0 },
767 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
768 CPU_AMDFAM10_FLAGS, 0, 0 },
769 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
770 CPU_BDVER1_FLAGS, 0, 0 },
771 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
772 CPU_BDVER2_FLAGS, 0, 0 },
773 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
774 CPU_BDVER3_FLAGS, 0, 0 },
775 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
776 CPU_BDVER4_FLAGS, 0, 0 },
777 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
778 CPU_BTVER1_FLAGS, 0, 0 },
779 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
780 CPU_BTVER2_FLAGS, 0, 0 },
781 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
782 CPU_8087_FLAGS, 0, 0 },
783 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
784 CPU_287_FLAGS, 0, 0 },
785 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
786 CPU_387_FLAGS, 0, 0 },
787 { STRING_COMMA_LEN (".no87"), PROCESSOR_UNKNOWN,
788 CPU_ANY87_FLAGS, 0, 1 },
789 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
790 CPU_MMX_FLAGS, 0, 0 },
791 { STRING_COMMA_LEN (".nommx"), PROCESSOR_UNKNOWN,
792 CPU_3DNOWA_FLAGS, 0, 1 },
793 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
794 CPU_SSE_FLAGS, 0, 0 },
795 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
796 CPU_SSE2_FLAGS, 0, 0 },
797 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
798 CPU_SSE3_FLAGS, 0, 0 },
799 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
800 CPU_SSSE3_FLAGS, 0, 0 },
801 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
802 CPU_SSE4_1_FLAGS, 0, 0 },
803 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
804 CPU_SSE4_2_FLAGS, 0, 0 },
805 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
806 CPU_SSE4_2_FLAGS, 0, 0 },
807 { STRING_COMMA_LEN (".nosse"), PROCESSOR_UNKNOWN,
808 CPU_ANY_SSE_FLAGS, 0, 1 },
809 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
810 CPU_AVX_FLAGS, 0, 0 },
811 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
812 CPU_AVX2_FLAGS, 0, 0 },
813 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
814 CPU_AVX512F_FLAGS, 0, 0 },
815 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
816 CPU_AVX512CD_FLAGS, 0, 0 },
817 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
818 CPU_AVX512ER_FLAGS, 0, 0 },
819 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
820 CPU_AVX512PF_FLAGS, 0, 0 },
821 { STRING_COMMA_LEN (".noavx"), PROCESSOR_UNKNOWN,
822 CPU_ANY_AVX_FLAGS, 0, 1 },
823 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
824 CPU_VMX_FLAGS, 0, 0 },
825 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
826 CPU_VMFUNC_FLAGS, 0, 0 },
827 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
828 CPU_SMX_FLAGS, 0, 0 },
829 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
830 CPU_XSAVE_FLAGS, 0, 0 },
831 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
832 CPU_XSAVEOPT_FLAGS, 0, 0 },
833 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
834 CPU_AES_FLAGS, 0, 0 },
835 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
836 CPU_PCLMUL_FLAGS, 0, 0 },
837 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
838 CPU_PCLMUL_FLAGS, 1, 0 },
839 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
840 CPU_FSGSBASE_FLAGS, 0, 0 },
841 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
842 CPU_RDRND_FLAGS, 0, 0 },
843 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
844 CPU_F16C_FLAGS, 0, 0 },
845 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
846 CPU_BMI2_FLAGS, 0, 0 },
847 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
848 CPU_FMA_FLAGS, 0, 0 },
849 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
850 CPU_FMA4_FLAGS, 0, 0 },
851 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
852 CPU_XOP_FLAGS, 0, 0 },
853 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
854 CPU_LWP_FLAGS, 0, 0 },
855 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
856 CPU_MOVBE_FLAGS, 0, 0 },
857 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
858 CPU_CX16_FLAGS, 0, 0 },
859 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
860 CPU_EPT_FLAGS, 0, 0 },
861 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
862 CPU_LZCNT_FLAGS, 0, 0 },
863 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
864 CPU_HLE_FLAGS, 0, 0 },
865 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
866 CPU_RTM_FLAGS, 0, 0 },
867 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
868 CPU_INVPCID_FLAGS, 0, 0 },
869 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
870 CPU_CLFLUSH_FLAGS, 0, 0 },
871 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
872 CPU_NOP_FLAGS, 0, 0 },
873 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
874 CPU_SYSCALL_FLAGS, 0, 0 },
875 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
876 CPU_RDTSCP_FLAGS, 0, 0 },
877 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
878 CPU_3DNOW_FLAGS, 0, 0 },
879 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
880 CPU_3DNOWA_FLAGS, 0, 0 },
881 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
882 CPU_PADLOCK_FLAGS, 0, 0 },
883 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
884 CPU_SVME_FLAGS, 1, 0 },
885 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
886 CPU_SVME_FLAGS, 0, 0 },
887 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
888 CPU_SSE4A_FLAGS, 0, 0 },
889 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
890 CPU_ABM_FLAGS, 0, 0 },
891 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
892 CPU_BMI_FLAGS, 0, 0 },
893 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
894 CPU_TBM_FLAGS, 0, 0 },
895 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
896 CPU_ADX_FLAGS, 0, 0 },
897 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
898 CPU_RDSEED_FLAGS, 0, 0 },
899 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
900 CPU_PRFCHW_FLAGS, 0, 0 },
901 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
902 CPU_SMAP_FLAGS, 0, 0 },
903 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
904 CPU_MPX_FLAGS, 0, 0 },
905 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
906 CPU_SHA_FLAGS, 0, 0 },
907 };
908
909 #ifdef I386COFF
910 /* Like s_lcomm_internal in gas/read.c but the alignment string
911 is allowed to be optional. */
912
913 static symbolS *
914 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
915 {
916 addressT align = 0;
917
918 SKIP_WHITESPACE ();
919
920 if (needs_align
921 && *input_line_pointer == ',')
922 {
923 align = parse_align (needs_align - 1);
924
925 if (align == (addressT) -1)
926 return NULL;
927 }
928 else
929 {
930 if (size >= 8)
931 align = 3;
932 else if (size >= 4)
933 align = 2;
934 else if (size >= 2)
935 align = 1;
936 else
937 align = 0;
938 }
939
940 bss_alloc (symbolP, size, align);
941 return symbolP;
942 }
943
944 static void
945 pe_lcomm (int needs_align)
946 {
947 s_comm_internal (needs_align * 2, pe_lcomm_internal);
948 }
949 #endif
950
951 const pseudo_typeS md_pseudo_table[] =
952 {
953 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
954 {"align", s_align_bytes, 0},
955 #else
956 {"align", s_align_ptwo, 0},
957 #endif
958 {"arch", set_cpu_arch, 0},
959 #ifndef I386COFF
960 {"bss", s_bss, 0},
961 #else
962 {"lcomm", pe_lcomm, 1},
963 #endif
964 {"ffloat", float_cons, 'f'},
965 {"dfloat", float_cons, 'd'},
966 {"tfloat", float_cons, 'x'},
967 {"value", cons, 2},
968 {"slong", signed_cons, 4},
969 {"noopt", s_ignore, 0},
970 {"optim", s_ignore, 0},
971 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
972 {"code16", set_code_flag, CODE_16BIT},
973 {"code32", set_code_flag, CODE_32BIT},
974 {"code64", set_code_flag, CODE_64BIT},
975 {"intel_syntax", set_intel_syntax, 1},
976 {"att_syntax", set_intel_syntax, 0},
977 {"intel_mnemonic", set_intel_mnemonic, 1},
978 {"att_mnemonic", set_intel_mnemonic, 0},
979 {"allow_index_reg", set_allow_index_reg, 1},
980 {"disallow_index_reg", set_allow_index_reg, 0},
981 {"sse_check", set_check, 0},
982 {"operand_check", set_check, 1},
983 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
984 {"largecomm", handle_large_common, 0},
985 #else
986 {"file", (void (*) (int)) dwarf2_directive_file, 0},
987 {"loc", dwarf2_directive_loc, 0},
988 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
989 #endif
990 #ifdef TE_PE
991 {"secrel32", pe_directive_secrel, 0},
992 #endif
993 {0, 0, 0}
994 };
995
996 /* For interface with expression (). */
997 extern char *input_line_pointer;
998
999 /* Hash table for instruction mnemonic lookup. */
1000 static struct hash_control *op_hash;
1001
1002 /* Hash table for register lookup. */
1003 static struct hash_control *reg_hash;
1004 \f
1005 void
1006 i386_align_code (fragS *fragP, int count)
1007 {
1008 /* Various efficient no-op patterns for aligning code labels.
1009 Note: Don't try to assemble the instructions in the comments.
1010 0L and 0w are not legal. */
1011 static const char f32_1[] =
1012 {0x90}; /* nop */
1013 static const char f32_2[] =
1014 {0x66,0x90}; /* xchg %ax,%ax */
1015 static const char f32_3[] =
1016 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1017 static const char f32_4[] =
1018 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1019 static const char f32_5[] =
1020 {0x90, /* nop */
1021 0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1022 static const char f32_6[] =
1023 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1024 static const char f32_7[] =
1025 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1026 static const char f32_8[] =
1027 {0x90, /* nop */
1028 0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1029 static const char f32_9[] =
1030 {0x89,0xf6, /* movl %esi,%esi */
1031 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
1032 static const char f32_10[] =
1033 {0x8d,0x76,0x00, /* leal 0(%esi),%esi */
1034 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
1035 static const char f32_11[] =
1036 {0x8d,0x74,0x26,0x00, /* leal 0(%esi,1),%esi */
1037 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
1038 static const char f32_12[] =
1039 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
1040 0x8d,0xbf,0x00,0x00,0x00,0x00}; /* leal 0L(%edi),%edi */
1041 static const char f32_13[] =
1042 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
1043 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
1044 static const char f32_14[] =
1045 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00, /* leal 0L(%esi,1),%esi */
1046 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
1047 static const char f16_3[] =
1048 {0x8d,0x74,0x00}; /* lea 0(%esi),%esi */
1049 static const char f16_4[] =
1050 {0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
1051 static const char f16_5[] =
1052 {0x90, /* nop */
1053 0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
1054 static const char f16_6[] =
1055 {0x89,0xf6, /* mov %si,%si */
1056 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
1057 static const char f16_7[] =
1058 {0x8d,0x74,0x00, /* lea 0(%si),%si */
1059 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
1060 static const char f16_8[] =
1061 {0x8d,0xb4,0x00,0x00, /* lea 0w(%si),%si */
1062 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
1063 static const char jump_31[] =
1064 {0xeb,0x1d,0x90,0x90,0x90,0x90,0x90, /* jmp .+31; lotsa nops */
1065 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90,
1066 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90,
1067 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90};
1068 static const char *const f32_patt[] = {
1069 f32_1, f32_2, f32_3, f32_4, f32_5, f32_6, f32_7, f32_8,
1070 f32_9, f32_10, f32_11, f32_12, f32_13, f32_14
1071 };
1072 static const char *const f16_patt[] = {
1073 f32_1, f32_2, f16_3, f16_4, f16_5, f16_6, f16_7, f16_8
1074 };
1075 /* nopl (%[re]ax) */
1076 static const char alt_3[] =
1077 {0x0f,0x1f,0x00};
1078 /* nopl 0(%[re]ax) */
1079 static const char alt_4[] =
1080 {0x0f,0x1f,0x40,0x00};
1081 /* nopl 0(%[re]ax,%[re]ax,1) */
1082 static const char alt_5[] =
1083 {0x0f,0x1f,0x44,0x00,0x00};
1084 /* nopw 0(%[re]ax,%[re]ax,1) */
1085 static const char alt_6[] =
1086 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1087 /* nopl 0L(%[re]ax) */
1088 static const char alt_7[] =
1089 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1090 /* nopl 0L(%[re]ax,%[re]ax,1) */
1091 static const char alt_8[] =
1092 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1093 /* nopw 0L(%[re]ax,%[re]ax,1) */
1094 static const char alt_9[] =
1095 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1096 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1097 static const char alt_10[] =
1098 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1099 /* data16
1100 nopw %cs:0L(%[re]ax,%[re]ax,1) */
1101 static const char alt_long_11[] =
1102 {0x66,
1103 0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1104 /* data16
1105 data16
1106 nopw %cs:0L(%[re]ax,%[re]ax,1) */
1107 static const char alt_long_12[] =
1108 {0x66,
1109 0x66,
1110 0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1111 /* data16
1112 data16
1113 data16
1114 nopw %cs:0L(%[re]ax,%[re]ax,1) */
1115 static const char alt_long_13[] =
1116 {0x66,
1117 0x66,
1118 0x66,
1119 0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1120 /* data16
1121 data16
1122 data16
1123 data16
1124 nopw %cs:0L(%[re]ax,%[re]ax,1) */
1125 static const char alt_long_14[] =
1126 {0x66,
1127 0x66,
1128 0x66,
1129 0x66,
1130 0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1131 /* data16
1132 data16
1133 data16
1134 data16
1135 data16
1136 nopw %cs:0L(%[re]ax,%[re]ax,1) */
1137 static const char alt_long_15[] =
1138 {0x66,
1139 0x66,
1140 0x66,
1141 0x66,
1142 0x66,
1143 0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1144 /* nopl 0(%[re]ax,%[re]ax,1)
1145 nopw 0(%[re]ax,%[re]ax,1) */
1146 static const char alt_short_11[] =
1147 {0x0f,0x1f,0x44,0x00,0x00,
1148 0x66,0x0f,0x1f,0x44,0x00,0x00};
1149 /* nopw 0(%[re]ax,%[re]ax,1)
1150 nopw 0(%[re]ax,%[re]ax,1) */
1151 static const char alt_short_12[] =
1152 {0x66,0x0f,0x1f,0x44,0x00,0x00,
1153 0x66,0x0f,0x1f,0x44,0x00,0x00};
1154 /* nopw 0(%[re]ax,%[re]ax,1)
1155 nopl 0L(%[re]ax) */
1156 static const char alt_short_13[] =
1157 {0x66,0x0f,0x1f,0x44,0x00,0x00,
1158 0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1159 /* nopl 0L(%[re]ax)
1160 nopl 0L(%[re]ax) */
1161 static const char alt_short_14[] =
1162 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00,
1163 0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1164 /* nopl 0L(%[re]ax)
1165 nopl 0L(%[re]ax,%[re]ax,1) */
1166 static const char alt_short_15[] =
1167 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00,
1168 0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1169 static const char *const alt_short_patt[] = {
1170 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1171 alt_9, alt_10, alt_short_11, alt_short_12, alt_short_13,
1172 alt_short_14, alt_short_15
1173 };
1174 static const char *const alt_long_patt[] = {
1175 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1176 alt_9, alt_10, alt_long_11, alt_long_12, alt_long_13,
1177 alt_long_14, alt_long_15
1178 };
1179
1180 /* Only align for at least a positive non-zero boundary. */
1181 if (count <= 0 || count > MAX_MEM_FOR_RS_ALIGN_CODE)
1182 return;
1183
1184 /* We need to decide which NOP sequence to use for 32bit and
1185 64bit. When -mtune= is used:
1186
1187 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1188 PROCESSOR_GENERIC32, f32_patt will be used.
1189 2. For PROCESSOR_PENTIUMPRO, PROCESSOR_PENTIUM4, PROCESSOR_NOCONA,
1190 PROCESSOR_CORE, PROCESSOR_CORE2, PROCESSOR_COREI7, and
1191 PROCESSOR_GENERIC64, alt_long_patt will be used.
1192 3. For PROCESSOR_ATHLON, PROCESSOR_K6, PROCESSOR_K8 and
1193 PROCESSOR_AMDFAM10, PROCESSOR_BD and PROCESSOR_BT, alt_short_patt
1194 will be used.
1195
1196 When -mtune= isn't used, alt_long_patt will be used if
1197 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1198 be used.
1199
1200 When -march= or .arch is used, we can't use anything beyond
1201 cpu_arch_isa_flags. */
1202
1203 if (flag_code == CODE_16BIT)
1204 {
1205 if (count > 8)
1206 {
1207 memcpy (fragP->fr_literal + fragP->fr_fix,
1208 jump_31, count);
1209 /* Adjust jump offset. */
1210 fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
1211 }
1212 else
1213 memcpy (fragP->fr_literal + fragP->fr_fix,
1214 f16_patt[count - 1], count);
1215 }
1216 else
1217 {
1218 const char *const *patt = NULL;
1219
1220 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1221 {
1222 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1223 switch (cpu_arch_tune)
1224 {
1225 case PROCESSOR_UNKNOWN:
1226 /* We use cpu_arch_isa_flags to check if we SHOULD
1227 optimize with nops. */
1228 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1229 patt = alt_long_patt;
1230 else
1231 patt = f32_patt;
1232 break;
1233 case PROCESSOR_PENTIUM4:
1234 case PROCESSOR_NOCONA:
1235 case PROCESSOR_CORE:
1236 case PROCESSOR_CORE2:
1237 case PROCESSOR_COREI7:
1238 case PROCESSOR_L1OM:
1239 case PROCESSOR_K1OM:
1240 case PROCESSOR_GENERIC64:
1241 patt = alt_long_patt;
1242 break;
1243 case PROCESSOR_K6:
1244 case PROCESSOR_ATHLON:
1245 case PROCESSOR_K8:
1246 case PROCESSOR_AMDFAM10:
1247 case PROCESSOR_BD:
1248 case PROCESSOR_BT:
1249 patt = alt_short_patt;
1250 break;
1251 case PROCESSOR_I386:
1252 case PROCESSOR_I486:
1253 case PROCESSOR_PENTIUM:
1254 case PROCESSOR_PENTIUMPRO:
1255 case PROCESSOR_GENERIC32:
1256 patt = f32_patt;
1257 break;
1258 }
1259 }
1260 else
1261 {
1262 switch (fragP->tc_frag_data.tune)
1263 {
1264 case PROCESSOR_UNKNOWN:
1265 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1266 PROCESSOR_UNKNOWN. */
1267 abort ();
1268 break;
1269
1270 case PROCESSOR_I386:
1271 case PROCESSOR_I486:
1272 case PROCESSOR_PENTIUM:
1273 case PROCESSOR_K6:
1274 case PROCESSOR_ATHLON:
1275 case PROCESSOR_K8:
1276 case PROCESSOR_AMDFAM10:
1277 case PROCESSOR_BD:
1278 case PROCESSOR_BT:
1279 case PROCESSOR_GENERIC32:
1280 /* We use cpu_arch_isa_flags to check if we CAN optimize
1281 with nops. */
1282 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1283 patt = alt_short_patt;
1284 else
1285 patt = f32_patt;
1286 break;
1287 case PROCESSOR_PENTIUMPRO:
1288 case PROCESSOR_PENTIUM4:
1289 case PROCESSOR_NOCONA:
1290 case PROCESSOR_CORE:
1291 case PROCESSOR_CORE2:
1292 case PROCESSOR_COREI7:
1293 case PROCESSOR_L1OM:
1294 case PROCESSOR_K1OM:
1295 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1296 patt = alt_long_patt;
1297 else
1298 patt = f32_patt;
1299 break;
1300 case PROCESSOR_GENERIC64:
1301 patt = alt_long_patt;
1302 break;
1303 }
1304 }
1305
1306 if (patt == f32_patt)
1307 {
1308 /* If the padding is less than 15 bytes, we use the normal
1309 ones. Otherwise, we use a jump instruction and adjust
1310 its offset. */
1311 int limit;
1312
1313 /* For 64bit, the limit is 3 bytes. */
1314 if (flag_code == CODE_64BIT
1315 && fragP->tc_frag_data.isa_flags.bitfield.cpulm)
1316 limit = 3;
1317 else
1318 limit = 15;
1319 if (count < limit)
1320 memcpy (fragP->fr_literal + fragP->fr_fix,
1321 patt[count - 1], count);
1322 else
1323 {
1324 memcpy (fragP->fr_literal + fragP->fr_fix,
1325 jump_31, count);
1326 /* Adjust jump offset. */
1327 fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
1328 }
1329 }
1330 else
1331 {
1332 /* Maximum length of an instruction is 15 byte. If the
1333 padding is greater than 15 bytes and we don't use jump,
1334 we have to break it into smaller pieces. */
1335 int padding = count;
1336 while (padding > 15)
1337 {
1338 padding -= 15;
1339 memcpy (fragP->fr_literal + fragP->fr_fix + padding,
1340 patt [14], 15);
1341 }
1342
1343 if (padding)
1344 memcpy (fragP->fr_literal + fragP->fr_fix,
1345 patt [padding - 1], padding);
1346 }
1347 }
1348 fragP->fr_var = count;
1349 }
1350
1351 static INLINE int
1352 operand_type_all_zero (const union i386_operand_type *x)
1353 {
1354 switch (ARRAY_SIZE(x->array))
1355 {
1356 case 3:
1357 if (x->array[2])
1358 return 0;
1359 case 2:
1360 if (x->array[1])
1361 return 0;
1362 case 1:
1363 return !x->array[0];
1364 default:
1365 abort ();
1366 }
1367 }
1368
1369 static INLINE void
1370 operand_type_set (union i386_operand_type *x, unsigned int v)
1371 {
1372 switch (ARRAY_SIZE(x->array))
1373 {
1374 case 3:
1375 x->array[2] = v;
1376 case 2:
1377 x->array[1] = v;
1378 case 1:
1379 x->array[0] = v;
1380 break;
1381 default:
1382 abort ();
1383 }
1384 }
1385
1386 static INLINE int
1387 operand_type_equal (const union i386_operand_type *x,
1388 const union i386_operand_type *y)
1389 {
1390 switch (ARRAY_SIZE(x->array))
1391 {
1392 case 3:
1393 if (x->array[2] != y->array[2])
1394 return 0;
1395 case 2:
1396 if (x->array[1] != y->array[1])
1397 return 0;
1398 case 1:
1399 return x->array[0] == y->array[0];
1400 break;
1401 default:
1402 abort ();
1403 }
1404 }
1405
1406 static INLINE int
1407 cpu_flags_all_zero (const union i386_cpu_flags *x)
1408 {
1409 switch (ARRAY_SIZE(x->array))
1410 {
1411 case 3:
1412 if (x->array[2])
1413 return 0;
1414 case 2:
1415 if (x->array[1])
1416 return 0;
1417 case 1:
1418 return !x->array[0];
1419 default:
1420 abort ();
1421 }
1422 }
1423
1424 static INLINE void
1425 cpu_flags_set (union i386_cpu_flags *x, unsigned int v)
1426 {
1427 switch (ARRAY_SIZE(x->array))
1428 {
1429 case 3:
1430 x->array[2] = v;
1431 case 2:
1432 x->array[1] = v;
1433 case 1:
1434 x->array[0] = v;
1435 break;
1436 default:
1437 abort ();
1438 }
1439 }
1440
1441 static INLINE int
1442 cpu_flags_equal (const union i386_cpu_flags *x,
1443 const union i386_cpu_flags *y)
1444 {
1445 switch (ARRAY_SIZE(x->array))
1446 {
1447 case 3:
1448 if (x->array[2] != y->array[2])
1449 return 0;
1450 case 2:
1451 if (x->array[1] != y->array[1])
1452 return 0;
1453 case 1:
1454 return x->array[0] == y->array[0];
1455 break;
1456 default:
1457 abort ();
1458 }
1459 }
1460
1461 static INLINE int
1462 cpu_flags_check_cpu64 (i386_cpu_flags f)
1463 {
1464 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1465 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1466 }
1467
1468 static INLINE i386_cpu_flags
1469 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1470 {
1471 switch (ARRAY_SIZE (x.array))
1472 {
1473 case 3:
1474 x.array [2] &= y.array [2];
1475 case 2:
1476 x.array [1] &= y.array [1];
1477 case 1:
1478 x.array [0] &= y.array [0];
1479 break;
1480 default:
1481 abort ();
1482 }
1483 return x;
1484 }
1485
1486 static INLINE i386_cpu_flags
1487 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1488 {
1489 switch (ARRAY_SIZE (x.array))
1490 {
1491 case 3:
1492 x.array [2] |= y.array [2];
1493 case 2:
1494 x.array [1] |= y.array [1];
1495 case 1:
1496 x.array [0] |= y.array [0];
1497 break;
1498 default:
1499 abort ();
1500 }
1501 return x;
1502 }
1503
1504 static INLINE i386_cpu_flags
1505 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1506 {
1507 switch (ARRAY_SIZE (x.array))
1508 {
1509 case 3:
1510 x.array [2] &= ~y.array [2];
1511 case 2:
1512 x.array [1] &= ~y.array [1];
1513 case 1:
1514 x.array [0] &= ~y.array [0];
1515 break;
1516 default:
1517 abort ();
1518 }
1519 return x;
1520 }
1521
1522 #define CPU_FLAGS_ARCH_MATCH 0x1
1523 #define CPU_FLAGS_64BIT_MATCH 0x2
1524 #define CPU_FLAGS_AES_MATCH 0x4
1525 #define CPU_FLAGS_PCLMUL_MATCH 0x8
1526 #define CPU_FLAGS_AVX_MATCH 0x10
1527
1528 #define CPU_FLAGS_32BIT_MATCH \
1529 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_AES_MATCH \
1530 | CPU_FLAGS_PCLMUL_MATCH | CPU_FLAGS_AVX_MATCH)
1531 #define CPU_FLAGS_PERFECT_MATCH \
1532 (CPU_FLAGS_32BIT_MATCH | CPU_FLAGS_64BIT_MATCH)
1533
1534 /* Return CPU flags match bits. */
1535
1536 static int
1537 cpu_flags_match (const insn_template *t)
1538 {
1539 i386_cpu_flags x = t->cpu_flags;
1540 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1541
1542 x.bitfield.cpu64 = 0;
1543 x.bitfield.cpuno64 = 0;
1544
1545 if (cpu_flags_all_zero (&x))
1546 {
1547 /* This instruction is available on all archs. */
1548 match |= CPU_FLAGS_32BIT_MATCH;
1549 }
1550 else
1551 {
1552 /* This instruction is available only on some archs. */
1553 i386_cpu_flags cpu = cpu_arch_flags;
1554
1555 cpu.bitfield.cpu64 = 0;
1556 cpu.bitfield.cpuno64 = 0;
1557 cpu = cpu_flags_and (x, cpu);
1558 if (!cpu_flags_all_zero (&cpu))
1559 {
1560 if (x.bitfield.cpuavx)
1561 {
1562 /* We only need to check AES/PCLMUL/SSE2AVX with AVX. */
1563 if (cpu.bitfield.cpuavx)
1564 {
1565 /* Check SSE2AVX. */
1566 if (!t->opcode_modifier.sse2avx|| sse2avx)
1567 {
1568 match |= (CPU_FLAGS_ARCH_MATCH
1569 | CPU_FLAGS_AVX_MATCH);
1570 /* Check AES. */
1571 if (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1572 match |= CPU_FLAGS_AES_MATCH;
1573 /* Check PCLMUL. */
1574 if (!x.bitfield.cpupclmul
1575 || cpu.bitfield.cpupclmul)
1576 match |= CPU_FLAGS_PCLMUL_MATCH;
1577 }
1578 }
1579 else
1580 match |= CPU_FLAGS_ARCH_MATCH;
1581 }
1582 else
1583 match |= CPU_FLAGS_32BIT_MATCH;
1584 }
1585 }
1586 return match;
1587 }
1588
1589 static INLINE i386_operand_type
1590 operand_type_and (i386_operand_type x, i386_operand_type y)
1591 {
1592 switch (ARRAY_SIZE (x.array))
1593 {
1594 case 3:
1595 x.array [2] &= y.array [2];
1596 case 2:
1597 x.array [1] &= y.array [1];
1598 case 1:
1599 x.array [0] &= y.array [0];
1600 break;
1601 default:
1602 abort ();
1603 }
1604 return x;
1605 }
1606
1607 static INLINE i386_operand_type
1608 operand_type_or (i386_operand_type x, i386_operand_type y)
1609 {
1610 switch (ARRAY_SIZE (x.array))
1611 {
1612 case 3:
1613 x.array [2] |= y.array [2];
1614 case 2:
1615 x.array [1] |= y.array [1];
1616 case 1:
1617 x.array [0] |= y.array [0];
1618 break;
1619 default:
1620 abort ();
1621 }
1622 return x;
1623 }
1624
1625 static INLINE i386_operand_type
1626 operand_type_xor (i386_operand_type x, i386_operand_type y)
1627 {
1628 switch (ARRAY_SIZE (x.array))
1629 {
1630 case 3:
1631 x.array [2] ^= y.array [2];
1632 case 2:
1633 x.array [1] ^= y.array [1];
1634 case 1:
1635 x.array [0] ^= y.array [0];
1636 break;
1637 default:
1638 abort ();
1639 }
1640 return x;
1641 }
1642
1643 static const i386_operand_type acc32 = OPERAND_TYPE_ACC32;
1644 static const i386_operand_type acc64 = OPERAND_TYPE_ACC64;
1645 static const i386_operand_type control = OPERAND_TYPE_CONTROL;
1646 static const i386_operand_type inoutportreg
1647 = OPERAND_TYPE_INOUTPORTREG;
1648 static const i386_operand_type reg16_inoutportreg
1649 = OPERAND_TYPE_REG16_INOUTPORTREG;
1650 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1651 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1652 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1653 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1654 static const i386_operand_type anydisp
1655 = OPERAND_TYPE_ANYDISP;
1656 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1657 static const i386_operand_type regymm = OPERAND_TYPE_REGYMM;
1658 static const i386_operand_type regzmm = OPERAND_TYPE_REGZMM;
1659 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
1660 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1661 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1662 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1663 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1664 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1665 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1666 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1667 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1668 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1669 static const i386_operand_type vec_imm4 = OPERAND_TYPE_VEC_IMM4;
1670
1671 enum operand_type
1672 {
1673 reg,
1674 imm,
1675 disp,
1676 anymem
1677 };
1678
1679 static INLINE int
1680 operand_type_check (i386_operand_type t, enum operand_type c)
1681 {
1682 switch (c)
1683 {
1684 case reg:
1685 return (t.bitfield.reg8
1686 || t.bitfield.reg16
1687 || t.bitfield.reg32
1688 || t.bitfield.reg64);
1689
1690 case imm:
1691 return (t.bitfield.imm8
1692 || t.bitfield.imm8s
1693 || t.bitfield.imm16
1694 || t.bitfield.imm32
1695 || t.bitfield.imm32s
1696 || t.bitfield.imm64);
1697
1698 case disp:
1699 return (t.bitfield.disp8
1700 || t.bitfield.disp16
1701 || t.bitfield.disp32
1702 || t.bitfield.disp32s
1703 || t.bitfield.disp64);
1704
1705 case anymem:
1706 return (t.bitfield.disp8
1707 || t.bitfield.disp16
1708 || t.bitfield.disp32
1709 || t.bitfield.disp32s
1710 || t.bitfield.disp64
1711 || t.bitfield.baseindex);
1712
1713 default:
1714 abort ();
1715 }
1716
1717 return 0;
1718 }
1719
1720 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit on
1721 operand J for instruction template T. */
1722
1723 static INLINE int
1724 match_reg_size (const insn_template *t, unsigned int j)
1725 {
1726 return !((i.types[j].bitfield.byte
1727 && !t->operand_types[j].bitfield.byte)
1728 || (i.types[j].bitfield.word
1729 && !t->operand_types[j].bitfield.word)
1730 || (i.types[j].bitfield.dword
1731 && !t->operand_types[j].bitfield.dword)
1732 || (i.types[j].bitfield.qword
1733 && !t->operand_types[j].bitfield.qword));
1734 }
1735
1736 /* Return 1 if there is no conflict in any size on operand J for
1737 instruction template T. */
1738
1739 static INLINE int
1740 match_mem_size (const insn_template *t, unsigned int j)
1741 {
1742 return (match_reg_size (t, j)
1743 && !((i.types[j].bitfield.unspecified
1744 && !t->operand_types[j].bitfield.unspecified)
1745 || (i.types[j].bitfield.fword
1746 && !t->operand_types[j].bitfield.fword)
1747 || (i.types[j].bitfield.tbyte
1748 && !t->operand_types[j].bitfield.tbyte)
1749 || (i.types[j].bitfield.xmmword
1750 && !t->operand_types[j].bitfield.xmmword)
1751 || (i.types[j].bitfield.ymmword
1752 && !t->operand_types[j].bitfield.ymmword)
1753 || (i.types[j].bitfield.zmmword
1754 && !t->operand_types[j].bitfield.zmmword)));
1755 }
1756
1757 /* Return 1 if there is no size conflict on any operands for
1758 instruction template T. */
1759
1760 static INLINE int
1761 operand_size_match (const insn_template *t)
1762 {
1763 unsigned int j;
1764 int match = 1;
1765
1766 /* Don't check jump instructions. */
1767 if (t->opcode_modifier.jump
1768 || t->opcode_modifier.jumpbyte
1769 || t->opcode_modifier.jumpdword
1770 || t->opcode_modifier.jumpintersegment)
1771 return match;
1772
1773 /* Check memory and accumulator operand size. */
1774 for (j = 0; j < i.operands; j++)
1775 {
1776 if (t->operand_types[j].bitfield.anysize)
1777 continue;
1778
1779 if (t->operand_types[j].bitfield.acc && !match_reg_size (t, j))
1780 {
1781 match = 0;
1782 break;
1783 }
1784
1785 if (i.types[j].bitfield.mem && !match_mem_size (t, j))
1786 {
1787 match = 0;
1788 break;
1789 }
1790 }
1791
1792 if (match)
1793 return match;
1794 else if (!t->opcode_modifier.d && !t->opcode_modifier.floatd)
1795 {
1796 mismatch:
1797 i.error = operand_size_mismatch;
1798 return 0;
1799 }
1800
1801 /* Check reverse. */
1802 gas_assert (i.operands == 2);
1803
1804 match = 1;
1805 for (j = 0; j < 2; j++)
1806 {
1807 if (t->operand_types[j].bitfield.acc
1808 && !match_reg_size (t, j ? 0 : 1))
1809 goto mismatch;
1810
1811 if (i.types[j].bitfield.mem
1812 && !match_mem_size (t, j ? 0 : 1))
1813 goto mismatch;
1814 }
1815
1816 return match;
1817 }
1818
1819 static INLINE int
1820 operand_type_match (i386_operand_type overlap,
1821 i386_operand_type given)
1822 {
1823 i386_operand_type temp = overlap;
1824
1825 temp.bitfield.jumpabsolute = 0;
1826 temp.bitfield.unspecified = 0;
1827 temp.bitfield.byte = 0;
1828 temp.bitfield.word = 0;
1829 temp.bitfield.dword = 0;
1830 temp.bitfield.fword = 0;
1831 temp.bitfield.qword = 0;
1832 temp.bitfield.tbyte = 0;
1833 temp.bitfield.xmmword = 0;
1834 temp.bitfield.ymmword = 0;
1835 temp.bitfield.zmmword = 0;
1836 if (operand_type_all_zero (&temp))
1837 goto mismatch;
1838
1839 if (given.bitfield.baseindex == overlap.bitfield.baseindex
1840 && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
1841 return 1;
1842
1843 mismatch:
1844 i.error = operand_type_mismatch;
1845 return 0;
1846 }
1847
1848 /* If given types g0 and g1 are registers they must be of the same type
1849 unless the expected operand type register overlap is null.
1850 Note that Acc in a template matches every size of reg. */
1851
1852 static INLINE int
1853 operand_type_register_match (i386_operand_type m0,
1854 i386_operand_type g0,
1855 i386_operand_type t0,
1856 i386_operand_type m1,
1857 i386_operand_type g1,
1858 i386_operand_type t1)
1859 {
1860 if (!operand_type_check (g0, reg))
1861 return 1;
1862
1863 if (!operand_type_check (g1, reg))
1864 return 1;
1865
1866 if (g0.bitfield.reg8 == g1.bitfield.reg8
1867 && g0.bitfield.reg16 == g1.bitfield.reg16
1868 && g0.bitfield.reg32 == g1.bitfield.reg32
1869 && g0.bitfield.reg64 == g1.bitfield.reg64)
1870 return 1;
1871
1872 if (m0.bitfield.acc)
1873 {
1874 t0.bitfield.reg8 = 1;
1875 t0.bitfield.reg16 = 1;
1876 t0.bitfield.reg32 = 1;
1877 t0.bitfield.reg64 = 1;
1878 }
1879
1880 if (m1.bitfield.acc)
1881 {
1882 t1.bitfield.reg8 = 1;
1883 t1.bitfield.reg16 = 1;
1884 t1.bitfield.reg32 = 1;
1885 t1.bitfield.reg64 = 1;
1886 }
1887
1888 if (!(t0.bitfield.reg8 & t1.bitfield.reg8)
1889 && !(t0.bitfield.reg16 & t1.bitfield.reg16)
1890 && !(t0.bitfield.reg32 & t1.bitfield.reg32)
1891 && !(t0.bitfield.reg64 & t1.bitfield.reg64))
1892 return 1;
1893
1894 i.error = register_type_mismatch;
1895
1896 return 0;
1897 }
1898
1899 static INLINE unsigned int
1900 register_number (const reg_entry *r)
1901 {
1902 unsigned int nr = r->reg_num;
1903
1904 if (r->reg_flags & RegRex)
1905 nr += 8;
1906
1907 return nr;
1908 }
1909
1910 static INLINE unsigned int
1911 mode_from_disp_size (i386_operand_type t)
1912 {
1913 if (t.bitfield.disp8 || t.bitfield.vec_disp8)
1914 return 1;
1915 else if (t.bitfield.disp16
1916 || t.bitfield.disp32
1917 || t.bitfield.disp32s)
1918 return 2;
1919 else
1920 return 0;
1921 }
1922
1923 static INLINE int
1924 fits_in_signed_byte (offsetT num)
1925 {
1926 return (num >= -128) && (num <= 127);
1927 }
1928
1929 static INLINE int
1930 fits_in_unsigned_byte (offsetT num)
1931 {
1932 return (num & 0xff) == num;
1933 }
1934
1935 static INLINE int
1936 fits_in_unsigned_word (offsetT num)
1937 {
1938 return (num & 0xffff) == num;
1939 }
1940
1941 static INLINE int
1942 fits_in_signed_word (offsetT num)
1943 {
1944 return (-32768 <= num) && (num <= 32767);
1945 }
1946
1947 static INLINE int
1948 fits_in_signed_long (offsetT num ATTRIBUTE_UNUSED)
1949 {
1950 #ifndef BFD64
1951 return 1;
1952 #else
1953 return (!(((offsetT) -1 << 31) & num)
1954 || (((offsetT) -1 << 31) & num) == ((offsetT) -1 << 31));
1955 #endif
1956 } /* fits_in_signed_long() */
1957
1958 static INLINE int
1959 fits_in_unsigned_long (offsetT num ATTRIBUTE_UNUSED)
1960 {
1961 #ifndef BFD64
1962 return 1;
1963 #else
1964 return (num & (((offsetT) 2 << 31) - 1)) == num;
1965 #endif
1966 } /* fits_in_unsigned_long() */
1967
1968 static INLINE int
1969 fits_in_vec_disp8 (offsetT num)
1970 {
1971 int shift = i.memshift;
1972 unsigned int mask;
1973
1974 if (shift == -1)
1975 abort ();
1976
1977 mask = (1 << shift) - 1;
1978
1979 /* Return 0 if NUM isn't properly aligned. */
1980 if ((num & mask))
1981 return 0;
1982
1983 /* Check if NUM will fit in 8bit after shift. */
1984 return fits_in_signed_byte (num >> shift);
1985 }
1986
1987 static INLINE int
1988 fits_in_imm4 (offsetT num)
1989 {
1990 return (num & 0xf) == num;
1991 }
1992
1993 static i386_operand_type
1994 smallest_imm_type (offsetT num)
1995 {
1996 i386_operand_type t;
1997
1998 operand_type_set (&t, 0);
1999 t.bitfield.imm64 = 1;
2000
2001 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2002 {
2003 /* This code is disabled on the 486 because all the Imm1 forms
2004 in the opcode table are slower on the i486. They're the
2005 versions with the implicitly specified single-position
2006 displacement, which has another syntax if you really want to
2007 use that form. */
2008 t.bitfield.imm1 = 1;
2009 t.bitfield.imm8 = 1;
2010 t.bitfield.imm8s = 1;
2011 t.bitfield.imm16 = 1;
2012 t.bitfield.imm32 = 1;
2013 t.bitfield.imm32s = 1;
2014 }
2015 else if (fits_in_signed_byte (num))
2016 {
2017 t.bitfield.imm8 = 1;
2018 t.bitfield.imm8s = 1;
2019 t.bitfield.imm16 = 1;
2020 t.bitfield.imm32 = 1;
2021 t.bitfield.imm32s = 1;
2022 }
2023 else if (fits_in_unsigned_byte (num))
2024 {
2025 t.bitfield.imm8 = 1;
2026 t.bitfield.imm16 = 1;
2027 t.bitfield.imm32 = 1;
2028 t.bitfield.imm32s = 1;
2029 }
2030 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2031 {
2032 t.bitfield.imm16 = 1;
2033 t.bitfield.imm32 = 1;
2034 t.bitfield.imm32s = 1;
2035 }
2036 else if (fits_in_signed_long (num))
2037 {
2038 t.bitfield.imm32 = 1;
2039 t.bitfield.imm32s = 1;
2040 }
2041 else if (fits_in_unsigned_long (num))
2042 t.bitfield.imm32 = 1;
2043
2044 return t;
2045 }
2046
2047 static offsetT
2048 offset_in_range (offsetT val, int size)
2049 {
2050 addressT mask;
2051
2052 switch (size)
2053 {
2054 case 1: mask = ((addressT) 1 << 8) - 1; break;
2055 case 2: mask = ((addressT) 1 << 16) - 1; break;
2056 case 4: mask = ((addressT) 2 << 31) - 1; break;
2057 #ifdef BFD64
2058 case 8: mask = ((addressT) 2 << 63) - 1; break;
2059 #endif
2060 default: abort ();
2061 }
2062
2063 #ifdef BFD64
2064 /* If BFD64, sign extend val for 32bit address mode. */
2065 if (flag_code != CODE_64BIT
2066 || i.prefix[ADDR_PREFIX])
2067 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2068 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2069 #endif
2070
2071 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2072 {
2073 char buf1[40], buf2[40];
2074
2075 sprint_value (buf1, val);
2076 sprint_value (buf2, val & mask);
2077 as_warn (_("%s shortened to %s"), buf1, buf2);
2078 }
2079 return val & mask;
2080 }
2081
2082 enum PREFIX_GROUP
2083 {
2084 PREFIX_EXIST = 0,
2085 PREFIX_LOCK,
2086 PREFIX_REP,
2087 PREFIX_OTHER
2088 };
2089
2090 /* Returns
2091 a. PREFIX_EXIST if attempting to add a prefix where one from the
2092 same class already exists.
2093 b. PREFIX_LOCK if lock prefix is added.
2094 c. PREFIX_REP if rep/repne prefix is added.
2095 d. PREFIX_OTHER if other prefix is added.
2096 */
2097
2098 static enum PREFIX_GROUP
2099 add_prefix (unsigned int prefix)
2100 {
2101 enum PREFIX_GROUP ret = PREFIX_OTHER;
2102 unsigned int q;
2103
2104 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2105 && flag_code == CODE_64BIT)
2106 {
2107 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2108 || ((i.prefix[REX_PREFIX] & (REX_R | REX_X | REX_B))
2109 && (prefix & (REX_R | REX_X | REX_B))))
2110 ret = PREFIX_EXIST;
2111 q = REX_PREFIX;
2112 }
2113 else
2114 {
2115 switch (prefix)
2116 {
2117 default:
2118 abort ();
2119
2120 case CS_PREFIX_OPCODE:
2121 case DS_PREFIX_OPCODE:
2122 case ES_PREFIX_OPCODE:
2123 case FS_PREFIX_OPCODE:
2124 case GS_PREFIX_OPCODE:
2125 case SS_PREFIX_OPCODE:
2126 q = SEG_PREFIX;
2127 break;
2128
2129 case REPNE_PREFIX_OPCODE:
2130 case REPE_PREFIX_OPCODE:
2131 q = REP_PREFIX;
2132 ret = PREFIX_REP;
2133 break;
2134
2135 case LOCK_PREFIX_OPCODE:
2136 q = LOCK_PREFIX;
2137 ret = PREFIX_LOCK;
2138 break;
2139
2140 case FWAIT_OPCODE:
2141 q = WAIT_PREFIX;
2142 break;
2143
2144 case ADDR_PREFIX_OPCODE:
2145 q = ADDR_PREFIX;
2146 break;
2147
2148 case DATA_PREFIX_OPCODE:
2149 q = DATA_PREFIX;
2150 break;
2151 }
2152 if (i.prefix[q] != 0)
2153 ret = PREFIX_EXIST;
2154 }
2155
2156 if (ret)
2157 {
2158 if (!i.prefix[q])
2159 ++i.prefixes;
2160 i.prefix[q] |= prefix;
2161 }
2162 else
2163 as_bad (_("same type of prefix used twice"));
2164
2165 return ret;
2166 }
2167
2168 static void
2169 update_code_flag (int value, int check)
2170 {
2171 PRINTF_LIKE ((*as_error));
2172
2173 flag_code = (enum flag_code) value;
2174 if (flag_code == CODE_64BIT)
2175 {
2176 cpu_arch_flags.bitfield.cpu64 = 1;
2177 cpu_arch_flags.bitfield.cpuno64 = 0;
2178 }
2179 else
2180 {
2181 cpu_arch_flags.bitfield.cpu64 = 0;
2182 cpu_arch_flags.bitfield.cpuno64 = 1;
2183 }
2184 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2185 {
2186 if (check)
2187 as_error = as_fatal;
2188 else
2189 as_error = as_bad;
2190 (*as_error) (_("64bit mode not supported on `%s'."),
2191 cpu_arch_name ? cpu_arch_name : default_arch);
2192 }
2193 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2194 {
2195 if (check)
2196 as_error = as_fatal;
2197 else
2198 as_error = as_bad;
2199 (*as_error) (_("32bit mode not supported on `%s'."),
2200 cpu_arch_name ? cpu_arch_name : default_arch);
2201 }
2202 stackop_size = '\0';
2203 }
2204
2205 static void
2206 set_code_flag (int value)
2207 {
2208 update_code_flag (value, 0);
2209 }
2210
2211 static void
2212 set_16bit_gcc_code_flag (int new_code_flag)
2213 {
2214 flag_code = (enum flag_code) new_code_flag;
2215 if (flag_code != CODE_16BIT)
2216 abort ();
2217 cpu_arch_flags.bitfield.cpu64 = 0;
2218 cpu_arch_flags.bitfield.cpuno64 = 1;
2219 stackop_size = LONG_MNEM_SUFFIX;
2220 }
2221
2222 static void
2223 set_intel_syntax (int syntax_flag)
2224 {
2225 /* Find out if register prefixing is specified. */
2226 int ask_naked_reg = 0;
2227
2228 SKIP_WHITESPACE ();
2229 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2230 {
2231 char *string = input_line_pointer;
2232 int e = get_symbol_end ();
2233
2234 if (strcmp (string, "prefix") == 0)
2235 ask_naked_reg = 1;
2236 else if (strcmp (string, "noprefix") == 0)
2237 ask_naked_reg = -1;
2238 else
2239 as_bad (_("bad argument to syntax directive."));
2240 *input_line_pointer = e;
2241 }
2242 demand_empty_rest_of_line ();
2243
2244 intel_syntax = syntax_flag;
2245
2246 if (ask_naked_reg == 0)
2247 allow_naked_reg = (intel_syntax
2248 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2249 else
2250 allow_naked_reg = (ask_naked_reg < 0);
2251
2252 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2253
2254 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2255 identifier_chars['$'] = intel_syntax ? '$' : 0;
2256 register_prefix = allow_naked_reg ? "" : "%";
2257 }
2258
2259 static void
2260 set_intel_mnemonic (int mnemonic_flag)
2261 {
2262 intel_mnemonic = mnemonic_flag;
2263 }
2264
2265 static void
2266 set_allow_index_reg (int flag)
2267 {
2268 allow_index_reg = flag;
2269 }
2270
2271 static void
2272 set_check (int what)
2273 {
2274 enum check_kind *kind;
2275 const char *str;
2276
2277 if (what)
2278 {
2279 kind = &operand_check;
2280 str = "operand";
2281 }
2282 else
2283 {
2284 kind = &sse_check;
2285 str = "sse";
2286 }
2287
2288 SKIP_WHITESPACE ();
2289
2290 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2291 {
2292 char *string = input_line_pointer;
2293 int e = get_symbol_end ();
2294
2295 if (strcmp (string, "none") == 0)
2296 *kind = check_none;
2297 else if (strcmp (string, "warning") == 0)
2298 *kind = check_warning;
2299 else if (strcmp (string, "error") == 0)
2300 *kind = check_error;
2301 else
2302 as_bad (_("bad argument to %s_check directive."), str);
2303 *input_line_pointer = e;
2304 }
2305 else
2306 as_bad (_("missing argument for %s_check directive"), str);
2307
2308 demand_empty_rest_of_line ();
2309 }
2310
2311 static void
2312 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2313 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2314 {
2315 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2316 static const char *arch;
2317
2318 /* Intel LIOM is only supported on ELF. */
2319 if (!IS_ELF)
2320 return;
2321
2322 if (!arch)
2323 {
2324 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2325 use default_arch. */
2326 arch = cpu_arch_name;
2327 if (!arch)
2328 arch = default_arch;
2329 }
2330
2331 /* If we are targeting Intel L1OM, we must enable it. */
2332 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2333 || new_flag.bitfield.cpul1om)
2334 return;
2335
2336 /* If we are targeting Intel K1OM, we must enable it. */
2337 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2338 || new_flag.bitfield.cpuk1om)
2339 return;
2340
2341 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2342 #endif
2343 }
2344
2345 static void
2346 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2347 {
2348 SKIP_WHITESPACE ();
2349
2350 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2351 {
2352 char *string = input_line_pointer;
2353 int e = get_symbol_end ();
2354 unsigned int j;
2355 i386_cpu_flags flags;
2356
2357 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2358 {
2359 if (strcmp (string, cpu_arch[j].name) == 0)
2360 {
2361 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2362
2363 if (*string != '.')
2364 {
2365 cpu_arch_name = cpu_arch[j].name;
2366 cpu_sub_arch_name = NULL;
2367 cpu_arch_flags = cpu_arch[j].flags;
2368 if (flag_code == CODE_64BIT)
2369 {
2370 cpu_arch_flags.bitfield.cpu64 = 1;
2371 cpu_arch_flags.bitfield.cpuno64 = 0;
2372 }
2373 else
2374 {
2375 cpu_arch_flags.bitfield.cpu64 = 0;
2376 cpu_arch_flags.bitfield.cpuno64 = 1;
2377 }
2378 cpu_arch_isa = cpu_arch[j].type;
2379 cpu_arch_isa_flags = cpu_arch[j].flags;
2380 if (!cpu_arch_tune_set)
2381 {
2382 cpu_arch_tune = cpu_arch_isa;
2383 cpu_arch_tune_flags = cpu_arch_isa_flags;
2384 }
2385 break;
2386 }
2387
2388 if (!cpu_arch[j].negated)
2389 flags = cpu_flags_or (cpu_arch_flags,
2390 cpu_arch[j].flags);
2391 else
2392 flags = cpu_flags_and_not (cpu_arch_flags,
2393 cpu_arch[j].flags);
2394 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2395 {
2396 if (cpu_sub_arch_name)
2397 {
2398 char *name = cpu_sub_arch_name;
2399 cpu_sub_arch_name = concat (name,
2400 cpu_arch[j].name,
2401 (const char *) NULL);
2402 free (name);
2403 }
2404 else
2405 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2406 cpu_arch_flags = flags;
2407 cpu_arch_isa_flags = flags;
2408 }
2409 *input_line_pointer = e;
2410 demand_empty_rest_of_line ();
2411 return;
2412 }
2413 }
2414 if (j >= ARRAY_SIZE (cpu_arch))
2415 as_bad (_("no such architecture: `%s'"), string);
2416
2417 *input_line_pointer = e;
2418 }
2419 else
2420 as_bad (_("missing cpu architecture"));
2421
2422 no_cond_jump_promotion = 0;
2423 if (*input_line_pointer == ','
2424 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2425 {
2426 char *string = ++input_line_pointer;
2427 int e = get_symbol_end ();
2428
2429 if (strcmp (string, "nojumps") == 0)
2430 no_cond_jump_promotion = 1;
2431 else if (strcmp (string, "jumps") == 0)
2432 ;
2433 else
2434 as_bad (_("no such architecture modifier: `%s'"), string);
2435
2436 *input_line_pointer = e;
2437 }
2438
2439 demand_empty_rest_of_line ();
2440 }
2441
2442 enum bfd_architecture
2443 i386_arch (void)
2444 {
2445 if (cpu_arch_isa == PROCESSOR_L1OM)
2446 {
2447 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2448 || flag_code != CODE_64BIT)
2449 as_fatal (_("Intel L1OM is 64bit ELF only"));
2450 return bfd_arch_l1om;
2451 }
2452 else if (cpu_arch_isa == PROCESSOR_K1OM)
2453 {
2454 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2455 || flag_code != CODE_64BIT)
2456 as_fatal (_("Intel K1OM is 64bit ELF only"));
2457 return bfd_arch_k1om;
2458 }
2459 else
2460 return bfd_arch_i386;
2461 }
2462
2463 unsigned long
2464 i386_mach (void)
2465 {
2466 if (!strncmp (default_arch, "x86_64", 6))
2467 {
2468 if (cpu_arch_isa == PROCESSOR_L1OM)
2469 {
2470 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2471 || default_arch[6] != '\0')
2472 as_fatal (_("Intel L1OM is 64bit ELF only"));
2473 return bfd_mach_l1om;
2474 }
2475 else if (cpu_arch_isa == PROCESSOR_K1OM)
2476 {
2477 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2478 || default_arch[6] != '\0')
2479 as_fatal (_("Intel K1OM is 64bit ELF only"));
2480 return bfd_mach_k1om;
2481 }
2482 else if (default_arch[6] == '\0')
2483 return bfd_mach_x86_64;
2484 else
2485 return bfd_mach_x64_32;
2486 }
2487 else if (!strcmp (default_arch, "i386"))
2488 return bfd_mach_i386_i386;
2489 else
2490 as_fatal (_("unknown architecture"));
2491 }
2492 \f
2493 void
2494 md_begin (void)
2495 {
2496 const char *hash_err;
2497
2498 /* Initialize op_hash hash table. */
2499 op_hash = hash_new ();
2500
2501 {
2502 const insn_template *optab;
2503 templates *core_optab;
2504
2505 /* Setup for loop. */
2506 optab = i386_optab;
2507 core_optab = (templates *) xmalloc (sizeof (templates));
2508 core_optab->start = optab;
2509
2510 while (1)
2511 {
2512 ++optab;
2513 if (optab->name == NULL
2514 || strcmp (optab->name, (optab - 1)->name) != 0)
2515 {
2516 /* different name --> ship out current template list;
2517 add to hash table; & begin anew. */
2518 core_optab->end = optab;
2519 hash_err = hash_insert (op_hash,
2520 (optab - 1)->name,
2521 (void *) core_optab);
2522 if (hash_err)
2523 {
2524 as_fatal (_("can't hash %s: %s"),
2525 (optab - 1)->name,
2526 hash_err);
2527 }
2528 if (optab->name == NULL)
2529 break;
2530 core_optab = (templates *) xmalloc (sizeof (templates));
2531 core_optab->start = optab;
2532 }
2533 }
2534 }
2535
2536 /* Initialize reg_hash hash table. */
2537 reg_hash = hash_new ();
2538 {
2539 const reg_entry *regtab;
2540 unsigned int regtab_size = i386_regtab_size;
2541
2542 for (regtab = i386_regtab; regtab_size--; regtab++)
2543 {
2544 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2545 if (hash_err)
2546 as_fatal (_("can't hash %s: %s"),
2547 regtab->reg_name,
2548 hash_err);
2549 }
2550 }
2551
2552 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
2553 {
2554 int c;
2555 char *p;
2556
2557 for (c = 0; c < 256; c++)
2558 {
2559 if (ISDIGIT (c))
2560 {
2561 digit_chars[c] = c;
2562 mnemonic_chars[c] = c;
2563 register_chars[c] = c;
2564 operand_chars[c] = c;
2565 }
2566 else if (ISLOWER (c))
2567 {
2568 mnemonic_chars[c] = c;
2569 register_chars[c] = c;
2570 operand_chars[c] = c;
2571 }
2572 else if (ISUPPER (c))
2573 {
2574 mnemonic_chars[c] = TOLOWER (c);
2575 register_chars[c] = mnemonic_chars[c];
2576 operand_chars[c] = c;
2577 }
2578 else if (c == '{' || c == '}')
2579 operand_chars[c] = c;
2580
2581 if (ISALPHA (c) || ISDIGIT (c))
2582 identifier_chars[c] = c;
2583 else if (c >= 128)
2584 {
2585 identifier_chars[c] = c;
2586 operand_chars[c] = c;
2587 }
2588 }
2589
2590 #ifdef LEX_AT
2591 identifier_chars['@'] = '@';
2592 #endif
2593 #ifdef LEX_QM
2594 identifier_chars['?'] = '?';
2595 operand_chars['?'] = '?';
2596 #endif
2597 digit_chars['-'] = '-';
2598 mnemonic_chars['_'] = '_';
2599 mnemonic_chars['-'] = '-';
2600 mnemonic_chars['.'] = '.';
2601 identifier_chars['_'] = '_';
2602 identifier_chars['.'] = '.';
2603
2604 for (p = operand_special_chars; *p != '\0'; p++)
2605 operand_chars[(unsigned char) *p] = *p;
2606 }
2607
2608 if (flag_code == CODE_64BIT)
2609 {
2610 #if defined (OBJ_COFF) && defined (TE_PE)
2611 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2612 ? 32 : 16);
2613 #else
2614 x86_dwarf2_return_column = 16;
2615 #endif
2616 x86_cie_data_alignment = -8;
2617 }
2618 else
2619 {
2620 x86_dwarf2_return_column = 8;
2621 x86_cie_data_alignment = -4;
2622 }
2623 }
2624
2625 void
2626 i386_print_statistics (FILE *file)
2627 {
2628 hash_print_statistics (file, "i386 opcode", op_hash);
2629 hash_print_statistics (file, "i386 register", reg_hash);
2630 }
2631 \f
2632 #ifdef DEBUG386
2633
2634 /* Debugging routines for md_assemble. */
2635 static void pte (insn_template *);
2636 static void pt (i386_operand_type);
2637 static void pe (expressionS *);
2638 static void ps (symbolS *);
2639
2640 static void
2641 pi (char *line, i386_insn *x)
2642 {
2643 unsigned int j;
2644
2645 fprintf (stdout, "%s: template ", line);
2646 pte (&x->tm);
2647 fprintf (stdout, " address: base %s index %s scale %x\n",
2648 x->base_reg ? x->base_reg->reg_name : "none",
2649 x->index_reg ? x->index_reg->reg_name : "none",
2650 x->log2_scale_factor);
2651 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
2652 x->rm.mode, x->rm.reg, x->rm.regmem);
2653 fprintf (stdout, " sib: base %x index %x scale %x\n",
2654 x->sib.base, x->sib.index, x->sib.scale);
2655 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
2656 (x->rex & REX_W) != 0,
2657 (x->rex & REX_R) != 0,
2658 (x->rex & REX_X) != 0,
2659 (x->rex & REX_B) != 0);
2660 for (j = 0; j < x->operands; j++)
2661 {
2662 fprintf (stdout, " #%d: ", j + 1);
2663 pt (x->types[j]);
2664 fprintf (stdout, "\n");
2665 if (x->types[j].bitfield.reg8
2666 || x->types[j].bitfield.reg16
2667 || x->types[j].bitfield.reg32
2668 || x->types[j].bitfield.reg64
2669 || x->types[j].bitfield.regmmx
2670 || x->types[j].bitfield.regxmm
2671 || x->types[j].bitfield.regymm
2672 || x->types[j].bitfield.regzmm
2673 || x->types[j].bitfield.sreg2
2674 || x->types[j].bitfield.sreg3
2675 || x->types[j].bitfield.control
2676 || x->types[j].bitfield.debug
2677 || x->types[j].bitfield.test)
2678 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
2679 if (operand_type_check (x->types[j], imm))
2680 pe (x->op[j].imms);
2681 if (operand_type_check (x->types[j], disp))
2682 pe (x->op[j].disps);
2683 }
2684 }
2685
2686 static void
2687 pte (insn_template *t)
2688 {
2689 unsigned int j;
2690 fprintf (stdout, " %d operands ", t->operands);
2691 fprintf (stdout, "opcode %x ", t->base_opcode);
2692 if (t->extension_opcode != None)
2693 fprintf (stdout, "ext %x ", t->extension_opcode);
2694 if (t->opcode_modifier.d)
2695 fprintf (stdout, "D");
2696 if (t->opcode_modifier.w)
2697 fprintf (stdout, "W");
2698 fprintf (stdout, "\n");
2699 for (j = 0; j < t->operands; j++)
2700 {
2701 fprintf (stdout, " #%d type ", j + 1);
2702 pt (t->operand_types[j]);
2703 fprintf (stdout, "\n");
2704 }
2705 }
2706
2707 static void
2708 pe (expressionS *e)
2709 {
2710 fprintf (stdout, " operation %d\n", e->X_op);
2711 fprintf (stdout, " add_number %ld (%lx)\n",
2712 (long) e->X_add_number, (long) e->X_add_number);
2713 if (e->X_add_symbol)
2714 {
2715 fprintf (stdout, " add_symbol ");
2716 ps (e->X_add_symbol);
2717 fprintf (stdout, "\n");
2718 }
2719 if (e->X_op_symbol)
2720 {
2721 fprintf (stdout, " op_symbol ");
2722 ps (e->X_op_symbol);
2723 fprintf (stdout, "\n");
2724 }
2725 }
2726
2727 static void
2728 ps (symbolS *s)
2729 {
2730 fprintf (stdout, "%s type %s%s",
2731 S_GET_NAME (s),
2732 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
2733 segment_name (S_GET_SEGMENT (s)));
2734 }
2735
2736 static struct type_name
2737 {
2738 i386_operand_type mask;
2739 const char *name;
2740 }
2741 const type_names[] =
2742 {
2743 { OPERAND_TYPE_REG8, "r8" },
2744 { OPERAND_TYPE_REG16, "r16" },
2745 { OPERAND_TYPE_REG32, "r32" },
2746 { OPERAND_TYPE_REG64, "r64" },
2747 { OPERAND_TYPE_IMM8, "i8" },
2748 { OPERAND_TYPE_IMM8, "i8s" },
2749 { OPERAND_TYPE_IMM16, "i16" },
2750 { OPERAND_TYPE_IMM32, "i32" },
2751 { OPERAND_TYPE_IMM32S, "i32s" },
2752 { OPERAND_TYPE_IMM64, "i64" },
2753 { OPERAND_TYPE_IMM1, "i1" },
2754 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
2755 { OPERAND_TYPE_DISP8, "d8" },
2756 { OPERAND_TYPE_DISP16, "d16" },
2757 { OPERAND_TYPE_DISP32, "d32" },
2758 { OPERAND_TYPE_DISP32S, "d32s" },
2759 { OPERAND_TYPE_DISP64, "d64" },
2760 { OPERAND_TYPE_VEC_DISP8, "Vector d8" },
2761 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
2762 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
2763 { OPERAND_TYPE_CONTROL, "control reg" },
2764 { OPERAND_TYPE_TEST, "test reg" },
2765 { OPERAND_TYPE_DEBUG, "debug reg" },
2766 { OPERAND_TYPE_FLOATREG, "FReg" },
2767 { OPERAND_TYPE_FLOATACC, "FAcc" },
2768 { OPERAND_TYPE_SREG2, "SReg2" },
2769 { OPERAND_TYPE_SREG3, "SReg3" },
2770 { OPERAND_TYPE_ACC, "Acc" },
2771 { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
2772 { OPERAND_TYPE_REGMMX, "rMMX" },
2773 { OPERAND_TYPE_REGXMM, "rXMM" },
2774 { OPERAND_TYPE_REGYMM, "rYMM" },
2775 { OPERAND_TYPE_REGZMM, "rZMM" },
2776 { OPERAND_TYPE_REGMASK, "Mask reg" },
2777 { OPERAND_TYPE_ESSEG, "es" },
2778 };
2779
2780 static void
2781 pt (i386_operand_type t)
2782 {
2783 unsigned int j;
2784 i386_operand_type a;
2785
2786 for (j = 0; j < ARRAY_SIZE (type_names); j++)
2787 {
2788 a = operand_type_and (t, type_names[j].mask);
2789 if (!operand_type_all_zero (&a))
2790 fprintf (stdout, "%s, ", type_names[j].name);
2791 }
2792 fflush (stdout);
2793 }
2794
2795 #endif /* DEBUG386 */
2796 \f
2797 static bfd_reloc_code_real_type
2798 reloc (unsigned int size,
2799 int pcrel,
2800 int sign,
2801 int bnd_prefix,
2802 bfd_reloc_code_real_type other)
2803 {
2804 if (other != NO_RELOC)
2805 {
2806 reloc_howto_type *rel;
2807
2808 if (size == 8)
2809 switch (other)
2810 {
2811 case BFD_RELOC_X86_64_GOT32:
2812 return BFD_RELOC_X86_64_GOT64;
2813 break;
2814 case BFD_RELOC_X86_64_PLTOFF64:
2815 return BFD_RELOC_X86_64_PLTOFF64;
2816 break;
2817 case BFD_RELOC_X86_64_GOTPC32:
2818 other = BFD_RELOC_X86_64_GOTPC64;
2819 break;
2820 case BFD_RELOC_X86_64_GOTPCREL:
2821 other = BFD_RELOC_X86_64_GOTPCREL64;
2822 break;
2823 case BFD_RELOC_X86_64_TPOFF32:
2824 other = BFD_RELOC_X86_64_TPOFF64;
2825 break;
2826 case BFD_RELOC_X86_64_DTPOFF32:
2827 other = BFD_RELOC_X86_64_DTPOFF64;
2828 break;
2829 default:
2830 break;
2831 }
2832
2833 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2834 if (other == BFD_RELOC_SIZE32)
2835 {
2836 if (size == 8)
2837 return BFD_RELOC_SIZE64;
2838 if (pcrel)
2839 as_bad (_("there are no pc-relative size relocations"));
2840 }
2841 #endif
2842
2843 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
2844 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
2845 sign = -1;
2846
2847 rel = bfd_reloc_type_lookup (stdoutput, other);
2848 if (!rel)
2849 as_bad (_("unknown relocation (%u)"), other);
2850 else if (size != bfd_get_reloc_size (rel))
2851 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
2852 bfd_get_reloc_size (rel),
2853 size);
2854 else if (pcrel && !rel->pc_relative)
2855 as_bad (_("non-pc-relative relocation for pc-relative field"));
2856 else if ((rel->complain_on_overflow == complain_overflow_signed
2857 && !sign)
2858 || (rel->complain_on_overflow == complain_overflow_unsigned
2859 && sign > 0))
2860 as_bad (_("relocated field and relocation type differ in signedness"));
2861 else
2862 return other;
2863 return NO_RELOC;
2864 }
2865
2866 if (pcrel)
2867 {
2868 if (!sign)
2869 as_bad (_("there are no unsigned pc-relative relocations"));
2870 switch (size)
2871 {
2872 case 1: return BFD_RELOC_8_PCREL;
2873 case 2: return BFD_RELOC_16_PCREL;
2874 case 4: return (bnd_prefix && object_64bit
2875 ? BFD_RELOC_X86_64_PC32_BND
2876 : BFD_RELOC_32_PCREL);
2877 case 8: return BFD_RELOC_64_PCREL;
2878 }
2879 as_bad (_("cannot do %u byte pc-relative relocation"), size);
2880 }
2881 else
2882 {
2883 if (sign > 0)
2884 switch (size)
2885 {
2886 case 4: return BFD_RELOC_X86_64_32S;
2887 }
2888 else
2889 switch (size)
2890 {
2891 case 1: return BFD_RELOC_8;
2892 case 2: return BFD_RELOC_16;
2893 case 4: return BFD_RELOC_32;
2894 case 8: return BFD_RELOC_64;
2895 }
2896 as_bad (_("cannot do %s %u byte relocation"),
2897 sign > 0 ? "signed" : "unsigned", size);
2898 }
2899
2900 return NO_RELOC;
2901 }
2902
2903 /* Here we decide which fixups can be adjusted to make them relative to
2904 the beginning of the section instead of the symbol. Basically we need
2905 to make sure that the dynamic relocations are done correctly, so in
2906 some cases we force the original symbol to be used. */
2907
2908 int
2909 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
2910 {
2911 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2912 if (!IS_ELF)
2913 return 1;
2914
2915 /* Don't adjust pc-relative references to merge sections in 64-bit
2916 mode. */
2917 if (use_rela_relocations
2918 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
2919 && fixP->fx_pcrel)
2920 return 0;
2921
2922 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
2923 and changed later by validate_fix. */
2924 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
2925 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
2926 return 0;
2927
2928 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
2929 for size relocations. */
2930 if (fixP->fx_r_type == BFD_RELOC_SIZE32
2931 || fixP->fx_r_type == BFD_RELOC_SIZE64
2932 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
2933 || fixP->fx_r_type == BFD_RELOC_386_PLT32
2934 || fixP->fx_r_type == BFD_RELOC_386_GOT32
2935 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
2936 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
2937 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
2938 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
2939 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
2940 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
2941 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
2942 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
2943 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
2944 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
2945 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
2946 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
2947 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
2948 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
2949 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
2950 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
2951 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
2952 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
2953 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
2954 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
2955 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
2956 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
2957 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
2958 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
2959 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
2960 return 0;
2961 #endif
2962 return 1;
2963 }
2964
2965 static int
2966 intel_float_operand (const char *mnemonic)
2967 {
2968 /* Note that the value returned is meaningful only for opcodes with (memory)
2969 operands, hence the code here is free to improperly handle opcodes that
2970 have no operands (for better performance and smaller code). */
2971
2972 if (mnemonic[0] != 'f')
2973 return 0; /* non-math */
2974
2975 switch (mnemonic[1])
2976 {
2977 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
2978 the fs segment override prefix not currently handled because no
2979 call path can make opcodes without operands get here */
2980 case 'i':
2981 return 2 /* integer op */;
2982 case 'l':
2983 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
2984 return 3; /* fldcw/fldenv */
2985 break;
2986 case 'n':
2987 if (mnemonic[2] != 'o' /* fnop */)
2988 return 3; /* non-waiting control op */
2989 break;
2990 case 'r':
2991 if (mnemonic[2] == 's')
2992 return 3; /* frstor/frstpm */
2993 break;
2994 case 's':
2995 if (mnemonic[2] == 'a')
2996 return 3; /* fsave */
2997 if (mnemonic[2] == 't')
2998 {
2999 switch (mnemonic[3])
3000 {
3001 case 'c': /* fstcw */
3002 case 'd': /* fstdw */
3003 case 'e': /* fstenv */
3004 case 's': /* fsts[gw] */
3005 return 3;
3006 }
3007 }
3008 break;
3009 case 'x':
3010 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3011 return 0; /* fxsave/fxrstor are not really math ops */
3012 break;
3013 }
3014
3015 return 1;
3016 }
3017
3018 /* Build the VEX prefix. */
3019
3020 static void
3021 build_vex_prefix (const insn_template *t)
3022 {
3023 unsigned int register_specifier;
3024 unsigned int implied_prefix;
3025 unsigned int vector_length;
3026
3027 /* Check register specifier. */
3028 if (i.vex.register_specifier)
3029 {
3030 register_specifier =
3031 ~register_number (i.vex.register_specifier) & 0xf;
3032 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3033 }
3034 else
3035 register_specifier = 0xf;
3036
3037 /* Use 2-byte VEX prefix by swappping destination and source
3038 operand. */
3039 if (!i.swap_operand
3040 && i.operands == i.reg_operands
3041 && i.tm.opcode_modifier.vexopcode == VEX0F
3042 && i.tm.opcode_modifier.s
3043 && i.rex == REX_B)
3044 {
3045 unsigned int xchg = i.operands - 1;
3046 union i386_op temp_op;
3047 i386_operand_type temp_type;
3048
3049 temp_type = i.types[xchg];
3050 i.types[xchg] = i.types[0];
3051 i.types[0] = temp_type;
3052 temp_op = i.op[xchg];
3053 i.op[xchg] = i.op[0];
3054 i.op[0] = temp_op;
3055
3056 gas_assert (i.rm.mode == 3);
3057
3058 i.rex = REX_R;
3059 xchg = i.rm.regmem;
3060 i.rm.regmem = i.rm.reg;
3061 i.rm.reg = xchg;
3062
3063 /* Use the next insn. */
3064 i.tm = t[1];
3065 }
3066
3067 if (i.tm.opcode_modifier.vex == VEXScalar)
3068 vector_length = avxscalar;
3069 else
3070 vector_length = i.tm.opcode_modifier.vex == VEX256 ? 1 : 0;
3071
3072 switch ((i.tm.base_opcode >> 8) & 0xff)
3073 {
3074 case 0:
3075 implied_prefix = 0;
3076 break;
3077 case DATA_PREFIX_OPCODE:
3078 implied_prefix = 1;
3079 break;
3080 case REPE_PREFIX_OPCODE:
3081 implied_prefix = 2;
3082 break;
3083 case REPNE_PREFIX_OPCODE:
3084 implied_prefix = 3;
3085 break;
3086 default:
3087 abort ();
3088 }
3089
3090 /* Use 2-byte VEX prefix if possible. */
3091 if (i.tm.opcode_modifier.vexopcode == VEX0F
3092 && i.tm.opcode_modifier.vexw != VEXW1
3093 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3094 {
3095 /* 2-byte VEX prefix. */
3096 unsigned int r;
3097
3098 i.vex.length = 2;
3099 i.vex.bytes[0] = 0xc5;
3100
3101 /* Check the REX.R bit. */
3102 r = (i.rex & REX_R) ? 0 : 1;
3103 i.vex.bytes[1] = (r << 7
3104 | register_specifier << 3
3105 | vector_length << 2
3106 | implied_prefix);
3107 }
3108 else
3109 {
3110 /* 3-byte VEX prefix. */
3111 unsigned int m, w;
3112
3113 i.vex.length = 3;
3114
3115 switch (i.tm.opcode_modifier.vexopcode)
3116 {
3117 case VEX0F:
3118 m = 0x1;
3119 i.vex.bytes[0] = 0xc4;
3120 break;
3121 case VEX0F38:
3122 m = 0x2;
3123 i.vex.bytes[0] = 0xc4;
3124 break;
3125 case VEX0F3A:
3126 m = 0x3;
3127 i.vex.bytes[0] = 0xc4;
3128 break;
3129 case XOP08:
3130 m = 0x8;
3131 i.vex.bytes[0] = 0x8f;
3132 break;
3133 case XOP09:
3134 m = 0x9;
3135 i.vex.bytes[0] = 0x8f;
3136 break;
3137 case XOP0A:
3138 m = 0xa;
3139 i.vex.bytes[0] = 0x8f;
3140 break;
3141 default:
3142 abort ();
3143 }
3144
3145 /* The high 3 bits of the second VEX byte are 1's compliment
3146 of RXB bits from REX. */
3147 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3148
3149 /* Check the REX.W bit. */
3150 w = (i.rex & REX_W) ? 1 : 0;
3151 if (i.tm.opcode_modifier.vexw)
3152 {
3153 if (w)
3154 abort ();
3155
3156 if (i.tm.opcode_modifier.vexw == VEXW1)
3157 w = 1;
3158 }
3159
3160 i.vex.bytes[2] = (w << 7
3161 | register_specifier << 3
3162 | vector_length << 2
3163 | implied_prefix);
3164 }
3165 }
3166
3167 /* Build the EVEX prefix. */
3168
3169 static void
3170 build_evex_prefix (void)
3171 {
3172 unsigned int register_specifier;
3173 unsigned int implied_prefix;
3174 unsigned int m, w;
3175 rex_byte vrex_used = 0;
3176
3177 /* Check register specifier. */
3178 if (i.vex.register_specifier)
3179 {
3180 gas_assert ((i.vrex & REX_X) == 0);
3181
3182 register_specifier = i.vex.register_specifier->reg_num;
3183 if ((i.vex.register_specifier->reg_flags & RegRex))
3184 register_specifier += 8;
3185 /* The upper 16 registers are encoded in the fourth byte of the
3186 EVEX prefix. */
3187 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3188 i.vex.bytes[3] = 0x8;
3189 register_specifier = ~register_specifier & 0xf;
3190 }
3191 else
3192 {
3193 register_specifier = 0xf;
3194
3195 /* Encode upper 16 vector index register in the fourth byte of
3196 the EVEX prefix. */
3197 if (!(i.vrex & REX_X))
3198 i.vex.bytes[3] = 0x8;
3199 else
3200 vrex_used |= REX_X;
3201 }
3202
3203 switch ((i.tm.base_opcode >> 8) & 0xff)
3204 {
3205 case 0:
3206 implied_prefix = 0;
3207 break;
3208 case DATA_PREFIX_OPCODE:
3209 implied_prefix = 1;
3210 break;
3211 case REPE_PREFIX_OPCODE:
3212 implied_prefix = 2;
3213 break;
3214 case REPNE_PREFIX_OPCODE:
3215 implied_prefix = 3;
3216 break;
3217 default:
3218 abort ();
3219 }
3220
3221 /* 4 byte EVEX prefix. */
3222 i.vex.length = 4;
3223 i.vex.bytes[0] = 0x62;
3224
3225 /* mmmm bits. */
3226 switch (i.tm.opcode_modifier.vexopcode)
3227 {
3228 case VEX0F:
3229 m = 1;
3230 break;
3231 case VEX0F38:
3232 m = 2;
3233 break;
3234 case VEX0F3A:
3235 m = 3;
3236 break;
3237 default:
3238 abort ();
3239 break;
3240 }
3241
3242 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3243 bits from REX. */
3244 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3245
3246 /* The fifth bit of the second EVEX byte is 1's compliment of the
3247 REX_R bit in VREX. */
3248 if (!(i.vrex & REX_R))
3249 i.vex.bytes[1] |= 0x10;
3250 else
3251 vrex_used |= REX_R;
3252
3253 if ((i.reg_operands + i.imm_operands) == i.operands)
3254 {
3255 /* When all operands are registers, the REX_X bit in REX is not
3256 used. We reuse it to encode the upper 16 registers, which is
3257 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3258 as 1's compliment. */
3259 if ((i.vrex & REX_B))
3260 {
3261 vrex_used |= REX_B;
3262 i.vex.bytes[1] &= ~0x40;
3263 }
3264 }
3265
3266 /* EVEX instructions shouldn't need the REX prefix. */
3267 i.vrex &= ~vrex_used;
3268 gas_assert (i.vrex == 0);
3269
3270 /* Check the REX.W bit. */
3271 w = (i.rex & REX_W) ? 1 : 0;
3272 if (i.tm.opcode_modifier.vexw)
3273 {
3274 if (i.tm.opcode_modifier.vexw == VEXW1)
3275 w = 1;
3276 }
3277 /* If w is not set it means we are dealing with WIG instruction. */
3278 else if (!w)
3279 {
3280 if (evexwig == evexw1)
3281 w = 1;
3282 }
3283
3284 /* Encode the U bit. */
3285 implied_prefix |= 0x4;
3286
3287 /* The third byte of the EVEX prefix. */
3288 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3289
3290 /* The fourth byte of the EVEX prefix. */
3291 /* The zeroing-masking bit. */
3292 if (i.mask && i.mask->zeroing)
3293 i.vex.bytes[3] |= 0x80;
3294
3295 /* Don't always set the broadcast bit if there is no RC. */
3296 if (!i.rounding)
3297 {
3298 /* Encode the vector length. */
3299 unsigned int vec_length;
3300
3301 switch (i.tm.opcode_modifier.evex)
3302 {
3303 case EVEXLIG: /* LL' is ignored */
3304 vec_length = evexlig << 5;
3305 break;
3306 case EVEX128:
3307 vec_length = 0 << 5;
3308 break;
3309 case EVEX256:
3310 vec_length = 1 << 5;
3311 break;
3312 case EVEX512:
3313 vec_length = 2 << 5;
3314 break;
3315 default:
3316 abort ();
3317 break;
3318 }
3319 i.vex.bytes[3] |= vec_length;
3320 /* Encode the broadcast bit. */
3321 if (i.broadcast)
3322 i.vex.bytes[3] |= 0x10;
3323 }
3324 else
3325 {
3326 if (i.rounding->type != saeonly)
3327 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3328 else
3329 i.vex.bytes[3] |= 0x10;
3330 }
3331
3332 if (i.mask && i.mask->mask)
3333 i.vex.bytes[3] |= i.mask->mask->reg_num;
3334 }
3335
3336 static void
3337 process_immext (void)
3338 {
3339 expressionS *exp;
3340
3341 if ((i.tm.cpu_flags.bitfield.cpusse3 || i.tm.cpu_flags.bitfield.cpusvme)
3342 && i.operands > 0)
3343 {
3344 /* MONITOR/MWAIT as well as SVME instructions have fixed operands
3345 with an opcode suffix which is coded in the same place as an
3346 8-bit immediate field would be.
3347 Here we check those operands and remove them afterwards. */
3348 unsigned int x;
3349
3350 for (x = 0; x < i.operands; x++)
3351 if (register_number (i.op[x].regs) != x)
3352 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3353 register_prefix, i.op[x].regs->reg_name, x + 1,
3354 i.tm.name);
3355
3356 i.operands = 0;
3357 }
3358
3359 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3360 which is coded in the same place as an 8-bit immediate field
3361 would be. Here we fake an 8-bit immediate operand from the
3362 opcode suffix stored in tm.extension_opcode.
3363
3364 AVX instructions also use this encoding, for some of
3365 3 argument instructions. */
3366
3367 gas_assert (i.imm_operands <= 1
3368 && (i.operands <= 2
3369 || ((i.tm.opcode_modifier.vex
3370 || i.tm.opcode_modifier.evex)
3371 && i.operands <= 4)));
3372
3373 exp = &im_expressions[i.imm_operands++];
3374 i.op[i.operands].imms = exp;
3375 i.types[i.operands] = imm8;
3376 i.operands++;
3377 exp->X_op = O_constant;
3378 exp->X_add_number = i.tm.extension_opcode;
3379 i.tm.extension_opcode = None;
3380 }
3381
3382
3383 static int
3384 check_hle (void)
3385 {
3386 switch (i.tm.opcode_modifier.hleprefixok)
3387 {
3388 default:
3389 abort ();
3390 case HLEPrefixNone:
3391 as_bad (_("invalid instruction `%s' after `%s'"),
3392 i.tm.name, i.hle_prefix);
3393 return 0;
3394 case HLEPrefixLock:
3395 if (i.prefix[LOCK_PREFIX])
3396 return 1;
3397 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3398 return 0;
3399 case HLEPrefixAny:
3400 return 1;
3401 case HLEPrefixRelease:
3402 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3403 {
3404 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3405 i.tm.name);
3406 return 0;
3407 }
3408 if (i.mem_operands == 0
3409 || !operand_type_check (i.types[i.operands - 1], anymem))
3410 {
3411 as_bad (_("memory destination needed for instruction `%s'"
3412 " after `xrelease'"), i.tm.name);
3413 return 0;
3414 }
3415 return 1;
3416 }
3417 }
3418
3419 /* This is the guts of the machine-dependent assembler. LINE points to a
3420 machine dependent instruction. This function is supposed to emit
3421 the frags/bytes it assembles to. */
3422
3423 void
3424 md_assemble (char *line)
3425 {
3426 unsigned int j;
3427 char mnemonic[MAX_MNEM_SIZE];
3428 const insn_template *t;
3429
3430 /* Initialize globals. */
3431 memset (&i, '\0', sizeof (i));
3432 for (j = 0; j < MAX_OPERANDS; j++)
3433 i.reloc[j] = NO_RELOC;
3434 memset (disp_expressions, '\0', sizeof (disp_expressions));
3435 memset (im_expressions, '\0', sizeof (im_expressions));
3436 save_stack_p = save_stack;
3437
3438 /* First parse an instruction mnemonic & call i386_operand for the operands.
3439 We assume that the scrubber has arranged it so that line[0] is the valid
3440 start of a (possibly prefixed) mnemonic. */
3441
3442 line = parse_insn (line, mnemonic);
3443 if (line == NULL)
3444 return;
3445
3446 line = parse_operands (line, mnemonic);
3447 this_operand = -1;
3448 if (line == NULL)
3449 return;
3450
3451 /* Now we've parsed the mnemonic into a set of templates, and have the
3452 operands at hand. */
3453
3454 /* All intel opcodes have reversed operands except for "bound" and
3455 "enter". We also don't reverse intersegment "jmp" and "call"
3456 instructions with 2 immediate operands so that the immediate segment
3457 precedes the offset, as it does when in AT&T mode. */
3458 if (intel_syntax
3459 && i.operands > 1
3460 && (strcmp (mnemonic, "bound") != 0)
3461 && (strcmp (mnemonic, "invlpga") != 0)
3462 && !(operand_type_check (i.types[0], imm)
3463 && operand_type_check (i.types[1], imm)))
3464 swap_operands ();
3465
3466 /* The order of the immediates should be reversed
3467 for 2 immediates extrq and insertq instructions */
3468 if (i.imm_operands == 2
3469 && (strcmp (mnemonic, "extrq") == 0
3470 || strcmp (mnemonic, "insertq") == 0))
3471 swap_2_operands (0, 1);
3472
3473 if (i.imm_operands)
3474 optimize_imm ();
3475
3476 /* Don't optimize displacement for movabs since it only takes 64bit
3477 displacement. */
3478 if (i.disp_operands
3479 && i.disp_encoding != disp_encoding_32bit
3480 && (flag_code != CODE_64BIT
3481 || strcmp (mnemonic, "movabs") != 0))
3482 optimize_disp ();
3483
3484 /* Next, we find a template that matches the given insn,
3485 making sure the overlap of the given operands types is consistent
3486 with the template operand types. */
3487
3488 if (!(t = match_template ()))
3489 return;
3490
3491 if (sse_check != check_none
3492 && !i.tm.opcode_modifier.noavx
3493 && (i.tm.cpu_flags.bitfield.cpusse
3494 || i.tm.cpu_flags.bitfield.cpusse2
3495 || i.tm.cpu_flags.bitfield.cpusse3
3496 || i.tm.cpu_flags.bitfield.cpussse3
3497 || i.tm.cpu_flags.bitfield.cpusse4_1
3498 || i.tm.cpu_flags.bitfield.cpusse4_2))
3499 {
3500 (sse_check == check_warning
3501 ? as_warn
3502 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
3503 }
3504
3505 /* Zap movzx and movsx suffix. The suffix has been set from
3506 "word ptr" or "byte ptr" on the source operand in Intel syntax
3507 or extracted from mnemonic in AT&T syntax. But we'll use
3508 the destination register to choose the suffix for encoding. */
3509 if ((i.tm.base_opcode & ~9) == 0x0fb6)
3510 {
3511 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
3512 there is no suffix, the default will be byte extension. */
3513 if (i.reg_operands != 2
3514 && !i.suffix
3515 && intel_syntax)
3516 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
3517
3518 i.suffix = 0;
3519 }
3520
3521 if (i.tm.opcode_modifier.fwait)
3522 if (!add_prefix (FWAIT_OPCODE))
3523 return;
3524
3525 /* Check if REP prefix is OK. */
3526 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
3527 {
3528 as_bad (_("invalid instruction `%s' after `%s'"),
3529 i.tm.name, i.rep_prefix);
3530 return;
3531 }
3532
3533 /* Check for lock without a lockable instruction. Destination operand
3534 must be memory unless it is xchg (0x86). */
3535 if (i.prefix[LOCK_PREFIX]
3536 && (!i.tm.opcode_modifier.islockable
3537 || i.mem_operands == 0
3538 || (i.tm.base_opcode != 0x86
3539 && !operand_type_check (i.types[i.operands - 1], anymem))))
3540 {
3541 as_bad (_("expecting lockable instruction after `lock'"));
3542 return;
3543 }
3544
3545 /* Check if HLE prefix is OK. */
3546 if (i.hle_prefix && !check_hle ())
3547 return;
3548
3549 /* Check BND prefix. */
3550 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
3551 as_bad (_("expecting valid branch instruction after `bnd'"));
3552
3553 if (i.tm.cpu_flags.bitfield.cpumpx
3554 && flag_code == CODE_64BIT
3555 && i.prefix[ADDR_PREFIX])
3556 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
3557
3558 /* Insert BND prefix. */
3559 if (add_bnd_prefix
3560 && i.tm.opcode_modifier.bndprefixok
3561 && !i.prefix[BND_PREFIX])
3562 add_prefix (BND_PREFIX_OPCODE);
3563
3564 /* Check string instruction segment overrides. */
3565 if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
3566 {
3567 if (!check_string ())
3568 return;
3569 i.disp_operands = 0;
3570 }
3571
3572 if (!process_suffix ())
3573 return;
3574
3575 /* Update operand types. */
3576 for (j = 0; j < i.operands; j++)
3577 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
3578
3579 /* Make still unresolved immediate matches conform to size of immediate
3580 given in i.suffix. */
3581 if (!finalize_imm ())
3582 return;
3583
3584 if (i.types[0].bitfield.imm1)
3585 i.imm_operands = 0; /* kludge for shift insns. */
3586
3587 /* We only need to check those implicit registers for instructions
3588 with 3 operands or less. */
3589 if (i.operands <= 3)
3590 for (j = 0; j < i.operands; j++)
3591 if (i.types[j].bitfield.inoutportreg
3592 || i.types[j].bitfield.shiftcount
3593 || i.types[j].bitfield.acc
3594 || i.types[j].bitfield.floatacc)
3595 i.reg_operands--;
3596
3597 /* ImmExt should be processed after SSE2AVX. */
3598 if (!i.tm.opcode_modifier.sse2avx
3599 && i.tm.opcode_modifier.immext)
3600 process_immext ();
3601
3602 /* For insns with operands there are more diddles to do to the opcode. */
3603 if (i.operands)
3604 {
3605 if (!process_operands ())
3606 return;
3607 }
3608 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
3609 {
3610 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
3611 as_warn (_("translating to `%sp'"), i.tm.name);
3612 }
3613
3614 if (i.tm.opcode_modifier.vex)
3615 build_vex_prefix (t);
3616
3617 if (i.tm.opcode_modifier.evex)
3618 build_evex_prefix ();
3619
3620 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
3621 instructions may define INT_OPCODE as well, so avoid this corner
3622 case for those instructions that use MODRM. */
3623 if (i.tm.base_opcode == INT_OPCODE
3624 && !i.tm.opcode_modifier.modrm
3625 && i.op[0].imms->X_add_number == 3)
3626 {
3627 i.tm.base_opcode = INT3_OPCODE;
3628 i.imm_operands = 0;
3629 }
3630
3631 if ((i.tm.opcode_modifier.jump
3632 || i.tm.opcode_modifier.jumpbyte
3633 || i.tm.opcode_modifier.jumpdword)
3634 && i.op[0].disps->X_op == O_constant)
3635 {
3636 /* Convert "jmp constant" (and "call constant") to a jump (call) to
3637 the absolute address given by the constant. Since ix86 jumps and
3638 calls are pc relative, we need to generate a reloc. */
3639 i.op[0].disps->X_add_symbol = &abs_symbol;
3640 i.op[0].disps->X_op = O_symbol;
3641 }
3642
3643 if (i.tm.opcode_modifier.rex64)
3644 i.rex |= REX_W;
3645
3646 /* For 8 bit registers we need an empty rex prefix. Also if the
3647 instruction already has a prefix, we need to convert old
3648 registers to new ones. */
3649
3650 if ((i.types[0].bitfield.reg8
3651 && (i.op[0].regs->reg_flags & RegRex64) != 0)
3652 || (i.types[1].bitfield.reg8
3653 && (i.op[1].regs->reg_flags & RegRex64) != 0)
3654 || ((i.types[0].bitfield.reg8
3655 || i.types[1].bitfield.reg8)
3656 && i.rex != 0))
3657 {
3658 int x;
3659
3660 i.rex |= REX_OPCODE;
3661 for (x = 0; x < 2; x++)
3662 {
3663 /* Look for 8 bit operand that uses old registers. */
3664 if (i.types[x].bitfield.reg8
3665 && (i.op[x].regs->reg_flags & RegRex64) == 0)
3666 {
3667 /* In case it is "hi" register, give up. */
3668 if (i.op[x].regs->reg_num > 3)
3669 as_bad (_("can't encode register '%s%s' in an "
3670 "instruction requiring REX prefix."),
3671 register_prefix, i.op[x].regs->reg_name);
3672
3673 /* Otherwise it is equivalent to the extended register.
3674 Since the encoding doesn't change this is merely
3675 cosmetic cleanup for debug output. */
3676
3677 i.op[x].regs = i.op[x].regs + 8;
3678 }
3679 }
3680 }
3681
3682 if (i.rex != 0)
3683 add_prefix (REX_OPCODE | i.rex);
3684
3685 /* We are ready to output the insn. */
3686 output_insn ();
3687 }
3688
3689 static char *
3690 parse_insn (char *line, char *mnemonic)
3691 {
3692 char *l = line;
3693 char *token_start = l;
3694 char *mnem_p;
3695 int supported;
3696 const insn_template *t;
3697 char *dot_p = NULL;
3698
3699 while (1)
3700 {
3701 mnem_p = mnemonic;
3702 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
3703 {
3704 if (*mnem_p == '.')
3705 dot_p = mnem_p;
3706 mnem_p++;
3707 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
3708 {
3709 as_bad (_("no such instruction: `%s'"), token_start);
3710 return NULL;
3711 }
3712 l++;
3713 }
3714 if (!is_space_char (*l)
3715 && *l != END_OF_INSN
3716 && (intel_syntax
3717 || (*l != PREFIX_SEPARATOR
3718 && *l != ',')))
3719 {
3720 as_bad (_("invalid character %s in mnemonic"),
3721 output_invalid (*l));
3722 return NULL;
3723 }
3724 if (token_start == l)
3725 {
3726 if (!intel_syntax && *l == PREFIX_SEPARATOR)
3727 as_bad (_("expecting prefix; got nothing"));
3728 else
3729 as_bad (_("expecting mnemonic; got nothing"));
3730 return NULL;
3731 }
3732
3733 /* Look up instruction (or prefix) via hash table. */
3734 current_templates = (const templates *) hash_find (op_hash, mnemonic);
3735
3736 if (*l != END_OF_INSN
3737 && (!is_space_char (*l) || l[1] != END_OF_INSN)
3738 && current_templates
3739 && current_templates->start->opcode_modifier.isprefix)
3740 {
3741 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
3742 {
3743 as_bad ((flag_code != CODE_64BIT
3744 ? _("`%s' is only supported in 64-bit mode")
3745 : _("`%s' is not supported in 64-bit mode")),
3746 current_templates->start->name);
3747 return NULL;
3748 }
3749 /* If we are in 16-bit mode, do not allow addr16 or data16.
3750 Similarly, in 32-bit mode, do not allow addr32 or data32. */
3751 if ((current_templates->start->opcode_modifier.size16
3752 || current_templates->start->opcode_modifier.size32)
3753 && flag_code != CODE_64BIT
3754 && (current_templates->start->opcode_modifier.size32
3755 ^ (flag_code == CODE_16BIT)))
3756 {
3757 as_bad (_("redundant %s prefix"),
3758 current_templates->start->name);
3759 return NULL;
3760 }
3761 /* Add prefix, checking for repeated prefixes. */
3762 switch (add_prefix (current_templates->start->base_opcode))
3763 {
3764 case PREFIX_EXIST:
3765 return NULL;
3766 case PREFIX_REP:
3767 if (current_templates->start->cpu_flags.bitfield.cpuhle)
3768 i.hle_prefix = current_templates->start->name;
3769 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
3770 i.bnd_prefix = current_templates->start->name;
3771 else
3772 i.rep_prefix = current_templates->start->name;
3773 break;
3774 default:
3775 break;
3776 }
3777 /* Skip past PREFIX_SEPARATOR and reset token_start. */
3778 token_start = ++l;
3779 }
3780 else
3781 break;
3782 }
3783
3784 if (!current_templates)
3785 {
3786 /* Check if we should swap operand or force 32bit displacement in
3787 encoding. */
3788 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
3789 i.swap_operand = 1;
3790 else if (mnem_p - 3 == dot_p
3791 && dot_p[1] == 'd'
3792 && dot_p[2] == '8')
3793 i.disp_encoding = disp_encoding_8bit;
3794 else if (mnem_p - 4 == dot_p
3795 && dot_p[1] == 'd'
3796 && dot_p[2] == '3'
3797 && dot_p[3] == '2')
3798 i.disp_encoding = disp_encoding_32bit;
3799 else
3800 goto check_suffix;
3801 mnem_p = dot_p;
3802 *dot_p = '\0';
3803 current_templates = (const templates *) hash_find (op_hash, mnemonic);
3804 }
3805
3806 if (!current_templates)
3807 {
3808 check_suffix:
3809 /* See if we can get a match by trimming off a suffix. */
3810 switch (mnem_p[-1])
3811 {
3812 case WORD_MNEM_SUFFIX:
3813 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
3814 i.suffix = SHORT_MNEM_SUFFIX;
3815 else
3816 case BYTE_MNEM_SUFFIX:
3817 case QWORD_MNEM_SUFFIX:
3818 i.suffix = mnem_p[-1];
3819 mnem_p[-1] = '\0';
3820 current_templates = (const templates *) hash_find (op_hash,
3821 mnemonic);
3822 break;
3823 case SHORT_MNEM_SUFFIX:
3824 case LONG_MNEM_SUFFIX:
3825 if (!intel_syntax)
3826 {
3827 i.suffix = mnem_p[-1];
3828 mnem_p[-1] = '\0';
3829 current_templates = (const templates *) hash_find (op_hash,
3830 mnemonic);
3831 }
3832 break;
3833
3834 /* Intel Syntax. */
3835 case 'd':
3836 if (intel_syntax)
3837 {
3838 if (intel_float_operand (mnemonic) == 1)
3839 i.suffix = SHORT_MNEM_SUFFIX;
3840 else
3841 i.suffix = LONG_MNEM_SUFFIX;
3842 mnem_p[-1] = '\0';
3843 current_templates = (const templates *) hash_find (op_hash,
3844 mnemonic);
3845 }
3846 break;
3847 }
3848 if (!current_templates)
3849 {
3850 as_bad (_("no such instruction: `%s'"), token_start);
3851 return NULL;
3852 }
3853 }
3854
3855 if (current_templates->start->opcode_modifier.jump
3856 || current_templates->start->opcode_modifier.jumpbyte)
3857 {
3858 /* Check for a branch hint. We allow ",pt" and ",pn" for
3859 predict taken and predict not taken respectively.
3860 I'm not sure that branch hints actually do anything on loop
3861 and jcxz insns (JumpByte) for current Pentium4 chips. They
3862 may work in the future and it doesn't hurt to accept them
3863 now. */
3864 if (l[0] == ',' && l[1] == 'p')
3865 {
3866 if (l[2] == 't')
3867 {
3868 if (!add_prefix (DS_PREFIX_OPCODE))
3869 return NULL;
3870 l += 3;
3871 }
3872 else if (l[2] == 'n')
3873 {
3874 if (!add_prefix (CS_PREFIX_OPCODE))
3875 return NULL;
3876 l += 3;
3877 }
3878 }
3879 }
3880 /* Any other comma loses. */
3881 if (*l == ',')
3882 {
3883 as_bad (_("invalid character %s in mnemonic"),
3884 output_invalid (*l));
3885 return NULL;
3886 }
3887
3888 /* Check if instruction is supported on specified architecture. */
3889 supported = 0;
3890 for (t = current_templates->start; t < current_templates->end; ++t)
3891 {
3892 supported |= cpu_flags_match (t);
3893 if (supported == CPU_FLAGS_PERFECT_MATCH)
3894 goto skip;
3895 }
3896
3897 if (!(supported & CPU_FLAGS_64BIT_MATCH))
3898 {
3899 as_bad (flag_code == CODE_64BIT
3900 ? _("`%s' is not supported in 64-bit mode")
3901 : _("`%s' is only supported in 64-bit mode"),
3902 current_templates->start->name);
3903 return NULL;
3904 }
3905 if (supported != CPU_FLAGS_PERFECT_MATCH)
3906 {
3907 as_bad (_("`%s' is not supported on `%s%s'"),
3908 current_templates->start->name,
3909 cpu_arch_name ? cpu_arch_name : default_arch,
3910 cpu_sub_arch_name ? cpu_sub_arch_name : "");
3911 return NULL;
3912 }
3913
3914 skip:
3915 if (!cpu_arch_flags.bitfield.cpui386
3916 && (flag_code != CODE_16BIT))
3917 {
3918 as_warn (_("use .code16 to ensure correct addressing mode"));
3919 }
3920
3921 return l;
3922 }
3923
3924 static char *
3925 parse_operands (char *l, const char *mnemonic)
3926 {
3927 char *token_start;
3928
3929 /* 1 if operand is pending after ','. */
3930 unsigned int expecting_operand = 0;
3931
3932 /* Non-zero if operand parens not balanced. */
3933 unsigned int paren_not_balanced;
3934
3935 while (*l != END_OF_INSN)
3936 {
3937 /* Skip optional white space before operand. */
3938 if (is_space_char (*l))
3939 ++l;
3940 if (!is_operand_char (*l) && *l != END_OF_INSN)
3941 {
3942 as_bad (_("invalid character %s before operand %d"),
3943 output_invalid (*l),
3944 i.operands + 1);
3945 return NULL;
3946 }
3947 token_start = l; /* after white space */
3948 paren_not_balanced = 0;
3949 while (paren_not_balanced || *l != ',')
3950 {
3951 if (*l == END_OF_INSN)
3952 {
3953 if (paren_not_balanced)
3954 {
3955 if (!intel_syntax)
3956 as_bad (_("unbalanced parenthesis in operand %d."),
3957 i.operands + 1);
3958 else
3959 as_bad (_("unbalanced brackets in operand %d."),
3960 i.operands + 1);
3961 return NULL;
3962 }
3963 else
3964 break; /* we are done */
3965 }
3966 else if (!is_operand_char (*l) && !is_space_char (*l))
3967 {
3968 as_bad (_("invalid character %s in operand %d"),
3969 output_invalid (*l),
3970 i.operands + 1);
3971 return NULL;
3972 }
3973 if (!intel_syntax)
3974 {
3975 if (*l == '(')
3976 ++paren_not_balanced;
3977 if (*l == ')')
3978 --paren_not_balanced;
3979 }
3980 else
3981 {
3982 if (*l == '[')
3983 ++paren_not_balanced;
3984 if (*l == ']')
3985 --paren_not_balanced;
3986 }
3987 l++;
3988 }
3989 if (l != token_start)
3990 { /* Yes, we've read in another operand. */
3991 unsigned int operand_ok;
3992 this_operand = i.operands++;
3993 i.types[this_operand].bitfield.unspecified = 1;
3994 if (i.operands > MAX_OPERANDS)
3995 {
3996 as_bad (_("spurious operands; (%d operands/instruction max)"),
3997 MAX_OPERANDS);
3998 return NULL;
3999 }
4000 /* Now parse operand adding info to 'i' as we go along. */
4001 END_STRING_AND_SAVE (l);
4002
4003 if (intel_syntax)
4004 operand_ok =
4005 i386_intel_operand (token_start,
4006 intel_float_operand (mnemonic));
4007 else
4008 operand_ok = i386_att_operand (token_start);
4009
4010 RESTORE_END_STRING (l);
4011 if (!operand_ok)
4012 return NULL;
4013 }
4014 else
4015 {
4016 if (expecting_operand)
4017 {
4018 expecting_operand_after_comma:
4019 as_bad (_("expecting operand after ','; got nothing"));
4020 return NULL;
4021 }
4022 if (*l == ',')
4023 {
4024 as_bad (_("expecting operand before ','; got nothing"));
4025 return NULL;
4026 }
4027 }
4028
4029 /* Now *l must be either ',' or END_OF_INSN. */
4030 if (*l == ',')
4031 {
4032 if (*++l == END_OF_INSN)
4033 {
4034 /* Just skip it, if it's \n complain. */
4035 goto expecting_operand_after_comma;
4036 }
4037 expecting_operand = 1;
4038 }
4039 }
4040 return l;
4041 }
4042
4043 static void
4044 swap_2_operands (int xchg1, int xchg2)
4045 {
4046 union i386_op temp_op;
4047 i386_operand_type temp_type;
4048 enum bfd_reloc_code_real temp_reloc;
4049
4050 temp_type = i.types[xchg2];
4051 i.types[xchg2] = i.types[xchg1];
4052 i.types[xchg1] = temp_type;
4053 temp_op = i.op[xchg2];
4054 i.op[xchg2] = i.op[xchg1];
4055 i.op[xchg1] = temp_op;
4056 temp_reloc = i.reloc[xchg2];
4057 i.reloc[xchg2] = i.reloc[xchg1];
4058 i.reloc[xchg1] = temp_reloc;
4059
4060 if (i.mask)
4061 {
4062 if (i.mask->operand == xchg1)
4063 i.mask->operand = xchg2;
4064 else if (i.mask->operand == xchg2)
4065 i.mask->operand = xchg1;
4066 }
4067 if (i.broadcast)
4068 {
4069 if (i.broadcast->operand == xchg1)
4070 i.broadcast->operand = xchg2;
4071 else if (i.broadcast->operand == xchg2)
4072 i.broadcast->operand = xchg1;
4073 }
4074 if (i.rounding)
4075 {
4076 if (i.rounding->operand == xchg1)
4077 i.rounding->operand = xchg2;
4078 else if (i.rounding->operand == xchg2)
4079 i.rounding->operand = xchg1;
4080 }
4081 }
4082
4083 static void
4084 swap_operands (void)
4085 {
4086 switch (i.operands)
4087 {
4088 case 5:
4089 case 4:
4090 swap_2_operands (1, i.operands - 2);
4091 case 3:
4092 case 2:
4093 swap_2_operands (0, i.operands - 1);
4094 break;
4095 default:
4096 abort ();
4097 }
4098
4099 if (i.mem_operands == 2)
4100 {
4101 const seg_entry *temp_seg;
4102 temp_seg = i.seg[0];
4103 i.seg[0] = i.seg[1];
4104 i.seg[1] = temp_seg;
4105 }
4106 }
4107
4108 /* Try to ensure constant immediates are represented in the smallest
4109 opcode possible. */
4110 static void
4111 optimize_imm (void)
4112 {
4113 char guess_suffix = 0;
4114 int op;
4115
4116 if (i.suffix)
4117 guess_suffix = i.suffix;
4118 else if (i.reg_operands)
4119 {
4120 /* Figure out a suffix from the last register operand specified.
4121 We can't do this properly yet, ie. excluding InOutPortReg,
4122 but the following works for instructions with immediates.
4123 In any case, we can't set i.suffix yet. */
4124 for (op = i.operands; --op >= 0;)
4125 if (i.types[op].bitfield.reg8)
4126 {
4127 guess_suffix = BYTE_MNEM_SUFFIX;
4128 break;
4129 }
4130 else if (i.types[op].bitfield.reg16)
4131 {
4132 guess_suffix = WORD_MNEM_SUFFIX;
4133 break;
4134 }
4135 else if (i.types[op].bitfield.reg32)
4136 {
4137 guess_suffix = LONG_MNEM_SUFFIX;
4138 break;
4139 }
4140 else if (i.types[op].bitfield.reg64)
4141 {
4142 guess_suffix = QWORD_MNEM_SUFFIX;
4143 break;
4144 }
4145 }
4146 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
4147 guess_suffix = WORD_MNEM_SUFFIX;
4148
4149 for (op = i.operands; --op >= 0;)
4150 if (operand_type_check (i.types[op], imm))
4151 {
4152 switch (i.op[op].imms->X_op)
4153 {
4154 case O_constant:
4155 /* If a suffix is given, this operand may be shortened. */
4156 switch (guess_suffix)
4157 {
4158 case LONG_MNEM_SUFFIX:
4159 i.types[op].bitfield.imm32 = 1;
4160 i.types[op].bitfield.imm64 = 1;
4161 break;
4162 case WORD_MNEM_SUFFIX:
4163 i.types[op].bitfield.imm16 = 1;
4164 i.types[op].bitfield.imm32 = 1;
4165 i.types[op].bitfield.imm32s = 1;
4166 i.types[op].bitfield.imm64 = 1;
4167 break;
4168 case BYTE_MNEM_SUFFIX:
4169 i.types[op].bitfield.imm8 = 1;
4170 i.types[op].bitfield.imm8s = 1;
4171 i.types[op].bitfield.imm16 = 1;
4172 i.types[op].bitfield.imm32 = 1;
4173 i.types[op].bitfield.imm32s = 1;
4174 i.types[op].bitfield.imm64 = 1;
4175 break;
4176 }
4177
4178 /* If this operand is at most 16 bits, convert it
4179 to a signed 16 bit number before trying to see
4180 whether it will fit in an even smaller size.
4181 This allows a 16-bit operand such as $0xffe0 to
4182 be recognised as within Imm8S range. */
4183 if ((i.types[op].bitfield.imm16)
4184 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
4185 {
4186 i.op[op].imms->X_add_number =
4187 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
4188 }
4189 if ((i.types[op].bitfield.imm32)
4190 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
4191 == 0))
4192 {
4193 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
4194 ^ ((offsetT) 1 << 31))
4195 - ((offsetT) 1 << 31));
4196 }
4197 i.types[op]
4198 = operand_type_or (i.types[op],
4199 smallest_imm_type (i.op[op].imms->X_add_number));
4200
4201 /* We must avoid matching of Imm32 templates when 64bit
4202 only immediate is available. */
4203 if (guess_suffix == QWORD_MNEM_SUFFIX)
4204 i.types[op].bitfield.imm32 = 0;
4205 break;
4206
4207 case O_absent:
4208 case O_register:
4209 abort ();
4210
4211 /* Symbols and expressions. */
4212 default:
4213 /* Convert symbolic operand to proper sizes for matching, but don't
4214 prevent matching a set of insns that only supports sizes other
4215 than those matching the insn suffix. */
4216 {
4217 i386_operand_type mask, allowed;
4218 const insn_template *t;
4219
4220 operand_type_set (&mask, 0);
4221 operand_type_set (&allowed, 0);
4222
4223 for (t = current_templates->start;
4224 t < current_templates->end;
4225 ++t)
4226 allowed = operand_type_or (allowed,
4227 t->operand_types[op]);
4228 switch (guess_suffix)
4229 {
4230 case QWORD_MNEM_SUFFIX:
4231 mask.bitfield.imm64 = 1;
4232 mask.bitfield.imm32s = 1;
4233 break;
4234 case LONG_MNEM_SUFFIX:
4235 mask.bitfield.imm32 = 1;
4236 break;
4237 case WORD_MNEM_SUFFIX:
4238 mask.bitfield.imm16 = 1;
4239 break;
4240 case BYTE_MNEM_SUFFIX:
4241 mask.bitfield.imm8 = 1;
4242 break;
4243 default:
4244 break;
4245 }
4246 allowed = operand_type_and (mask, allowed);
4247 if (!operand_type_all_zero (&allowed))
4248 i.types[op] = operand_type_and (i.types[op], mask);
4249 }
4250 break;
4251 }
4252 }
4253 }
4254
4255 /* Try to use the smallest displacement type too. */
4256 static void
4257 optimize_disp (void)
4258 {
4259 int op;
4260
4261 for (op = i.operands; --op >= 0;)
4262 if (operand_type_check (i.types[op], disp))
4263 {
4264 if (i.op[op].disps->X_op == O_constant)
4265 {
4266 offsetT op_disp = i.op[op].disps->X_add_number;
4267
4268 if (i.types[op].bitfield.disp16
4269 && (op_disp & ~(offsetT) 0xffff) == 0)
4270 {
4271 /* If this operand is at most 16 bits, convert
4272 to a signed 16 bit number and don't use 64bit
4273 displacement. */
4274 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
4275 i.types[op].bitfield.disp64 = 0;
4276 }
4277 if (i.types[op].bitfield.disp32
4278 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
4279 {
4280 /* If this operand is at most 32 bits, convert
4281 to a signed 32 bit number and don't use 64bit
4282 displacement. */
4283 op_disp &= (((offsetT) 2 << 31) - 1);
4284 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
4285 i.types[op].bitfield.disp64 = 0;
4286 }
4287 if (!op_disp && i.types[op].bitfield.baseindex)
4288 {
4289 i.types[op].bitfield.disp8 = 0;
4290 i.types[op].bitfield.disp16 = 0;
4291 i.types[op].bitfield.disp32 = 0;
4292 i.types[op].bitfield.disp32s = 0;
4293 i.types[op].bitfield.disp64 = 0;
4294 i.op[op].disps = 0;
4295 i.disp_operands--;
4296 }
4297 else if (flag_code == CODE_64BIT)
4298 {
4299 if (fits_in_signed_long (op_disp))
4300 {
4301 i.types[op].bitfield.disp64 = 0;
4302 i.types[op].bitfield.disp32s = 1;
4303 }
4304 if (i.prefix[ADDR_PREFIX]
4305 && fits_in_unsigned_long (op_disp))
4306 i.types[op].bitfield.disp32 = 1;
4307 }
4308 if ((i.types[op].bitfield.disp32
4309 || i.types[op].bitfield.disp32s
4310 || i.types[op].bitfield.disp16)
4311 && fits_in_signed_byte (op_disp))
4312 i.types[op].bitfield.disp8 = 1;
4313 }
4314 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
4315 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
4316 {
4317 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
4318 i.op[op].disps, 0, i.reloc[op]);
4319 i.types[op].bitfield.disp8 = 0;
4320 i.types[op].bitfield.disp16 = 0;
4321 i.types[op].bitfield.disp32 = 0;
4322 i.types[op].bitfield.disp32s = 0;
4323 i.types[op].bitfield.disp64 = 0;
4324 }
4325 else
4326 /* We only support 64bit displacement on constants. */
4327 i.types[op].bitfield.disp64 = 0;
4328 }
4329 }
4330
4331 /* Check if operands are valid for the instruction. */
4332
4333 static int
4334 check_VecOperands (const insn_template *t)
4335 {
4336 unsigned int op;
4337
4338 /* Without VSIB byte, we can't have a vector register for index. */
4339 if (!t->opcode_modifier.vecsib
4340 && i.index_reg
4341 && (i.index_reg->reg_type.bitfield.regxmm
4342 || i.index_reg->reg_type.bitfield.regymm
4343 || i.index_reg->reg_type.bitfield.regzmm))
4344 {
4345 i.error = unsupported_vector_index_register;
4346 return 1;
4347 }
4348
4349 /* Check if default mask is allowed. */
4350 if (t->opcode_modifier.nodefmask
4351 && (!i.mask || i.mask->mask->reg_num == 0))
4352 {
4353 i.error = no_default_mask;
4354 return 1;
4355 }
4356
4357 /* For VSIB byte, we need a vector register for index, and all vector
4358 registers must be distinct. */
4359 if (t->opcode_modifier.vecsib)
4360 {
4361 if (!i.index_reg
4362 || !((t->opcode_modifier.vecsib == VecSIB128
4363 && i.index_reg->reg_type.bitfield.regxmm)
4364 || (t->opcode_modifier.vecsib == VecSIB256
4365 && i.index_reg->reg_type.bitfield.regymm)
4366 || (t->opcode_modifier.vecsib == VecSIB512
4367 && i.index_reg->reg_type.bitfield.regzmm)))
4368 {
4369 i.error = invalid_vsib_address;
4370 return 1;
4371 }
4372
4373 gas_assert (i.reg_operands == 2 || i.mask);
4374 if (i.reg_operands == 2 && !i.mask)
4375 {
4376 gas_assert (i.types[0].bitfield.regxmm
4377 || i.types[0].bitfield.regymm
4378 || i.types[0].bitfield.regzmm);
4379 gas_assert (i.types[2].bitfield.regxmm
4380 || i.types[2].bitfield.regymm
4381 || i.types[2].bitfield.regzmm);
4382 if (operand_check == check_none)
4383 return 0;
4384 if (register_number (i.op[0].regs)
4385 != register_number (i.index_reg)
4386 && register_number (i.op[2].regs)
4387 != register_number (i.index_reg)
4388 && register_number (i.op[0].regs)
4389 != register_number (i.op[2].regs))
4390 return 0;
4391 if (operand_check == check_error)
4392 {
4393 i.error = invalid_vector_register_set;
4394 return 1;
4395 }
4396 as_warn (_("mask, index, and destination registers should be distinct"));
4397 }
4398 }
4399
4400 /* Check if broadcast is supported by the instruction and is applied
4401 to the memory operand. */
4402 if (i.broadcast)
4403 {
4404 int broadcasted_opnd_size;
4405
4406 /* Check if specified broadcast is supported in this instruction,
4407 and it's applied to memory operand of DWORD or QWORD type,
4408 depending on VecESize. */
4409 if (i.broadcast->type != t->opcode_modifier.broadcast
4410 || !i.types[i.broadcast->operand].bitfield.mem
4411 || (t->opcode_modifier.vecesize == 0
4412 && !i.types[i.broadcast->operand].bitfield.dword
4413 && !i.types[i.broadcast->operand].bitfield.unspecified)
4414 || (t->opcode_modifier.vecesize == 1
4415 && !i.types[i.broadcast->operand].bitfield.qword
4416 && !i.types[i.broadcast->operand].bitfield.unspecified))
4417 goto bad_broadcast;
4418
4419 broadcasted_opnd_size = t->opcode_modifier.vecesize ? 64 : 32;
4420 if (i.broadcast->type == BROADCAST_1TO16)
4421 broadcasted_opnd_size <<= 4; /* Broadcast 1to16. */
4422 else if (i.broadcast->type == BROADCAST_1TO8)
4423 broadcasted_opnd_size <<= 3; /* Broadcast 1to8. */
4424 else
4425 goto bad_broadcast;
4426
4427 if ((broadcasted_opnd_size == 256
4428 && !t->operand_types[i.broadcast->operand].bitfield.ymmword)
4429 || (broadcasted_opnd_size == 512
4430 && !t->operand_types[i.broadcast->operand].bitfield.zmmword))
4431 {
4432 bad_broadcast:
4433 i.error = unsupported_broadcast;
4434 return 1;
4435 }
4436 }
4437 /* If broadcast is supported in this instruction, we need to check if
4438 operand of one-element size isn't specified without broadcast. */
4439 else if (t->opcode_modifier.broadcast && i.mem_operands)
4440 {
4441 /* Find memory operand. */
4442 for (op = 0; op < i.operands; op++)
4443 if (operand_type_check (i.types[op], anymem))
4444 break;
4445 gas_assert (op < i.operands);
4446 /* Check size of the memory operand. */
4447 if ((t->opcode_modifier.vecesize == 0
4448 && i.types[op].bitfield.dword)
4449 || (t->opcode_modifier.vecesize == 1
4450 && i.types[op].bitfield.qword))
4451 {
4452 i.error = broadcast_needed;
4453 return 1;
4454 }
4455 }
4456
4457 /* Check if requested masking is supported. */
4458 if (i.mask
4459 && (!t->opcode_modifier.masking
4460 || (i.mask->zeroing
4461 && t->opcode_modifier.masking == MERGING_MASKING)))
4462 {
4463 i.error = unsupported_masking;
4464 return 1;
4465 }
4466
4467 /* Check if masking is applied to dest operand. */
4468 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
4469 {
4470 i.error = mask_not_on_destination;
4471 return 1;
4472 }
4473
4474 /* Check RC/SAE. */
4475 if (i.rounding)
4476 {
4477 if ((i.rounding->type != saeonly
4478 && !t->opcode_modifier.staticrounding)
4479 || (i.rounding->type == saeonly
4480 && (t->opcode_modifier.staticrounding
4481 || !t->opcode_modifier.sae)))
4482 {
4483 i.error = unsupported_rc_sae;
4484 return 1;
4485 }
4486 /* If the instruction has several immediate operands and one of
4487 them is rounding, the rounding operand should be the last
4488 immediate operand. */
4489 if (i.imm_operands > 1
4490 && i.rounding->operand != (int) (i.imm_operands - 1))
4491 {
4492 i.error = rc_sae_operand_not_last_imm;
4493 return 1;
4494 }
4495 }
4496
4497 /* Check vector Disp8 operand. */
4498 if (t->opcode_modifier.disp8memshift)
4499 {
4500 if (i.broadcast)
4501 i.memshift = t->opcode_modifier.vecesize ? 3 : 2;
4502 else
4503 i.memshift = t->opcode_modifier.disp8memshift;
4504
4505 for (op = 0; op < i.operands; op++)
4506 if (operand_type_check (i.types[op], disp)
4507 && i.op[op].disps->X_op == O_constant)
4508 {
4509 offsetT value = i.op[op].disps->X_add_number;
4510 int vec_disp8_ok = fits_in_vec_disp8 (value);
4511 if (t->operand_types [op].bitfield.vec_disp8)
4512 {
4513 if (vec_disp8_ok)
4514 i.types[op].bitfield.vec_disp8 = 1;
4515 else
4516 {
4517 /* Vector insn can only have Vec_Disp8/Disp32 in
4518 32/64bit modes, and Vec_Disp8/Disp16 in 16bit
4519 mode. */
4520 i.types[op].bitfield.disp8 = 0;
4521 if (flag_code != CODE_16BIT)
4522 i.types[op].bitfield.disp16 = 0;
4523 }
4524 }
4525 else if (flag_code != CODE_16BIT)
4526 {
4527 /* One form of this instruction supports vector Disp8.
4528 Try vector Disp8 if we need to use Disp32. */
4529 if (vec_disp8_ok && !fits_in_signed_byte (value))
4530 {
4531 i.error = try_vector_disp8;
4532 return 1;
4533 }
4534 }
4535 }
4536 }
4537 else
4538 i.memshift = -1;
4539
4540 return 0;
4541 }
4542
4543 /* Check if operands are valid for the instruction. Update VEX
4544 operand types. */
4545
4546 static int
4547 VEX_check_operands (const insn_template *t)
4548 {
4549 /* VREX is only valid with EVEX prefix. */
4550 if (i.need_vrex && !t->opcode_modifier.evex)
4551 {
4552 i.error = invalid_register_operand;
4553 return 1;
4554 }
4555
4556 if (!t->opcode_modifier.vex)
4557 return 0;
4558
4559 /* Only check VEX_Imm4, which must be the first operand. */
4560 if (t->operand_types[0].bitfield.vec_imm4)
4561 {
4562 if (i.op[0].imms->X_op != O_constant
4563 || !fits_in_imm4 (i.op[0].imms->X_add_number))
4564 {
4565 i.error = bad_imm4;
4566 return 1;
4567 }
4568
4569 /* Turn off Imm8 so that update_imm won't complain. */
4570 i.types[0] = vec_imm4;
4571 }
4572
4573 return 0;
4574 }
4575
4576 static const insn_template *
4577 match_template (void)
4578 {
4579 /* Points to template once we've found it. */
4580 const insn_template *t;
4581 i386_operand_type overlap0, overlap1, overlap2, overlap3;
4582 i386_operand_type overlap4;
4583 unsigned int found_reverse_match;
4584 i386_opcode_modifier suffix_check;
4585 i386_operand_type operand_types [MAX_OPERANDS];
4586 int addr_prefix_disp;
4587 unsigned int j;
4588 unsigned int found_cpu_match;
4589 unsigned int check_register;
4590 enum i386_error specific_error = 0;
4591
4592 #if MAX_OPERANDS != 5
4593 # error "MAX_OPERANDS must be 5."
4594 #endif
4595
4596 found_reverse_match = 0;
4597 addr_prefix_disp = -1;
4598
4599 memset (&suffix_check, 0, sizeof (suffix_check));
4600 if (i.suffix == BYTE_MNEM_SUFFIX)
4601 suffix_check.no_bsuf = 1;
4602 else if (i.suffix == WORD_MNEM_SUFFIX)
4603 suffix_check.no_wsuf = 1;
4604 else if (i.suffix == SHORT_MNEM_SUFFIX)
4605 suffix_check.no_ssuf = 1;
4606 else if (i.suffix == LONG_MNEM_SUFFIX)
4607 suffix_check.no_lsuf = 1;
4608 else if (i.suffix == QWORD_MNEM_SUFFIX)
4609 suffix_check.no_qsuf = 1;
4610 else if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
4611 suffix_check.no_ldsuf = 1;
4612
4613 /* Must have right number of operands. */
4614 i.error = number_of_operands_mismatch;
4615
4616 for (t = current_templates->start; t < current_templates->end; t++)
4617 {
4618 addr_prefix_disp = -1;
4619
4620 if (i.operands != t->operands)
4621 continue;
4622
4623 /* Check processor support. */
4624 i.error = unsupported;
4625 found_cpu_match = (cpu_flags_match (t)
4626 == CPU_FLAGS_PERFECT_MATCH);
4627 if (!found_cpu_match)
4628 continue;
4629
4630 /* Check old gcc support. */
4631 i.error = old_gcc_only;
4632 if (!old_gcc && t->opcode_modifier.oldgcc)
4633 continue;
4634
4635 /* Check AT&T mnemonic. */
4636 i.error = unsupported_with_intel_mnemonic;
4637 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
4638 continue;
4639
4640 /* Check AT&T/Intel syntax. */
4641 i.error = unsupported_syntax;
4642 if ((intel_syntax && t->opcode_modifier.attsyntax)
4643 || (!intel_syntax && t->opcode_modifier.intelsyntax))
4644 continue;
4645
4646 /* Check the suffix, except for some instructions in intel mode. */
4647 i.error = invalid_instruction_suffix;
4648 if ((!intel_syntax || !t->opcode_modifier.ignoresize)
4649 && ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
4650 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
4651 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
4652 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
4653 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
4654 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf)))
4655 continue;
4656
4657 if (!operand_size_match (t))
4658 continue;
4659
4660 for (j = 0; j < MAX_OPERANDS; j++)
4661 operand_types[j] = t->operand_types[j];
4662
4663 /* In general, don't allow 64-bit operands in 32-bit mode. */
4664 if (i.suffix == QWORD_MNEM_SUFFIX
4665 && flag_code != CODE_64BIT
4666 && (intel_syntax
4667 ? (!t->opcode_modifier.ignoresize
4668 && !intel_float_operand (t->name))
4669 : intel_float_operand (t->name) != 2)
4670 && ((!operand_types[0].bitfield.regmmx
4671 && !operand_types[0].bitfield.regxmm
4672 && !operand_types[0].bitfield.regymm
4673 && !operand_types[0].bitfield.regzmm)
4674 || (!operand_types[t->operands > 1].bitfield.regmmx
4675 && !!operand_types[t->operands > 1].bitfield.regxmm
4676 && !!operand_types[t->operands > 1].bitfield.regymm
4677 && !!operand_types[t->operands > 1].bitfield.regzmm))
4678 && (t->base_opcode != 0x0fc7
4679 || t->extension_opcode != 1 /* cmpxchg8b */))
4680 continue;
4681
4682 /* In general, don't allow 32-bit operands on pre-386. */
4683 else if (i.suffix == LONG_MNEM_SUFFIX
4684 && !cpu_arch_flags.bitfield.cpui386
4685 && (intel_syntax
4686 ? (!t->opcode_modifier.ignoresize
4687 && !intel_float_operand (t->name))
4688 : intel_float_operand (t->name) != 2)
4689 && ((!operand_types[0].bitfield.regmmx
4690 && !operand_types[0].bitfield.regxmm)
4691 || (!operand_types[t->operands > 1].bitfield.regmmx
4692 && !!operand_types[t->operands > 1].bitfield.regxmm)))
4693 continue;
4694
4695 /* Do not verify operands when there are none. */
4696 else
4697 {
4698 if (!t->operands)
4699 /* We've found a match; break out of loop. */
4700 break;
4701 }
4702
4703 /* Address size prefix will turn Disp64/Disp32/Disp16 operand
4704 into Disp32/Disp16/Disp32 operand. */
4705 if (i.prefix[ADDR_PREFIX] != 0)
4706 {
4707 /* There should be only one Disp operand. */
4708 switch (flag_code)
4709 {
4710 case CODE_16BIT:
4711 for (j = 0; j < MAX_OPERANDS; j++)
4712 {
4713 if (operand_types[j].bitfield.disp16)
4714 {
4715 addr_prefix_disp = j;
4716 operand_types[j].bitfield.disp32 = 1;
4717 operand_types[j].bitfield.disp16 = 0;
4718 break;
4719 }
4720 }
4721 break;
4722 case CODE_32BIT:
4723 for (j = 0; j < MAX_OPERANDS; j++)
4724 {
4725 if (operand_types[j].bitfield.disp32)
4726 {
4727 addr_prefix_disp = j;
4728 operand_types[j].bitfield.disp32 = 0;
4729 operand_types[j].bitfield.disp16 = 1;
4730 break;
4731 }
4732 }
4733 break;
4734 case CODE_64BIT:
4735 for (j = 0; j < MAX_OPERANDS; j++)
4736 {
4737 if (operand_types[j].bitfield.disp64)
4738 {
4739 addr_prefix_disp = j;
4740 operand_types[j].bitfield.disp64 = 0;
4741 operand_types[j].bitfield.disp32 = 1;
4742 break;
4743 }
4744 }
4745 break;
4746 }
4747 }
4748
4749 /* We check register size if needed. */
4750 check_register = t->opcode_modifier.checkregsize;
4751 overlap0 = operand_type_and (i.types[0], operand_types[0]);
4752 switch (t->operands)
4753 {
4754 case 1:
4755 if (!operand_type_match (overlap0, i.types[0]))
4756 continue;
4757 break;
4758 case 2:
4759 /* xchg %eax, %eax is a special case. It is an aliase for nop
4760 only in 32bit mode and we can use opcode 0x90. In 64bit
4761 mode, we can't use 0x90 for xchg %eax, %eax since it should
4762 zero-extend %eax to %rax. */
4763 if (flag_code == CODE_64BIT
4764 && t->base_opcode == 0x90
4765 && operand_type_equal (&i.types [0], &acc32)
4766 && operand_type_equal (&i.types [1], &acc32))
4767 continue;
4768 if (i.swap_operand)
4769 {
4770 /* If we swap operand in encoding, we either match
4771 the next one or reverse direction of operands. */
4772 if (t->opcode_modifier.s)
4773 continue;
4774 else if (t->opcode_modifier.d)
4775 goto check_reverse;
4776 }
4777
4778 case 3:
4779 /* If we swap operand in encoding, we match the next one. */
4780 if (i.swap_operand && t->opcode_modifier.s)
4781 continue;
4782 case 4:
4783 case 5:
4784 overlap1 = operand_type_and (i.types[1], operand_types[1]);
4785 if (!operand_type_match (overlap0, i.types[0])
4786 || !operand_type_match (overlap1, i.types[1])
4787 || (check_register
4788 && !operand_type_register_match (overlap0, i.types[0],
4789 operand_types[0],
4790 overlap1, i.types[1],
4791 operand_types[1])))
4792 {
4793 /* Check if other direction is valid ... */
4794 if (!t->opcode_modifier.d && !t->opcode_modifier.floatd)
4795 continue;
4796
4797 check_reverse:
4798 /* Try reversing direction of operands. */
4799 overlap0 = operand_type_and (i.types[0], operand_types[1]);
4800 overlap1 = operand_type_and (i.types[1], operand_types[0]);
4801 if (!operand_type_match (overlap0, i.types[0])
4802 || !operand_type_match (overlap1, i.types[1])
4803 || (check_register
4804 && !operand_type_register_match (overlap0,
4805 i.types[0],
4806 operand_types[1],
4807 overlap1,
4808 i.types[1],
4809 operand_types[0])))
4810 {
4811 /* Does not match either direction. */
4812 continue;
4813 }
4814 /* found_reverse_match holds which of D or FloatDR
4815 we've found. */
4816 if (t->opcode_modifier.d)
4817 found_reverse_match = Opcode_D;
4818 else if (t->opcode_modifier.floatd)
4819 found_reverse_match = Opcode_FloatD;
4820 else
4821 found_reverse_match = 0;
4822 if (t->opcode_modifier.floatr)
4823 found_reverse_match |= Opcode_FloatR;
4824 }
4825 else
4826 {
4827 /* Found a forward 2 operand match here. */
4828 switch (t->operands)
4829 {
4830 case 5:
4831 overlap4 = operand_type_and (i.types[4],
4832 operand_types[4]);
4833 case 4:
4834 overlap3 = operand_type_and (i.types[3],
4835 operand_types[3]);
4836 case 3:
4837 overlap2 = operand_type_and (i.types[2],
4838 operand_types[2]);
4839 break;
4840 }
4841
4842 switch (t->operands)
4843 {
4844 case 5:
4845 if (!operand_type_match (overlap4, i.types[4])
4846 || !operand_type_register_match (overlap3,
4847 i.types[3],
4848 operand_types[3],
4849 overlap4,
4850 i.types[4],
4851 operand_types[4]))
4852 continue;
4853 case 4:
4854 if (!operand_type_match (overlap3, i.types[3])
4855 || (check_register
4856 && !operand_type_register_match (overlap2,
4857 i.types[2],
4858 operand_types[2],
4859 overlap3,
4860 i.types[3],
4861 operand_types[3])))
4862 continue;
4863 case 3:
4864 /* Here we make use of the fact that there are no
4865 reverse match 3 operand instructions, and all 3
4866 operand instructions only need to be checked for
4867 register consistency between operands 2 and 3. */
4868 if (!operand_type_match (overlap2, i.types[2])
4869 || (check_register
4870 && !operand_type_register_match (overlap1,
4871 i.types[1],
4872 operand_types[1],
4873 overlap2,
4874 i.types[2],
4875 operand_types[2])))
4876 continue;
4877 break;
4878 }
4879 }
4880 /* Found either forward/reverse 2, 3 or 4 operand match here:
4881 slip through to break. */
4882 }
4883 if (!found_cpu_match)
4884 {
4885 found_reverse_match = 0;
4886 continue;
4887 }
4888
4889 /* Check if vector and VEX operands are valid. */
4890 if (check_VecOperands (t) || VEX_check_operands (t))
4891 {
4892 specific_error = i.error;
4893 continue;
4894 }
4895
4896 /* We've found a match; break out of loop. */
4897 break;
4898 }
4899
4900 if (t == current_templates->end)
4901 {
4902 /* We found no match. */
4903 const char *err_msg;
4904 switch (specific_error ? specific_error : i.error)
4905 {
4906 default:
4907 abort ();
4908 case operand_size_mismatch:
4909 err_msg = _("operand size mismatch");
4910 break;
4911 case operand_type_mismatch:
4912 err_msg = _("operand type mismatch");
4913 break;
4914 case register_type_mismatch:
4915 err_msg = _("register type mismatch");
4916 break;
4917 case number_of_operands_mismatch:
4918 err_msg = _("number of operands mismatch");
4919 break;
4920 case invalid_instruction_suffix:
4921 err_msg = _("invalid instruction suffix");
4922 break;
4923 case bad_imm4:
4924 err_msg = _("constant doesn't fit in 4 bits");
4925 break;
4926 case old_gcc_only:
4927 err_msg = _("only supported with old gcc");
4928 break;
4929 case unsupported_with_intel_mnemonic:
4930 err_msg = _("unsupported with Intel mnemonic");
4931 break;
4932 case unsupported_syntax:
4933 err_msg = _("unsupported syntax");
4934 break;
4935 case unsupported:
4936 as_bad (_("unsupported instruction `%s'"),
4937 current_templates->start->name);
4938 return NULL;
4939 case invalid_vsib_address:
4940 err_msg = _("invalid VSIB address");
4941 break;
4942 case invalid_vector_register_set:
4943 err_msg = _("mask, index, and destination registers must be distinct");
4944 break;
4945 case unsupported_vector_index_register:
4946 err_msg = _("unsupported vector index register");
4947 break;
4948 case unsupported_broadcast:
4949 err_msg = _("unsupported broadcast");
4950 break;
4951 case broadcast_not_on_src_operand:
4952 err_msg = _("broadcast not on source memory operand");
4953 break;
4954 case broadcast_needed:
4955 err_msg = _("broadcast is needed for operand of such type");
4956 break;
4957 case unsupported_masking:
4958 err_msg = _("unsupported masking");
4959 break;
4960 case mask_not_on_destination:
4961 err_msg = _("mask not on destination operand");
4962 break;
4963 case no_default_mask:
4964 err_msg = _("default mask isn't allowed");
4965 break;
4966 case unsupported_rc_sae:
4967 err_msg = _("unsupported static rounding/sae");
4968 break;
4969 case rc_sae_operand_not_last_imm:
4970 if (intel_syntax)
4971 err_msg = _("RC/SAE operand must precede immediate operands");
4972 else
4973 err_msg = _("RC/SAE operand must follow immediate operands");
4974 break;
4975 case invalid_register_operand:
4976 err_msg = _("invalid register operand");
4977 break;
4978 }
4979 as_bad (_("%s for `%s'"), err_msg,
4980 current_templates->start->name);
4981 return NULL;
4982 }
4983
4984 if (!quiet_warnings)
4985 {
4986 if (!intel_syntax
4987 && (i.types[0].bitfield.jumpabsolute
4988 != operand_types[0].bitfield.jumpabsolute))
4989 {
4990 as_warn (_("indirect %s without `*'"), t->name);
4991 }
4992
4993 if (t->opcode_modifier.isprefix
4994 && t->opcode_modifier.ignoresize)
4995 {
4996 /* Warn them that a data or address size prefix doesn't
4997 affect assembly of the next line of code. */
4998 as_warn (_("stand-alone `%s' prefix"), t->name);
4999 }
5000 }
5001
5002 /* Copy the template we found. */
5003 i.tm = *t;
5004
5005 if (addr_prefix_disp != -1)
5006 i.tm.operand_types[addr_prefix_disp]
5007 = operand_types[addr_prefix_disp];
5008
5009 if (found_reverse_match)
5010 {
5011 /* If we found a reverse match we must alter the opcode
5012 direction bit. found_reverse_match holds bits to change
5013 (different for int & float insns). */
5014
5015 i.tm.base_opcode ^= found_reverse_match;
5016
5017 i.tm.operand_types[0] = operand_types[1];
5018 i.tm.operand_types[1] = operand_types[0];
5019 }
5020
5021 return t;
5022 }
5023
5024 static int
5025 check_string (void)
5026 {
5027 int mem_op = operand_type_check (i.types[0], anymem) ? 0 : 1;
5028 if (i.tm.operand_types[mem_op].bitfield.esseg)
5029 {
5030 if (i.seg[0] != NULL && i.seg[0] != &es)
5031 {
5032 as_bad (_("`%s' operand %d must use `%ses' segment"),
5033 i.tm.name,
5034 mem_op + 1,
5035 register_prefix);
5036 return 0;
5037 }
5038 /* There's only ever one segment override allowed per instruction.
5039 This instruction possibly has a legal segment override on the
5040 second operand, so copy the segment to where non-string
5041 instructions store it, allowing common code. */
5042 i.seg[0] = i.seg[1];
5043 }
5044 else if (i.tm.operand_types[mem_op + 1].bitfield.esseg)
5045 {
5046 if (i.seg[1] != NULL && i.seg[1] != &es)
5047 {
5048 as_bad (_("`%s' operand %d must use `%ses' segment"),
5049 i.tm.name,
5050 mem_op + 2,
5051 register_prefix);
5052 return 0;
5053 }
5054 }
5055 return 1;
5056 }
5057
5058 static int
5059 process_suffix (void)
5060 {
5061 /* If matched instruction specifies an explicit instruction mnemonic
5062 suffix, use it. */
5063 if (i.tm.opcode_modifier.size16)
5064 i.suffix = WORD_MNEM_SUFFIX;
5065 else if (i.tm.opcode_modifier.size32)
5066 i.suffix = LONG_MNEM_SUFFIX;
5067 else if (i.tm.opcode_modifier.size64)
5068 i.suffix = QWORD_MNEM_SUFFIX;
5069 else if (i.reg_operands)
5070 {
5071 /* If there's no instruction mnemonic suffix we try to invent one
5072 based on register operands. */
5073 if (!i.suffix)
5074 {
5075 /* We take i.suffix from the last register operand specified,
5076 Destination register type is more significant than source
5077 register type. crc32 in SSE4.2 prefers source register
5078 type. */
5079 if (i.tm.base_opcode == 0xf20f38f1)
5080 {
5081 if (i.types[0].bitfield.reg16)
5082 i.suffix = WORD_MNEM_SUFFIX;
5083 else if (i.types[0].bitfield.reg32)
5084 i.suffix = LONG_MNEM_SUFFIX;
5085 else if (i.types[0].bitfield.reg64)
5086 i.suffix = QWORD_MNEM_SUFFIX;
5087 }
5088 else if (i.tm.base_opcode == 0xf20f38f0)
5089 {
5090 if (i.types[0].bitfield.reg8)
5091 i.suffix = BYTE_MNEM_SUFFIX;
5092 }
5093
5094 if (!i.suffix)
5095 {
5096 int op;
5097
5098 if (i.tm.base_opcode == 0xf20f38f1
5099 || i.tm.base_opcode == 0xf20f38f0)
5100 {
5101 /* We have to know the operand size for crc32. */
5102 as_bad (_("ambiguous memory operand size for `%s`"),
5103 i.tm.name);
5104 return 0;
5105 }
5106
5107 for (op = i.operands; --op >= 0;)
5108 if (!i.tm.operand_types[op].bitfield.inoutportreg)
5109 {
5110 if (i.types[op].bitfield.reg8)
5111 {
5112 i.suffix = BYTE_MNEM_SUFFIX;
5113 break;
5114 }
5115 else if (i.types[op].bitfield.reg16)
5116 {
5117 i.suffix = WORD_MNEM_SUFFIX;
5118 break;
5119 }
5120 else if (i.types[op].bitfield.reg32)
5121 {
5122 i.suffix = LONG_MNEM_SUFFIX;
5123 break;
5124 }
5125 else if (i.types[op].bitfield.reg64)
5126 {
5127 i.suffix = QWORD_MNEM_SUFFIX;
5128 break;
5129 }
5130 }
5131 }
5132 }
5133 else if (i.suffix == BYTE_MNEM_SUFFIX)
5134 {
5135 if (intel_syntax
5136 && i.tm.opcode_modifier.ignoresize
5137 && i.tm.opcode_modifier.no_bsuf)
5138 i.suffix = 0;
5139 else if (!check_byte_reg ())
5140 return 0;
5141 }
5142 else if (i.suffix == LONG_MNEM_SUFFIX)
5143 {
5144 if (intel_syntax
5145 && i.tm.opcode_modifier.ignoresize
5146 && i.tm.opcode_modifier.no_lsuf)
5147 i.suffix = 0;
5148 else if (!check_long_reg ())
5149 return 0;
5150 }
5151 else if (i.suffix == QWORD_MNEM_SUFFIX)
5152 {
5153 if (intel_syntax
5154 && i.tm.opcode_modifier.ignoresize
5155 && i.tm.opcode_modifier.no_qsuf)
5156 i.suffix = 0;
5157 else if (!check_qword_reg ())
5158 return 0;
5159 }
5160 else if (i.suffix == WORD_MNEM_SUFFIX)
5161 {
5162 if (intel_syntax
5163 && i.tm.opcode_modifier.ignoresize
5164 && i.tm.opcode_modifier.no_wsuf)
5165 i.suffix = 0;
5166 else if (!check_word_reg ())
5167 return 0;
5168 }
5169 else if (i.suffix == XMMWORD_MNEM_SUFFIX
5170 || i.suffix == YMMWORD_MNEM_SUFFIX
5171 || i.suffix == ZMMWORD_MNEM_SUFFIX)
5172 {
5173 /* Skip if the instruction has x/y/z suffix. match_template
5174 should check if it is a valid suffix. */
5175 }
5176 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
5177 /* Do nothing if the instruction is going to ignore the prefix. */
5178 ;
5179 else
5180 abort ();
5181 }
5182 else if (i.tm.opcode_modifier.defaultsize
5183 && !i.suffix
5184 /* exclude fldenv/frstor/fsave/fstenv */
5185 && i.tm.opcode_modifier.no_ssuf)
5186 {
5187 i.suffix = stackop_size;
5188 }
5189 else if (intel_syntax
5190 && !i.suffix
5191 && (i.tm.operand_types[0].bitfield.jumpabsolute
5192 || i.tm.opcode_modifier.jumpbyte
5193 || i.tm.opcode_modifier.jumpintersegment
5194 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
5195 && i.tm.extension_opcode <= 3)))
5196 {
5197 switch (flag_code)
5198 {
5199 case CODE_64BIT:
5200 if (!i.tm.opcode_modifier.no_qsuf)
5201 {
5202 i.suffix = QWORD_MNEM_SUFFIX;
5203 break;
5204 }
5205 case CODE_32BIT:
5206 if (!i.tm.opcode_modifier.no_lsuf)
5207 i.suffix = LONG_MNEM_SUFFIX;
5208 break;
5209 case CODE_16BIT:
5210 if (!i.tm.opcode_modifier.no_wsuf)
5211 i.suffix = WORD_MNEM_SUFFIX;
5212 break;
5213 }
5214 }
5215
5216 if (!i.suffix)
5217 {
5218 if (!intel_syntax)
5219 {
5220 if (i.tm.opcode_modifier.w)
5221 {
5222 as_bad (_("no instruction mnemonic suffix given and "
5223 "no register operands; can't size instruction"));
5224 return 0;
5225 }
5226 }
5227 else
5228 {
5229 unsigned int suffixes;
5230
5231 suffixes = !i.tm.opcode_modifier.no_bsuf;
5232 if (!i.tm.opcode_modifier.no_wsuf)
5233 suffixes |= 1 << 1;
5234 if (!i.tm.opcode_modifier.no_lsuf)
5235 suffixes |= 1 << 2;
5236 if (!i.tm.opcode_modifier.no_ldsuf)
5237 suffixes |= 1 << 3;
5238 if (!i.tm.opcode_modifier.no_ssuf)
5239 suffixes |= 1 << 4;
5240 if (!i.tm.opcode_modifier.no_qsuf)
5241 suffixes |= 1 << 5;
5242
5243 /* There are more than suffix matches. */
5244 if (i.tm.opcode_modifier.w
5245 || ((suffixes & (suffixes - 1))
5246 && !i.tm.opcode_modifier.defaultsize
5247 && !i.tm.opcode_modifier.ignoresize))
5248 {
5249 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
5250 return 0;
5251 }
5252 }
5253 }
5254
5255 /* Change the opcode based on the operand size given by i.suffix;
5256 We don't need to change things for byte insns. */
5257
5258 if (i.suffix
5259 && i.suffix != BYTE_MNEM_SUFFIX
5260 && i.suffix != XMMWORD_MNEM_SUFFIX
5261 && i.suffix != YMMWORD_MNEM_SUFFIX
5262 && i.suffix != ZMMWORD_MNEM_SUFFIX)
5263 {
5264 /* It's not a byte, select word/dword operation. */
5265 if (i.tm.opcode_modifier.w)
5266 {
5267 if (i.tm.opcode_modifier.shortform)
5268 i.tm.base_opcode |= 8;
5269 else
5270 i.tm.base_opcode |= 1;
5271 }
5272
5273 /* Now select between word & dword operations via the operand
5274 size prefix, except for instructions that will ignore this
5275 prefix anyway. */
5276 if (i.tm.opcode_modifier.addrprefixop0)
5277 {
5278 /* The address size override prefix changes the size of the
5279 first operand. */
5280 if ((flag_code == CODE_32BIT
5281 && i.op->regs[0].reg_type.bitfield.reg16)
5282 || (flag_code != CODE_32BIT
5283 && i.op->regs[0].reg_type.bitfield.reg32))
5284 if (!add_prefix (ADDR_PREFIX_OPCODE))
5285 return 0;
5286 }
5287 else if (i.suffix != QWORD_MNEM_SUFFIX
5288 && i.suffix != LONG_DOUBLE_MNEM_SUFFIX
5289 && !i.tm.opcode_modifier.ignoresize
5290 && !i.tm.opcode_modifier.floatmf
5291 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
5292 || (flag_code == CODE_64BIT
5293 && i.tm.opcode_modifier.jumpbyte)))
5294 {
5295 unsigned int prefix = DATA_PREFIX_OPCODE;
5296
5297 if (i.tm.opcode_modifier.jumpbyte) /* jcxz, loop */
5298 prefix = ADDR_PREFIX_OPCODE;
5299
5300 if (!add_prefix (prefix))
5301 return 0;
5302 }
5303
5304 /* Set mode64 for an operand. */
5305 if (i.suffix == QWORD_MNEM_SUFFIX
5306 && flag_code == CODE_64BIT
5307 && !i.tm.opcode_modifier.norex64)
5308 {
5309 /* Special case for xchg %rax,%rax. It is NOP and doesn't
5310 need rex64. cmpxchg8b is also a special case. */
5311 if (! (i.operands == 2
5312 && i.tm.base_opcode == 0x90
5313 && i.tm.extension_opcode == None
5314 && operand_type_equal (&i.types [0], &acc64)
5315 && operand_type_equal (&i.types [1], &acc64))
5316 && ! (i.operands == 1
5317 && i.tm.base_opcode == 0xfc7
5318 && i.tm.extension_opcode == 1
5319 && !operand_type_check (i.types [0], reg)
5320 && operand_type_check (i.types [0], anymem)))
5321 i.rex |= REX_W;
5322 }
5323
5324 /* Size floating point instruction. */
5325 if (i.suffix == LONG_MNEM_SUFFIX)
5326 if (i.tm.opcode_modifier.floatmf)
5327 i.tm.base_opcode ^= 4;
5328 }
5329
5330 return 1;
5331 }
5332
5333 static int
5334 check_byte_reg (void)
5335 {
5336 int op;
5337
5338 for (op = i.operands; --op >= 0;)
5339 {
5340 /* If this is an eight bit register, it's OK. If it's the 16 or
5341 32 bit version of an eight bit register, we will just use the
5342 low portion, and that's OK too. */
5343 if (i.types[op].bitfield.reg8)
5344 continue;
5345
5346 /* I/O port address operands are OK too. */
5347 if (i.tm.operand_types[op].bitfield.inoutportreg)
5348 continue;
5349
5350 /* crc32 doesn't generate this warning. */
5351 if (i.tm.base_opcode == 0xf20f38f0)
5352 continue;
5353
5354 if ((i.types[op].bitfield.reg16
5355 || i.types[op].bitfield.reg32
5356 || i.types[op].bitfield.reg64)
5357 && i.op[op].regs->reg_num < 4
5358 /* Prohibit these changes in 64bit mode, since the lowering
5359 would be more complicated. */
5360 && flag_code != CODE_64BIT)
5361 {
5362 #if REGISTER_WARNINGS
5363 if (!quiet_warnings)
5364 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5365 register_prefix,
5366 (i.op[op].regs + (i.types[op].bitfield.reg16
5367 ? REGNAM_AL - REGNAM_AX
5368 : REGNAM_AL - REGNAM_EAX))->reg_name,
5369 register_prefix,
5370 i.op[op].regs->reg_name,
5371 i.suffix);
5372 #endif
5373 continue;
5374 }
5375 /* Any other register is bad. */
5376 if (i.types[op].bitfield.reg16
5377 || i.types[op].bitfield.reg32
5378 || i.types[op].bitfield.reg64
5379 || i.types[op].bitfield.regmmx
5380 || i.types[op].bitfield.regxmm
5381 || i.types[op].bitfield.regymm
5382 || i.types[op].bitfield.regzmm
5383 || i.types[op].bitfield.sreg2
5384 || i.types[op].bitfield.sreg3
5385 || i.types[op].bitfield.control
5386 || i.types[op].bitfield.debug
5387 || i.types[op].bitfield.test
5388 || i.types[op].bitfield.floatreg
5389 || i.types[op].bitfield.floatacc)
5390 {
5391 as_bad (_("`%s%s' not allowed with `%s%c'"),
5392 register_prefix,
5393 i.op[op].regs->reg_name,
5394 i.tm.name,
5395 i.suffix);
5396 return 0;
5397 }
5398 }
5399 return 1;
5400 }
5401
5402 static int
5403 check_long_reg (void)
5404 {
5405 int op;
5406
5407 for (op = i.operands; --op >= 0;)
5408 /* Reject eight bit registers, except where the template requires
5409 them. (eg. movzb) */
5410 if (i.types[op].bitfield.reg8
5411 && (i.tm.operand_types[op].bitfield.reg16
5412 || i.tm.operand_types[op].bitfield.reg32
5413 || i.tm.operand_types[op].bitfield.acc))
5414 {
5415 as_bad (_("`%s%s' not allowed with `%s%c'"),
5416 register_prefix,
5417 i.op[op].regs->reg_name,
5418 i.tm.name,
5419 i.suffix);
5420 return 0;
5421 }
5422 /* Warn if the e prefix on a general reg is missing. */
5423 else if ((!quiet_warnings || flag_code == CODE_64BIT)
5424 && i.types[op].bitfield.reg16
5425 && (i.tm.operand_types[op].bitfield.reg32
5426 || i.tm.operand_types[op].bitfield.acc))
5427 {
5428 /* Prohibit these changes in the 64bit mode, since the
5429 lowering is more complicated. */
5430 if (flag_code == CODE_64BIT)
5431 {
5432 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5433 register_prefix, i.op[op].regs->reg_name,
5434 i.suffix);
5435 return 0;
5436 }
5437 #if REGISTER_WARNINGS
5438 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5439 register_prefix,
5440 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
5441 register_prefix, i.op[op].regs->reg_name, i.suffix);
5442 #endif
5443 }
5444 /* Warn if the r prefix on a general reg is present. */
5445 else if (i.types[op].bitfield.reg64
5446 && (i.tm.operand_types[op].bitfield.reg32
5447 || i.tm.operand_types[op].bitfield.acc))
5448 {
5449 if (intel_syntax
5450 && i.tm.opcode_modifier.toqword
5451 && !i.types[0].bitfield.regxmm)
5452 {
5453 /* Convert to QWORD. We want REX byte. */
5454 i.suffix = QWORD_MNEM_SUFFIX;
5455 }
5456 else
5457 {
5458 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5459 register_prefix, i.op[op].regs->reg_name,
5460 i.suffix);
5461 return 0;
5462 }
5463 }
5464 return 1;
5465 }
5466
5467 static int
5468 check_qword_reg (void)
5469 {
5470 int op;
5471
5472 for (op = i.operands; --op >= 0; )
5473 /* Reject eight bit registers, except where the template requires
5474 them. (eg. movzb) */
5475 if (i.types[op].bitfield.reg8
5476 && (i.tm.operand_types[op].bitfield.reg16
5477 || i.tm.operand_types[op].bitfield.reg32
5478 || i.tm.operand_types[op].bitfield.acc))
5479 {
5480 as_bad (_("`%s%s' not allowed with `%s%c'"),
5481 register_prefix,
5482 i.op[op].regs->reg_name,
5483 i.tm.name,
5484 i.suffix);
5485 return 0;
5486 }
5487 /* Warn if the r prefix on a general reg is missing. */
5488 else if ((i.types[op].bitfield.reg16
5489 || i.types[op].bitfield.reg32)
5490 && (i.tm.operand_types[op].bitfield.reg32
5491 || i.tm.operand_types[op].bitfield.acc))
5492 {
5493 /* Prohibit these changes in the 64bit mode, since the
5494 lowering is more complicated. */
5495 if (intel_syntax
5496 && i.tm.opcode_modifier.todword
5497 && !i.types[0].bitfield.regxmm)
5498 {
5499 /* Convert to DWORD. We don't want REX byte. */
5500 i.suffix = LONG_MNEM_SUFFIX;
5501 }
5502 else
5503 {
5504 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5505 register_prefix, i.op[op].regs->reg_name,
5506 i.suffix);
5507 return 0;
5508 }
5509 }
5510 return 1;
5511 }
5512
5513 static int
5514 check_word_reg (void)
5515 {
5516 int op;
5517 for (op = i.operands; --op >= 0;)
5518 /* Reject eight bit registers, except where the template requires
5519 them. (eg. movzb) */
5520 if (i.types[op].bitfield.reg8
5521 && (i.tm.operand_types[op].bitfield.reg16
5522 || i.tm.operand_types[op].bitfield.reg32
5523 || i.tm.operand_types[op].bitfield.acc))
5524 {
5525 as_bad (_("`%s%s' not allowed with `%s%c'"),
5526 register_prefix,
5527 i.op[op].regs->reg_name,
5528 i.tm.name,
5529 i.suffix);
5530 return 0;
5531 }
5532 /* Warn if the e or r prefix on a general reg is present. */
5533 else if ((!quiet_warnings || flag_code == CODE_64BIT)
5534 && (i.types[op].bitfield.reg32
5535 || i.types[op].bitfield.reg64)
5536 && (i.tm.operand_types[op].bitfield.reg16
5537 || i.tm.operand_types[op].bitfield.acc))
5538 {
5539 /* Prohibit these changes in the 64bit mode, since the
5540 lowering is more complicated. */
5541 if (flag_code == CODE_64BIT)
5542 {
5543 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5544 register_prefix, i.op[op].regs->reg_name,
5545 i.suffix);
5546 return 0;
5547 }
5548 #if REGISTER_WARNINGS
5549 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5550 register_prefix,
5551 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
5552 register_prefix, i.op[op].regs->reg_name, i.suffix);
5553 #endif
5554 }
5555 return 1;
5556 }
5557
5558 static int
5559 update_imm (unsigned int j)
5560 {
5561 i386_operand_type overlap = i.types[j];
5562 if ((overlap.bitfield.imm8
5563 || overlap.bitfield.imm8s
5564 || overlap.bitfield.imm16
5565 || overlap.bitfield.imm32
5566 || overlap.bitfield.imm32s
5567 || overlap.bitfield.imm64)
5568 && !operand_type_equal (&overlap, &imm8)
5569 && !operand_type_equal (&overlap, &imm8s)
5570 && !operand_type_equal (&overlap, &imm16)
5571 && !operand_type_equal (&overlap, &imm32)
5572 && !operand_type_equal (&overlap, &imm32s)
5573 && !operand_type_equal (&overlap, &imm64))
5574 {
5575 if (i.suffix)
5576 {
5577 i386_operand_type temp;
5578
5579 operand_type_set (&temp, 0);
5580 if (i.suffix == BYTE_MNEM_SUFFIX)
5581 {
5582 temp.bitfield.imm8 = overlap.bitfield.imm8;
5583 temp.bitfield.imm8s = overlap.bitfield.imm8s;
5584 }
5585 else if (i.suffix == WORD_MNEM_SUFFIX)
5586 temp.bitfield.imm16 = overlap.bitfield.imm16;
5587 else if (i.suffix == QWORD_MNEM_SUFFIX)
5588 {
5589 temp.bitfield.imm64 = overlap.bitfield.imm64;
5590 temp.bitfield.imm32s = overlap.bitfield.imm32s;
5591 }
5592 else
5593 temp.bitfield.imm32 = overlap.bitfield.imm32;
5594 overlap = temp;
5595 }
5596 else if (operand_type_equal (&overlap, &imm16_32_32s)
5597 || operand_type_equal (&overlap, &imm16_32)
5598 || operand_type_equal (&overlap, &imm16_32s))
5599 {
5600 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5601 overlap = imm16;
5602 else
5603 overlap = imm32s;
5604 }
5605 if (!operand_type_equal (&overlap, &imm8)
5606 && !operand_type_equal (&overlap, &imm8s)
5607 && !operand_type_equal (&overlap, &imm16)
5608 && !operand_type_equal (&overlap, &imm32)
5609 && !operand_type_equal (&overlap, &imm32s)
5610 && !operand_type_equal (&overlap, &imm64))
5611 {
5612 as_bad (_("no instruction mnemonic suffix given; "
5613 "can't determine immediate size"));
5614 return 0;
5615 }
5616 }
5617 i.types[j] = overlap;
5618
5619 return 1;
5620 }
5621
5622 static int
5623 finalize_imm (void)
5624 {
5625 unsigned int j, n;
5626
5627 /* Update the first 2 immediate operands. */
5628 n = i.operands > 2 ? 2 : i.operands;
5629 if (n)
5630 {
5631 for (j = 0; j < n; j++)
5632 if (update_imm (j) == 0)
5633 return 0;
5634
5635 /* The 3rd operand can't be immediate operand. */
5636 gas_assert (operand_type_check (i.types[2], imm) == 0);
5637 }
5638
5639 return 1;
5640 }
5641
5642 static int
5643 bad_implicit_operand (int xmm)
5644 {
5645 const char *ireg = xmm ? "xmm0" : "ymm0";
5646
5647 if (intel_syntax)
5648 as_bad (_("the last operand of `%s' must be `%s%s'"),
5649 i.tm.name, register_prefix, ireg);
5650 else
5651 as_bad (_("the first operand of `%s' must be `%s%s'"),
5652 i.tm.name, register_prefix, ireg);
5653 return 0;
5654 }
5655
5656 static int
5657 process_operands (void)
5658 {
5659 /* Default segment register this instruction will use for memory
5660 accesses. 0 means unknown. This is only for optimizing out
5661 unnecessary segment overrides. */
5662 const seg_entry *default_seg = 0;
5663
5664 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
5665 {
5666 unsigned int dupl = i.operands;
5667 unsigned int dest = dupl - 1;
5668 unsigned int j;
5669
5670 /* The destination must be an xmm register. */
5671 gas_assert (i.reg_operands
5672 && MAX_OPERANDS > dupl
5673 && operand_type_equal (&i.types[dest], &regxmm));
5674
5675 if (i.tm.opcode_modifier.firstxmm0)
5676 {
5677 /* The first operand is implicit and must be xmm0. */
5678 gas_assert (operand_type_equal (&i.types[0], &regxmm));
5679 if (register_number (i.op[0].regs) != 0)
5680 return bad_implicit_operand (1);
5681
5682 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
5683 {
5684 /* Keep xmm0 for instructions with VEX prefix and 3
5685 sources. */
5686 goto duplicate;
5687 }
5688 else
5689 {
5690 /* We remove the first xmm0 and keep the number of
5691 operands unchanged, which in fact duplicates the
5692 destination. */
5693 for (j = 1; j < i.operands; j++)
5694 {
5695 i.op[j - 1] = i.op[j];
5696 i.types[j - 1] = i.types[j];
5697 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
5698 }
5699 }
5700 }
5701 else if (i.tm.opcode_modifier.implicit1stxmm0)
5702 {
5703 gas_assert ((MAX_OPERANDS - 1) > dupl
5704 && (i.tm.opcode_modifier.vexsources
5705 == VEX3SOURCES));
5706
5707 /* Add the implicit xmm0 for instructions with VEX prefix
5708 and 3 sources. */
5709 for (j = i.operands; j > 0; j--)
5710 {
5711 i.op[j] = i.op[j - 1];
5712 i.types[j] = i.types[j - 1];
5713 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
5714 }
5715 i.op[0].regs
5716 = (const reg_entry *) hash_find (reg_hash, "xmm0");
5717 i.types[0] = regxmm;
5718 i.tm.operand_types[0] = regxmm;
5719
5720 i.operands += 2;
5721 i.reg_operands += 2;
5722 i.tm.operands += 2;
5723
5724 dupl++;
5725 dest++;
5726 i.op[dupl] = i.op[dest];
5727 i.types[dupl] = i.types[dest];
5728 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
5729 }
5730 else
5731 {
5732 duplicate:
5733 i.operands++;
5734 i.reg_operands++;
5735 i.tm.operands++;
5736
5737 i.op[dupl] = i.op[dest];
5738 i.types[dupl] = i.types[dest];
5739 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
5740 }
5741
5742 if (i.tm.opcode_modifier.immext)
5743 process_immext ();
5744 }
5745 else if (i.tm.opcode_modifier.firstxmm0)
5746 {
5747 unsigned int j;
5748
5749 /* The first operand is implicit and must be xmm0/ymm0/zmm0. */
5750 gas_assert (i.reg_operands
5751 && (operand_type_equal (&i.types[0], &regxmm)
5752 || operand_type_equal (&i.types[0], &regymm)
5753 || operand_type_equal (&i.types[0], &regzmm)));
5754 if (register_number (i.op[0].regs) != 0)
5755 return bad_implicit_operand (i.types[0].bitfield.regxmm);
5756
5757 for (j = 1; j < i.operands; j++)
5758 {
5759 i.op[j - 1] = i.op[j];
5760 i.types[j - 1] = i.types[j];
5761
5762 /* We need to adjust fields in i.tm since they are used by
5763 build_modrm_byte. */
5764 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
5765 }
5766
5767 i.operands--;
5768 i.reg_operands--;
5769 i.tm.operands--;
5770 }
5771 else if (i.tm.opcode_modifier.regkludge)
5772 {
5773 /* The imul $imm, %reg instruction is converted into
5774 imul $imm, %reg, %reg, and the clr %reg instruction
5775 is converted into xor %reg, %reg. */
5776
5777 unsigned int first_reg_op;
5778
5779 if (operand_type_check (i.types[0], reg))
5780 first_reg_op = 0;
5781 else
5782 first_reg_op = 1;
5783 /* Pretend we saw the extra register operand. */
5784 gas_assert (i.reg_operands == 1
5785 && i.op[first_reg_op + 1].regs == 0);
5786 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
5787 i.types[first_reg_op + 1] = i.types[first_reg_op];
5788 i.operands++;
5789 i.reg_operands++;
5790 }
5791
5792 if (i.tm.opcode_modifier.shortform)
5793 {
5794 if (i.types[0].bitfield.sreg2
5795 || i.types[0].bitfield.sreg3)
5796 {
5797 if (i.tm.base_opcode == POP_SEG_SHORT
5798 && i.op[0].regs->reg_num == 1)
5799 {
5800 as_bad (_("you can't `pop %scs'"), register_prefix);
5801 return 0;
5802 }
5803 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
5804 if ((i.op[0].regs->reg_flags & RegRex) != 0)
5805 i.rex |= REX_B;
5806 }
5807 else
5808 {
5809 /* The register or float register operand is in operand
5810 0 or 1. */
5811 unsigned int op;
5812
5813 if (i.types[0].bitfield.floatreg
5814 || operand_type_check (i.types[0], reg))
5815 op = 0;
5816 else
5817 op = 1;
5818 /* Register goes in low 3 bits of opcode. */
5819 i.tm.base_opcode |= i.op[op].regs->reg_num;
5820 if ((i.op[op].regs->reg_flags & RegRex) != 0)
5821 i.rex |= REX_B;
5822 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
5823 {
5824 /* Warn about some common errors, but press on regardless.
5825 The first case can be generated by gcc (<= 2.8.1). */
5826 if (i.operands == 2)
5827 {
5828 /* Reversed arguments on faddp, fsubp, etc. */
5829 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
5830 register_prefix, i.op[!intel_syntax].regs->reg_name,
5831 register_prefix, i.op[intel_syntax].regs->reg_name);
5832 }
5833 else
5834 {
5835 /* Extraneous `l' suffix on fp insn. */
5836 as_warn (_("translating to `%s %s%s'"), i.tm.name,
5837 register_prefix, i.op[0].regs->reg_name);
5838 }
5839 }
5840 }
5841 }
5842 else if (i.tm.opcode_modifier.modrm)
5843 {
5844 /* The opcode is completed (modulo i.tm.extension_opcode which
5845 must be put into the modrm byte). Now, we make the modrm and
5846 index base bytes based on all the info we've collected. */
5847
5848 default_seg = build_modrm_byte ();
5849 }
5850 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
5851 {
5852 default_seg = &ds;
5853 }
5854 else if (i.tm.opcode_modifier.isstring)
5855 {
5856 /* For the string instructions that allow a segment override
5857 on one of their operands, the default segment is ds. */
5858 default_seg = &ds;
5859 }
5860
5861 if (i.tm.base_opcode == 0x8d /* lea */
5862 && i.seg[0]
5863 && !quiet_warnings)
5864 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
5865
5866 /* If a segment was explicitly specified, and the specified segment
5867 is not the default, use an opcode prefix to select it. If we
5868 never figured out what the default segment is, then default_seg
5869 will be zero at this point, and the specified segment prefix will
5870 always be used. */
5871 if ((i.seg[0]) && (i.seg[0] != default_seg))
5872 {
5873 if (!add_prefix (i.seg[0]->seg_prefix))
5874 return 0;
5875 }
5876 return 1;
5877 }
5878
5879 static const seg_entry *
5880 build_modrm_byte (void)
5881 {
5882 const seg_entry *default_seg = 0;
5883 unsigned int source, dest;
5884 int vex_3_sources;
5885
5886 /* The first operand of instructions with VEX prefix and 3 sources
5887 must be VEX_Imm4. */
5888 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
5889 if (vex_3_sources)
5890 {
5891 unsigned int nds, reg_slot;
5892 expressionS *exp;
5893
5894 if (i.tm.opcode_modifier.veximmext
5895 && i.tm.opcode_modifier.immext)
5896 {
5897 dest = i.operands - 2;
5898 gas_assert (dest == 3);
5899 }
5900 else
5901 dest = i.operands - 1;
5902 nds = dest - 1;
5903
5904 /* There are 2 kinds of instructions:
5905 1. 5 operands: 4 register operands or 3 register operands
5906 plus 1 memory operand plus one Vec_Imm4 operand, VexXDS, and
5907 VexW0 or VexW1. The destination must be either XMM, YMM or
5908 ZMM register.
5909 2. 4 operands: 4 register operands or 3 register operands
5910 plus 1 memory operand, VexXDS, and VexImmExt */
5911 gas_assert ((i.reg_operands == 4
5912 || (i.reg_operands == 3 && i.mem_operands == 1))
5913 && i.tm.opcode_modifier.vexvvvv == VEXXDS
5914 && (i.tm.opcode_modifier.veximmext
5915 || (i.imm_operands == 1
5916 && i.types[0].bitfield.vec_imm4
5917 && (i.tm.opcode_modifier.vexw == VEXW0
5918 || i.tm.opcode_modifier.vexw == VEXW1)
5919 && (operand_type_equal (&i.tm.operand_types[dest], &regxmm)
5920 || operand_type_equal (&i.tm.operand_types[dest], &regymm)
5921 || operand_type_equal (&i.tm.operand_types[dest], &regzmm)))));
5922
5923 if (i.imm_operands == 0)
5924 {
5925 /* When there is no immediate operand, generate an 8bit
5926 immediate operand to encode the first operand. */
5927 exp = &im_expressions[i.imm_operands++];
5928 i.op[i.operands].imms = exp;
5929 i.types[i.operands] = imm8;
5930 i.operands++;
5931 /* If VexW1 is set, the first operand is the source and
5932 the second operand is encoded in the immediate operand. */
5933 if (i.tm.opcode_modifier.vexw == VEXW1)
5934 {
5935 source = 0;
5936 reg_slot = 1;
5937 }
5938 else
5939 {
5940 source = 1;
5941 reg_slot = 0;
5942 }
5943
5944 /* FMA swaps REG and NDS. */
5945 if (i.tm.cpu_flags.bitfield.cpufma)
5946 {
5947 unsigned int tmp;
5948 tmp = reg_slot;
5949 reg_slot = nds;
5950 nds = tmp;
5951 }
5952
5953 gas_assert (operand_type_equal (&i.tm.operand_types[reg_slot],
5954 &regxmm)
5955 || operand_type_equal (&i.tm.operand_types[reg_slot],
5956 &regymm)
5957 || operand_type_equal (&i.tm.operand_types[reg_slot],
5958 &regzmm));
5959 exp->X_op = O_constant;
5960 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
5961 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
5962 }
5963 else
5964 {
5965 unsigned int imm_slot;
5966
5967 if (i.tm.opcode_modifier.vexw == VEXW0)
5968 {
5969 /* If VexW0 is set, the third operand is the source and
5970 the second operand is encoded in the immediate
5971 operand. */
5972 source = 2;
5973 reg_slot = 1;
5974 }
5975 else
5976 {
5977 /* VexW1 is set, the second operand is the source and
5978 the third operand is encoded in the immediate
5979 operand. */
5980 source = 1;
5981 reg_slot = 2;
5982 }
5983
5984 if (i.tm.opcode_modifier.immext)
5985 {
5986 /* When ImmExt is set, the immdiate byte is the last
5987 operand. */
5988 imm_slot = i.operands - 1;
5989 source--;
5990 reg_slot--;
5991 }
5992 else
5993 {
5994 imm_slot = 0;
5995
5996 /* Turn on Imm8 so that output_imm will generate it. */
5997 i.types[imm_slot].bitfield.imm8 = 1;
5998 }
5999
6000 gas_assert (operand_type_equal (&i.tm.operand_types[reg_slot],
6001 &regxmm)
6002 || operand_type_equal (&i.tm.operand_types[reg_slot],
6003 &regymm)
6004 || operand_type_equal (&i.tm.operand_types[reg_slot],
6005 &regzmm));
6006 i.op[imm_slot].imms->X_add_number
6007 |= register_number (i.op[reg_slot].regs) << 4;
6008 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
6009 }
6010
6011 gas_assert (operand_type_equal (&i.tm.operand_types[nds], &regxmm)
6012 || operand_type_equal (&i.tm.operand_types[nds],
6013 &regymm)
6014 || operand_type_equal (&i.tm.operand_types[nds],
6015 &regzmm));
6016 i.vex.register_specifier = i.op[nds].regs;
6017 }
6018 else
6019 source = dest = 0;
6020
6021 /* i.reg_operands MUST be the number of real register operands;
6022 implicit registers do not count. If there are 3 register
6023 operands, it must be a instruction with VexNDS. For a
6024 instruction with VexNDD, the destination register is encoded
6025 in VEX prefix. If there are 4 register operands, it must be
6026 a instruction with VEX prefix and 3 sources. */
6027 if (i.mem_operands == 0
6028 && ((i.reg_operands == 2
6029 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
6030 || (i.reg_operands == 3
6031 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
6032 || (i.reg_operands == 4 && vex_3_sources)))
6033 {
6034 switch (i.operands)
6035 {
6036 case 2:
6037 source = 0;
6038 break;
6039 case 3:
6040 /* When there are 3 operands, one of them may be immediate,
6041 which may be the first or the last operand. Otherwise,
6042 the first operand must be shift count register (cl) or it
6043 is an instruction with VexNDS. */
6044 gas_assert (i.imm_operands == 1
6045 || (i.imm_operands == 0
6046 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
6047 || i.types[0].bitfield.shiftcount)));
6048 if (operand_type_check (i.types[0], imm)
6049 || i.types[0].bitfield.shiftcount)
6050 source = 1;
6051 else
6052 source = 0;
6053 break;
6054 case 4:
6055 /* When there are 4 operands, the first two must be 8bit
6056 immediate operands. The source operand will be the 3rd
6057 one.
6058
6059 For instructions with VexNDS, if the first operand
6060 an imm8, the source operand is the 2nd one. If the last
6061 operand is imm8, the source operand is the first one. */
6062 gas_assert ((i.imm_operands == 2
6063 && i.types[0].bitfield.imm8
6064 && i.types[1].bitfield.imm8)
6065 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
6066 && i.imm_operands == 1
6067 && (i.types[0].bitfield.imm8
6068 || i.types[i.operands - 1].bitfield.imm8
6069 || i.rounding)));
6070 if (i.imm_operands == 2)
6071 source = 2;
6072 else
6073 {
6074 if (i.types[0].bitfield.imm8)
6075 source = 1;
6076 else
6077 source = 0;
6078 }
6079 break;
6080 case 5:
6081 if (i.tm.opcode_modifier.evex)
6082 {
6083 /* For EVEX instructions, when there are 5 operands, the
6084 first one must be immediate operand. If the second one
6085 is immediate operand, the source operand is the 3th
6086 one. If the last one is immediate operand, the source
6087 operand is the 2nd one. */
6088 gas_assert (i.imm_operands == 2
6089 && i.tm.opcode_modifier.sae
6090 && operand_type_check (i.types[0], imm));
6091 if (operand_type_check (i.types[1], imm))
6092 source = 2;
6093 else if (operand_type_check (i.types[4], imm))
6094 source = 1;
6095 else
6096 abort ();
6097 }
6098 break;
6099 default:
6100 abort ();
6101 }
6102
6103 if (!vex_3_sources)
6104 {
6105 dest = source + 1;
6106
6107 /* RC/SAE operand could be between DEST and SRC. That happens
6108 when one operand is GPR and the other one is XMM/YMM/ZMM
6109 register. */
6110 if (i.rounding && i.rounding->operand == (int) dest)
6111 dest++;
6112
6113 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
6114 {
6115 /* For instructions with VexNDS, the register-only source
6116 operand must be 32/64bit integer, XMM, YMM or ZMM
6117 register. It is encoded in VEX prefix. We need to
6118 clear RegMem bit before calling operand_type_equal. */
6119
6120 i386_operand_type op;
6121 unsigned int vvvv;
6122
6123 /* Check register-only source operand when two source
6124 operands are swapped. */
6125 if (!i.tm.operand_types[source].bitfield.baseindex
6126 && i.tm.operand_types[dest].bitfield.baseindex)
6127 {
6128 vvvv = source;
6129 source = dest;
6130 }
6131 else
6132 vvvv = dest;
6133
6134 op = i.tm.operand_types[vvvv];
6135 op.bitfield.regmem = 0;
6136 if ((dest + 1) >= i.operands
6137 || (op.bitfield.reg32 != 1
6138 && !op.bitfield.reg64 != 1
6139 && !operand_type_equal (&op, &regxmm)
6140 && !operand_type_equal (&op, &regymm)
6141 && !operand_type_equal (&op, &regzmm)
6142 && !operand_type_equal (&op, &regmask)))
6143 abort ();
6144 i.vex.register_specifier = i.op[vvvv].regs;
6145 dest++;
6146 }
6147 }
6148
6149 i.rm.mode = 3;
6150 /* One of the register operands will be encoded in the i.tm.reg
6151 field, the other in the combined i.tm.mode and i.tm.regmem
6152 fields. If no form of this instruction supports a memory
6153 destination operand, then we assume the source operand may
6154 sometimes be a memory operand and so we need to store the
6155 destination in the i.rm.reg field. */
6156 if (!i.tm.operand_types[dest].bitfield.regmem
6157 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
6158 {
6159 i.rm.reg = i.op[dest].regs->reg_num;
6160 i.rm.regmem = i.op[source].regs->reg_num;
6161 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
6162 i.rex |= REX_R;
6163 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
6164 i.vrex |= REX_R;
6165 if ((i.op[source].regs->reg_flags & RegRex) != 0)
6166 i.rex |= REX_B;
6167 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
6168 i.vrex |= REX_B;
6169 }
6170 else
6171 {
6172 i.rm.reg = i.op[source].regs->reg_num;
6173 i.rm.regmem = i.op[dest].regs->reg_num;
6174 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
6175 i.rex |= REX_B;
6176 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
6177 i.vrex |= REX_B;
6178 if ((i.op[source].regs->reg_flags & RegRex) != 0)
6179 i.rex |= REX_R;
6180 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
6181 i.vrex |= REX_R;
6182 }
6183 if (flag_code != CODE_64BIT && (i.rex & (REX_R | REX_B)))
6184 {
6185 if (!i.types[0].bitfield.control
6186 && !i.types[1].bitfield.control)
6187 abort ();
6188 i.rex &= ~(REX_R | REX_B);
6189 add_prefix (LOCK_PREFIX_OPCODE);
6190 }
6191 }
6192 else
6193 { /* If it's not 2 reg operands... */
6194 unsigned int mem;
6195
6196 if (i.mem_operands)
6197 {
6198 unsigned int fake_zero_displacement = 0;
6199 unsigned int op;
6200
6201 for (op = 0; op < i.operands; op++)
6202 if (operand_type_check (i.types[op], anymem))
6203 break;
6204 gas_assert (op < i.operands);
6205
6206 if (i.tm.opcode_modifier.vecsib)
6207 {
6208 if (i.index_reg->reg_num == RegEiz
6209 || i.index_reg->reg_num == RegRiz)
6210 abort ();
6211
6212 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6213 if (!i.base_reg)
6214 {
6215 i.sib.base = NO_BASE_REGISTER;
6216 i.sib.scale = i.log2_scale_factor;
6217 /* No Vec_Disp8 if there is no base. */
6218 i.types[op].bitfield.vec_disp8 = 0;
6219 i.types[op].bitfield.disp8 = 0;
6220 i.types[op].bitfield.disp16 = 0;
6221 i.types[op].bitfield.disp64 = 0;
6222 if (flag_code != CODE_64BIT)
6223 {
6224 /* Must be 32 bit */
6225 i.types[op].bitfield.disp32 = 1;
6226 i.types[op].bitfield.disp32s = 0;
6227 }
6228 else
6229 {
6230 i.types[op].bitfield.disp32 = 0;
6231 i.types[op].bitfield.disp32s = 1;
6232 }
6233 }
6234 i.sib.index = i.index_reg->reg_num;
6235 if ((i.index_reg->reg_flags & RegRex) != 0)
6236 i.rex |= REX_X;
6237 if ((i.index_reg->reg_flags & RegVRex) != 0)
6238 i.vrex |= REX_X;
6239 }
6240
6241 default_seg = &ds;
6242
6243 if (i.base_reg == 0)
6244 {
6245 i.rm.mode = 0;
6246 if (!i.disp_operands)
6247 {
6248 fake_zero_displacement = 1;
6249 /* Instructions with VSIB byte need 32bit displacement
6250 if there is no base register. */
6251 if (i.tm.opcode_modifier.vecsib)
6252 i.types[op].bitfield.disp32 = 1;
6253 }
6254 if (i.index_reg == 0)
6255 {
6256 gas_assert (!i.tm.opcode_modifier.vecsib);
6257 /* Operand is just <disp> */
6258 if (flag_code == CODE_64BIT)
6259 {
6260 /* 64bit mode overwrites the 32bit absolute
6261 addressing by RIP relative addressing and
6262 absolute addressing is encoded by one of the
6263 redundant SIB forms. */
6264 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6265 i.sib.base = NO_BASE_REGISTER;
6266 i.sib.index = NO_INDEX_REGISTER;
6267 i.types[op] = ((i.prefix[ADDR_PREFIX] == 0)
6268 ? disp32s : disp32);
6269 }
6270 else if ((flag_code == CODE_16BIT)
6271 ^ (i.prefix[ADDR_PREFIX] != 0))
6272 {
6273 i.rm.regmem = NO_BASE_REGISTER_16;
6274 i.types[op] = disp16;
6275 }
6276 else
6277 {
6278 i.rm.regmem = NO_BASE_REGISTER;
6279 i.types[op] = disp32;
6280 }
6281 }
6282 else if (!i.tm.opcode_modifier.vecsib)
6283 {
6284 /* !i.base_reg && i.index_reg */
6285 if (i.index_reg->reg_num == RegEiz
6286 || i.index_reg->reg_num == RegRiz)
6287 i.sib.index = NO_INDEX_REGISTER;
6288 else
6289 i.sib.index = i.index_reg->reg_num;
6290 i.sib.base = NO_BASE_REGISTER;
6291 i.sib.scale = i.log2_scale_factor;
6292 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6293 /* No Vec_Disp8 if there is no base. */
6294 i.types[op].bitfield.vec_disp8 = 0;
6295 i.types[op].bitfield.disp8 = 0;
6296 i.types[op].bitfield.disp16 = 0;
6297 i.types[op].bitfield.disp64 = 0;
6298 if (flag_code != CODE_64BIT)
6299 {
6300 /* Must be 32 bit */
6301 i.types[op].bitfield.disp32 = 1;
6302 i.types[op].bitfield.disp32s = 0;
6303 }
6304 else
6305 {
6306 i.types[op].bitfield.disp32 = 0;
6307 i.types[op].bitfield.disp32s = 1;
6308 }
6309 if ((i.index_reg->reg_flags & RegRex) != 0)
6310 i.rex |= REX_X;
6311 }
6312 }
6313 /* RIP addressing for 64bit mode. */
6314 else if (i.base_reg->reg_num == RegRip ||
6315 i.base_reg->reg_num == RegEip)
6316 {
6317 gas_assert (!i.tm.opcode_modifier.vecsib);
6318 i.rm.regmem = NO_BASE_REGISTER;
6319 i.types[op].bitfield.disp8 = 0;
6320 i.types[op].bitfield.disp16 = 0;
6321 i.types[op].bitfield.disp32 = 0;
6322 i.types[op].bitfield.disp32s = 1;
6323 i.types[op].bitfield.disp64 = 0;
6324 i.types[op].bitfield.vec_disp8 = 0;
6325 i.flags[op] |= Operand_PCrel;
6326 if (! i.disp_operands)
6327 fake_zero_displacement = 1;
6328 }
6329 else if (i.base_reg->reg_type.bitfield.reg16)
6330 {
6331 gas_assert (!i.tm.opcode_modifier.vecsib);
6332 switch (i.base_reg->reg_num)
6333 {
6334 case 3: /* (%bx) */
6335 if (i.index_reg == 0)
6336 i.rm.regmem = 7;
6337 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
6338 i.rm.regmem = i.index_reg->reg_num - 6;
6339 break;
6340 case 5: /* (%bp) */
6341 default_seg = &ss;
6342 if (i.index_reg == 0)
6343 {
6344 i.rm.regmem = 6;
6345 if (operand_type_check (i.types[op], disp) == 0)
6346 {
6347 /* fake (%bp) into 0(%bp) */
6348 if (i.tm.operand_types[op].bitfield.vec_disp8)
6349 i.types[op].bitfield.vec_disp8 = 1;
6350 else
6351 i.types[op].bitfield.disp8 = 1;
6352 fake_zero_displacement = 1;
6353 }
6354 }
6355 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
6356 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
6357 break;
6358 default: /* (%si) -> 4 or (%di) -> 5 */
6359 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
6360 }
6361 i.rm.mode = mode_from_disp_size (i.types[op]);
6362 }
6363 else /* i.base_reg and 32/64 bit mode */
6364 {
6365 if (flag_code == CODE_64BIT
6366 && operand_type_check (i.types[op], disp))
6367 {
6368 i386_operand_type temp;
6369 operand_type_set (&temp, 0);
6370 temp.bitfield.disp8 = i.types[op].bitfield.disp8;
6371 temp.bitfield.vec_disp8
6372 = i.types[op].bitfield.vec_disp8;
6373 i.types[op] = temp;
6374 if (i.prefix[ADDR_PREFIX] == 0)
6375 i.types[op].bitfield.disp32s = 1;
6376 else
6377 i.types[op].bitfield.disp32 = 1;
6378 }
6379
6380 if (!i.tm.opcode_modifier.vecsib)
6381 i.rm.regmem = i.base_reg->reg_num;
6382 if ((i.base_reg->reg_flags & RegRex) != 0)
6383 i.rex |= REX_B;
6384 i.sib.base = i.base_reg->reg_num;
6385 /* x86-64 ignores REX prefix bit here to avoid decoder
6386 complications. */
6387 if (!(i.base_reg->reg_flags & RegRex)
6388 && (i.base_reg->reg_num == EBP_REG_NUM
6389 || i.base_reg->reg_num == ESP_REG_NUM))
6390 default_seg = &ss;
6391 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
6392 {
6393 fake_zero_displacement = 1;
6394 if (i.tm.operand_types [op].bitfield.vec_disp8)
6395 i.types[op].bitfield.vec_disp8 = 1;
6396 else
6397 i.types[op].bitfield.disp8 = 1;
6398 }
6399 i.sib.scale = i.log2_scale_factor;
6400 if (i.index_reg == 0)
6401 {
6402 gas_assert (!i.tm.opcode_modifier.vecsib);
6403 /* <disp>(%esp) becomes two byte modrm with no index
6404 register. We've already stored the code for esp
6405 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
6406 Any base register besides %esp will not use the
6407 extra modrm byte. */
6408 i.sib.index = NO_INDEX_REGISTER;
6409 }
6410 else if (!i.tm.opcode_modifier.vecsib)
6411 {
6412 if (i.index_reg->reg_num == RegEiz
6413 || i.index_reg->reg_num == RegRiz)
6414 i.sib.index = NO_INDEX_REGISTER;
6415 else
6416 i.sib.index = i.index_reg->reg_num;
6417 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6418 if ((i.index_reg->reg_flags & RegRex) != 0)
6419 i.rex |= REX_X;
6420 }
6421
6422 if (i.disp_operands
6423 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
6424 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
6425 i.rm.mode = 0;
6426 else
6427 {
6428 if (!fake_zero_displacement
6429 && !i.disp_operands
6430 && i.disp_encoding)
6431 {
6432 fake_zero_displacement = 1;
6433 if (i.disp_encoding == disp_encoding_8bit)
6434 i.types[op].bitfield.disp8 = 1;
6435 else
6436 i.types[op].bitfield.disp32 = 1;
6437 }
6438 i.rm.mode = mode_from_disp_size (i.types[op]);
6439 }
6440 }
6441
6442 if (fake_zero_displacement)
6443 {
6444 /* Fakes a zero displacement assuming that i.types[op]
6445 holds the correct displacement size. */
6446 expressionS *exp;
6447
6448 gas_assert (i.op[op].disps == 0);
6449 exp = &disp_expressions[i.disp_operands++];
6450 i.op[op].disps = exp;
6451 exp->X_op = O_constant;
6452 exp->X_add_number = 0;
6453 exp->X_add_symbol = (symbolS *) 0;
6454 exp->X_op_symbol = (symbolS *) 0;
6455 }
6456
6457 mem = op;
6458 }
6459 else
6460 mem = ~0;
6461
6462 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
6463 {
6464 if (operand_type_check (i.types[0], imm))
6465 i.vex.register_specifier = NULL;
6466 else
6467 {
6468 /* VEX.vvvv encodes one of the sources when the first
6469 operand is not an immediate. */
6470 if (i.tm.opcode_modifier.vexw == VEXW0)
6471 i.vex.register_specifier = i.op[0].regs;
6472 else
6473 i.vex.register_specifier = i.op[1].regs;
6474 }
6475
6476 /* Destination is a XMM register encoded in the ModRM.reg
6477 and VEX.R bit. */
6478 i.rm.reg = i.op[2].regs->reg_num;
6479 if ((i.op[2].regs->reg_flags & RegRex) != 0)
6480 i.rex |= REX_R;
6481
6482 /* ModRM.rm and VEX.B encodes the other source. */
6483 if (!i.mem_operands)
6484 {
6485 i.rm.mode = 3;
6486
6487 if (i.tm.opcode_modifier.vexw == VEXW0)
6488 i.rm.regmem = i.op[1].regs->reg_num;
6489 else
6490 i.rm.regmem = i.op[0].regs->reg_num;
6491
6492 if ((i.op[1].regs->reg_flags & RegRex) != 0)
6493 i.rex |= REX_B;
6494 }
6495 }
6496 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
6497 {
6498 i.vex.register_specifier = i.op[2].regs;
6499 if (!i.mem_operands)
6500 {
6501 i.rm.mode = 3;
6502 i.rm.regmem = i.op[1].regs->reg_num;
6503 if ((i.op[1].regs->reg_flags & RegRex) != 0)
6504 i.rex |= REX_B;
6505 }
6506 }
6507 /* Fill in i.rm.reg or i.rm.regmem field with register operand
6508 (if any) based on i.tm.extension_opcode. Again, we must be
6509 careful to make sure that segment/control/debug/test/MMX
6510 registers are coded into the i.rm.reg field. */
6511 else if (i.reg_operands)
6512 {
6513 unsigned int op;
6514 unsigned int vex_reg = ~0;
6515
6516 for (op = 0; op < i.operands; op++)
6517 if (i.types[op].bitfield.reg8
6518 || i.types[op].bitfield.reg16
6519 || i.types[op].bitfield.reg32
6520 || i.types[op].bitfield.reg64
6521 || i.types[op].bitfield.regmmx
6522 || i.types[op].bitfield.regxmm
6523 || i.types[op].bitfield.regymm
6524 || i.types[op].bitfield.regbnd
6525 || i.types[op].bitfield.regzmm
6526 || i.types[op].bitfield.regmask
6527 || i.types[op].bitfield.sreg2
6528 || i.types[op].bitfield.sreg3
6529 || i.types[op].bitfield.control
6530 || i.types[op].bitfield.debug
6531 || i.types[op].bitfield.test)
6532 break;
6533
6534 if (vex_3_sources)
6535 op = dest;
6536 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
6537 {
6538 /* For instructions with VexNDS, the register-only
6539 source operand is encoded in VEX prefix. */
6540 gas_assert (mem != (unsigned int) ~0);
6541
6542 if (op > mem)
6543 {
6544 vex_reg = op++;
6545 gas_assert (op < i.operands);
6546 }
6547 else
6548 {
6549 /* Check register-only source operand when two source
6550 operands are swapped. */
6551 if (!i.tm.operand_types[op].bitfield.baseindex
6552 && i.tm.operand_types[op + 1].bitfield.baseindex)
6553 {
6554 vex_reg = op;
6555 op += 2;
6556 gas_assert (mem == (vex_reg + 1)
6557 && op < i.operands);
6558 }
6559 else
6560 {
6561 vex_reg = op + 1;
6562 gas_assert (vex_reg < i.operands);
6563 }
6564 }
6565 }
6566 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
6567 {
6568 /* For instructions with VexNDD, the register destination
6569 is encoded in VEX prefix. */
6570 if (i.mem_operands == 0)
6571 {
6572 /* There is no memory operand. */
6573 gas_assert ((op + 2) == i.operands);
6574 vex_reg = op + 1;
6575 }
6576 else
6577 {
6578 /* There are only 2 operands. */
6579 gas_assert (op < 2 && i.operands == 2);
6580 vex_reg = 1;
6581 }
6582 }
6583 else
6584 gas_assert (op < i.operands);
6585
6586 if (vex_reg != (unsigned int) ~0)
6587 {
6588 i386_operand_type *type = &i.tm.operand_types[vex_reg];
6589
6590 if (type->bitfield.reg32 != 1
6591 && type->bitfield.reg64 != 1
6592 && !operand_type_equal (type, &regxmm)
6593 && !operand_type_equal (type, &regymm)
6594 && !operand_type_equal (type, &regzmm)
6595 && !operand_type_equal (type, &regmask))
6596 abort ();
6597
6598 i.vex.register_specifier = i.op[vex_reg].regs;
6599 }
6600
6601 /* Don't set OP operand twice. */
6602 if (vex_reg != op)
6603 {
6604 /* If there is an extension opcode to put here, the
6605 register number must be put into the regmem field. */
6606 if (i.tm.extension_opcode != None)
6607 {
6608 i.rm.regmem = i.op[op].regs->reg_num;
6609 if ((i.op[op].regs->reg_flags & RegRex) != 0)
6610 i.rex |= REX_B;
6611 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
6612 i.vrex |= REX_B;
6613 }
6614 else
6615 {
6616 i.rm.reg = i.op[op].regs->reg_num;
6617 if ((i.op[op].regs->reg_flags & RegRex) != 0)
6618 i.rex |= REX_R;
6619 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
6620 i.vrex |= REX_R;
6621 }
6622 }
6623
6624 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
6625 must set it to 3 to indicate this is a register operand
6626 in the regmem field. */
6627 if (!i.mem_operands)
6628 i.rm.mode = 3;
6629 }
6630
6631 /* Fill in i.rm.reg field with extension opcode (if any). */
6632 if (i.tm.extension_opcode != None)
6633 i.rm.reg = i.tm.extension_opcode;
6634 }
6635 return default_seg;
6636 }
6637
6638 static void
6639 output_branch (void)
6640 {
6641 char *p;
6642 int size;
6643 int code16;
6644 int prefix;
6645 relax_substateT subtype;
6646 symbolS *sym;
6647 offsetT off;
6648
6649 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
6650 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
6651
6652 prefix = 0;
6653 if (i.prefix[DATA_PREFIX] != 0)
6654 {
6655 prefix = 1;
6656 i.prefixes -= 1;
6657 code16 ^= CODE16;
6658 }
6659 /* Pentium4 branch hints. */
6660 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
6661 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
6662 {
6663 prefix++;
6664 i.prefixes--;
6665 }
6666 if (i.prefix[REX_PREFIX] != 0)
6667 {
6668 prefix++;
6669 i.prefixes--;
6670 }
6671
6672 /* BND prefixed jump. */
6673 if (i.prefix[BND_PREFIX] != 0)
6674 {
6675 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
6676 i.prefixes -= 1;
6677 }
6678
6679 if (i.prefixes != 0 && !intel_syntax)
6680 as_warn (_("skipping prefixes on this instruction"));
6681
6682 /* It's always a symbol; End frag & setup for relax.
6683 Make sure there is enough room in this frag for the largest
6684 instruction we may generate in md_convert_frag. This is 2
6685 bytes for the opcode and room for the prefix and largest
6686 displacement. */
6687 frag_grow (prefix + 2 + 4);
6688 /* Prefix and 1 opcode byte go in fr_fix. */
6689 p = frag_more (prefix + 1);
6690 if (i.prefix[DATA_PREFIX] != 0)
6691 *p++ = DATA_PREFIX_OPCODE;
6692 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
6693 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
6694 *p++ = i.prefix[SEG_PREFIX];
6695 if (i.prefix[REX_PREFIX] != 0)
6696 *p++ = i.prefix[REX_PREFIX];
6697 *p = i.tm.base_opcode;
6698
6699 if ((unsigned char) *p == JUMP_PC_RELATIVE)
6700 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
6701 else if (cpu_arch_flags.bitfield.cpui386)
6702 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
6703 else
6704 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
6705 subtype |= code16;
6706
6707 sym = i.op[0].disps->X_add_symbol;
6708 off = i.op[0].disps->X_add_number;
6709
6710 if (i.op[0].disps->X_op != O_constant
6711 && i.op[0].disps->X_op != O_symbol)
6712 {
6713 /* Handle complex expressions. */
6714 sym = make_expr_symbol (i.op[0].disps);
6715 off = 0;
6716 }
6717
6718 /* 1 possible extra opcode + 4 byte displacement go in var part.
6719 Pass reloc in fr_var. */
6720 frag_var (rs_machine_dependent, 5,
6721 ((!object_64bit
6722 || i.reloc[0] != NO_RELOC
6723 || (i.bnd_prefix == NULL && !add_bnd_prefix))
6724 ? i.reloc[0]
6725 : BFD_RELOC_X86_64_PC32_BND),
6726 subtype, sym, off, p);
6727 }
6728
6729 static void
6730 output_jump (void)
6731 {
6732 char *p;
6733 int size;
6734 fixS *fixP;
6735
6736 if (i.tm.opcode_modifier.jumpbyte)
6737 {
6738 /* This is a loop or jecxz type instruction. */
6739 size = 1;
6740 if (i.prefix[ADDR_PREFIX] != 0)
6741 {
6742 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
6743 i.prefixes -= 1;
6744 }
6745 /* Pentium4 branch hints. */
6746 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
6747 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
6748 {
6749 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
6750 i.prefixes--;
6751 }
6752 }
6753 else
6754 {
6755 int code16;
6756
6757 code16 = 0;
6758 if (flag_code == CODE_16BIT)
6759 code16 = CODE16;
6760
6761 if (i.prefix[DATA_PREFIX] != 0)
6762 {
6763 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
6764 i.prefixes -= 1;
6765 code16 ^= CODE16;
6766 }
6767
6768 size = 4;
6769 if (code16)
6770 size = 2;
6771 }
6772
6773 if (i.prefix[REX_PREFIX] != 0)
6774 {
6775 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
6776 i.prefixes -= 1;
6777 }
6778
6779 /* BND prefixed jump. */
6780 if (i.prefix[BND_PREFIX] != 0)
6781 {
6782 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
6783 i.prefixes -= 1;
6784 }
6785
6786 if (i.prefixes != 0 && !intel_syntax)
6787 as_warn (_("skipping prefixes on this instruction"));
6788
6789 p = frag_more (i.tm.opcode_length + size);
6790 switch (i.tm.opcode_length)
6791 {
6792 case 2:
6793 *p++ = i.tm.base_opcode >> 8;
6794 case 1:
6795 *p++ = i.tm.base_opcode;
6796 break;
6797 default:
6798 abort ();
6799 }
6800
6801 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
6802 i.op[0].disps, 1, reloc (size, 1, 1,
6803 (i.bnd_prefix != NULL
6804 || add_bnd_prefix),
6805 i.reloc[0]));
6806
6807 /* All jumps handled here are signed, but don't use a signed limit
6808 check for 32 and 16 bit jumps as we want to allow wrap around at
6809 4G and 64k respectively. */
6810 if (size == 1)
6811 fixP->fx_signed = 1;
6812 }
6813
6814 static void
6815 output_interseg_jump (void)
6816 {
6817 char *p;
6818 int size;
6819 int prefix;
6820 int code16;
6821
6822 code16 = 0;
6823 if (flag_code == CODE_16BIT)
6824 code16 = CODE16;
6825
6826 prefix = 0;
6827 if (i.prefix[DATA_PREFIX] != 0)
6828 {
6829 prefix = 1;
6830 i.prefixes -= 1;
6831 code16 ^= CODE16;
6832 }
6833 if (i.prefix[REX_PREFIX] != 0)
6834 {
6835 prefix++;
6836 i.prefixes -= 1;
6837 }
6838
6839 size = 4;
6840 if (code16)
6841 size = 2;
6842
6843 if (i.prefixes != 0 && !intel_syntax)
6844 as_warn (_("skipping prefixes on this instruction"));
6845
6846 /* 1 opcode; 2 segment; offset */
6847 p = frag_more (prefix + 1 + 2 + size);
6848
6849 if (i.prefix[DATA_PREFIX] != 0)
6850 *p++ = DATA_PREFIX_OPCODE;
6851
6852 if (i.prefix[REX_PREFIX] != 0)
6853 *p++ = i.prefix[REX_PREFIX];
6854
6855 *p++ = i.tm.base_opcode;
6856 if (i.op[1].imms->X_op == O_constant)
6857 {
6858 offsetT n = i.op[1].imms->X_add_number;
6859
6860 if (size == 2
6861 && !fits_in_unsigned_word (n)
6862 && !fits_in_signed_word (n))
6863 {
6864 as_bad (_("16-bit jump out of range"));
6865 return;
6866 }
6867 md_number_to_chars (p, n, size);
6868 }
6869 else
6870 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
6871 i.op[1].imms, 0, reloc (size, 0, 0, 0, i.reloc[1]));
6872 if (i.op[0].imms->X_op != O_constant)
6873 as_bad (_("can't handle non absolute segment in `%s'"),
6874 i.tm.name);
6875 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
6876 }
6877
6878 static void
6879 output_insn (void)
6880 {
6881 fragS *insn_start_frag;
6882 offsetT insn_start_off;
6883
6884 /* Tie dwarf2 debug info to the address at the start of the insn.
6885 We can't do this after the insn has been output as the current
6886 frag may have been closed off. eg. by frag_var. */
6887 dwarf2_emit_insn (0);
6888
6889 insn_start_frag = frag_now;
6890 insn_start_off = frag_now_fix ();
6891
6892 /* Output jumps. */
6893 if (i.tm.opcode_modifier.jump)
6894 output_branch ();
6895 else if (i.tm.opcode_modifier.jumpbyte
6896 || i.tm.opcode_modifier.jumpdword)
6897 output_jump ();
6898 else if (i.tm.opcode_modifier.jumpintersegment)
6899 output_interseg_jump ();
6900 else
6901 {
6902 /* Output normal instructions here. */
6903 char *p;
6904 unsigned char *q;
6905 unsigned int j;
6906 unsigned int prefix;
6907
6908 /* Since the VEX/EVEX prefix contains the implicit prefix, we
6909 don't need the explicit prefix. */
6910 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
6911 {
6912 switch (i.tm.opcode_length)
6913 {
6914 case 3:
6915 if (i.tm.base_opcode & 0xff000000)
6916 {
6917 prefix = (i.tm.base_opcode >> 24) & 0xff;
6918 goto check_prefix;
6919 }
6920 break;
6921 case 2:
6922 if ((i.tm.base_opcode & 0xff0000) != 0)
6923 {
6924 prefix = (i.tm.base_opcode >> 16) & 0xff;
6925 if (i.tm.cpu_flags.bitfield.cpupadlock)
6926 {
6927 check_prefix:
6928 if (prefix != REPE_PREFIX_OPCODE
6929 || (i.prefix[REP_PREFIX]
6930 != REPE_PREFIX_OPCODE))
6931 add_prefix (prefix);
6932 }
6933 else
6934 add_prefix (prefix);
6935 }
6936 break;
6937 case 1:
6938 break;
6939 default:
6940 abort ();
6941 }
6942
6943 /* The prefix bytes. */
6944 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
6945 if (*q)
6946 FRAG_APPEND_1_CHAR (*q);
6947 }
6948 else
6949 {
6950 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
6951 if (*q)
6952 switch (j)
6953 {
6954 case REX_PREFIX:
6955 /* REX byte is encoded in VEX prefix. */
6956 break;
6957 case SEG_PREFIX:
6958 case ADDR_PREFIX:
6959 FRAG_APPEND_1_CHAR (*q);
6960 break;
6961 default:
6962 /* There should be no other prefixes for instructions
6963 with VEX prefix. */
6964 abort ();
6965 }
6966
6967 /* For EVEX instructions i.vrex should become 0 after
6968 build_evex_prefix. For VEX instructions upper 16 registers
6969 aren't available, so VREX should be 0. */
6970 if (i.vrex)
6971 abort ();
6972 /* Now the VEX prefix. */
6973 p = frag_more (i.vex.length);
6974 for (j = 0; j < i.vex.length; j++)
6975 p[j] = i.vex.bytes[j];
6976 }
6977
6978 /* Now the opcode; be careful about word order here! */
6979 if (i.tm.opcode_length == 1)
6980 {
6981 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
6982 }
6983 else
6984 {
6985 switch (i.tm.opcode_length)
6986 {
6987 case 4:
6988 p = frag_more (4);
6989 *p++ = (i.tm.base_opcode >> 24) & 0xff;
6990 *p++ = (i.tm.base_opcode >> 16) & 0xff;
6991 break;
6992 case 3:
6993 p = frag_more (3);
6994 *p++ = (i.tm.base_opcode >> 16) & 0xff;
6995 break;
6996 case 2:
6997 p = frag_more (2);
6998 break;
6999 default:
7000 abort ();
7001 break;
7002 }
7003
7004 /* Put out high byte first: can't use md_number_to_chars! */
7005 *p++ = (i.tm.base_opcode >> 8) & 0xff;
7006 *p = i.tm.base_opcode & 0xff;
7007 }
7008
7009 /* Now the modrm byte and sib byte (if present). */
7010 if (i.tm.opcode_modifier.modrm)
7011 {
7012 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
7013 | i.rm.reg << 3
7014 | i.rm.mode << 6));
7015 /* If i.rm.regmem == ESP (4)
7016 && i.rm.mode != (Register mode)
7017 && not 16 bit
7018 ==> need second modrm byte. */
7019 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
7020 && i.rm.mode != 3
7021 && !(i.base_reg && i.base_reg->reg_type.bitfield.reg16))
7022 FRAG_APPEND_1_CHAR ((i.sib.base << 0
7023 | i.sib.index << 3
7024 | i.sib.scale << 6));
7025 }
7026
7027 if (i.disp_operands)
7028 output_disp (insn_start_frag, insn_start_off);
7029
7030 if (i.imm_operands)
7031 output_imm (insn_start_frag, insn_start_off);
7032 }
7033
7034 #ifdef DEBUG386
7035 if (flag_debug)
7036 {
7037 pi ("" /*line*/, &i);
7038 }
7039 #endif /* DEBUG386 */
7040 }
7041
7042 /* Return the size of the displacement operand N. */
7043
7044 static int
7045 disp_size (unsigned int n)
7046 {
7047 int size = 4;
7048
7049 /* Vec_Disp8 has to be 8bit. */
7050 if (i.types[n].bitfield.vec_disp8)
7051 size = 1;
7052 else if (i.types[n].bitfield.disp64)
7053 size = 8;
7054 else if (i.types[n].bitfield.disp8)
7055 size = 1;
7056 else if (i.types[n].bitfield.disp16)
7057 size = 2;
7058 return size;
7059 }
7060
7061 /* Return the size of the immediate operand N. */
7062
7063 static int
7064 imm_size (unsigned int n)
7065 {
7066 int size = 4;
7067 if (i.types[n].bitfield.imm64)
7068 size = 8;
7069 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
7070 size = 1;
7071 else if (i.types[n].bitfield.imm16)
7072 size = 2;
7073 return size;
7074 }
7075
7076 static void
7077 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
7078 {
7079 char *p;
7080 unsigned int n;
7081
7082 for (n = 0; n < i.operands; n++)
7083 {
7084 if (i.types[n].bitfield.vec_disp8
7085 || operand_type_check (i.types[n], disp))
7086 {
7087 if (i.op[n].disps->X_op == O_constant)
7088 {
7089 int size = disp_size (n);
7090 offsetT val = i.op[n].disps->X_add_number;
7091
7092 if (i.types[n].bitfield.vec_disp8)
7093 val >>= i.memshift;
7094 val = offset_in_range (val, size);
7095 p = frag_more (size);
7096 md_number_to_chars (p, val, size);
7097 }
7098 else
7099 {
7100 enum bfd_reloc_code_real reloc_type;
7101 int size = disp_size (n);
7102 int sign = i.types[n].bitfield.disp32s;
7103 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
7104
7105 /* We can't have 8 bit displacement here. */
7106 gas_assert (!i.types[n].bitfield.disp8);
7107
7108 /* The PC relative address is computed relative
7109 to the instruction boundary, so in case immediate
7110 fields follows, we need to adjust the value. */
7111 if (pcrel && i.imm_operands)
7112 {
7113 unsigned int n1;
7114 int sz = 0;
7115
7116 for (n1 = 0; n1 < i.operands; n1++)
7117 if (operand_type_check (i.types[n1], imm))
7118 {
7119 /* Only one immediate is allowed for PC
7120 relative address. */
7121 gas_assert (sz == 0);
7122 sz = imm_size (n1);
7123 i.op[n].disps->X_add_number -= sz;
7124 }
7125 /* We should find the immediate. */
7126 gas_assert (sz != 0);
7127 }
7128
7129 p = frag_more (size);
7130 reloc_type = reloc (size, pcrel, sign,
7131 (i.bnd_prefix != NULL
7132 || add_bnd_prefix),
7133 i.reloc[n]);
7134 if (GOT_symbol
7135 && GOT_symbol == i.op[n].disps->X_add_symbol
7136 && (((reloc_type == BFD_RELOC_32
7137 || reloc_type == BFD_RELOC_X86_64_32S
7138 || (reloc_type == BFD_RELOC_64
7139 && object_64bit))
7140 && (i.op[n].disps->X_op == O_symbol
7141 || (i.op[n].disps->X_op == O_add
7142 && ((symbol_get_value_expression
7143 (i.op[n].disps->X_op_symbol)->X_op)
7144 == O_subtract))))
7145 || reloc_type == BFD_RELOC_32_PCREL))
7146 {
7147 offsetT add;
7148
7149 if (insn_start_frag == frag_now)
7150 add = (p - frag_now->fr_literal) - insn_start_off;
7151 else
7152 {
7153 fragS *fr;
7154
7155 add = insn_start_frag->fr_fix - insn_start_off;
7156 for (fr = insn_start_frag->fr_next;
7157 fr && fr != frag_now; fr = fr->fr_next)
7158 add += fr->fr_fix;
7159 add += p - frag_now->fr_literal;
7160 }
7161
7162 if (!object_64bit)
7163 {
7164 reloc_type = BFD_RELOC_386_GOTPC;
7165 i.op[n].imms->X_add_number += add;
7166 }
7167 else if (reloc_type == BFD_RELOC_64)
7168 reloc_type = BFD_RELOC_X86_64_GOTPC64;
7169 else
7170 /* Don't do the adjustment for x86-64, as there
7171 the pcrel addressing is relative to the _next_
7172 insn, and that is taken care of in other code. */
7173 reloc_type = BFD_RELOC_X86_64_GOTPC32;
7174 }
7175 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7176 i.op[n].disps, pcrel, reloc_type);
7177 }
7178 }
7179 }
7180 }
7181
7182 static void
7183 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
7184 {
7185 char *p;
7186 unsigned int n;
7187
7188 for (n = 0; n < i.operands; n++)
7189 {
7190 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
7191 if (i.rounding && (int) n == i.rounding->operand)
7192 continue;
7193
7194 if (operand_type_check (i.types[n], imm))
7195 {
7196 if (i.op[n].imms->X_op == O_constant)
7197 {
7198 int size = imm_size (n);
7199 offsetT val;
7200
7201 val = offset_in_range (i.op[n].imms->X_add_number,
7202 size);
7203 p = frag_more (size);
7204 md_number_to_chars (p, val, size);
7205 }
7206 else
7207 {
7208 /* Not absolute_section.
7209 Need a 32-bit fixup (don't support 8bit
7210 non-absolute imms). Try to support other
7211 sizes ... */
7212 enum bfd_reloc_code_real reloc_type;
7213 int size = imm_size (n);
7214 int sign;
7215
7216 if (i.types[n].bitfield.imm32s
7217 && (i.suffix == QWORD_MNEM_SUFFIX
7218 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
7219 sign = 1;
7220 else
7221 sign = 0;
7222
7223 p = frag_more (size);
7224 reloc_type = reloc (size, 0, sign, 0, i.reloc[n]);
7225
7226 /* This is tough to explain. We end up with this one if we
7227 * have operands that look like
7228 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
7229 * obtain the absolute address of the GOT, and it is strongly
7230 * preferable from a performance point of view to avoid using
7231 * a runtime relocation for this. The actual sequence of
7232 * instructions often look something like:
7233 *
7234 * call .L66
7235 * .L66:
7236 * popl %ebx
7237 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
7238 *
7239 * The call and pop essentially return the absolute address
7240 * of the label .L66 and store it in %ebx. The linker itself
7241 * will ultimately change the first operand of the addl so
7242 * that %ebx points to the GOT, but to keep things simple, the
7243 * .o file must have this operand set so that it generates not
7244 * the absolute address of .L66, but the absolute address of
7245 * itself. This allows the linker itself simply treat a GOTPC
7246 * relocation as asking for a pcrel offset to the GOT to be
7247 * added in, and the addend of the relocation is stored in the
7248 * operand field for the instruction itself.
7249 *
7250 * Our job here is to fix the operand so that it would add
7251 * the correct offset so that %ebx would point to itself. The
7252 * thing that is tricky is that .-.L66 will point to the
7253 * beginning of the instruction, so we need to further modify
7254 * the operand so that it will point to itself. There are
7255 * other cases where you have something like:
7256 *
7257 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
7258 *
7259 * and here no correction would be required. Internally in
7260 * the assembler we treat operands of this form as not being
7261 * pcrel since the '.' is explicitly mentioned, and I wonder
7262 * whether it would simplify matters to do it this way. Who
7263 * knows. In earlier versions of the PIC patches, the
7264 * pcrel_adjust field was used to store the correction, but
7265 * since the expression is not pcrel, I felt it would be
7266 * confusing to do it this way. */
7267
7268 if ((reloc_type == BFD_RELOC_32
7269 || reloc_type == BFD_RELOC_X86_64_32S
7270 || reloc_type == BFD_RELOC_64)
7271 && GOT_symbol
7272 && GOT_symbol == i.op[n].imms->X_add_symbol
7273 && (i.op[n].imms->X_op == O_symbol
7274 || (i.op[n].imms->X_op == O_add
7275 && ((symbol_get_value_expression
7276 (i.op[n].imms->X_op_symbol)->X_op)
7277 == O_subtract))))
7278 {
7279 offsetT add;
7280
7281 if (insn_start_frag == frag_now)
7282 add = (p - frag_now->fr_literal) - insn_start_off;
7283 else
7284 {
7285 fragS *fr;
7286
7287 add = insn_start_frag->fr_fix - insn_start_off;
7288 for (fr = insn_start_frag->fr_next;
7289 fr && fr != frag_now; fr = fr->fr_next)
7290 add += fr->fr_fix;
7291 add += p - frag_now->fr_literal;
7292 }
7293
7294 if (!object_64bit)
7295 reloc_type = BFD_RELOC_386_GOTPC;
7296 else if (size == 4)
7297 reloc_type = BFD_RELOC_X86_64_GOTPC32;
7298 else if (size == 8)
7299 reloc_type = BFD_RELOC_X86_64_GOTPC64;
7300 i.op[n].imms->X_add_number += add;
7301 }
7302 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7303 i.op[n].imms, 0, reloc_type);
7304 }
7305 }
7306 }
7307 }
7308 \f
7309 /* x86_cons_fix_new is called via the expression parsing code when a
7310 reloc is needed. We use this hook to get the correct .got reloc. */
7311 static enum bfd_reloc_code_real got_reloc = NO_RELOC;
7312 static int cons_sign = -1;
7313
7314 void
7315 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
7316 expressionS *exp)
7317 {
7318 enum bfd_reloc_code_real r = reloc (len, 0, cons_sign, 0, got_reloc);
7319
7320 got_reloc = NO_RELOC;
7321
7322 #ifdef TE_PE
7323 if (exp->X_op == O_secrel)
7324 {
7325 exp->X_op = O_symbol;
7326 r = BFD_RELOC_32_SECREL;
7327 }
7328 #endif
7329
7330 fix_new_exp (frag, off, len, exp, 0, r);
7331 }
7332
7333 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
7334 purpose of the `.dc.a' internal pseudo-op. */
7335
7336 int
7337 x86_address_bytes (void)
7338 {
7339 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
7340 return 4;
7341 return stdoutput->arch_info->bits_per_address / 8;
7342 }
7343
7344 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
7345 || defined (LEX_AT)
7346 # define lex_got(reloc, adjust, types, bnd_prefix) NULL
7347 #else
7348 /* Parse operands of the form
7349 <symbol>@GOTOFF+<nnn>
7350 and similar .plt or .got references.
7351
7352 If we find one, set up the correct relocation in RELOC and copy the
7353 input string, minus the `@GOTOFF' into a malloc'd buffer for
7354 parsing by the calling routine. Return this buffer, and if ADJUST
7355 is non-null set it to the length of the string we removed from the
7356 input line. Otherwise return NULL. */
7357 static char *
7358 lex_got (enum bfd_reloc_code_real *rel,
7359 int *adjust,
7360 i386_operand_type *types,
7361 int bnd_prefix)
7362 {
7363 /* Some of the relocations depend on the size of what field is to
7364 be relocated. But in our callers i386_immediate and i386_displacement
7365 we don't yet know the operand size (this will be set by insn
7366 matching). Hence we record the word32 relocation here,
7367 and adjust the reloc according to the real size in reloc(). */
7368 static const struct {
7369 const char *str;
7370 int len;
7371 const enum bfd_reloc_code_real rel[2];
7372 const i386_operand_type types64;
7373 } gotrel[] = {
7374 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7375 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
7376 BFD_RELOC_SIZE32 },
7377 OPERAND_TYPE_IMM32_64 },
7378 #endif
7379 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
7380 BFD_RELOC_X86_64_PLTOFF64 },
7381 OPERAND_TYPE_IMM64 },
7382 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
7383 BFD_RELOC_X86_64_PLT32 },
7384 OPERAND_TYPE_IMM32_32S_DISP32 },
7385 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
7386 BFD_RELOC_X86_64_GOTPLT64 },
7387 OPERAND_TYPE_IMM64_DISP64 },
7388 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
7389 BFD_RELOC_X86_64_GOTOFF64 },
7390 OPERAND_TYPE_IMM64_DISP64 },
7391 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
7392 BFD_RELOC_X86_64_GOTPCREL },
7393 OPERAND_TYPE_IMM32_32S_DISP32 },
7394 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
7395 BFD_RELOC_X86_64_TLSGD },
7396 OPERAND_TYPE_IMM32_32S_DISP32 },
7397 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
7398 _dummy_first_bfd_reloc_code_real },
7399 OPERAND_TYPE_NONE },
7400 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
7401 BFD_RELOC_X86_64_TLSLD },
7402 OPERAND_TYPE_IMM32_32S_DISP32 },
7403 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
7404 BFD_RELOC_X86_64_GOTTPOFF },
7405 OPERAND_TYPE_IMM32_32S_DISP32 },
7406 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
7407 BFD_RELOC_X86_64_TPOFF32 },
7408 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7409 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
7410 _dummy_first_bfd_reloc_code_real },
7411 OPERAND_TYPE_NONE },
7412 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
7413 BFD_RELOC_X86_64_DTPOFF32 },
7414 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7415 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
7416 _dummy_first_bfd_reloc_code_real },
7417 OPERAND_TYPE_NONE },
7418 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
7419 _dummy_first_bfd_reloc_code_real },
7420 OPERAND_TYPE_NONE },
7421 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
7422 BFD_RELOC_X86_64_GOT32 },
7423 OPERAND_TYPE_IMM32_32S_64_DISP32 },
7424 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
7425 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
7426 OPERAND_TYPE_IMM32_32S_DISP32 },
7427 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
7428 BFD_RELOC_X86_64_TLSDESC_CALL },
7429 OPERAND_TYPE_IMM32_32S_DISP32 },
7430 };
7431 char *cp;
7432 unsigned int j;
7433
7434 #if defined (OBJ_MAYBE_ELF)
7435 if (!IS_ELF)
7436 return NULL;
7437 #endif
7438
7439 for (cp = input_line_pointer; *cp != '@'; cp++)
7440 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
7441 return NULL;
7442
7443 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
7444 {
7445 int len = gotrel[j].len;
7446 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
7447 {
7448 if (gotrel[j].rel[object_64bit] != 0)
7449 {
7450 int first, second;
7451 char *tmpbuf, *past_reloc;
7452
7453 *rel = gotrel[j].rel[object_64bit];
7454
7455 if (types)
7456 {
7457 if (flag_code != CODE_64BIT)
7458 {
7459 types->bitfield.imm32 = 1;
7460 types->bitfield.disp32 = 1;
7461 }
7462 else
7463 *types = gotrel[j].types64;
7464 }
7465
7466 if (j != 0 && GOT_symbol == NULL)
7467 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
7468
7469 /* The length of the first part of our input line. */
7470 first = cp - input_line_pointer;
7471
7472 /* The second part goes from after the reloc token until
7473 (and including) an end_of_line char or comma. */
7474 past_reloc = cp + 1 + len;
7475 cp = past_reloc;
7476 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
7477 ++cp;
7478 second = cp + 1 - past_reloc;
7479
7480 /* Allocate and copy string. The trailing NUL shouldn't
7481 be necessary, but be safe. */
7482 tmpbuf = (char *) xmalloc (first + second + 2);
7483 memcpy (tmpbuf, input_line_pointer, first);
7484 if (second != 0 && *past_reloc != ' ')
7485 /* Replace the relocation token with ' ', so that
7486 errors like foo@GOTOFF1 will be detected. */
7487 tmpbuf[first++] = ' ';
7488 else
7489 /* Increment length by 1 if the relocation token is
7490 removed. */
7491 len++;
7492 if (adjust)
7493 *adjust = len;
7494 memcpy (tmpbuf + first, past_reloc, second);
7495 tmpbuf[first + second] = '\0';
7496 if (bnd_prefix && *rel == BFD_RELOC_X86_64_PLT32)
7497 *rel = BFD_RELOC_X86_64_PLT32_BND;
7498 return tmpbuf;
7499 }
7500
7501 as_bad (_("@%s reloc is not supported with %d-bit output format"),
7502 gotrel[j].str, 1 << (5 + object_64bit));
7503 return NULL;
7504 }
7505 }
7506
7507 /* Might be a symbol version string. Don't as_bad here. */
7508 return NULL;
7509 }
7510 #endif
7511
7512 #ifdef TE_PE
7513 #ifdef lex_got
7514 #undef lex_got
7515 #endif
7516 /* Parse operands of the form
7517 <symbol>@SECREL32+<nnn>
7518
7519 If we find one, set up the correct relocation in RELOC and copy the
7520 input string, minus the `@SECREL32' into a malloc'd buffer for
7521 parsing by the calling routine. Return this buffer, and if ADJUST
7522 is non-null set it to the length of the string we removed from the
7523 input line. Otherwise return NULL.
7524
7525 This function is copied from the ELF version above adjusted for PE targets. */
7526
7527 static char *
7528 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
7529 int *adjust ATTRIBUTE_UNUSED,
7530 i386_operand_type *types,
7531 int bnd_prefix ATTRIBUTE_UNUSED)
7532 {
7533 static const struct
7534 {
7535 const char *str;
7536 int len;
7537 const enum bfd_reloc_code_real rel[2];
7538 const i386_operand_type types64;
7539 }
7540 gotrel[] =
7541 {
7542 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
7543 BFD_RELOC_32_SECREL },
7544 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7545 };
7546
7547 char *cp;
7548 unsigned j;
7549
7550 for (cp = input_line_pointer; *cp != '@'; cp++)
7551 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
7552 return NULL;
7553
7554 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
7555 {
7556 int len = gotrel[j].len;
7557
7558 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
7559 {
7560 if (gotrel[j].rel[object_64bit] != 0)
7561 {
7562 int first, second;
7563 char *tmpbuf, *past_reloc;
7564
7565 *rel = gotrel[j].rel[object_64bit];
7566 if (adjust)
7567 *adjust = len;
7568
7569 if (types)
7570 {
7571 if (flag_code != CODE_64BIT)
7572 {
7573 types->bitfield.imm32 = 1;
7574 types->bitfield.disp32 = 1;
7575 }
7576 else
7577 *types = gotrel[j].types64;
7578 }
7579
7580 /* The length of the first part of our input line. */
7581 first = cp - input_line_pointer;
7582
7583 /* The second part goes from after the reloc token until
7584 (and including) an end_of_line char or comma. */
7585 past_reloc = cp + 1 + len;
7586 cp = past_reloc;
7587 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
7588 ++cp;
7589 second = cp + 1 - past_reloc;
7590
7591 /* Allocate and copy string. The trailing NUL shouldn't
7592 be necessary, but be safe. */
7593 tmpbuf = (char *) xmalloc (first + second + 2);
7594 memcpy (tmpbuf, input_line_pointer, first);
7595 if (second != 0 && *past_reloc != ' ')
7596 /* Replace the relocation token with ' ', so that
7597 errors like foo@SECLREL321 will be detected. */
7598 tmpbuf[first++] = ' ';
7599 memcpy (tmpbuf + first, past_reloc, second);
7600 tmpbuf[first + second] = '\0';
7601 return tmpbuf;
7602 }
7603
7604 as_bad (_("@%s reloc is not supported with %d-bit output format"),
7605 gotrel[j].str, 1 << (5 + object_64bit));
7606 return NULL;
7607 }
7608 }
7609
7610 /* Might be a symbol version string. Don't as_bad here. */
7611 return NULL;
7612 }
7613
7614 #endif /* TE_PE */
7615
7616 void
7617 x86_cons (expressionS *exp, int size)
7618 {
7619 intel_syntax = -intel_syntax;
7620
7621 exp->X_md = 0;
7622 if (size == 4 || (object_64bit && size == 8))
7623 {
7624 /* Handle @GOTOFF and the like in an expression. */
7625 char *save;
7626 char *gotfree_input_line;
7627 int adjust = 0;
7628
7629 save = input_line_pointer;
7630 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL, 0);
7631 if (gotfree_input_line)
7632 input_line_pointer = gotfree_input_line;
7633
7634 expression (exp);
7635
7636 if (gotfree_input_line)
7637 {
7638 /* expression () has merrily parsed up to the end of line,
7639 or a comma - in the wrong buffer. Transfer how far
7640 input_line_pointer has moved to the right buffer. */
7641 input_line_pointer = (save
7642 + (input_line_pointer - gotfree_input_line)
7643 + adjust);
7644 free (gotfree_input_line);
7645 if (exp->X_op == O_constant
7646 || exp->X_op == O_absent
7647 || exp->X_op == O_illegal
7648 || exp->X_op == O_register
7649 || exp->X_op == O_big)
7650 {
7651 char c = *input_line_pointer;
7652 *input_line_pointer = 0;
7653 as_bad (_("missing or invalid expression `%s'"), save);
7654 *input_line_pointer = c;
7655 }
7656 }
7657 }
7658 else
7659 expression (exp);
7660
7661 intel_syntax = -intel_syntax;
7662
7663 if (intel_syntax)
7664 i386_intel_simplify (exp);
7665 }
7666
7667 static void
7668 signed_cons (int size)
7669 {
7670 if (flag_code == CODE_64BIT)
7671 cons_sign = 1;
7672 cons (size);
7673 cons_sign = -1;
7674 }
7675
7676 #ifdef TE_PE
7677 static void
7678 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
7679 {
7680 expressionS exp;
7681
7682 do
7683 {
7684 expression (&exp);
7685 if (exp.X_op == O_symbol)
7686 exp.X_op = O_secrel;
7687
7688 emit_expr (&exp, 4);
7689 }
7690 while (*input_line_pointer++ == ',');
7691
7692 input_line_pointer--;
7693 demand_empty_rest_of_line ();
7694 }
7695 #endif
7696
7697 /* Handle Vector operations. */
7698
7699 static char *
7700 check_VecOperations (char *op_string, char *op_end)
7701 {
7702 const reg_entry *mask;
7703 const char *saved;
7704 char *end_op;
7705
7706 while (*op_string
7707 && (op_end == NULL || op_string < op_end))
7708 {
7709 saved = op_string;
7710 if (*op_string == '{')
7711 {
7712 op_string++;
7713
7714 /* Check broadcasts. */
7715 if (strncmp (op_string, "1to", 3) == 0)
7716 {
7717 int bcst_type;
7718
7719 if (i.broadcast)
7720 goto duplicated_vec_op;
7721
7722 op_string += 3;
7723 if (*op_string == '8')
7724 bcst_type = BROADCAST_1TO8;
7725 else if (*op_string == '1'
7726 && *(op_string+1) == '6')
7727 {
7728 bcst_type = BROADCAST_1TO16;
7729 op_string++;
7730 }
7731 else
7732 {
7733 as_bad (_("Unsupported broadcast: `%s'"), saved);
7734 return NULL;
7735 }
7736 op_string++;
7737
7738 broadcast_op.type = bcst_type;
7739 broadcast_op.operand = this_operand;
7740 i.broadcast = &broadcast_op;
7741 }
7742 /* Check masking operation. */
7743 else if ((mask = parse_register (op_string, &end_op)) != NULL)
7744 {
7745 /* k0 can't be used for write mask. */
7746 if (mask->reg_num == 0)
7747 {
7748 as_bad (_("`%s' can't be used for write mask"),
7749 op_string);
7750 return NULL;
7751 }
7752
7753 if (!i.mask)
7754 {
7755 mask_op.mask = mask;
7756 mask_op.zeroing = 0;
7757 mask_op.operand = this_operand;
7758 i.mask = &mask_op;
7759 }
7760 else
7761 {
7762 if (i.mask->mask)
7763 goto duplicated_vec_op;
7764
7765 i.mask->mask = mask;
7766
7767 /* Only "{z}" is allowed here. No need to check
7768 zeroing mask explicitly. */
7769 if (i.mask->operand != this_operand)
7770 {
7771 as_bad (_("invalid write mask `%s'"), saved);
7772 return NULL;
7773 }
7774 }
7775
7776 op_string = end_op;
7777 }
7778 /* Check zeroing-flag for masking operation. */
7779 else if (*op_string == 'z')
7780 {
7781 if (!i.mask)
7782 {
7783 mask_op.mask = NULL;
7784 mask_op.zeroing = 1;
7785 mask_op.operand = this_operand;
7786 i.mask = &mask_op;
7787 }
7788 else
7789 {
7790 if (i.mask->zeroing)
7791 {
7792 duplicated_vec_op:
7793 as_bad (_("duplicated `%s'"), saved);
7794 return NULL;
7795 }
7796
7797 i.mask->zeroing = 1;
7798
7799 /* Only "{%k}" is allowed here. No need to check mask
7800 register explicitly. */
7801 if (i.mask->operand != this_operand)
7802 {
7803 as_bad (_("invalid zeroing-masking `%s'"),
7804 saved);
7805 return NULL;
7806 }
7807 }
7808
7809 op_string++;
7810 }
7811 else
7812 goto unknown_vec_op;
7813
7814 if (*op_string != '}')
7815 {
7816 as_bad (_("missing `}' in `%s'"), saved);
7817 return NULL;
7818 }
7819 op_string++;
7820 continue;
7821 }
7822 unknown_vec_op:
7823 /* We don't know this one. */
7824 as_bad (_("unknown vector operation: `%s'"), saved);
7825 return NULL;
7826 }
7827
7828 return op_string;
7829 }
7830
7831 static int
7832 i386_immediate (char *imm_start)
7833 {
7834 char *save_input_line_pointer;
7835 char *gotfree_input_line;
7836 segT exp_seg = 0;
7837 expressionS *exp;
7838 i386_operand_type types;
7839
7840 operand_type_set (&types, ~0);
7841
7842 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
7843 {
7844 as_bad (_("at most %d immediate operands are allowed"),
7845 MAX_IMMEDIATE_OPERANDS);
7846 return 0;
7847 }
7848
7849 exp = &im_expressions[i.imm_operands++];
7850 i.op[this_operand].imms = exp;
7851
7852 if (is_space_char (*imm_start))
7853 ++imm_start;
7854
7855 save_input_line_pointer = input_line_pointer;
7856 input_line_pointer = imm_start;
7857
7858 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types,
7859 (i.bnd_prefix != NULL
7860 || add_bnd_prefix));
7861 if (gotfree_input_line)
7862 input_line_pointer = gotfree_input_line;
7863
7864 exp_seg = expression (exp);
7865
7866 SKIP_WHITESPACE ();
7867
7868 /* Handle vector operations. */
7869 if (*input_line_pointer == '{')
7870 {
7871 input_line_pointer = check_VecOperations (input_line_pointer,
7872 NULL);
7873 if (input_line_pointer == NULL)
7874 return 0;
7875 }
7876
7877 if (*input_line_pointer)
7878 as_bad (_("junk `%s' after expression"), input_line_pointer);
7879
7880 input_line_pointer = save_input_line_pointer;
7881 if (gotfree_input_line)
7882 {
7883 free (gotfree_input_line);
7884
7885 if (exp->X_op == O_constant || exp->X_op == O_register)
7886 exp->X_op = O_illegal;
7887 }
7888
7889 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
7890 }
7891
7892 static int
7893 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
7894 i386_operand_type types, const char *imm_start)
7895 {
7896 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
7897 {
7898 if (imm_start)
7899 as_bad (_("missing or invalid immediate expression `%s'"),
7900 imm_start);
7901 return 0;
7902 }
7903 else if (exp->X_op == O_constant)
7904 {
7905 /* Size it properly later. */
7906 i.types[this_operand].bitfield.imm64 = 1;
7907 /* If not 64bit, sign extend val. */
7908 if (flag_code != CODE_64BIT
7909 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
7910 exp->X_add_number
7911 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
7912 }
7913 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
7914 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
7915 && exp_seg != absolute_section
7916 && exp_seg != text_section
7917 && exp_seg != data_section
7918 && exp_seg != bss_section
7919 && exp_seg != undefined_section
7920 && !bfd_is_com_section (exp_seg))
7921 {
7922 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
7923 return 0;
7924 }
7925 #endif
7926 else if (!intel_syntax && exp->X_op == O_register)
7927 {
7928 if (imm_start)
7929 as_bad (_("illegal immediate register operand %s"), imm_start);
7930 return 0;
7931 }
7932 else
7933 {
7934 /* This is an address. The size of the address will be
7935 determined later, depending on destination register,
7936 suffix, or the default for the section. */
7937 i.types[this_operand].bitfield.imm8 = 1;
7938 i.types[this_operand].bitfield.imm16 = 1;
7939 i.types[this_operand].bitfield.imm32 = 1;
7940 i.types[this_operand].bitfield.imm32s = 1;
7941 i.types[this_operand].bitfield.imm64 = 1;
7942 i.types[this_operand] = operand_type_and (i.types[this_operand],
7943 types);
7944 }
7945
7946 return 1;
7947 }
7948
7949 static char *
7950 i386_scale (char *scale)
7951 {
7952 offsetT val;
7953 char *save = input_line_pointer;
7954
7955 input_line_pointer = scale;
7956 val = get_absolute_expression ();
7957
7958 switch (val)
7959 {
7960 case 1:
7961 i.log2_scale_factor = 0;
7962 break;
7963 case 2:
7964 i.log2_scale_factor = 1;
7965 break;
7966 case 4:
7967 i.log2_scale_factor = 2;
7968 break;
7969 case 8:
7970 i.log2_scale_factor = 3;
7971 break;
7972 default:
7973 {
7974 char sep = *input_line_pointer;
7975
7976 *input_line_pointer = '\0';
7977 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
7978 scale);
7979 *input_line_pointer = sep;
7980 input_line_pointer = save;
7981 return NULL;
7982 }
7983 }
7984 if (i.log2_scale_factor != 0 && i.index_reg == 0)
7985 {
7986 as_warn (_("scale factor of %d without an index register"),
7987 1 << i.log2_scale_factor);
7988 i.log2_scale_factor = 0;
7989 }
7990 scale = input_line_pointer;
7991 input_line_pointer = save;
7992 return scale;
7993 }
7994
7995 static int
7996 i386_displacement (char *disp_start, char *disp_end)
7997 {
7998 expressionS *exp;
7999 segT exp_seg = 0;
8000 char *save_input_line_pointer;
8001 char *gotfree_input_line;
8002 int override;
8003 i386_operand_type bigdisp, types = anydisp;
8004 int ret;
8005
8006 if (i.disp_operands == MAX_MEMORY_OPERANDS)
8007 {
8008 as_bad (_("at most %d displacement operands are allowed"),
8009 MAX_MEMORY_OPERANDS);
8010 return 0;
8011 }
8012
8013 operand_type_set (&bigdisp, 0);
8014 if ((i.types[this_operand].bitfield.jumpabsolute)
8015 || (!current_templates->start->opcode_modifier.jump
8016 && !current_templates->start->opcode_modifier.jumpdword))
8017 {
8018 bigdisp.bitfield.disp32 = 1;
8019 override = (i.prefix[ADDR_PREFIX] != 0);
8020 if (flag_code == CODE_64BIT)
8021 {
8022 if (!override)
8023 {
8024 bigdisp.bitfield.disp32s = 1;
8025 bigdisp.bitfield.disp64 = 1;
8026 }
8027 }
8028 else if ((flag_code == CODE_16BIT) ^ override)
8029 {
8030 bigdisp.bitfield.disp32 = 0;
8031 bigdisp.bitfield.disp16 = 1;
8032 }
8033 }
8034 else
8035 {
8036 /* For PC-relative branches, the width of the displacement
8037 is dependent upon data size, not address size. */
8038 override = (i.prefix[DATA_PREFIX] != 0);
8039 if (flag_code == CODE_64BIT)
8040 {
8041 if (override || i.suffix == WORD_MNEM_SUFFIX)
8042 bigdisp.bitfield.disp16 = 1;
8043 else
8044 {
8045 bigdisp.bitfield.disp32 = 1;
8046 bigdisp.bitfield.disp32s = 1;
8047 }
8048 }
8049 else
8050 {
8051 if (!override)
8052 override = (i.suffix == (flag_code != CODE_16BIT
8053 ? WORD_MNEM_SUFFIX
8054 : LONG_MNEM_SUFFIX));
8055 bigdisp.bitfield.disp32 = 1;
8056 if ((flag_code == CODE_16BIT) ^ override)
8057 {
8058 bigdisp.bitfield.disp32 = 0;
8059 bigdisp.bitfield.disp16 = 1;
8060 }
8061 }
8062 }
8063 i.types[this_operand] = operand_type_or (i.types[this_operand],
8064 bigdisp);
8065
8066 exp = &disp_expressions[i.disp_operands];
8067 i.op[this_operand].disps = exp;
8068 i.disp_operands++;
8069 save_input_line_pointer = input_line_pointer;
8070 input_line_pointer = disp_start;
8071 END_STRING_AND_SAVE (disp_end);
8072
8073 #ifndef GCC_ASM_O_HACK
8074 #define GCC_ASM_O_HACK 0
8075 #endif
8076 #if GCC_ASM_O_HACK
8077 END_STRING_AND_SAVE (disp_end + 1);
8078 if (i.types[this_operand].bitfield.baseIndex
8079 && displacement_string_end[-1] == '+')
8080 {
8081 /* This hack is to avoid a warning when using the "o"
8082 constraint within gcc asm statements.
8083 For instance:
8084
8085 #define _set_tssldt_desc(n,addr,limit,type) \
8086 __asm__ __volatile__ ( \
8087 "movw %w2,%0\n\t" \
8088 "movw %w1,2+%0\n\t" \
8089 "rorl $16,%1\n\t" \
8090 "movb %b1,4+%0\n\t" \
8091 "movb %4,5+%0\n\t" \
8092 "movb $0,6+%0\n\t" \
8093 "movb %h1,7+%0\n\t" \
8094 "rorl $16,%1" \
8095 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
8096
8097 This works great except that the output assembler ends
8098 up looking a bit weird if it turns out that there is
8099 no offset. You end up producing code that looks like:
8100
8101 #APP
8102 movw $235,(%eax)
8103 movw %dx,2+(%eax)
8104 rorl $16,%edx
8105 movb %dl,4+(%eax)
8106 movb $137,5+(%eax)
8107 movb $0,6+(%eax)
8108 movb %dh,7+(%eax)
8109 rorl $16,%edx
8110 #NO_APP
8111
8112 So here we provide the missing zero. */
8113
8114 *displacement_string_end = '0';
8115 }
8116 #endif
8117 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types,
8118 (i.bnd_prefix != NULL
8119 || add_bnd_prefix));
8120 if (gotfree_input_line)
8121 input_line_pointer = gotfree_input_line;
8122
8123 exp_seg = expression (exp);
8124
8125 SKIP_WHITESPACE ();
8126 if (*input_line_pointer)
8127 as_bad (_("junk `%s' after expression"), input_line_pointer);
8128 #if GCC_ASM_O_HACK
8129 RESTORE_END_STRING (disp_end + 1);
8130 #endif
8131 input_line_pointer = save_input_line_pointer;
8132 if (gotfree_input_line)
8133 {
8134 free (gotfree_input_line);
8135
8136 if (exp->X_op == O_constant || exp->X_op == O_register)
8137 exp->X_op = O_illegal;
8138 }
8139
8140 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
8141
8142 RESTORE_END_STRING (disp_end);
8143
8144 return ret;
8145 }
8146
8147 static int
8148 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
8149 i386_operand_type types, const char *disp_start)
8150 {
8151 i386_operand_type bigdisp;
8152 int ret = 1;
8153
8154 /* We do this to make sure that the section symbol is in
8155 the symbol table. We will ultimately change the relocation
8156 to be relative to the beginning of the section. */
8157 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
8158 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
8159 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
8160 {
8161 if (exp->X_op != O_symbol)
8162 goto inv_disp;
8163
8164 if (S_IS_LOCAL (exp->X_add_symbol)
8165 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
8166 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
8167 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
8168 exp->X_op = O_subtract;
8169 exp->X_op_symbol = GOT_symbol;
8170 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
8171 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
8172 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
8173 i.reloc[this_operand] = BFD_RELOC_64;
8174 else
8175 i.reloc[this_operand] = BFD_RELOC_32;
8176 }
8177
8178 else if (exp->X_op == O_absent
8179 || exp->X_op == O_illegal
8180 || exp->X_op == O_big)
8181 {
8182 inv_disp:
8183 as_bad (_("missing or invalid displacement expression `%s'"),
8184 disp_start);
8185 ret = 0;
8186 }
8187
8188 else if (flag_code == CODE_64BIT
8189 && !i.prefix[ADDR_PREFIX]
8190 && exp->X_op == O_constant)
8191 {
8192 /* Since displacement is signed extended to 64bit, don't allow
8193 disp32 and turn off disp32s if they are out of range. */
8194 i.types[this_operand].bitfield.disp32 = 0;
8195 if (!fits_in_signed_long (exp->X_add_number))
8196 {
8197 i.types[this_operand].bitfield.disp32s = 0;
8198 if (i.types[this_operand].bitfield.baseindex)
8199 {
8200 as_bad (_("0x%lx out range of signed 32bit displacement"),
8201 (long) exp->X_add_number);
8202 ret = 0;
8203 }
8204 }
8205 }
8206
8207 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
8208 else if (exp->X_op != O_constant
8209 && OUTPUT_FLAVOR == bfd_target_aout_flavour
8210 && exp_seg != absolute_section
8211 && exp_seg != text_section
8212 && exp_seg != data_section
8213 && exp_seg != bss_section
8214 && exp_seg != undefined_section
8215 && !bfd_is_com_section (exp_seg))
8216 {
8217 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
8218 ret = 0;
8219 }
8220 #endif
8221
8222 /* Check if this is a displacement only operand. */
8223 bigdisp = i.types[this_operand];
8224 bigdisp.bitfield.disp8 = 0;
8225 bigdisp.bitfield.disp16 = 0;
8226 bigdisp.bitfield.disp32 = 0;
8227 bigdisp.bitfield.disp32s = 0;
8228 bigdisp.bitfield.disp64 = 0;
8229 if (operand_type_all_zero (&bigdisp))
8230 i.types[this_operand] = operand_type_and (i.types[this_operand],
8231 types);
8232
8233 return ret;
8234 }
8235
8236 /* Make sure the memory operand we've been dealt is valid.
8237 Return 1 on success, 0 on a failure. */
8238
8239 static int
8240 i386_index_check (const char *operand_string)
8241 {
8242 const char *kind = "base/index";
8243 enum flag_code addr_mode;
8244
8245 if (i.prefix[ADDR_PREFIX])
8246 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
8247 else
8248 {
8249 addr_mode = flag_code;
8250
8251 #if INFER_ADDR_PREFIX
8252 if (i.mem_operands == 0)
8253 {
8254 /* Infer address prefix from the first memory operand. */
8255 const reg_entry *addr_reg = i.base_reg;
8256
8257 if (addr_reg == NULL)
8258 addr_reg = i.index_reg;
8259
8260 if (addr_reg)
8261 {
8262 if (addr_reg->reg_num == RegEip
8263 || addr_reg->reg_num == RegEiz
8264 || addr_reg->reg_type.bitfield.reg32)
8265 addr_mode = CODE_32BIT;
8266 else if (flag_code != CODE_64BIT
8267 && addr_reg->reg_type.bitfield.reg16)
8268 addr_mode = CODE_16BIT;
8269
8270 if (addr_mode != flag_code)
8271 {
8272 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
8273 i.prefixes += 1;
8274 /* Change the size of any displacement too. At most one
8275 of Disp16 or Disp32 is set.
8276 FIXME. There doesn't seem to be any real need for
8277 separate Disp16 and Disp32 flags. The same goes for
8278 Imm16 and Imm32. Removing them would probably clean
8279 up the code quite a lot. */
8280 if (flag_code != CODE_64BIT
8281 && (i.types[this_operand].bitfield.disp16
8282 || i.types[this_operand].bitfield.disp32))
8283 i.types[this_operand]
8284 = operand_type_xor (i.types[this_operand], disp16_32);
8285 }
8286 }
8287 }
8288 #endif
8289 }
8290
8291 if (current_templates->start->opcode_modifier.isstring
8292 && !current_templates->start->opcode_modifier.immext
8293 && (current_templates->end[-1].opcode_modifier.isstring
8294 || i.mem_operands))
8295 {
8296 /* Memory operands of string insns are special in that they only allow
8297 a single register (rDI, rSI, or rBX) as their memory address. */
8298 const reg_entry *expected_reg;
8299 static const char *di_si[][2] =
8300 {
8301 { "esi", "edi" },
8302 { "si", "di" },
8303 { "rsi", "rdi" }
8304 };
8305 static const char *bx[] = { "ebx", "bx", "rbx" };
8306
8307 kind = "string address";
8308
8309 if (current_templates->start->opcode_modifier.w)
8310 {
8311 i386_operand_type type = current_templates->end[-1].operand_types[0];
8312
8313 if (!type.bitfield.baseindex
8314 || ((!i.mem_operands != !intel_syntax)
8315 && current_templates->end[-1].operand_types[1]
8316 .bitfield.baseindex))
8317 type = current_templates->end[-1].operand_types[1];
8318 expected_reg = hash_find (reg_hash,
8319 di_si[addr_mode][type.bitfield.esseg]);
8320
8321 }
8322 else
8323 expected_reg = hash_find (reg_hash, bx[addr_mode]);
8324
8325 if (i.base_reg != expected_reg
8326 || i.index_reg
8327 || operand_type_check (i.types[this_operand], disp))
8328 {
8329 /* The second memory operand must have the same size as
8330 the first one. */
8331 if (i.mem_operands
8332 && i.base_reg
8333 && !((addr_mode == CODE_64BIT
8334 && i.base_reg->reg_type.bitfield.reg64)
8335 || (addr_mode == CODE_32BIT
8336 ? i.base_reg->reg_type.bitfield.reg32
8337 : i.base_reg->reg_type.bitfield.reg16)))
8338 goto bad_address;
8339
8340 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
8341 operand_string,
8342 intel_syntax ? '[' : '(',
8343 register_prefix,
8344 expected_reg->reg_name,
8345 intel_syntax ? ']' : ')');
8346 return 1;
8347 }
8348 else
8349 return 1;
8350
8351 bad_address:
8352 as_bad (_("`%s' is not a valid %s expression"),
8353 operand_string, kind);
8354 return 0;
8355 }
8356 else
8357 {
8358 if (addr_mode != CODE_16BIT)
8359 {
8360 /* 32-bit/64-bit checks. */
8361 if ((i.base_reg
8362 && (addr_mode == CODE_64BIT
8363 ? !i.base_reg->reg_type.bitfield.reg64
8364 : !i.base_reg->reg_type.bitfield.reg32)
8365 && (i.index_reg
8366 || (i.base_reg->reg_num
8367 != (addr_mode == CODE_64BIT ? RegRip : RegEip))))
8368 || (i.index_reg
8369 && !i.index_reg->reg_type.bitfield.regxmm
8370 && !i.index_reg->reg_type.bitfield.regymm
8371 && !i.index_reg->reg_type.bitfield.regzmm
8372 && ((addr_mode == CODE_64BIT
8373 ? !(i.index_reg->reg_type.bitfield.reg64
8374 || i.index_reg->reg_num == RegRiz)
8375 : !(i.index_reg->reg_type.bitfield.reg32
8376 || i.index_reg->reg_num == RegEiz))
8377 || !i.index_reg->reg_type.bitfield.baseindex)))
8378 goto bad_address;
8379 }
8380 else
8381 {
8382 /* 16-bit checks. */
8383 if ((i.base_reg
8384 && (!i.base_reg->reg_type.bitfield.reg16
8385 || !i.base_reg->reg_type.bitfield.baseindex))
8386 || (i.index_reg
8387 && (!i.index_reg->reg_type.bitfield.reg16
8388 || !i.index_reg->reg_type.bitfield.baseindex
8389 || !(i.base_reg
8390 && i.base_reg->reg_num < 6
8391 && i.index_reg->reg_num >= 6
8392 && i.log2_scale_factor == 0))))
8393 goto bad_address;
8394 }
8395 }
8396 return 1;
8397 }
8398
8399 /* Handle vector immediates. */
8400
8401 static int
8402 RC_SAE_immediate (const char *imm_start)
8403 {
8404 unsigned int match_found, j;
8405 const char *pstr = imm_start;
8406 expressionS *exp;
8407
8408 if (*pstr != '{')
8409 return 0;
8410
8411 pstr++;
8412 match_found = 0;
8413 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
8414 {
8415 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
8416 {
8417 if (!i.rounding)
8418 {
8419 rc_op.type = RC_NamesTable[j].type;
8420 rc_op.operand = this_operand;
8421 i.rounding = &rc_op;
8422 }
8423 else
8424 {
8425 as_bad (_("duplicated `%s'"), imm_start);
8426 return 0;
8427 }
8428 pstr += RC_NamesTable[j].len;
8429 match_found = 1;
8430 break;
8431 }
8432 }
8433 if (!match_found)
8434 return 0;
8435
8436 if (*pstr++ != '}')
8437 {
8438 as_bad (_("Missing '}': '%s'"), imm_start);
8439 return 0;
8440 }
8441 /* RC/SAE immediate string should contain nothing more. */;
8442 if (*pstr != 0)
8443 {
8444 as_bad (_("Junk after '}': '%s'"), imm_start);
8445 return 0;
8446 }
8447
8448 exp = &im_expressions[i.imm_operands++];
8449 i.op[this_operand].imms = exp;
8450
8451 exp->X_op = O_constant;
8452 exp->X_add_number = 0;
8453 exp->X_add_symbol = (symbolS *) 0;
8454 exp->X_op_symbol = (symbolS *) 0;
8455
8456 i.types[this_operand].bitfield.imm8 = 1;
8457 return 1;
8458 }
8459
8460 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
8461 on error. */
8462
8463 static int
8464 i386_att_operand (char *operand_string)
8465 {
8466 const reg_entry *r;
8467 char *end_op;
8468 char *op_string = operand_string;
8469
8470 if (is_space_char (*op_string))
8471 ++op_string;
8472
8473 /* We check for an absolute prefix (differentiating,
8474 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
8475 if (*op_string == ABSOLUTE_PREFIX)
8476 {
8477 ++op_string;
8478 if (is_space_char (*op_string))
8479 ++op_string;
8480 i.types[this_operand].bitfield.jumpabsolute = 1;
8481 }
8482
8483 /* Check if operand is a register. */
8484 if ((r = parse_register (op_string, &end_op)) != NULL)
8485 {
8486 i386_operand_type temp;
8487
8488 /* Check for a segment override by searching for ':' after a
8489 segment register. */
8490 op_string = end_op;
8491 if (is_space_char (*op_string))
8492 ++op_string;
8493 if (*op_string == ':'
8494 && (r->reg_type.bitfield.sreg2
8495 || r->reg_type.bitfield.sreg3))
8496 {
8497 switch (r->reg_num)
8498 {
8499 case 0:
8500 i.seg[i.mem_operands] = &es;
8501 break;
8502 case 1:
8503 i.seg[i.mem_operands] = &cs;
8504 break;
8505 case 2:
8506 i.seg[i.mem_operands] = &ss;
8507 break;
8508 case 3:
8509 i.seg[i.mem_operands] = &ds;
8510 break;
8511 case 4:
8512 i.seg[i.mem_operands] = &fs;
8513 break;
8514 case 5:
8515 i.seg[i.mem_operands] = &gs;
8516 break;
8517 }
8518
8519 /* Skip the ':' and whitespace. */
8520 ++op_string;
8521 if (is_space_char (*op_string))
8522 ++op_string;
8523
8524 if (!is_digit_char (*op_string)
8525 && !is_identifier_char (*op_string)
8526 && *op_string != '('
8527 && *op_string != ABSOLUTE_PREFIX)
8528 {
8529 as_bad (_("bad memory operand `%s'"), op_string);
8530 return 0;
8531 }
8532 /* Handle case of %es:*foo. */
8533 if (*op_string == ABSOLUTE_PREFIX)
8534 {
8535 ++op_string;
8536 if (is_space_char (*op_string))
8537 ++op_string;
8538 i.types[this_operand].bitfield.jumpabsolute = 1;
8539 }
8540 goto do_memory_reference;
8541 }
8542
8543 /* Handle vector operations. */
8544 if (*op_string == '{')
8545 {
8546 op_string = check_VecOperations (op_string, NULL);
8547 if (op_string == NULL)
8548 return 0;
8549 }
8550
8551 if (*op_string)
8552 {
8553 as_bad (_("junk `%s' after register"), op_string);
8554 return 0;
8555 }
8556 temp = r->reg_type;
8557 temp.bitfield.baseindex = 0;
8558 i.types[this_operand] = operand_type_or (i.types[this_operand],
8559 temp);
8560 i.types[this_operand].bitfield.unspecified = 0;
8561 i.op[this_operand].regs = r;
8562 i.reg_operands++;
8563 }
8564 else if (*op_string == REGISTER_PREFIX)
8565 {
8566 as_bad (_("bad register name `%s'"), op_string);
8567 return 0;
8568 }
8569 else if (*op_string == IMMEDIATE_PREFIX)
8570 {
8571 ++op_string;
8572 if (i.types[this_operand].bitfield.jumpabsolute)
8573 {
8574 as_bad (_("immediate operand illegal with absolute jump"));
8575 return 0;
8576 }
8577 if (!i386_immediate (op_string))
8578 return 0;
8579 }
8580 else if (RC_SAE_immediate (operand_string))
8581 {
8582 /* If it is a RC or SAE immediate, do nothing. */
8583 ;
8584 }
8585 else if (is_digit_char (*op_string)
8586 || is_identifier_char (*op_string)
8587 || *op_string == '(')
8588 {
8589 /* This is a memory reference of some sort. */
8590 char *base_string;
8591
8592 /* Start and end of displacement string expression (if found). */
8593 char *displacement_string_start;
8594 char *displacement_string_end;
8595 char *vop_start;
8596
8597 do_memory_reference:
8598 if ((i.mem_operands == 1
8599 && !current_templates->start->opcode_modifier.isstring)
8600 || i.mem_operands == 2)
8601 {
8602 as_bad (_("too many memory references for `%s'"),
8603 current_templates->start->name);
8604 return 0;
8605 }
8606
8607 /* Check for base index form. We detect the base index form by
8608 looking for an ')' at the end of the operand, searching
8609 for the '(' matching it, and finding a REGISTER_PREFIX or ','
8610 after the '('. */
8611 base_string = op_string + strlen (op_string);
8612
8613 /* Handle vector operations. */
8614 vop_start = strchr (op_string, '{');
8615 if (vop_start && vop_start < base_string)
8616 {
8617 if (check_VecOperations (vop_start, base_string) == NULL)
8618 return 0;
8619 base_string = vop_start;
8620 }
8621
8622 --base_string;
8623 if (is_space_char (*base_string))
8624 --base_string;
8625
8626 /* If we only have a displacement, set-up for it to be parsed later. */
8627 displacement_string_start = op_string;
8628 displacement_string_end = base_string + 1;
8629
8630 if (*base_string == ')')
8631 {
8632 char *temp_string;
8633 unsigned int parens_balanced = 1;
8634 /* We've already checked that the number of left & right ()'s are
8635 equal, so this loop will not be infinite. */
8636 do
8637 {
8638 base_string--;
8639 if (*base_string == ')')
8640 parens_balanced++;
8641 if (*base_string == '(')
8642 parens_balanced--;
8643 }
8644 while (parens_balanced);
8645
8646 temp_string = base_string;
8647
8648 /* Skip past '(' and whitespace. */
8649 ++base_string;
8650 if (is_space_char (*base_string))
8651 ++base_string;
8652
8653 if (*base_string == ','
8654 || ((i.base_reg = parse_register (base_string, &end_op))
8655 != NULL))
8656 {
8657 displacement_string_end = temp_string;
8658
8659 i.types[this_operand].bitfield.baseindex = 1;
8660
8661 if (i.base_reg)
8662 {
8663 base_string = end_op;
8664 if (is_space_char (*base_string))
8665 ++base_string;
8666 }
8667
8668 /* There may be an index reg or scale factor here. */
8669 if (*base_string == ',')
8670 {
8671 ++base_string;
8672 if (is_space_char (*base_string))
8673 ++base_string;
8674
8675 if ((i.index_reg = parse_register (base_string, &end_op))
8676 != NULL)
8677 {
8678 base_string = end_op;
8679 if (is_space_char (*base_string))
8680 ++base_string;
8681 if (*base_string == ',')
8682 {
8683 ++base_string;
8684 if (is_space_char (*base_string))
8685 ++base_string;
8686 }
8687 else if (*base_string != ')')
8688 {
8689 as_bad (_("expecting `,' or `)' "
8690 "after index register in `%s'"),
8691 operand_string);
8692 return 0;
8693 }
8694 }
8695 else if (*base_string == REGISTER_PREFIX)
8696 {
8697 end_op = strchr (base_string, ',');
8698 if (end_op)
8699 *end_op = '\0';
8700 as_bad (_("bad register name `%s'"), base_string);
8701 return 0;
8702 }
8703
8704 /* Check for scale factor. */
8705 if (*base_string != ')')
8706 {
8707 char *end_scale = i386_scale (base_string);
8708
8709 if (!end_scale)
8710 return 0;
8711
8712 base_string = end_scale;
8713 if (is_space_char (*base_string))
8714 ++base_string;
8715 if (*base_string != ')')
8716 {
8717 as_bad (_("expecting `)' "
8718 "after scale factor in `%s'"),
8719 operand_string);
8720 return 0;
8721 }
8722 }
8723 else if (!i.index_reg)
8724 {
8725 as_bad (_("expecting index register or scale factor "
8726 "after `,'; got '%c'"),
8727 *base_string);
8728 return 0;
8729 }
8730 }
8731 else if (*base_string != ')')
8732 {
8733 as_bad (_("expecting `,' or `)' "
8734 "after base register in `%s'"),
8735 operand_string);
8736 return 0;
8737 }
8738 }
8739 else if (*base_string == REGISTER_PREFIX)
8740 {
8741 end_op = strchr (base_string, ',');
8742 if (end_op)
8743 *end_op = '\0';
8744 as_bad (_("bad register name `%s'"), base_string);
8745 return 0;
8746 }
8747 }
8748
8749 /* If there's an expression beginning the operand, parse it,
8750 assuming displacement_string_start and
8751 displacement_string_end are meaningful. */
8752 if (displacement_string_start != displacement_string_end)
8753 {
8754 if (!i386_displacement (displacement_string_start,
8755 displacement_string_end))
8756 return 0;
8757 }
8758
8759 /* Special case for (%dx) while doing input/output op. */
8760 if (i.base_reg
8761 && operand_type_equal (&i.base_reg->reg_type,
8762 &reg16_inoutportreg)
8763 && i.index_reg == 0
8764 && i.log2_scale_factor == 0
8765 && i.seg[i.mem_operands] == 0
8766 && !operand_type_check (i.types[this_operand], disp))
8767 {
8768 i.types[this_operand] = inoutportreg;
8769 return 1;
8770 }
8771
8772 if (i386_index_check (operand_string) == 0)
8773 return 0;
8774 i.types[this_operand].bitfield.mem = 1;
8775 i.mem_operands++;
8776 }
8777 else
8778 {
8779 /* It's not a memory operand; argh! */
8780 as_bad (_("invalid char %s beginning operand %d `%s'"),
8781 output_invalid (*op_string),
8782 this_operand + 1,
8783 op_string);
8784 return 0;
8785 }
8786 return 1; /* Normal return. */
8787 }
8788 \f
8789 /* Calculate the maximum variable size (i.e., excluding fr_fix)
8790 that an rs_machine_dependent frag may reach. */
8791
8792 unsigned int
8793 i386_frag_max_var (fragS *frag)
8794 {
8795 /* The only relaxable frags are for jumps.
8796 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
8797 gas_assert (frag->fr_type == rs_machine_dependent);
8798 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
8799 }
8800
8801 /* md_estimate_size_before_relax()
8802
8803 Called just before relax() for rs_machine_dependent frags. The x86
8804 assembler uses these frags to handle variable size jump
8805 instructions.
8806
8807 Any symbol that is now undefined will not become defined.
8808 Return the correct fr_subtype in the frag.
8809 Return the initial "guess for variable size of frag" to caller.
8810 The guess is actually the growth beyond the fixed part. Whatever
8811 we do to grow the fixed or variable part contributes to our
8812 returned value. */
8813
8814 int
8815 md_estimate_size_before_relax (fragS *fragP, segT segment)
8816 {
8817 /* We've already got fragP->fr_subtype right; all we have to do is
8818 check for un-relaxable symbols. On an ELF system, we can't relax
8819 an externally visible symbol, because it may be overridden by a
8820 shared library. */
8821 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
8822 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8823 || (IS_ELF
8824 && (S_IS_EXTERNAL (fragP->fr_symbol)
8825 || S_IS_WEAK (fragP->fr_symbol)
8826 || ((symbol_get_bfdsym (fragP->fr_symbol)->flags
8827 & BSF_GNU_INDIRECT_FUNCTION))))
8828 #endif
8829 #if defined (OBJ_COFF) && defined (TE_PE)
8830 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
8831 && S_IS_WEAK (fragP->fr_symbol))
8832 #endif
8833 )
8834 {
8835 /* Symbol is undefined in this segment, or we need to keep a
8836 reloc so that weak symbols can be overridden. */
8837 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
8838 enum bfd_reloc_code_real reloc_type;
8839 unsigned char *opcode;
8840 int old_fr_fix;
8841
8842 if (fragP->fr_var != NO_RELOC)
8843 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
8844 else if (size == 2)
8845 reloc_type = BFD_RELOC_16_PCREL;
8846 else
8847 reloc_type = BFD_RELOC_32_PCREL;
8848
8849 old_fr_fix = fragP->fr_fix;
8850 opcode = (unsigned char *) fragP->fr_opcode;
8851
8852 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
8853 {
8854 case UNCOND_JUMP:
8855 /* Make jmp (0xeb) a (d)word displacement jump. */
8856 opcode[0] = 0xe9;
8857 fragP->fr_fix += size;
8858 fix_new (fragP, old_fr_fix, size,
8859 fragP->fr_symbol,
8860 fragP->fr_offset, 1,
8861 reloc_type);
8862 break;
8863
8864 case COND_JUMP86:
8865 if (size == 2
8866 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
8867 {
8868 /* Negate the condition, and branch past an
8869 unconditional jump. */
8870 opcode[0] ^= 1;
8871 opcode[1] = 3;
8872 /* Insert an unconditional jump. */
8873 opcode[2] = 0xe9;
8874 /* We added two extra opcode bytes, and have a two byte
8875 offset. */
8876 fragP->fr_fix += 2 + 2;
8877 fix_new (fragP, old_fr_fix + 2, 2,
8878 fragP->fr_symbol,
8879 fragP->fr_offset, 1,
8880 reloc_type);
8881 break;
8882 }
8883 /* Fall through. */
8884
8885 case COND_JUMP:
8886 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
8887 {
8888 fixS *fixP;
8889
8890 fragP->fr_fix += 1;
8891 fixP = fix_new (fragP, old_fr_fix, 1,
8892 fragP->fr_symbol,
8893 fragP->fr_offset, 1,
8894 BFD_RELOC_8_PCREL);
8895 fixP->fx_signed = 1;
8896 break;
8897 }
8898
8899 /* This changes the byte-displacement jump 0x7N
8900 to the (d)word-displacement jump 0x0f,0x8N. */
8901 opcode[1] = opcode[0] + 0x10;
8902 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
8903 /* We've added an opcode byte. */
8904 fragP->fr_fix += 1 + size;
8905 fix_new (fragP, old_fr_fix + 1, size,
8906 fragP->fr_symbol,
8907 fragP->fr_offset, 1,
8908 reloc_type);
8909 break;
8910
8911 default:
8912 BAD_CASE (fragP->fr_subtype);
8913 break;
8914 }
8915 frag_wane (fragP);
8916 return fragP->fr_fix - old_fr_fix;
8917 }
8918
8919 /* Guess size depending on current relax state. Initially the relax
8920 state will correspond to a short jump and we return 1, because
8921 the variable part of the frag (the branch offset) is one byte
8922 long. However, we can relax a section more than once and in that
8923 case we must either set fr_subtype back to the unrelaxed state,
8924 or return the value for the appropriate branch. */
8925 return md_relax_table[fragP->fr_subtype].rlx_length;
8926 }
8927
8928 /* Called after relax() is finished.
8929
8930 In: Address of frag.
8931 fr_type == rs_machine_dependent.
8932 fr_subtype is what the address relaxed to.
8933
8934 Out: Any fixSs and constants are set up.
8935 Caller will turn frag into a ".space 0". */
8936
8937 void
8938 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
8939 fragS *fragP)
8940 {
8941 unsigned char *opcode;
8942 unsigned char *where_to_put_displacement = NULL;
8943 offsetT target_address;
8944 offsetT opcode_address;
8945 unsigned int extension = 0;
8946 offsetT displacement_from_opcode_start;
8947
8948 opcode = (unsigned char *) fragP->fr_opcode;
8949
8950 /* Address we want to reach in file space. */
8951 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
8952
8953 /* Address opcode resides at in file space. */
8954 opcode_address = fragP->fr_address + fragP->fr_fix;
8955
8956 /* Displacement from opcode start to fill into instruction. */
8957 displacement_from_opcode_start = target_address - opcode_address;
8958
8959 if ((fragP->fr_subtype & BIG) == 0)
8960 {
8961 /* Don't have to change opcode. */
8962 extension = 1; /* 1 opcode + 1 displacement */
8963 where_to_put_displacement = &opcode[1];
8964 }
8965 else
8966 {
8967 if (no_cond_jump_promotion
8968 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
8969 as_warn_where (fragP->fr_file, fragP->fr_line,
8970 _("long jump required"));
8971
8972 switch (fragP->fr_subtype)
8973 {
8974 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
8975 extension = 4; /* 1 opcode + 4 displacement */
8976 opcode[0] = 0xe9;
8977 where_to_put_displacement = &opcode[1];
8978 break;
8979
8980 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
8981 extension = 2; /* 1 opcode + 2 displacement */
8982 opcode[0] = 0xe9;
8983 where_to_put_displacement = &opcode[1];
8984 break;
8985
8986 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
8987 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
8988 extension = 5; /* 2 opcode + 4 displacement */
8989 opcode[1] = opcode[0] + 0x10;
8990 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
8991 where_to_put_displacement = &opcode[2];
8992 break;
8993
8994 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
8995 extension = 3; /* 2 opcode + 2 displacement */
8996 opcode[1] = opcode[0] + 0x10;
8997 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
8998 where_to_put_displacement = &opcode[2];
8999 break;
9000
9001 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
9002 extension = 4;
9003 opcode[0] ^= 1;
9004 opcode[1] = 3;
9005 opcode[2] = 0xe9;
9006 where_to_put_displacement = &opcode[3];
9007 break;
9008
9009 default:
9010 BAD_CASE (fragP->fr_subtype);
9011 break;
9012 }
9013 }
9014
9015 /* If size if less then four we are sure that the operand fits,
9016 but if it's 4, then it could be that the displacement is larger
9017 then -/+ 2GB. */
9018 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
9019 && object_64bit
9020 && ((addressT) (displacement_from_opcode_start - extension
9021 + ((addressT) 1 << 31))
9022 > (((addressT) 2 << 31) - 1)))
9023 {
9024 as_bad_where (fragP->fr_file, fragP->fr_line,
9025 _("jump target out of range"));
9026 /* Make us emit 0. */
9027 displacement_from_opcode_start = extension;
9028 }
9029 /* Now put displacement after opcode. */
9030 md_number_to_chars ((char *) where_to_put_displacement,
9031 (valueT) (displacement_from_opcode_start - extension),
9032 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
9033 fragP->fr_fix += extension;
9034 }
9035 \f
9036 /* Apply a fixup (fixP) to segment data, once it has been determined
9037 by our caller that we have all the info we need to fix it up.
9038
9039 Parameter valP is the pointer to the value of the bits.
9040
9041 On the 386, immediates, displacements, and data pointers are all in
9042 the same (little-endian) format, so we don't need to care about which
9043 we are handling. */
9044
9045 void
9046 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
9047 {
9048 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
9049 valueT value = *valP;
9050
9051 #if !defined (TE_Mach)
9052 if (fixP->fx_pcrel)
9053 {
9054 switch (fixP->fx_r_type)
9055 {
9056 default:
9057 break;
9058
9059 case BFD_RELOC_64:
9060 fixP->fx_r_type = BFD_RELOC_64_PCREL;
9061 break;
9062 case BFD_RELOC_32:
9063 case BFD_RELOC_X86_64_32S:
9064 fixP->fx_r_type = BFD_RELOC_32_PCREL;
9065 break;
9066 case BFD_RELOC_16:
9067 fixP->fx_r_type = BFD_RELOC_16_PCREL;
9068 break;
9069 case BFD_RELOC_8:
9070 fixP->fx_r_type = BFD_RELOC_8_PCREL;
9071 break;
9072 }
9073 }
9074
9075 if (fixP->fx_addsy != NULL
9076 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
9077 || fixP->fx_r_type == BFD_RELOC_64_PCREL
9078 || fixP->fx_r_type == BFD_RELOC_16_PCREL
9079 || fixP->fx_r_type == BFD_RELOC_8_PCREL
9080 || fixP->fx_r_type == BFD_RELOC_X86_64_PC32_BND)
9081 && !use_rela_relocations)
9082 {
9083 /* This is a hack. There should be a better way to handle this.
9084 This covers for the fact that bfd_install_relocation will
9085 subtract the current location (for partial_inplace, PC relative
9086 relocations); see more below. */
9087 #ifndef OBJ_AOUT
9088 if (IS_ELF
9089 #ifdef TE_PE
9090 || OUTPUT_FLAVOR == bfd_target_coff_flavour
9091 #endif
9092 )
9093 value += fixP->fx_where + fixP->fx_frag->fr_address;
9094 #endif
9095 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9096 if (IS_ELF)
9097 {
9098 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
9099
9100 if ((sym_seg == seg
9101 || (symbol_section_p (fixP->fx_addsy)
9102 && sym_seg != absolute_section))
9103 && !generic_force_reloc (fixP))
9104 {
9105 /* Yes, we add the values in twice. This is because
9106 bfd_install_relocation subtracts them out again. I think
9107 bfd_install_relocation is broken, but I don't dare change
9108 it. FIXME. */
9109 value += fixP->fx_where + fixP->fx_frag->fr_address;
9110 }
9111 }
9112 #endif
9113 #if defined (OBJ_COFF) && defined (TE_PE)
9114 /* For some reason, the PE format does not store a
9115 section address offset for a PC relative symbol. */
9116 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
9117 || S_IS_WEAK (fixP->fx_addsy))
9118 value += md_pcrel_from (fixP);
9119 #endif
9120 }
9121 #if defined (OBJ_COFF) && defined (TE_PE)
9122 if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
9123 {
9124 value -= S_GET_VALUE (fixP->fx_addsy);
9125 }
9126 #endif
9127
9128 /* Fix a few things - the dynamic linker expects certain values here,
9129 and we must not disappoint it. */
9130 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9131 if (IS_ELF && fixP->fx_addsy)
9132 switch (fixP->fx_r_type)
9133 {
9134 case BFD_RELOC_386_PLT32:
9135 case BFD_RELOC_X86_64_PLT32:
9136 case BFD_RELOC_X86_64_PLT32_BND:
9137 /* Make the jump instruction point to the address of the operand. At
9138 runtime we merely add the offset to the actual PLT entry. */
9139 value = -4;
9140 break;
9141
9142 case BFD_RELOC_386_TLS_GD:
9143 case BFD_RELOC_386_TLS_LDM:
9144 case BFD_RELOC_386_TLS_IE_32:
9145 case BFD_RELOC_386_TLS_IE:
9146 case BFD_RELOC_386_TLS_GOTIE:
9147 case BFD_RELOC_386_TLS_GOTDESC:
9148 case BFD_RELOC_X86_64_TLSGD:
9149 case BFD_RELOC_X86_64_TLSLD:
9150 case BFD_RELOC_X86_64_GOTTPOFF:
9151 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9152 value = 0; /* Fully resolved at runtime. No addend. */
9153 /* Fallthrough */
9154 case BFD_RELOC_386_TLS_LE:
9155 case BFD_RELOC_386_TLS_LDO_32:
9156 case BFD_RELOC_386_TLS_LE_32:
9157 case BFD_RELOC_X86_64_DTPOFF32:
9158 case BFD_RELOC_X86_64_DTPOFF64:
9159 case BFD_RELOC_X86_64_TPOFF32:
9160 case BFD_RELOC_X86_64_TPOFF64:
9161 S_SET_THREAD_LOCAL (fixP->fx_addsy);
9162 break;
9163
9164 case BFD_RELOC_386_TLS_DESC_CALL:
9165 case BFD_RELOC_X86_64_TLSDESC_CALL:
9166 value = 0; /* Fully resolved at runtime. No addend. */
9167 S_SET_THREAD_LOCAL (fixP->fx_addsy);
9168 fixP->fx_done = 0;
9169 return;
9170
9171 case BFD_RELOC_386_GOT32:
9172 case BFD_RELOC_X86_64_GOT32:
9173 value = 0; /* Fully resolved at runtime. No addend. */
9174 break;
9175
9176 case BFD_RELOC_VTABLE_INHERIT:
9177 case BFD_RELOC_VTABLE_ENTRY:
9178 fixP->fx_done = 0;
9179 return;
9180
9181 default:
9182 break;
9183 }
9184 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
9185 *valP = value;
9186 #endif /* !defined (TE_Mach) */
9187
9188 /* Are we finished with this relocation now? */
9189 if (fixP->fx_addsy == NULL)
9190 fixP->fx_done = 1;
9191 #if defined (OBJ_COFF) && defined (TE_PE)
9192 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
9193 {
9194 fixP->fx_done = 0;
9195 /* Remember value for tc_gen_reloc. */
9196 fixP->fx_addnumber = value;
9197 /* Clear out the frag for now. */
9198 value = 0;
9199 }
9200 #endif
9201 else if (use_rela_relocations)
9202 {
9203 fixP->fx_no_overflow = 1;
9204 /* Remember value for tc_gen_reloc. */
9205 fixP->fx_addnumber = value;
9206 value = 0;
9207 }
9208
9209 md_number_to_chars (p, value, fixP->fx_size);
9210 }
9211 \f
9212 char *
9213 md_atof (int type, char *litP, int *sizeP)
9214 {
9215 /* This outputs the LITTLENUMs in REVERSE order;
9216 in accord with the bigendian 386. */
9217 return ieee_md_atof (type, litP, sizeP, FALSE);
9218 }
9219 \f
9220 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
9221
9222 static char *
9223 output_invalid (int c)
9224 {
9225 if (ISPRINT (c))
9226 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
9227 "'%c'", c);
9228 else
9229 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
9230 "(0x%x)", (unsigned char) c);
9231 return output_invalid_buf;
9232 }
9233
9234 /* REG_STRING starts *before* REGISTER_PREFIX. */
9235
9236 static const reg_entry *
9237 parse_real_register (char *reg_string, char **end_op)
9238 {
9239 char *s = reg_string;
9240 char *p;
9241 char reg_name_given[MAX_REG_NAME_SIZE + 1];
9242 const reg_entry *r;
9243
9244 /* Skip possible REGISTER_PREFIX and possible whitespace. */
9245 if (*s == REGISTER_PREFIX)
9246 ++s;
9247
9248 if (is_space_char (*s))
9249 ++s;
9250
9251 p = reg_name_given;
9252 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
9253 {
9254 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
9255 return (const reg_entry *) NULL;
9256 s++;
9257 }
9258
9259 /* For naked regs, make sure that we are not dealing with an identifier.
9260 This prevents confusing an identifier like `eax_var' with register
9261 `eax'. */
9262 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
9263 return (const reg_entry *) NULL;
9264
9265 *end_op = s;
9266
9267 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
9268
9269 /* Handle floating point regs, allowing spaces in the (i) part. */
9270 if (r == i386_regtab /* %st is first entry of table */)
9271 {
9272 if (is_space_char (*s))
9273 ++s;
9274 if (*s == '(')
9275 {
9276 ++s;
9277 if (is_space_char (*s))
9278 ++s;
9279 if (*s >= '0' && *s <= '7')
9280 {
9281 int fpr = *s - '0';
9282 ++s;
9283 if (is_space_char (*s))
9284 ++s;
9285 if (*s == ')')
9286 {
9287 *end_op = s + 1;
9288 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
9289 know (r);
9290 return r + fpr;
9291 }
9292 }
9293 /* We have "%st(" then garbage. */
9294 return (const reg_entry *) NULL;
9295 }
9296 }
9297
9298 if (r == NULL || allow_pseudo_reg)
9299 return r;
9300
9301 if (operand_type_all_zero (&r->reg_type))
9302 return (const reg_entry *) NULL;
9303
9304 if ((r->reg_type.bitfield.reg32
9305 || r->reg_type.bitfield.sreg3
9306 || r->reg_type.bitfield.control
9307 || r->reg_type.bitfield.debug
9308 || r->reg_type.bitfield.test)
9309 && !cpu_arch_flags.bitfield.cpui386)
9310 return (const reg_entry *) NULL;
9311
9312 if (r->reg_type.bitfield.floatreg
9313 && !cpu_arch_flags.bitfield.cpu8087
9314 && !cpu_arch_flags.bitfield.cpu287
9315 && !cpu_arch_flags.bitfield.cpu387)
9316 return (const reg_entry *) NULL;
9317
9318 if (r->reg_type.bitfield.regmmx && !cpu_arch_flags.bitfield.cpummx)
9319 return (const reg_entry *) NULL;
9320
9321 if (r->reg_type.bitfield.regxmm && !cpu_arch_flags.bitfield.cpusse)
9322 return (const reg_entry *) NULL;
9323
9324 if (r->reg_type.bitfield.regymm && !cpu_arch_flags.bitfield.cpuavx)
9325 return (const reg_entry *) NULL;
9326
9327 if ((r->reg_type.bitfield.regzmm || r->reg_type.bitfield.regmask)
9328 && !cpu_arch_flags.bitfield.cpuavx512f)
9329 return (const reg_entry *) NULL;
9330
9331 /* Don't allow fake index register unless allow_index_reg isn't 0. */
9332 if (!allow_index_reg
9333 && (r->reg_num == RegEiz || r->reg_num == RegRiz))
9334 return (const reg_entry *) NULL;
9335
9336 /* Upper 16 vector register is only available with VREX in 64bit
9337 mode. */
9338 if ((r->reg_flags & RegVRex))
9339 {
9340 if (!cpu_arch_flags.bitfield.cpuvrex
9341 || flag_code != CODE_64BIT)
9342 return (const reg_entry *) NULL;
9343
9344 i.need_vrex = 1;
9345 }
9346
9347 if (((r->reg_flags & (RegRex64 | RegRex))
9348 || r->reg_type.bitfield.reg64)
9349 && (!cpu_arch_flags.bitfield.cpulm
9350 || !operand_type_equal (&r->reg_type, &control))
9351 && flag_code != CODE_64BIT)
9352 return (const reg_entry *) NULL;
9353
9354 if (r->reg_type.bitfield.sreg3 && r->reg_num == RegFlat && !intel_syntax)
9355 return (const reg_entry *) NULL;
9356
9357 return r;
9358 }
9359
9360 /* REG_STRING starts *before* REGISTER_PREFIX. */
9361
9362 static const reg_entry *
9363 parse_register (char *reg_string, char **end_op)
9364 {
9365 const reg_entry *r;
9366
9367 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
9368 r = parse_real_register (reg_string, end_op);
9369 else
9370 r = NULL;
9371 if (!r)
9372 {
9373 char *save = input_line_pointer;
9374 char c;
9375 symbolS *symbolP;
9376
9377 input_line_pointer = reg_string;
9378 c = get_symbol_end ();
9379 symbolP = symbol_find (reg_string);
9380 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
9381 {
9382 const expressionS *e = symbol_get_value_expression (symbolP);
9383
9384 know (e->X_op == O_register);
9385 know (e->X_add_number >= 0
9386 && (valueT) e->X_add_number < i386_regtab_size);
9387 r = i386_regtab + e->X_add_number;
9388 *end_op = input_line_pointer;
9389 }
9390 *input_line_pointer = c;
9391 input_line_pointer = save;
9392 }
9393 return r;
9394 }
9395
9396 int
9397 i386_parse_name (char *name, expressionS *e, char *nextcharP)
9398 {
9399 const reg_entry *r;
9400 char *end = input_line_pointer;
9401
9402 *end = *nextcharP;
9403 r = parse_register (name, &input_line_pointer);
9404 if (r && end <= input_line_pointer)
9405 {
9406 *nextcharP = *input_line_pointer;
9407 *input_line_pointer = 0;
9408 e->X_op = O_register;
9409 e->X_add_number = r - i386_regtab;
9410 return 1;
9411 }
9412 input_line_pointer = end;
9413 *end = 0;
9414 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
9415 }
9416
9417 void
9418 md_operand (expressionS *e)
9419 {
9420 char *end;
9421 const reg_entry *r;
9422
9423 switch (*input_line_pointer)
9424 {
9425 case REGISTER_PREFIX:
9426 r = parse_real_register (input_line_pointer, &end);
9427 if (r)
9428 {
9429 e->X_op = O_register;
9430 e->X_add_number = r - i386_regtab;
9431 input_line_pointer = end;
9432 }
9433 break;
9434
9435 case '[':
9436 gas_assert (intel_syntax);
9437 end = input_line_pointer++;
9438 expression (e);
9439 if (*input_line_pointer == ']')
9440 {
9441 ++input_line_pointer;
9442 e->X_op_symbol = make_expr_symbol (e);
9443 e->X_add_symbol = NULL;
9444 e->X_add_number = 0;
9445 e->X_op = O_index;
9446 }
9447 else
9448 {
9449 e->X_op = O_absent;
9450 input_line_pointer = end;
9451 }
9452 break;
9453 }
9454 }
9455
9456 \f
9457 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9458 const char *md_shortopts = "kVQ:sqn";
9459 #else
9460 const char *md_shortopts = "qn";
9461 #endif
9462
9463 #define OPTION_32 (OPTION_MD_BASE + 0)
9464 #define OPTION_64 (OPTION_MD_BASE + 1)
9465 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
9466 #define OPTION_MARCH (OPTION_MD_BASE + 3)
9467 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
9468 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
9469 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
9470 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
9471 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
9472 #define OPTION_MOLD_GCC (OPTION_MD_BASE + 9)
9473 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
9474 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
9475 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
9476 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
9477 #define OPTION_X32 (OPTION_MD_BASE + 14)
9478 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
9479 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
9480 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
9481
9482 struct option md_longopts[] =
9483 {
9484 {"32", no_argument, NULL, OPTION_32},
9485 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9486 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
9487 {"64", no_argument, NULL, OPTION_64},
9488 #endif
9489 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9490 {"x32", no_argument, NULL, OPTION_X32},
9491 #endif
9492 {"divide", no_argument, NULL, OPTION_DIVIDE},
9493 {"march", required_argument, NULL, OPTION_MARCH},
9494 {"mtune", required_argument, NULL, OPTION_MTUNE},
9495 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
9496 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
9497 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
9498 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
9499 {"mold-gcc", no_argument, NULL, OPTION_MOLD_GCC},
9500 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
9501 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
9502 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
9503 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
9504 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
9505 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
9506 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
9507 {NULL, no_argument, NULL, 0}
9508 };
9509 size_t md_longopts_size = sizeof (md_longopts);
9510
9511 int
9512 md_parse_option (int c, char *arg)
9513 {
9514 unsigned int j;
9515 char *arch, *next;
9516
9517 switch (c)
9518 {
9519 case 'n':
9520 optimize_align_code = 0;
9521 break;
9522
9523 case 'q':
9524 quiet_warnings = 1;
9525 break;
9526
9527 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9528 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
9529 should be emitted or not. FIXME: Not implemented. */
9530 case 'Q':
9531 break;
9532
9533 /* -V: SVR4 argument to print version ID. */
9534 case 'V':
9535 print_version_id ();
9536 break;
9537
9538 /* -k: Ignore for FreeBSD compatibility. */
9539 case 'k':
9540 break;
9541
9542 case 's':
9543 /* -s: On i386 Solaris, this tells the native assembler to use
9544 .stab instead of .stab.excl. We always use .stab anyhow. */
9545 break;
9546 #endif
9547 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9548 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
9549 case OPTION_64:
9550 {
9551 const char **list, **l;
9552
9553 list = bfd_target_list ();
9554 for (l = list; *l != NULL; l++)
9555 if (CONST_STRNEQ (*l, "elf64-x86-64")
9556 || strcmp (*l, "coff-x86-64") == 0
9557 || strcmp (*l, "pe-x86-64") == 0
9558 || strcmp (*l, "pei-x86-64") == 0
9559 || strcmp (*l, "mach-o-x86-64") == 0)
9560 {
9561 default_arch = "x86_64";
9562 break;
9563 }
9564 if (*l == NULL)
9565 as_fatal (_("no compiled in support for x86_64"));
9566 free (list);
9567 }
9568 break;
9569 #endif
9570
9571 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9572 case OPTION_X32:
9573 if (IS_ELF)
9574 {
9575 const char **list, **l;
9576
9577 list = bfd_target_list ();
9578 for (l = list; *l != NULL; l++)
9579 if (CONST_STRNEQ (*l, "elf32-x86-64"))
9580 {
9581 default_arch = "x86_64:32";
9582 break;
9583 }
9584 if (*l == NULL)
9585 as_fatal (_("no compiled in support for 32bit x86_64"));
9586 free (list);
9587 }
9588 else
9589 as_fatal (_("32bit x86_64 is only supported for ELF"));
9590 break;
9591 #endif
9592
9593 case OPTION_32:
9594 default_arch = "i386";
9595 break;
9596
9597 case OPTION_DIVIDE:
9598 #ifdef SVR4_COMMENT_CHARS
9599 {
9600 char *n, *t;
9601 const char *s;
9602
9603 n = (char *) xmalloc (strlen (i386_comment_chars) + 1);
9604 t = n;
9605 for (s = i386_comment_chars; *s != '\0'; s++)
9606 if (*s != '/')
9607 *t++ = *s;
9608 *t = '\0';
9609 i386_comment_chars = n;
9610 }
9611 #endif
9612 break;
9613
9614 case OPTION_MARCH:
9615 arch = xstrdup (arg);
9616 do
9617 {
9618 if (*arch == '.')
9619 as_fatal (_("invalid -march= option: `%s'"), arg);
9620 next = strchr (arch, '+');
9621 if (next)
9622 *next++ = '\0';
9623 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9624 {
9625 if (strcmp (arch, cpu_arch [j].name) == 0)
9626 {
9627 /* Processor. */
9628 if (! cpu_arch[j].flags.bitfield.cpui386)
9629 continue;
9630
9631 cpu_arch_name = cpu_arch[j].name;
9632 cpu_sub_arch_name = NULL;
9633 cpu_arch_flags = cpu_arch[j].flags;
9634 cpu_arch_isa = cpu_arch[j].type;
9635 cpu_arch_isa_flags = cpu_arch[j].flags;
9636 if (!cpu_arch_tune_set)
9637 {
9638 cpu_arch_tune = cpu_arch_isa;
9639 cpu_arch_tune_flags = cpu_arch_isa_flags;
9640 }
9641 break;
9642 }
9643 else if (*cpu_arch [j].name == '.'
9644 && strcmp (arch, cpu_arch [j].name + 1) == 0)
9645 {
9646 /* ISA entension. */
9647 i386_cpu_flags flags;
9648
9649 if (!cpu_arch[j].negated)
9650 flags = cpu_flags_or (cpu_arch_flags,
9651 cpu_arch[j].flags);
9652 else
9653 flags = cpu_flags_and_not (cpu_arch_flags,
9654 cpu_arch[j].flags);
9655 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
9656 {
9657 if (cpu_sub_arch_name)
9658 {
9659 char *name = cpu_sub_arch_name;
9660 cpu_sub_arch_name = concat (name,
9661 cpu_arch[j].name,
9662 (const char *) NULL);
9663 free (name);
9664 }
9665 else
9666 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
9667 cpu_arch_flags = flags;
9668 cpu_arch_isa_flags = flags;
9669 }
9670 break;
9671 }
9672 }
9673
9674 if (j >= ARRAY_SIZE (cpu_arch))
9675 as_fatal (_("invalid -march= option: `%s'"), arg);
9676
9677 arch = next;
9678 }
9679 while (next != NULL );
9680 break;
9681
9682 case OPTION_MTUNE:
9683 if (*arg == '.')
9684 as_fatal (_("invalid -mtune= option: `%s'"), arg);
9685 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9686 {
9687 if (strcmp (arg, cpu_arch [j].name) == 0)
9688 {
9689 cpu_arch_tune_set = 1;
9690 cpu_arch_tune = cpu_arch [j].type;
9691 cpu_arch_tune_flags = cpu_arch[j].flags;
9692 break;
9693 }
9694 }
9695 if (j >= ARRAY_SIZE (cpu_arch))
9696 as_fatal (_("invalid -mtune= option: `%s'"), arg);
9697 break;
9698
9699 case OPTION_MMNEMONIC:
9700 if (strcasecmp (arg, "att") == 0)
9701 intel_mnemonic = 0;
9702 else if (strcasecmp (arg, "intel") == 0)
9703 intel_mnemonic = 1;
9704 else
9705 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
9706 break;
9707
9708 case OPTION_MSYNTAX:
9709 if (strcasecmp (arg, "att") == 0)
9710 intel_syntax = 0;
9711 else if (strcasecmp (arg, "intel") == 0)
9712 intel_syntax = 1;
9713 else
9714 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
9715 break;
9716
9717 case OPTION_MINDEX_REG:
9718 allow_index_reg = 1;
9719 break;
9720
9721 case OPTION_MNAKED_REG:
9722 allow_naked_reg = 1;
9723 break;
9724
9725 case OPTION_MOLD_GCC:
9726 old_gcc = 1;
9727 break;
9728
9729 case OPTION_MSSE2AVX:
9730 sse2avx = 1;
9731 break;
9732
9733 case OPTION_MSSE_CHECK:
9734 if (strcasecmp (arg, "error") == 0)
9735 sse_check = check_error;
9736 else if (strcasecmp (arg, "warning") == 0)
9737 sse_check = check_warning;
9738 else if (strcasecmp (arg, "none") == 0)
9739 sse_check = check_none;
9740 else
9741 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
9742 break;
9743
9744 case OPTION_MOPERAND_CHECK:
9745 if (strcasecmp (arg, "error") == 0)
9746 operand_check = check_error;
9747 else if (strcasecmp (arg, "warning") == 0)
9748 operand_check = check_warning;
9749 else if (strcasecmp (arg, "none") == 0)
9750 operand_check = check_none;
9751 else
9752 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
9753 break;
9754
9755 case OPTION_MAVXSCALAR:
9756 if (strcasecmp (arg, "128") == 0)
9757 avxscalar = vex128;
9758 else if (strcasecmp (arg, "256") == 0)
9759 avxscalar = vex256;
9760 else
9761 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
9762 break;
9763
9764 case OPTION_MADD_BND_PREFIX:
9765 add_bnd_prefix = 1;
9766 break;
9767
9768 case OPTION_MEVEXLIG:
9769 if (strcmp (arg, "128") == 0)
9770 evexlig = evexl128;
9771 else if (strcmp (arg, "256") == 0)
9772 evexlig = evexl256;
9773 else if (strcmp (arg, "512") == 0)
9774 evexlig = evexl512;
9775 else
9776 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
9777 break;
9778
9779 case OPTION_MEVEXWIG:
9780 if (strcmp (arg, "0") == 0)
9781 evexwig = evexw0;
9782 else if (strcmp (arg, "1") == 0)
9783 evexwig = evexw1;
9784 else
9785 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
9786 break;
9787
9788 default:
9789 return 0;
9790 }
9791 return 1;
9792 }
9793
9794 #define MESSAGE_TEMPLATE \
9795 " "
9796
9797 static void
9798 show_arch (FILE *stream, int ext, int check)
9799 {
9800 static char message[] = MESSAGE_TEMPLATE;
9801 char *start = message + 27;
9802 char *p;
9803 int size = sizeof (MESSAGE_TEMPLATE);
9804 int left;
9805 const char *name;
9806 int len;
9807 unsigned int j;
9808
9809 p = start;
9810 left = size - (start - message);
9811 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9812 {
9813 /* Should it be skipped? */
9814 if (cpu_arch [j].skip)
9815 continue;
9816
9817 name = cpu_arch [j].name;
9818 len = cpu_arch [j].len;
9819 if (*name == '.')
9820 {
9821 /* It is an extension. Skip if we aren't asked to show it. */
9822 if (ext)
9823 {
9824 name++;
9825 len--;
9826 }
9827 else
9828 continue;
9829 }
9830 else if (ext)
9831 {
9832 /* It is an processor. Skip if we show only extension. */
9833 continue;
9834 }
9835 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
9836 {
9837 /* It is an impossible processor - skip. */
9838 continue;
9839 }
9840
9841 /* Reserve 2 spaces for ", " or ",\0" */
9842 left -= len + 2;
9843
9844 /* Check if there is any room. */
9845 if (left >= 0)
9846 {
9847 if (p != start)
9848 {
9849 *p++ = ',';
9850 *p++ = ' ';
9851 }
9852 p = mempcpy (p, name, len);
9853 }
9854 else
9855 {
9856 /* Output the current message now and start a new one. */
9857 *p++ = ',';
9858 *p = '\0';
9859 fprintf (stream, "%s\n", message);
9860 p = start;
9861 left = size - (start - message) - len - 2;
9862
9863 gas_assert (left >= 0);
9864
9865 p = mempcpy (p, name, len);
9866 }
9867 }
9868
9869 *p = '\0';
9870 fprintf (stream, "%s\n", message);
9871 }
9872
9873 void
9874 md_show_usage (FILE *stream)
9875 {
9876 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9877 fprintf (stream, _("\
9878 -Q ignored\n\
9879 -V print assembler version number\n\
9880 -k ignored\n"));
9881 #endif
9882 fprintf (stream, _("\
9883 -n Do not optimize code alignment\n\
9884 -q quieten some warnings\n"));
9885 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9886 fprintf (stream, _("\
9887 -s ignored\n"));
9888 #endif
9889 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9890 || defined (TE_PE) || defined (TE_PEP))
9891 fprintf (stream, _("\
9892 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
9893 #endif
9894 #ifdef SVR4_COMMENT_CHARS
9895 fprintf (stream, _("\
9896 --divide do not treat `/' as a comment character\n"));
9897 #else
9898 fprintf (stream, _("\
9899 --divide ignored\n"));
9900 #endif
9901 fprintf (stream, _("\
9902 -march=CPU[,+EXTENSION...]\n\
9903 generate code for CPU and EXTENSION, CPU is one of:\n"));
9904 show_arch (stream, 0, 1);
9905 fprintf (stream, _("\
9906 EXTENSION is combination of:\n"));
9907 show_arch (stream, 1, 0);
9908 fprintf (stream, _("\
9909 -mtune=CPU optimize for CPU, CPU is one of:\n"));
9910 show_arch (stream, 0, 0);
9911 fprintf (stream, _("\
9912 -msse2avx encode SSE instructions with VEX prefix\n"));
9913 fprintf (stream, _("\
9914 -msse-check=[none|error|warning]\n\
9915 check SSE instructions\n"));
9916 fprintf (stream, _("\
9917 -moperand-check=[none|error|warning]\n\
9918 check operand combinations for validity\n"));
9919 fprintf (stream, _("\
9920 -mavxscalar=[128|256] encode scalar AVX instructions with specific vector\n\
9921 length\n"));
9922 fprintf (stream, _("\
9923 -mevexlig=[128|256|512] encode scalar EVEX instructions with specific vector\n\
9924 length\n"));
9925 fprintf (stream, _("\
9926 -mevexwig=[0|1] encode EVEX instructions with specific EVEX.W value\n\
9927 for EVEX.W bit ignored instructions\n"));
9928 fprintf (stream, _("\
9929 -mmnemonic=[att|intel] use AT&T/Intel mnemonic\n"));
9930 fprintf (stream, _("\
9931 -msyntax=[att|intel] use AT&T/Intel syntax\n"));
9932 fprintf (stream, _("\
9933 -mindex-reg support pseudo index registers\n"));
9934 fprintf (stream, _("\
9935 -mnaked-reg don't require `%%' prefix for registers\n"));
9936 fprintf (stream, _("\
9937 -mold-gcc support old (<= 2.8.1) versions of gcc\n"));
9938 fprintf (stream, _("\
9939 -madd-bnd-prefix add BND prefix for all valid branches\n"));
9940 }
9941
9942 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
9943 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9944 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
9945
9946 /* Pick the target format to use. */
9947
9948 const char *
9949 i386_target_format (void)
9950 {
9951 if (!strncmp (default_arch, "x86_64", 6))
9952 {
9953 update_code_flag (CODE_64BIT, 1);
9954 if (default_arch[6] == '\0')
9955 x86_elf_abi = X86_64_ABI;
9956 else
9957 x86_elf_abi = X86_64_X32_ABI;
9958 }
9959 else if (!strcmp (default_arch, "i386"))
9960 update_code_flag (CODE_32BIT, 1);
9961 else
9962 as_fatal (_("unknown architecture"));
9963
9964 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
9965 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
9966 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
9967 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
9968
9969 switch (OUTPUT_FLAVOR)
9970 {
9971 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
9972 case bfd_target_aout_flavour:
9973 return AOUT_TARGET_FORMAT;
9974 #endif
9975 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
9976 # if defined (TE_PE) || defined (TE_PEP)
9977 case bfd_target_coff_flavour:
9978 return flag_code == CODE_64BIT ? "pe-x86-64" : "pe-i386";
9979 # elif defined (TE_GO32)
9980 case bfd_target_coff_flavour:
9981 return "coff-go32";
9982 # else
9983 case bfd_target_coff_flavour:
9984 return "coff-i386";
9985 # endif
9986 #endif
9987 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9988 case bfd_target_elf_flavour:
9989 {
9990 const char *format;
9991
9992 switch (x86_elf_abi)
9993 {
9994 default:
9995 format = ELF_TARGET_FORMAT;
9996 break;
9997 case X86_64_ABI:
9998 use_rela_relocations = 1;
9999 object_64bit = 1;
10000 format = ELF_TARGET_FORMAT64;
10001 break;
10002 case X86_64_X32_ABI:
10003 use_rela_relocations = 1;
10004 object_64bit = 1;
10005 disallow_64bit_reloc = 1;
10006 format = ELF_TARGET_FORMAT32;
10007 break;
10008 }
10009 if (cpu_arch_isa == PROCESSOR_L1OM)
10010 {
10011 if (x86_elf_abi != X86_64_ABI)
10012 as_fatal (_("Intel L1OM is 64bit only"));
10013 return ELF_TARGET_L1OM_FORMAT;
10014 }
10015 if (cpu_arch_isa == PROCESSOR_K1OM)
10016 {
10017 if (x86_elf_abi != X86_64_ABI)
10018 as_fatal (_("Intel K1OM is 64bit only"));
10019 return ELF_TARGET_K1OM_FORMAT;
10020 }
10021 else
10022 return format;
10023 }
10024 #endif
10025 #if defined (OBJ_MACH_O)
10026 case bfd_target_mach_o_flavour:
10027 if (flag_code == CODE_64BIT)
10028 {
10029 use_rela_relocations = 1;
10030 object_64bit = 1;
10031 return "mach-o-x86-64";
10032 }
10033 else
10034 return "mach-o-i386";
10035 #endif
10036 default:
10037 abort ();
10038 return NULL;
10039 }
10040 }
10041
10042 #endif /* OBJ_MAYBE_ more than one */
10043
10044 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
10045 void
10046 i386_elf_emit_arch_note (void)
10047 {
10048 if (IS_ELF && cpu_arch_name != NULL)
10049 {
10050 char *p;
10051 asection *seg = now_seg;
10052 subsegT subseg = now_subseg;
10053 Elf_Internal_Note i_note;
10054 Elf_External_Note e_note;
10055 asection *note_secp;
10056 int len;
10057
10058 /* Create the .note section. */
10059 note_secp = subseg_new (".note", 0);
10060 bfd_set_section_flags (stdoutput,
10061 note_secp,
10062 SEC_HAS_CONTENTS | SEC_READONLY);
10063
10064 /* Process the arch string. */
10065 len = strlen (cpu_arch_name);
10066
10067 i_note.namesz = len + 1;
10068 i_note.descsz = 0;
10069 i_note.type = NT_ARCH;
10070 p = frag_more (sizeof (e_note.namesz));
10071 md_number_to_chars (p, (valueT) i_note.namesz, sizeof (e_note.namesz));
10072 p = frag_more (sizeof (e_note.descsz));
10073 md_number_to_chars (p, (valueT) i_note.descsz, sizeof (e_note.descsz));
10074 p = frag_more (sizeof (e_note.type));
10075 md_number_to_chars (p, (valueT) i_note.type, sizeof (e_note.type));
10076 p = frag_more (len + 1);
10077 strcpy (p, cpu_arch_name);
10078
10079 frag_align (2, 0, 0);
10080
10081 subseg_set (seg, subseg);
10082 }
10083 }
10084 #endif
10085 \f
10086 symbolS *
10087 md_undefined_symbol (char *name)
10088 {
10089 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
10090 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
10091 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
10092 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
10093 {
10094 if (!GOT_symbol)
10095 {
10096 if (symbol_find (name))
10097 as_bad (_("GOT already in symbol table"));
10098 GOT_symbol = symbol_new (name, undefined_section,
10099 (valueT) 0, &zero_address_frag);
10100 };
10101 return GOT_symbol;
10102 }
10103 return 0;
10104 }
10105
10106 /* Round up a section size to the appropriate boundary. */
10107
10108 valueT
10109 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
10110 {
10111 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10112 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
10113 {
10114 /* For a.out, force the section size to be aligned. If we don't do
10115 this, BFD will align it for us, but it will not write out the
10116 final bytes of the section. This may be a bug in BFD, but it is
10117 easier to fix it here since that is how the other a.out targets
10118 work. */
10119 int align;
10120
10121 align = bfd_get_section_alignment (stdoutput, segment);
10122 size = ((size + (1 << align) - 1) & ((valueT) -1 << align));
10123 }
10124 #endif
10125
10126 return size;
10127 }
10128
10129 /* On the i386, PC-relative offsets are relative to the start of the
10130 next instruction. That is, the address of the offset, plus its
10131 size, since the offset is always the last part of the insn. */
10132
10133 long
10134 md_pcrel_from (fixS *fixP)
10135 {
10136 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
10137 }
10138
10139 #ifndef I386COFF
10140
10141 static void
10142 s_bss (int ignore ATTRIBUTE_UNUSED)
10143 {
10144 int temp;
10145
10146 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10147 if (IS_ELF)
10148 obj_elf_section_change_hook ();
10149 #endif
10150 temp = get_absolute_expression ();
10151 subseg_set (bss_section, (subsegT) temp);
10152 demand_empty_rest_of_line ();
10153 }
10154
10155 #endif
10156
10157 void
10158 i386_validate_fix (fixS *fixp)
10159 {
10160 if (fixp->fx_subsy && fixp->fx_subsy == GOT_symbol)
10161 {
10162 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
10163 {
10164 if (!object_64bit)
10165 abort ();
10166 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
10167 }
10168 else
10169 {
10170 if (!object_64bit)
10171 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
10172 else
10173 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
10174 }
10175 fixp->fx_subsy = 0;
10176 }
10177 }
10178
10179 arelent *
10180 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
10181 {
10182 arelent *rel;
10183 bfd_reloc_code_real_type code;
10184
10185 switch (fixp->fx_r_type)
10186 {
10187 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10188 case BFD_RELOC_SIZE32:
10189 case BFD_RELOC_SIZE64:
10190 if (S_IS_DEFINED (fixp->fx_addsy)
10191 && !S_IS_EXTERNAL (fixp->fx_addsy))
10192 {
10193 /* Resolve size relocation against local symbol to size of
10194 the symbol plus addend. */
10195 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
10196 if (fixp->fx_r_type == BFD_RELOC_SIZE32
10197 && !fits_in_unsigned_long (value))
10198 as_bad_where (fixp->fx_file, fixp->fx_line,
10199 _("symbol size computation overflow"));
10200 fixp->fx_addsy = NULL;
10201 fixp->fx_subsy = NULL;
10202 md_apply_fix (fixp, (valueT *) &value, NULL);
10203 return NULL;
10204 }
10205 #endif
10206
10207 case BFD_RELOC_X86_64_PLT32:
10208 case BFD_RELOC_X86_64_PLT32_BND:
10209 case BFD_RELOC_X86_64_GOT32:
10210 case BFD_RELOC_X86_64_GOTPCREL:
10211 case BFD_RELOC_386_PLT32:
10212 case BFD_RELOC_386_GOT32:
10213 case BFD_RELOC_386_GOTOFF:
10214 case BFD_RELOC_386_GOTPC:
10215 case BFD_RELOC_386_TLS_GD:
10216 case BFD_RELOC_386_TLS_LDM:
10217 case BFD_RELOC_386_TLS_LDO_32:
10218 case BFD_RELOC_386_TLS_IE_32:
10219 case BFD_RELOC_386_TLS_IE:
10220 case BFD_RELOC_386_TLS_GOTIE:
10221 case BFD_RELOC_386_TLS_LE_32:
10222 case BFD_RELOC_386_TLS_LE:
10223 case BFD_RELOC_386_TLS_GOTDESC:
10224 case BFD_RELOC_386_TLS_DESC_CALL:
10225 case BFD_RELOC_X86_64_TLSGD:
10226 case BFD_RELOC_X86_64_TLSLD:
10227 case BFD_RELOC_X86_64_DTPOFF32:
10228 case BFD_RELOC_X86_64_DTPOFF64:
10229 case BFD_RELOC_X86_64_GOTTPOFF:
10230 case BFD_RELOC_X86_64_TPOFF32:
10231 case BFD_RELOC_X86_64_TPOFF64:
10232 case BFD_RELOC_X86_64_GOTOFF64:
10233 case BFD_RELOC_X86_64_GOTPC32:
10234 case BFD_RELOC_X86_64_GOT64:
10235 case BFD_RELOC_X86_64_GOTPCREL64:
10236 case BFD_RELOC_X86_64_GOTPC64:
10237 case BFD_RELOC_X86_64_GOTPLT64:
10238 case BFD_RELOC_X86_64_PLTOFF64:
10239 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10240 case BFD_RELOC_X86_64_TLSDESC_CALL:
10241 case BFD_RELOC_RVA:
10242 case BFD_RELOC_VTABLE_ENTRY:
10243 case BFD_RELOC_VTABLE_INHERIT:
10244 #ifdef TE_PE
10245 case BFD_RELOC_32_SECREL:
10246 #endif
10247 code = fixp->fx_r_type;
10248 break;
10249 case BFD_RELOC_X86_64_32S:
10250 if (!fixp->fx_pcrel)
10251 {
10252 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
10253 code = fixp->fx_r_type;
10254 break;
10255 }
10256 default:
10257 if (fixp->fx_pcrel)
10258 {
10259 switch (fixp->fx_size)
10260 {
10261 default:
10262 as_bad_where (fixp->fx_file, fixp->fx_line,
10263 _("can not do %d byte pc-relative relocation"),
10264 fixp->fx_size);
10265 code = BFD_RELOC_32_PCREL;
10266 break;
10267 case 1: code = BFD_RELOC_8_PCREL; break;
10268 case 2: code = BFD_RELOC_16_PCREL; break;
10269 case 4:
10270 code = (fixp->fx_r_type == BFD_RELOC_X86_64_PC32_BND
10271 ? fixp-> fx_r_type : BFD_RELOC_32_PCREL);
10272 break;
10273 #ifdef BFD64
10274 case 8: code = BFD_RELOC_64_PCREL; break;
10275 #endif
10276 }
10277 }
10278 else
10279 {
10280 switch (fixp->fx_size)
10281 {
10282 default:
10283 as_bad_where (fixp->fx_file, fixp->fx_line,
10284 _("can not do %d byte relocation"),
10285 fixp->fx_size);
10286 code = BFD_RELOC_32;
10287 break;
10288 case 1: code = BFD_RELOC_8; break;
10289 case 2: code = BFD_RELOC_16; break;
10290 case 4: code = BFD_RELOC_32; break;
10291 #ifdef BFD64
10292 case 8: code = BFD_RELOC_64; break;
10293 #endif
10294 }
10295 }
10296 break;
10297 }
10298
10299 if ((code == BFD_RELOC_32
10300 || code == BFD_RELOC_32_PCREL
10301 || code == BFD_RELOC_X86_64_32S)
10302 && GOT_symbol
10303 && fixp->fx_addsy == GOT_symbol)
10304 {
10305 if (!object_64bit)
10306 code = BFD_RELOC_386_GOTPC;
10307 else
10308 code = BFD_RELOC_X86_64_GOTPC32;
10309 }
10310 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
10311 && GOT_symbol
10312 && fixp->fx_addsy == GOT_symbol)
10313 {
10314 code = BFD_RELOC_X86_64_GOTPC64;
10315 }
10316
10317 rel = (arelent *) xmalloc (sizeof (arelent));
10318 rel->sym_ptr_ptr = (asymbol **) xmalloc (sizeof (asymbol *));
10319 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
10320
10321 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
10322
10323 if (!use_rela_relocations)
10324 {
10325 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
10326 vtable entry to be used in the relocation's section offset. */
10327 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
10328 rel->address = fixp->fx_offset;
10329 #if defined (OBJ_COFF) && defined (TE_PE)
10330 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
10331 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
10332 else
10333 #endif
10334 rel->addend = 0;
10335 }
10336 /* Use the rela in 64bit mode. */
10337 else
10338 {
10339 if (disallow_64bit_reloc)
10340 switch (code)
10341 {
10342 case BFD_RELOC_X86_64_DTPOFF64:
10343 case BFD_RELOC_X86_64_TPOFF64:
10344 case BFD_RELOC_64_PCREL:
10345 case BFD_RELOC_X86_64_GOTOFF64:
10346 case BFD_RELOC_X86_64_GOT64:
10347 case BFD_RELOC_X86_64_GOTPCREL64:
10348 case BFD_RELOC_X86_64_GOTPC64:
10349 case BFD_RELOC_X86_64_GOTPLT64:
10350 case BFD_RELOC_X86_64_PLTOFF64:
10351 as_bad_where (fixp->fx_file, fixp->fx_line,
10352 _("cannot represent relocation type %s in x32 mode"),
10353 bfd_get_reloc_code_name (code));
10354 break;
10355 default:
10356 break;
10357 }
10358
10359 if (!fixp->fx_pcrel)
10360 rel->addend = fixp->fx_offset;
10361 else
10362 switch (code)
10363 {
10364 case BFD_RELOC_X86_64_PLT32:
10365 case BFD_RELOC_X86_64_PLT32_BND:
10366 case BFD_RELOC_X86_64_GOT32:
10367 case BFD_RELOC_X86_64_GOTPCREL:
10368 case BFD_RELOC_X86_64_TLSGD:
10369 case BFD_RELOC_X86_64_TLSLD:
10370 case BFD_RELOC_X86_64_GOTTPOFF:
10371 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10372 case BFD_RELOC_X86_64_TLSDESC_CALL:
10373 rel->addend = fixp->fx_offset - fixp->fx_size;
10374 break;
10375 default:
10376 rel->addend = (section->vma
10377 - fixp->fx_size
10378 + fixp->fx_addnumber
10379 + md_pcrel_from (fixp));
10380 break;
10381 }
10382 }
10383
10384 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
10385 if (rel->howto == NULL)
10386 {
10387 as_bad_where (fixp->fx_file, fixp->fx_line,
10388 _("cannot represent relocation type %s"),
10389 bfd_get_reloc_code_name (code));
10390 /* Set howto to a garbage value so that we can keep going. */
10391 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
10392 gas_assert (rel->howto != NULL);
10393 }
10394
10395 return rel;
10396 }
10397
10398 #include "tc-i386-intel.c"
10399
10400 void
10401 tc_x86_parse_to_dw2regnum (expressionS *exp)
10402 {
10403 int saved_naked_reg;
10404 char saved_register_dot;
10405
10406 saved_naked_reg = allow_naked_reg;
10407 allow_naked_reg = 1;
10408 saved_register_dot = register_chars['.'];
10409 register_chars['.'] = '.';
10410 allow_pseudo_reg = 1;
10411 expression_and_evaluate (exp);
10412 allow_pseudo_reg = 0;
10413 register_chars['.'] = saved_register_dot;
10414 allow_naked_reg = saved_naked_reg;
10415
10416 if (exp->X_op == O_register && exp->X_add_number >= 0)
10417 {
10418 if ((addressT) exp->X_add_number < i386_regtab_size)
10419 {
10420 exp->X_op = O_constant;
10421 exp->X_add_number = i386_regtab[exp->X_add_number]
10422 .dw2_regnum[flag_code >> 1];
10423 }
10424 else
10425 exp->X_op = O_illegal;
10426 }
10427 }
10428
10429 void
10430 tc_x86_frame_initial_instructions (void)
10431 {
10432 static unsigned int sp_regno[2];
10433
10434 if (!sp_regno[flag_code >> 1])
10435 {
10436 char *saved_input = input_line_pointer;
10437 char sp[][4] = {"esp", "rsp"};
10438 expressionS exp;
10439
10440 input_line_pointer = sp[flag_code >> 1];
10441 tc_x86_parse_to_dw2regnum (&exp);
10442 gas_assert (exp.X_op == O_constant);
10443 sp_regno[flag_code >> 1] = exp.X_add_number;
10444 input_line_pointer = saved_input;
10445 }
10446
10447 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
10448 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
10449 }
10450
10451 int
10452 x86_dwarf2_addr_size (void)
10453 {
10454 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
10455 if (x86_elf_abi == X86_64_X32_ABI)
10456 return 4;
10457 #endif
10458 return bfd_arch_bits_per_address (stdoutput) / 8;
10459 }
10460
10461 int
10462 i386_elf_section_type (const char *str, size_t len)
10463 {
10464 if (flag_code == CODE_64BIT
10465 && len == sizeof ("unwind") - 1
10466 && strncmp (str, "unwind", 6) == 0)
10467 return SHT_X86_64_UNWIND;
10468
10469 return -1;
10470 }
10471
10472 #ifdef TE_SOLARIS
10473 void
10474 i386_solaris_fix_up_eh_frame (segT sec)
10475 {
10476 if (flag_code == CODE_64BIT)
10477 elf_section_type (sec) = SHT_X86_64_UNWIND;
10478 }
10479 #endif
10480
10481 #ifdef TE_PE
10482 void
10483 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
10484 {
10485 expressionS exp;
10486
10487 exp.X_op = O_secrel;
10488 exp.X_add_symbol = symbol;
10489 exp.X_add_number = 0;
10490 emit_expr (&exp, size);
10491 }
10492 #endif
10493
10494 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10495 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
10496
10497 bfd_vma
10498 x86_64_section_letter (int letter, char **ptr_msg)
10499 {
10500 if (flag_code == CODE_64BIT)
10501 {
10502 if (letter == 'l')
10503 return SHF_X86_64_LARGE;
10504
10505 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
10506 }
10507 else
10508 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
10509 return -1;
10510 }
10511
10512 bfd_vma
10513 x86_64_section_word (char *str, size_t len)
10514 {
10515 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
10516 return SHF_X86_64_LARGE;
10517
10518 return -1;
10519 }
10520
10521 static void
10522 handle_large_common (int small ATTRIBUTE_UNUSED)
10523 {
10524 if (flag_code != CODE_64BIT)
10525 {
10526 s_comm_internal (0, elf_common_parse);
10527 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
10528 }
10529 else
10530 {
10531 static segT lbss_section;
10532 asection *saved_com_section_ptr = elf_com_section_ptr;
10533 asection *saved_bss_section = bss_section;
10534
10535 if (lbss_section == NULL)
10536 {
10537 flagword applicable;
10538 segT seg = now_seg;
10539 subsegT subseg = now_subseg;
10540
10541 /* The .lbss section is for local .largecomm symbols. */
10542 lbss_section = subseg_new (".lbss", 0);
10543 applicable = bfd_applicable_section_flags (stdoutput);
10544 bfd_set_section_flags (stdoutput, lbss_section,
10545 applicable & SEC_ALLOC);
10546 seg_info (lbss_section)->bss = 1;
10547
10548 subseg_set (seg, subseg);
10549 }
10550
10551 elf_com_section_ptr = &_bfd_elf_large_com_section;
10552 bss_section = lbss_section;
10553
10554 s_comm_internal (0, elf_common_parse);
10555
10556 elf_com_section_ptr = saved_com_section_ptr;
10557 bss_section = saved_bss_section;
10558 }
10559 }
10560 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 0.267255 seconds and 4 git commands to generate.