gas/
[deliverable/binutils-gdb.git] / gas / config / tc-i386.c
1 /* i386.c -- Assemble code for the Intel 80386
2 Copyright 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999,
3 2000, 2001, 2002, 2003, 2004, 2005, 2006
4 Free Software Foundation, Inc.
5
6 This file is part of GAS, the GNU Assembler.
7
8 GAS is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 2, or (at your option)
11 any later version.
12
13 GAS is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
17
18 You should have received a copy of the GNU General Public License
19 along with GAS; see the file COPYING. If not, write to the Free
20 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
21 02110-1301, USA. */
22
23 /* Intel 80386 machine specific gas.
24 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
25 x86_64 support by Jan Hubicka (jh@suse.cz)
26 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
27 Bugs & suggestions are completely welcome. This is free software.
28 Please help us make it better. */
29
30 #include "as.h"
31 #include "safe-ctype.h"
32 #include "subsegs.h"
33 #include "dwarf2dbg.h"
34 #include "dw2gencfi.h"
35 #include "opcode/i386.h"
36 #include "elf/x86-64.h"
37
38 #ifndef REGISTER_WARNINGS
39 #define REGISTER_WARNINGS 1
40 #endif
41
42 #ifndef INFER_ADDR_PREFIX
43 #define INFER_ADDR_PREFIX 1
44 #endif
45
46 #ifndef SCALE1_WHEN_NO_INDEX
47 /* Specifying a scale factor besides 1 when there is no index is
48 futile. eg. `mov (%ebx,2),%al' does exactly the same as
49 `mov (%ebx),%al'. To slavishly follow what the programmer
50 specified, set SCALE1_WHEN_NO_INDEX to 0. */
51 #define SCALE1_WHEN_NO_INDEX 1
52 #endif
53
54 #ifndef DEFAULT_ARCH
55 #define DEFAULT_ARCH "i386"
56 #endif
57
58 #ifndef INLINE
59 #if __GNUC__ >= 2
60 #define INLINE __inline__
61 #else
62 #define INLINE
63 #endif
64 #endif
65
66 static INLINE unsigned int mode_from_disp_size PARAMS ((unsigned int));
67 static INLINE int fits_in_signed_byte PARAMS ((offsetT));
68 static INLINE int fits_in_unsigned_byte PARAMS ((offsetT));
69 static INLINE int fits_in_unsigned_word PARAMS ((offsetT));
70 static INLINE int fits_in_signed_word PARAMS ((offsetT));
71 static INLINE int fits_in_unsigned_long PARAMS ((offsetT));
72 static INLINE int fits_in_signed_long PARAMS ((offsetT));
73 static int smallest_imm_type PARAMS ((offsetT));
74 static offsetT offset_in_range PARAMS ((offsetT, int));
75 static int add_prefix PARAMS ((unsigned int));
76 static void set_code_flag PARAMS ((int));
77 static void set_16bit_gcc_code_flag PARAMS ((int));
78 static void set_intel_syntax PARAMS ((int));
79 static void set_cpu_arch PARAMS ((int));
80 #ifdef TE_PE
81 static void pe_directive_secrel PARAMS ((int));
82 #endif
83 static void signed_cons PARAMS ((int));
84 static char *output_invalid PARAMS ((int c));
85 static int i386_operand PARAMS ((char *operand_string));
86 static int i386_intel_operand PARAMS ((char *operand_string, int got_a_float));
87 static const reg_entry *parse_register PARAMS ((char *reg_string,
88 char **end_op));
89 static char *parse_insn PARAMS ((char *, char *));
90 static char *parse_operands PARAMS ((char *, const char *));
91 static void swap_operands PARAMS ((void));
92 static void optimize_imm PARAMS ((void));
93 static void optimize_disp PARAMS ((void));
94 static int match_template PARAMS ((void));
95 static int check_string PARAMS ((void));
96 static int process_suffix PARAMS ((void));
97 static int check_byte_reg PARAMS ((void));
98 static int check_long_reg PARAMS ((void));
99 static int check_qword_reg PARAMS ((void));
100 static int check_word_reg PARAMS ((void));
101 static int finalize_imm PARAMS ((void));
102 static int process_operands PARAMS ((void));
103 static const seg_entry *build_modrm_byte PARAMS ((void));
104 static void output_insn PARAMS ((void));
105 static void output_branch PARAMS ((void));
106 static void output_jump PARAMS ((void));
107 static void output_interseg_jump PARAMS ((void));
108 static void output_imm PARAMS ((fragS *insn_start_frag,
109 offsetT insn_start_off));
110 static void output_disp PARAMS ((fragS *insn_start_frag,
111 offsetT insn_start_off));
112 #ifndef I386COFF
113 static void s_bss PARAMS ((int));
114 #endif
115 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
116 static void handle_large_common (int small ATTRIBUTE_UNUSED);
117 #endif
118
119 static const char *default_arch = DEFAULT_ARCH;
120
121 /* 'md_assemble ()' gathers together information and puts it into a
122 i386_insn. */
123
124 union i386_op
125 {
126 expressionS *disps;
127 expressionS *imms;
128 const reg_entry *regs;
129 };
130
131 struct _i386_insn
132 {
133 /* TM holds the template for the insn were currently assembling. */
134 template tm;
135
136 /* SUFFIX holds the instruction mnemonic suffix if given.
137 (e.g. 'l' for 'movl') */
138 char suffix;
139
140 /* OPERANDS gives the number of given operands. */
141 unsigned int operands;
142
143 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
144 of given register, displacement, memory operands and immediate
145 operands. */
146 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
147
148 /* TYPES [i] is the type (see above #defines) which tells us how to
149 use OP[i] for the corresponding operand. */
150 unsigned int types[MAX_OPERANDS];
151
152 /* Displacement expression, immediate expression, or register for each
153 operand. */
154 union i386_op op[MAX_OPERANDS];
155
156 /* Flags for operands. */
157 unsigned int flags[MAX_OPERANDS];
158 #define Operand_PCrel 1
159
160 /* Relocation type for operand */
161 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
162
163 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
164 the base index byte below. */
165 const reg_entry *base_reg;
166 const reg_entry *index_reg;
167 unsigned int log2_scale_factor;
168
169 /* SEG gives the seg_entries of this insn. They are zero unless
170 explicit segment overrides are given. */
171 const seg_entry *seg[2];
172
173 /* PREFIX holds all the given prefix opcodes (usually null).
174 PREFIXES is the number of prefix opcodes. */
175 unsigned int prefixes;
176 unsigned char prefix[MAX_PREFIXES];
177
178 /* RM and SIB are the modrm byte and the sib byte where the
179 addressing modes of this insn are encoded. */
180
181 modrm_byte rm;
182 rex_byte rex;
183 sib_byte sib;
184 };
185
186 typedef struct _i386_insn i386_insn;
187
188 /* List of chars besides those in app.c:symbol_chars that can start an
189 operand. Used to prevent the scrubber eating vital white-space. */
190 const char extra_symbol_chars[] = "*%-(["
191 #ifdef LEX_AT
192 "@"
193 #endif
194 #ifdef LEX_QM
195 "?"
196 #endif
197 ;
198
199 #if (defined (TE_I386AIX) \
200 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
201 && !defined (TE_GNU) \
202 && !defined (TE_LINUX) \
203 && !defined (TE_NETWARE) \
204 && !defined (TE_FreeBSD) \
205 && !defined (TE_NetBSD)))
206 /* This array holds the chars that always start a comment. If the
207 pre-processor is disabled, these aren't very useful. The option
208 --divide will remove '/' from this list. */
209 const char *i386_comment_chars = "#/";
210 #define SVR4_COMMENT_CHARS 1
211 #define PREFIX_SEPARATOR '\\'
212
213 #else
214 const char *i386_comment_chars = "#";
215 #define PREFIX_SEPARATOR '/'
216 #endif
217
218 /* This array holds the chars that only start a comment at the beginning of
219 a line. If the line seems to have the form '# 123 filename'
220 .line and .file directives will appear in the pre-processed output.
221 Note that input_file.c hand checks for '#' at the beginning of the
222 first line of the input file. This is because the compiler outputs
223 #NO_APP at the beginning of its output.
224 Also note that comments started like this one will always work if
225 '/' isn't otherwise defined. */
226 const char line_comment_chars[] = "#/";
227
228 const char line_separator_chars[] = ";";
229
230 /* Chars that can be used to separate mant from exp in floating point
231 nums. */
232 const char EXP_CHARS[] = "eE";
233
234 /* Chars that mean this number is a floating point constant
235 As in 0f12.456
236 or 0d1.2345e12. */
237 const char FLT_CHARS[] = "fFdDxX";
238
239 /* Tables for lexical analysis. */
240 static char mnemonic_chars[256];
241 static char register_chars[256];
242 static char operand_chars[256];
243 static char identifier_chars[256];
244 static char digit_chars[256];
245
246 /* Lexical macros. */
247 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
248 #define is_operand_char(x) (operand_chars[(unsigned char) x])
249 #define is_register_char(x) (register_chars[(unsigned char) x])
250 #define is_space_char(x) ((x) == ' ')
251 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
252 #define is_digit_char(x) (digit_chars[(unsigned char) x])
253
254 /* All non-digit non-letter characters that may occur in an operand. */
255 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
256
257 /* md_assemble() always leaves the strings it's passed unaltered. To
258 effect this we maintain a stack of saved characters that we've smashed
259 with '\0's (indicating end of strings for various sub-fields of the
260 assembler instruction). */
261 static char save_stack[32];
262 static char *save_stack_p;
263 #define END_STRING_AND_SAVE(s) \
264 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
265 #define RESTORE_END_STRING(s) \
266 do { *(s) = *--save_stack_p; } while (0)
267
268 /* The instruction we're assembling. */
269 static i386_insn i;
270
271 /* Possible templates for current insn. */
272 static const templates *current_templates;
273
274 /* Per instruction expressionS buffers: 2 displacements & 2 immediate max. */
275 static expressionS disp_expressions[2], im_expressions[2];
276
277 /* Current operand we are working on. */
278 static int this_operand;
279
280 /* We support four different modes. FLAG_CODE variable is used to distinguish
281 these. */
282
283 enum flag_code {
284 CODE_32BIT,
285 CODE_16BIT,
286 CODE_64BIT };
287 #define NUM_FLAG_CODE ((int) CODE_64BIT + 1)
288
289 static enum flag_code flag_code;
290 static unsigned int object_64bit;
291 static int use_rela_relocations = 0;
292
293 /* The names used to print error messages. */
294 static const char *flag_code_names[] =
295 {
296 "32",
297 "16",
298 "64"
299 };
300
301 /* 1 for intel syntax,
302 0 if att syntax. */
303 static int intel_syntax = 0;
304
305 /* 1 if register prefix % not required. */
306 static int allow_naked_reg = 0;
307
308 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
309 leave, push, and pop instructions so that gcc has the same stack
310 frame as in 32 bit mode. */
311 static char stackop_size = '\0';
312
313 /* Non-zero to optimize code alignment. */
314 int optimize_align_code = 1;
315
316 /* Non-zero to quieten some warnings. */
317 static int quiet_warnings = 0;
318
319 /* CPU name. */
320 static const char *cpu_arch_name = NULL;
321 static const char *cpu_sub_arch_name = NULL;
322
323 /* CPU feature flags. */
324 static unsigned int cpu_arch_flags = CpuUnknownFlags | CpuNo64;
325
326 /* If set, conditional jumps are not automatically promoted to handle
327 larger than a byte offset. */
328 static unsigned int no_cond_jump_promotion = 0;
329
330 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
331 static symbolS *GOT_symbol;
332
333 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
334 unsigned int x86_dwarf2_return_column;
335
336 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
337 int x86_cie_data_alignment;
338
339 /* Interface to relax_segment.
340 There are 3 major relax states for 386 jump insns because the
341 different types of jumps add different sizes to frags when we're
342 figuring out what sort of jump to choose to reach a given label. */
343
344 /* Types. */
345 #define UNCOND_JUMP 0
346 #define COND_JUMP 1
347 #define COND_JUMP86 2
348
349 /* Sizes. */
350 #define CODE16 1
351 #define SMALL 0
352 #define SMALL16 (SMALL | CODE16)
353 #define BIG 2
354 #define BIG16 (BIG | CODE16)
355
356 #ifndef INLINE
357 #ifdef __GNUC__
358 #define INLINE __inline__
359 #else
360 #define INLINE
361 #endif
362 #endif
363
364 #define ENCODE_RELAX_STATE(type, size) \
365 ((relax_substateT) (((type) << 2) | (size)))
366 #define TYPE_FROM_RELAX_STATE(s) \
367 ((s) >> 2)
368 #define DISP_SIZE_FROM_RELAX_STATE(s) \
369 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
370
371 /* This table is used by relax_frag to promote short jumps to long
372 ones where necessary. SMALL (short) jumps may be promoted to BIG
373 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
374 don't allow a short jump in a 32 bit code segment to be promoted to
375 a 16 bit offset jump because it's slower (requires data size
376 prefix), and doesn't work, unless the destination is in the bottom
377 64k of the code segment (The top 16 bits of eip are zeroed). */
378
379 const relax_typeS md_relax_table[] =
380 {
381 /* The fields are:
382 1) most positive reach of this state,
383 2) most negative reach of this state,
384 3) how many bytes this mode will have in the variable part of the frag
385 4) which index into the table to try if we can't fit into this one. */
386
387 /* UNCOND_JUMP states. */
388 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
389 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
390 /* dword jmp adds 4 bytes to frag:
391 0 extra opcode bytes, 4 displacement bytes. */
392 {0, 0, 4, 0},
393 /* word jmp adds 2 byte2 to frag:
394 0 extra opcode bytes, 2 displacement bytes. */
395 {0, 0, 2, 0},
396
397 /* COND_JUMP states. */
398 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
399 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
400 /* dword conditionals adds 5 bytes to frag:
401 1 extra opcode byte, 4 displacement bytes. */
402 {0, 0, 5, 0},
403 /* word conditionals add 3 bytes to frag:
404 1 extra opcode byte, 2 displacement bytes. */
405 {0, 0, 3, 0},
406
407 /* COND_JUMP86 states. */
408 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
409 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
410 /* dword conditionals adds 5 bytes to frag:
411 1 extra opcode byte, 4 displacement bytes. */
412 {0, 0, 5, 0},
413 /* word conditionals add 4 bytes to frag:
414 1 displacement byte and a 3 byte long branch insn. */
415 {0, 0, 4, 0}
416 };
417
418 static const arch_entry cpu_arch[] = {
419 {"i8086", Cpu086 },
420 {"i186", Cpu086|Cpu186 },
421 {"i286", Cpu086|Cpu186|Cpu286 },
422 {"i386", Cpu086|Cpu186|Cpu286|Cpu386 },
423 {"i486", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486 },
424 {"i586", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586 },
425 {"i686", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686 },
426 {"pentium", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586 },
427 {"pentiumpro",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686 },
428 {"pentiumii", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuMMX },
429 {"pentiumiii",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuMMX|CpuMMX2|CpuSSE },
430 {"pentium4", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuP4|CpuMMX|CpuMMX2|CpuSSE|CpuSSE2 },
431 {"prescott", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuP4|CpuMMX|CpuMMX2|CpuSSE|CpuSSE2|CpuPNI },
432 {"k6", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|CpuK6|CpuMMX },
433 {"k6_2", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|CpuK6|CpuMMX|Cpu3dnow },
434 {"athlon", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA },
435 {"sledgehammer",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuSledgehammer|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA|CpuSSE|CpuSSE2 },
436 {"opteron", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuSledgehammer|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA|CpuSSE|CpuSSE2 },
437 {".mmx", CpuMMX },
438 {".sse", CpuMMX|CpuMMX2|CpuSSE },
439 {".sse2", CpuMMX|CpuMMX2|CpuSSE|CpuSSE2 },
440 {".sse3", CpuMMX|CpuMMX2|CpuSSE|CpuSSE2|CpuSSE3 },
441 {".3dnow", CpuMMX|Cpu3dnow },
442 {".3dnowa", CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA },
443 {".padlock", CpuPadLock },
444 {".pacifica", CpuSVME },
445 {".svme", CpuSVME },
446 {NULL, 0 }
447 };
448
449 const pseudo_typeS md_pseudo_table[] =
450 {
451 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
452 {"align", s_align_bytes, 0},
453 #else
454 {"align", s_align_ptwo, 0},
455 #endif
456 {"arch", set_cpu_arch, 0},
457 #ifndef I386COFF
458 {"bss", s_bss, 0},
459 #endif
460 {"ffloat", float_cons, 'f'},
461 {"dfloat", float_cons, 'd'},
462 {"tfloat", float_cons, 'x'},
463 {"value", cons, 2},
464 {"slong", signed_cons, 4},
465 {"noopt", s_ignore, 0},
466 {"optim", s_ignore, 0},
467 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
468 {"code16", set_code_flag, CODE_16BIT},
469 {"code32", set_code_flag, CODE_32BIT},
470 {"code64", set_code_flag, CODE_64BIT},
471 {"intel_syntax", set_intel_syntax, 1},
472 {"att_syntax", set_intel_syntax, 0},
473 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
474 {"largecomm", handle_large_common, 0},
475 #else
476 {"file", (void (*) PARAMS ((int))) dwarf2_directive_file, 0},
477 {"loc", dwarf2_directive_loc, 0},
478 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
479 #endif
480 #ifdef TE_PE
481 {"secrel32", pe_directive_secrel, 0},
482 #endif
483 {0, 0, 0}
484 };
485
486 /* For interface with expression (). */
487 extern char *input_line_pointer;
488
489 /* Hash table for instruction mnemonic lookup. */
490 static struct hash_control *op_hash;
491
492 /* Hash table for register lookup. */
493 static struct hash_control *reg_hash;
494 \f
495 void
496 i386_align_code (fragP, count)
497 fragS *fragP;
498 int count;
499 {
500 /* Various efficient no-op patterns for aligning code labels.
501 Note: Don't try to assemble the instructions in the comments.
502 0L and 0w are not legal. */
503 static const char f32_1[] =
504 {0x90}; /* nop */
505 static const char f32_2[] =
506 {0x89,0xf6}; /* movl %esi,%esi */
507 static const char f32_3[] =
508 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
509 static const char f32_4[] =
510 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
511 static const char f32_5[] =
512 {0x90, /* nop */
513 0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
514 static const char f32_6[] =
515 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
516 static const char f32_7[] =
517 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
518 static const char f32_8[] =
519 {0x90, /* nop */
520 0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
521 static const char f32_9[] =
522 {0x89,0xf6, /* movl %esi,%esi */
523 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
524 static const char f32_10[] =
525 {0x8d,0x76,0x00, /* leal 0(%esi),%esi */
526 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
527 static const char f32_11[] =
528 {0x8d,0x74,0x26,0x00, /* leal 0(%esi,1),%esi */
529 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
530 static const char f32_12[] =
531 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
532 0x8d,0xbf,0x00,0x00,0x00,0x00}; /* leal 0L(%edi),%edi */
533 static const char f32_13[] =
534 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
535 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
536 static const char f32_14[] =
537 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00, /* leal 0L(%esi,1),%esi */
538 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
539 static const char f32_15[] =
540 {0xeb,0x0d,0x90,0x90,0x90,0x90,0x90, /* jmp .+15; lotsa nops */
541 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90};
542 static const char f16_3[] =
543 {0x8d,0x74,0x00}; /* lea 0(%esi),%esi */
544 static const char f16_4[] =
545 {0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
546 static const char f16_5[] =
547 {0x90, /* nop */
548 0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
549 static const char f16_6[] =
550 {0x89,0xf6, /* mov %si,%si */
551 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
552 static const char f16_7[] =
553 {0x8d,0x74,0x00, /* lea 0(%si),%si */
554 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
555 static const char f16_8[] =
556 {0x8d,0xb4,0x00,0x00, /* lea 0w(%si),%si */
557 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
558 static const char *const f32_patt[] = {
559 f32_1, f32_2, f32_3, f32_4, f32_5, f32_6, f32_7, f32_8,
560 f32_9, f32_10, f32_11, f32_12, f32_13, f32_14, f32_15
561 };
562 static const char *const f16_patt[] = {
563 f32_1, f32_2, f16_3, f16_4, f16_5, f16_6, f16_7, f16_8,
564 f32_15, f32_15, f32_15, f32_15, f32_15, f32_15, f32_15
565 };
566
567 if (count <= 0 || count > 15)
568 return;
569
570 /* The recommended way to pad 64bit code is to use NOPs preceded by
571 maximally four 0x66 prefixes. Balance the size of nops. */
572 if (flag_code == CODE_64BIT)
573 {
574 int i;
575 int nnops = (count + 3) / 4;
576 int len = count / nnops;
577 int remains = count - nnops * len;
578 int pos = 0;
579
580 for (i = 0; i < remains; i++)
581 {
582 memset (fragP->fr_literal + fragP->fr_fix + pos, 0x66, len);
583 fragP->fr_literal[fragP->fr_fix + pos + len] = 0x90;
584 pos += len + 1;
585 }
586 for (; i < nnops; i++)
587 {
588 memset (fragP->fr_literal + fragP->fr_fix + pos, 0x66, len - 1);
589 fragP->fr_literal[fragP->fr_fix + pos + len - 1] = 0x90;
590 pos += len;
591 }
592 }
593 else
594 if (flag_code == CODE_16BIT)
595 {
596 memcpy (fragP->fr_literal + fragP->fr_fix,
597 f16_patt[count - 1], count);
598 if (count > 8)
599 /* Adjust jump offset. */
600 fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
601 }
602 else
603 memcpy (fragP->fr_literal + fragP->fr_fix,
604 f32_patt[count - 1], count);
605 fragP->fr_var = count;
606 }
607
608 static INLINE unsigned int
609 mode_from_disp_size (t)
610 unsigned int t;
611 {
612 return (t & Disp8) ? 1 : (t & (Disp16 | Disp32 | Disp32S)) ? 2 : 0;
613 }
614
615 static INLINE int
616 fits_in_signed_byte (num)
617 offsetT num;
618 {
619 return (num >= -128) && (num <= 127);
620 }
621
622 static INLINE int
623 fits_in_unsigned_byte (num)
624 offsetT num;
625 {
626 return (num & 0xff) == num;
627 }
628
629 static INLINE int
630 fits_in_unsigned_word (num)
631 offsetT num;
632 {
633 return (num & 0xffff) == num;
634 }
635
636 static INLINE int
637 fits_in_signed_word (num)
638 offsetT num;
639 {
640 return (-32768 <= num) && (num <= 32767);
641 }
642 static INLINE int
643 fits_in_signed_long (num)
644 offsetT num ATTRIBUTE_UNUSED;
645 {
646 #ifndef BFD64
647 return 1;
648 #else
649 return (!(((offsetT) -1 << 31) & num)
650 || (((offsetT) -1 << 31) & num) == ((offsetT) -1 << 31));
651 #endif
652 } /* fits_in_signed_long() */
653 static INLINE int
654 fits_in_unsigned_long (num)
655 offsetT num ATTRIBUTE_UNUSED;
656 {
657 #ifndef BFD64
658 return 1;
659 #else
660 return (num & (((offsetT) 2 << 31) - 1)) == num;
661 #endif
662 } /* fits_in_unsigned_long() */
663
664 static int
665 smallest_imm_type (num)
666 offsetT num;
667 {
668 if (cpu_arch_flags != (Cpu086 | Cpu186 | Cpu286 | Cpu386 | Cpu486 | CpuNo64))
669 {
670 /* This code is disabled on the 486 because all the Imm1 forms
671 in the opcode table are slower on the i486. They're the
672 versions with the implicitly specified single-position
673 displacement, which has another syntax if you really want to
674 use that form. */
675 if (num == 1)
676 return Imm1 | Imm8 | Imm8S | Imm16 | Imm32 | Imm32S | Imm64;
677 }
678 return (fits_in_signed_byte (num)
679 ? (Imm8S | Imm8 | Imm16 | Imm32 | Imm32S | Imm64)
680 : fits_in_unsigned_byte (num)
681 ? (Imm8 | Imm16 | Imm32 | Imm32S | Imm64)
682 : (fits_in_signed_word (num) || fits_in_unsigned_word (num))
683 ? (Imm16 | Imm32 | Imm32S | Imm64)
684 : fits_in_signed_long (num)
685 ? (Imm32 | Imm32S | Imm64)
686 : fits_in_unsigned_long (num)
687 ? (Imm32 | Imm64)
688 : Imm64);
689 }
690
691 static offsetT
692 offset_in_range (val, size)
693 offsetT val;
694 int size;
695 {
696 addressT mask;
697
698 switch (size)
699 {
700 case 1: mask = ((addressT) 1 << 8) - 1; break;
701 case 2: mask = ((addressT) 1 << 16) - 1; break;
702 case 4: mask = ((addressT) 2 << 31) - 1; break;
703 #ifdef BFD64
704 case 8: mask = ((addressT) 2 << 63) - 1; break;
705 #endif
706 default: abort ();
707 }
708
709 /* If BFD64, sign extend val. */
710 if (!use_rela_relocations)
711 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
712 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
713
714 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
715 {
716 char buf1[40], buf2[40];
717
718 sprint_value (buf1, val);
719 sprint_value (buf2, val & mask);
720 as_warn (_("%s shortened to %s"), buf1, buf2);
721 }
722 return val & mask;
723 }
724
725 /* Returns 0 if attempting to add a prefix where one from the same
726 class already exists, 1 if non rep/repne added, 2 if rep/repne
727 added. */
728 static int
729 add_prefix (prefix)
730 unsigned int prefix;
731 {
732 int ret = 1;
733 unsigned int q;
734
735 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
736 && flag_code == CODE_64BIT)
737 {
738 if ((i.prefix[REX_PREFIX] & prefix & REX_MODE64)
739 || ((i.prefix[REX_PREFIX] & (REX_EXTX | REX_EXTY | REX_EXTZ))
740 && (prefix & (REX_EXTX | REX_EXTY | REX_EXTZ))))
741 ret = 0;
742 q = REX_PREFIX;
743 }
744 else
745 {
746 switch (prefix)
747 {
748 default:
749 abort ();
750
751 case CS_PREFIX_OPCODE:
752 case DS_PREFIX_OPCODE:
753 case ES_PREFIX_OPCODE:
754 case FS_PREFIX_OPCODE:
755 case GS_PREFIX_OPCODE:
756 case SS_PREFIX_OPCODE:
757 q = SEG_PREFIX;
758 break;
759
760 case REPNE_PREFIX_OPCODE:
761 case REPE_PREFIX_OPCODE:
762 ret = 2;
763 /* fall thru */
764 case LOCK_PREFIX_OPCODE:
765 q = LOCKREP_PREFIX;
766 break;
767
768 case FWAIT_OPCODE:
769 q = WAIT_PREFIX;
770 break;
771
772 case ADDR_PREFIX_OPCODE:
773 q = ADDR_PREFIX;
774 break;
775
776 case DATA_PREFIX_OPCODE:
777 q = DATA_PREFIX;
778 break;
779 }
780 if (i.prefix[q] != 0)
781 ret = 0;
782 }
783
784 if (ret)
785 {
786 if (!i.prefix[q])
787 ++i.prefixes;
788 i.prefix[q] |= prefix;
789 }
790 else
791 as_bad (_("same type of prefix used twice"));
792
793 return ret;
794 }
795
796 static void
797 set_code_flag (value)
798 int value;
799 {
800 flag_code = value;
801 cpu_arch_flags &= ~(Cpu64 | CpuNo64);
802 cpu_arch_flags |= (flag_code == CODE_64BIT ? Cpu64 : CpuNo64);
803 if (value == CODE_64BIT && !(cpu_arch_flags & CpuSledgehammer))
804 {
805 as_bad (_("64bit mode not supported on this CPU."));
806 }
807 if (value == CODE_32BIT && !(cpu_arch_flags & Cpu386))
808 {
809 as_bad (_("32bit mode not supported on this CPU."));
810 }
811 stackop_size = '\0';
812 }
813
814 static void
815 set_16bit_gcc_code_flag (new_code_flag)
816 int new_code_flag;
817 {
818 flag_code = new_code_flag;
819 cpu_arch_flags &= ~(Cpu64 | CpuNo64);
820 cpu_arch_flags |= (flag_code == CODE_64BIT ? Cpu64 : CpuNo64);
821 stackop_size = LONG_MNEM_SUFFIX;
822 }
823
824 static void
825 set_intel_syntax (syntax_flag)
826 int syntax_flag;
827 {
828 /* Find out if register prefixing is specified. */
829 int ask_naked_reg = 0;
830
831 SKIP_WHITESPACE ();
832 if (!is_end_of_line[(unsigned char) *input_line_pointer])
833 {
834 char *string = input_line_pointer;
835 int e = get_symbol_end ();
836
837 if (strcmp (string, "prefix") == 0)
838 ask_naked_reg = 1;
839 else if (strcmp (string, "noprefix") == 0)
840 ask_naked_reg = -1;
841 else
842 as_bad (_("bad argument to syntax directive."));
843 *input_line_pointer = e;
844 }
845 demand_empty_rest_of_line ();
846
847 intel_syntax = syntax_flag;
848
849 if (ask_naked_reg == 0)
850 allow_naked_reg = (intel_syntax
851 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
852 else
853 allow_naked_reg = (ask_naked_reg < 0);
854
855 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
856 identifier_chars['$'] = intel_syntax ? '$' : 0;
857 }
858
859 static void
860 set_cpu_arch (dummy)
861 int dummy ATTRIBUTE_UNUSED;
862 {
863 SKIP_WHITESPACE ();
864
865 if (!is_end_of_line[(unsigned char) *input_line_pointer])
866 {
867 char *string = input_line_pointer;
868 int e = get_symbol_end ();
869 int i;
870
871 for (i = 0; cpu_arch[i].name; i++)
872 {
873 if (strcmp (string, cpu_arch[i].name) == 0)
874 {
875 if (*string != '.')
876 {
877 cpu_arch_name = cpu_arch[i].name;
878 cpu_sub_arch_name = NULL;
879 cpu_arch_flags = (cpu_arch[i].flags
880 | (flag_code == CODE_64BIT ? Cpu64 : CpuNo64));
881 break;
882 }
883 if ((cpu_arch_flags | cpu_arch[i].flags) != cpu_arch_flags)
884 {
885 cpu_sub_arch_name = cpu_arch[i].name;
886 cpu_arch_flags |= cpu_arch[i].flags;
887 }
888 *input_line_pointer = e;
889 demand_empty_rest_of_line ();
890 return;
891 }
892 }
893 if (!cpu_arch[i].name)
894 as_bad (_("no such architecture: `%s'"), string);
895
896 *input_line_pointer = e;
897 }
898 else
899 as_bad (_("missing cpu architecture"));
900
901 no_cond_jump_promotion = 0;
902 if (*input_line_pointer == ','
903 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
904 {
905 char *string = ++input_line_pointer;
906 int e = get_symbol_end ();
907
908 if (strcmp (string, "nojumps") == 0)
909 no_cond_jump_promotion = 1;
910 else if (strcmp (string, "jumps") == 0)
911 ;
912 else
913 as_bad (_("no such architecture modifier: `%s'"), string);
914
915 *input_line_pointer = e;
916 }
917
918 demand_empty_rest_of_line ();
919 }
920
921 unsigned long
922 i386_mach ()
923 {
924 if (!strcmp (default_arch, "x86_64"))
925 return bfd_mach_x86_64;
926 else if (!strcmp (default_arch, "i386"))
927 return bfd_mach_i386_i386;
928 else
929 as_fatal (_("Unknown architecture"));
930 }
931 \f
932 void
933 md_begin ()
934 {
935 const char *hash_err;
936
937 /* Initialize op_hash hash table. */
938 op_hash = hash_new ();
939
940 {
941 const template *optab;
942 templates *core_optab;
943
944 /* Setup for loop. */
945 optab = i386_optab;
946 core_optab = (templates *) xmalloc (sizeof (templates));
947 core_optab->start = optab;
948
949 while (1)
950 {
951 ++optab;
952 if (optab->name == NULL
953 || strcmp (optab->name, (optab - 1)->name) != 0)
954 {
955 /* different name --> ship out current template list;
956 add to hash table; & begin anew. */
957 core_optab->end = optab;
958 hash_err = hash_insert (op_hash,
959 (optab - 1)->name,
960 (PTR) core_optab);
961 if (hash_err)
962 {
963 as_fatal (_("Internal Error: Can't hash %s: %s"),
964 (optab - 1)->name,
965 hash_err);
966 }
967 if (optab->name == NULL)
968 break;
969 core_optab = (templates *) xmalloc (sizeof (templates));
970 core_optab->start = optab;
971 }
972 }
973 }
974
975 /* Initialize reg_hash hash table. */
976 reg_hash = hash_new ();
977 {
978 const reg_entry *regtab;
979
980 for (regtab = i386_regtab;
981 regtab < i386_regtab + sizeof (i386_regtab) / sizeof (i386_regtab[0]);
982 regtab++)
983 {
984 hash_err = hash_insert (reg_hash, regtab->reg_name, (PTR) regtab);
985 if (hash_err)
986 as_fatal (_("Internal Error: Can't hash %s: %s"),
987 regtab->reg_name,
988 hash_err);
989 }
990 }
991
992 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
993 {
994 int c;
995 char *p;
996
997 for (c = 0; c < 256; c++)
998 {
999 if (ISDIGIT (c))
1000 {
1001 digit_chars[c] = c;
1002 mnemonic_chars[c] = c;
1003 register_chars[c] = c;
1004 operand_chars[c] = c;
1005 }
1006 else if (ISLOWER (c))
1007 {
1008 mnemonic_chars[c] = c;
1009 register_chars[c] = c;
1010 operand_chars[c] = c;
1011 }
1012 else if (ISUPPER (c))
1013 {
1014 mnemonic_chars[c] = TOLOWER (c);
1015 register_chars[c] = mnemonic_chars[c];
1016 operand_chars[c] = c;
1017 }
1018
1019 if (ISALPHA (c) || ISDIGIT (c))
1020 identifier_chars[c] = c;
1021 else if (c >= 128)
1022 {
1023 identifier_chars[c] = c;
1024 operand_chars[c] = c;
1025 }
1026 }
1027
1028 #ifdef LEX_AT
1029 identifier_chars['@'] = '@';
1030 #endif
1031 #ifdef LEX_QM
1032 identifier_chars['?'] = '?';
1033 operand_chars['?'] = '?';
1034 #endif
1035 digit_chars['-'] = '-';
1036 mnemonic_chars['-'] = '-';
1037 identifier_chars['_'] = '_';
1038 identifier_chars['.'] = '.';
1039
1040 for (p = operand_special_chars; *p != '\0'; p++)
1041 operand_chars[(unsigned char) *p] = *p;
1042 }
1043
1044 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1045 if (IS_ELF)
1046 {
1047 record_alignment (text_section, 2);
1048 record_alignment (data_section, 2);
1049 record_alignment (bss_section, 2);
1050 }
1051 #endif
1052
1053 if (flag_code == CODE_64BIT)
1054 {
1055 x86_dwarf2_return_column = 16;
1056 x86_cie_data_alignment = -8;
1057 }
1058 else
1059 {
1060 x86_dwarf2_return_column = 8;
1061 x86_cie_data_alignment = -4;
1062 }
1063 }
1064
1065 void
1066 i386_print_statistics (file)
1067 FILE *file;
1068 {
1069 hash_print_statistics (file, "i386 opcode", op_hash);
1070 hash_print_statistics (file, "i386 register", reg_hash);
1071 }
1072 \f
1073 #ifdef DEBUG386
1074
1075 /* Debugging routines for md_assemble. */
1076 static void pi PARAMS ((char *, i386_insn *));
1077 static void pte PARAMS ((template *));
1078 static void pt PARAMS ((unsigned int));
1079 static void pe PARAMS ((expressionS *));
1080 static void ps PARAMS ((symbolS *));
1081
1082 static void
1083 pi (line, x)
1084 char *line;
1085 i386_insn *x;
1086 {
1087 unsigned int i;
1088
1089 fprintf (stdout, "%s: template ", line);
1090 pte (&x->tm);
1091 fprintf (stdout, " address: base %s index %s scale %x\n",
1092 x->base_reg ? x->base_reg->reg_name : "none",
1093 x->index_reg ? x->index_reg->reg_name : "none",
1094 x->log2_scale_factor);
1095 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
1096 x->rm.mode, x->rm.reg, x->rm.regmem);
1097 fprintf (stdout, " sib: base %x index %x scale %x\n",
1098 x->sib.base, x->sib.index, x->sib.scale);
1099 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
1100 (x->rex & REX_MODE64) != 0,
1101 (x->rex & REX_EXTX) != 0,
1102 (x->rex & REX_EXTY) != 0,
1103 (x->rex & REX_EXTZ) != 0);
1104 for (i = 0; i < x->operands; i++)
1105 {
1106 fprintf (stdout, " #%d: ", i + 1);
1107 pt (x->types[i]);
1108 fprintf (stdout, "\n");
1109 if (x->types[i]
1110 & (Reg | SReg2 | SReg3 | Control | Debug | Test | RegMMX | RegXMM))
1111 fprintf (stdout, "%s\n", x->op[i].regs->reg_name);
1112 if (x->types[i] & Imm)
1113 pe (x->op[i].imms);
1114 if (x->types[i] & Disp)
1115 pe (x->op[i].disps);
1116 }
1117 }
1118
1119 static void
1120 pte (t)
1121 template *t;
1122 {
1123 unsigned int i;
1124 fprintf (stdout, " %d operands ", t->operands);
1125 fprintf (stdout, "opcode %x ", t->base_opcode);
1126 if (t->extension_opcode != None)
1127 fprintf (stdout, "ext %x ", t->extension_opcode);
1128 if (t->opcode_modifier & D)
1129 fprintf (stdout, "D");
1130 if (t->opcode_modifier & W)
1131 fprintf (stdout, "W");
1132 fprintf (stdout, "\n");
1133 for (i = 0; i < t->operands; i++)
1134 {
1135 fprintf (stdout, " #%d type ", i + 1);
1136 pt (t->operand_types[i]);
1137 fprintf (stdout, "\n");
1138 }
1139 }
1140
1141 static void
1142 pe (e)
1143 expressionS *e;
1144 {
1145 fprintf (stdout, " operation %d\n", e->X_op);
1146 fprintf (stdout, " add_number %ld (%lx)\n",
1147 (long) e->X_add_number, (long) e->X_add_number);
1148 if (e->X_add_symbol)
1149 {
1150 fprintf (stdout, " add_symbol ");
1151 ps (e->X_add_symbol);
1152 fprintf (stdout, "\n");
1153 }
1154 if (e->X_op_symbol)
1155 {
1156 fprintf (stdout, " op_symbol ");
1157 ps (e->X_op_symbol);
1158 fprintf (stdout, "\n");
1159 }
1160 }
1161
1162 static void
1163 ps (s)
1164 symbolS *s;
1165 {
1166 fprintf (stdout, "%s type %s%s",
1167 S_GET_NAME (s),
1168 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
1169 segment_name (S_GET_SEGMENT (s)));
1170 }
1171
1172 struct type_name
1173 {
1174 unsigned int mask;
1175 char *tname;
1176 }
1177
1178 static const type_names[] =
1179 {
1180 { Reg8, "r8" },
1181 { Reg16, "r16" },
1182 { Reg32, "r32" },
1183 { Reg64, "r64" },
1184 { Imm8, "i8" },
1185 { Imm8S, "i8s" },
1186 { Imm16, "i16" },
1187 { Imm32, "i32" },
1188 { Imm32S, "i32s" },
1189 { Imm64, "i64" },
1190 { Imm1, "i1" },
1191 { BaseIndex, "BaseIndex" },
1192 { Disp8, "d8" },
1193 { Disp16, "d16" },
1194 { Disp32, "d32" },
1195 { Disp32S, "d32s" },
1196 { Disp64, "d64" },
1197 { InOutPortReg, "InOutPortReg" },
1198 { ShiftCount, "ShiftCount" },
1199 { Control, "control reg" },
1200 { Test, "test reg" },
1201 { Debug, "debug reg" },
1202 { FloatReg, "FReg" },
1203 { FloatAcc, "FAcc" },
1204 { SReg2, "SReg2" },
1205 { SReg3, "SReg3" },
1206 { Acc, "Acc" },
1207 { JumpAbsolute, "Jump Absolute" },
1208 { RegMMX, "rMMX" },
1209 { RegXMM, "rXMM" },
1210 { EsSeg, "es" },
1211 { 0, "" }
1212 };
1213
1214 static void
1215 pt (t)
1216 unsigned int t;
1217 {
1218 const struct type_name *ty;
1219
1220 for (ty = type_names; ty->mask; ty++)
1221 if (t & ty->mask)
1222 fprintf (stdout, "%s, ", ty->tname);
1223 fflush (stdout);
1224 }
1225
1226 #endif /* DEBUG386 */
1227 \f
1228 static bfd_reloc_code_real_type
1229 reloc (unsigned int size,
1230 int pcrel,
1231 int sign,
1232 bfd_reloc_code_real_type other)
1233 {
1234 if (other != NO_RELOC)
1235 {
1236 reloc_howto_type *reloc;
1237
1238 if (size == 8)
1239 switch (other)
1240 {
1241 case BFD_RELOC_X86_64_TPOFF32:
1242 other = BFD_RELOC_X86_64_TPOFF64;
1243 break;
1244 case BFD_RELOC_X86_64_DTPOFF32:
1245 other = BFD_RELOC_X86_64_DTPOFF64;
1246 break;
1247 default:
1248 break;
1249 }
1250
1251 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
1252 if (size == 4 && flag_code != CODE_64BIT)
1253 sign = -1;
1254
1255 reloc = bfd_reloc_type_lookup (stdoutput, other);
1256 if (!reloc)
1257 as_bad (_("unknown relocation (%u)"), other);
1258 else if (size != bfd_get_reloc_size (reloc))
1259 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
1260 bfd_get_reloc_size (reloc),
1261 size);
1262 else if (pcrel && !reloc->pc_relative)
1263 as_bad (_("non-pc-relative relocation for pc-relative field"));
1264 else if ((reloc->complain_on_overflow == complain_overflow_signed
1265 && !sign)
1266 || (reloc->complain_on_overflow == complain_overflow_unsigned
1267 && sign > 0))
1268 as_bad (_("relocated field and relocation type differ in signedness"));
1269 else
1270 return other;
1271 return NO_RELOC;
1272 }
1273
1274 if (pcrel)
1275 {
1276 if (!sign)
1277 as_bad (_("there are no unsigned pc-relative relocations"));
1278 switch (size)
1279 {
1280 case 1: return BFD_RELOC_8_PCREL;
1281 case 2: return BFD_RELOC_16_PCREL;
1282 case 4: return BFD_RELOC_32_PCREL;
1283 case 8: return BFD_RELOC_64_PCREL;
1284 }
1285 as_bad (_("cannot do %u byte pc-relative relocation"), size);
1286 }
1287 else
1288 {
1289 if (sign > 0)
1290 switch (size)
1291 {
1292 case 4: return BFD_RELOC_X86_64_32S;
1293 }
1294 else
1295 switch (size)
1296 {
1297 case 1: return BFD_RELOC_8;
1298 case 2: return BFD_RELOC_16;
1299 case 4: return BFD_RELOC_32;
1300 case 8: return BFD_RELOC_64;
1301 }
1302 as_bad (_("cannot do %s %u byte relocation"),
1303 sign > 0 ? "signed" : "unsigned", size);
1304 }
1305
1306 abort ();
1307 return BFD_RELOC_NONE;
1308 }
1309
1310 /* Here we decide which fixups can be adjusted to make them relative to
1311 the beginning of the section instead of the symbol. Basically we need
1312 to make sure that the dynamic relocations are done correctly, so in
1313 some cases we force the original symbol to be used. */
1314
1315 int
1316 tc_i386_fix_adjustable (fixP)
1317 fixS *fixP ATTRIBUTE_UNUSED;
1318 {
1319 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1320 if (!IS_ELF)
1321 return 1;
1322
1323 /* Don't adjust pc-relative references to merge sections in 64-bit
1324 mode. */
1325 if (use_rela_relocations
1326 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
1327 && fixP->fx_pcrel)
1328 return 0;
1329
1330 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
1331 and changed later by validate_fix. */
1332 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
1333 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
1334 return 0;
1335
1336 /* adjust_reloc_syms doesn't know about the GOT. */
1337 if (fixP->fx_r_type == BFD_RELOC_386_GOTOFF
1338 || fixP->fx_r_type == BFD_RELOC_386_PLT32
1339 || fixP->fx_r_type == BFD_RELOC_386_GOT32
1340 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
1341 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
1342 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
1343 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
1344 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
1345 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
1346 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
1347 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
1348 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
1349 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
1350 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
1351 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
1352 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
1353 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
1354 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
1355 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
1356 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
1357 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
1358 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
1359 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
1360 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
1361 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
1362 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
1363 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
1364 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
1365 return 0;
1366 #endif
1367 return 1;
1368 }
1369
1370 static int intel_float_operand PARAMS ((const char *mnemonic));
1371
1372 static int
1373 intel_float_operand (mnemonic)
1374 const char *mnemonic;
1375 {
1376 /* Note that the value returned is meaningful only for opcodes with (memory)
1377 operands, hence the code here is free to improperly handle opcodes that
1378 have no operands (for better performance and smaller code). */
1379
1380 if (mnemonic[0] != 'f')
1381 return 0; /* non-math */
1382
1383 switch (mnemonic[1])
1384 {
1385 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
1386 the fs segment override prefix not currently handled because no
1387 call path can make opcodes without operands get here */
1388 case 'i':
1389 return 2 /* integer op */;
1390 case 'l':
1391 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
1392 return 3; /* fldcw/fldenv */
1393 break;
1394 case 'n':
1395 if (mnemonic[2] != 'o' /* fnop */)
1396 return 3; /* non-waiting control op */
1397 break;
1398 case 'r':
1399 if (mnemonic[2] == 's')
1400 return 3; /* frstor/frstpm */
1401 break;
1402 case 's':
1403 if (mnemonic[2] == 'a')
1404 return 3; /* fsave */
1405 if (mnemonic[2] == 't')
1406 {
1407 switch (mnemonic[3])
1408 {
1409 case 'c': /* fstcw */
1410 case 'd': /* fstdw */
1411 case 'e': /* fstenv */
1412 case 's': /* fsts[gw] */
1413 return 3;
1414 }
1415 }
1416 break;
1417 case 'x':
1418 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
1419 return 0; /* fxsave/fxrstor are not really math ops */
1420 break;
1421 }
1422
1423 return 1;
1424 }
1425
1426 /* This is the guts of the machine-dependent assembler. LINE points to a
1427 machine dependent instruction. This function is supposed to emit
1428 the frags/bytes it assembles to. */
1429
1430 void
1431 md_assemble (line)
1432 char *line;
1433 {
1434 int j;
1435 char mnemonic[MAX_MNEM_SIZE];
1436
1437 /* Initialize globals. */
1438 memset (&i, '\0', sizeof (i));
1439 for (j = 0; j < MAX_OPERANDS; j++)
1440 i.reloc[j] = NO_RELOC;
1441 memset (disp_expressions, '\0', sizeof (disp_expressions));
1442 memset (im_expressions, '\0', sizeof (im_expressions));
1443 save_stack_p = save_stack;
1444
1445 /* First parse an instruction mnemonic & call i386_operand for the operands.
1446 We assume that the scrubber has arranged it so that line[0] is the valid
1447 start of a (possibly prefixed) mnemonic. */
1448
1449 line = parse_insn (line, mnemonic);
1450 if (line == NULL)
1451 return;
1452
1453 line = parse_operands (line, mnemonic);
1454 if (line == NULL)
1455 return;
1456
1457 /* Now we've parsed the mnemonic into a set of templates, and have the
1458 operands at hand. */
1459
1460 /* All intel opcodes have reversed operands except for "bound" and
1461 "enter". We also don't reverse intersegment "jmp" and "call"
1462 instructions with 2 immediate operands so that the immediate segment
1463 precedes the offset, as it does when in AT&T mode. "enter" and the
1464 intersegment "jmp" and "call" instructions are the only ones that
1465 have two immediate operands. */
1466 if (intel_syntax && i.operands > 1
1467 && (strcmp (mnemonic, "bound") != 0)
1468 && (strcmp (mnemonic, "invlpga") != 0)
1469 && !((i.types[0] & Imm) && (i.types[1] & Imm)))
1470 swap_operands ();
1471
1472 if (i.imm_operands)
1473 optimize_imm ();
1474
1475 /* Don't optimize displacement for movabs since it only takes 64bit
1476 displacement. */
1477 if (i.disp_operands
1478 && (flag_code != CODE_64BIT
1479 || strcmp (mnemonic, "movabs") != 0))
1480 optimize_disp ();
1481
1482 /* Next, we find a template that matches the given insn,
1483 making sure the overlap of the given operands types is consistent
1484 with the template operand types. */
1485
1486 if (!match_template ())
1487 return;
1488
1489 if (intel_syntax)
1490 {
1491 /* Undo SYSV386_COMPAT brokenness when in Intel mode. See i386.h */
1492 if (SYSV386_COMPAT
1493 && (i.tm.base_opcode & 0xfffffde0) == 0xdce0)
1494 i.tm.base_opcode ^= FloatR;
1495
1496 /* Zap movzx and movsx suffix. The suffix may have been set from
1497 "word ptr" or "byte ptr" on the source operand, but we'll use
1498 the suffix later to choose the destination register. */
1499 if ((i.tm.base_opcode & ~9) == 0x0fb6)
1500 {
1501 if (i.reg_operands < 2
1502 && !i.suffix
1503 && (~i.tm.opcode_modifier
1504 & (No_bSuf
1505 | No_wSuf
1506 | No_lSuf
1507 | No_sSuf
1508 | No_xSuf
1509 | No_qSuf)))
1510 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
1511
1512 i.suffix = 0;
1513 }
1514 }
1515
1516 if (i.tm.opcode_modifier & FWait)
1517 if (!add_prefix (FWAIT_OPCODE))
1518 return;
1519
1520 /* Check string instruction segment overrides. */
1521 if ((i.tm.opcode_modifier & IsString) != 0 && i.mem_operands != 0)
1522 {
1523 if (!check_string ())
1524 return;
1525 }
1526
1527 if (!process_suffix ())
1528 return;
1529
1530 /* Make still unresolved immediate matches conform to size of immediate
1531 given in i.suffix. */
1532 if (!finalize_imm ())
1533 return;
1534
1535 if (i.types[0] & Imm1)
1536 i.imm_operands = 0; /* kludge for shift insns. */
1537 if (i.types[0] & ImplicitRegister)
1538 i.reg_operands--;
1539 if (i.types[1] & ImplicitRegister)
1540 i.reg_operands--;
1541 if (i.types[2] & ImplicitRegister)
1542 i.reg_operands--;
1543
1544 if (i.tm.opcode_modifier & ImmExt)
1545 {
1546 expressionS *exp;
1547
1548 if ((i.tm.cpu_flags & CpuPNI) && i.operands > 0)
1549 {
1550 /* These Intel Prescott New Instructions have the fixed
1551 operands with an opcode suffix which is coded in the same
1552 place as an 8-bit immediate field would be. Here we check
1553 those operands and remove them afterwards. */
1554 unsigned int x;
1555
1556 for (x = 0; x < i.operands; x++)
1557 if (i.op[x].regs->reg_num != x)
1558 as_bad (_("can't use register '%%%s' as operand %d in '%s'."),
1559 i.op[x].regs->reg_name, x + 1, i.tm.name);
1560 i.operands = 0;
1561 }
1562
1563 /* These AMD 3DNow! and Intel Katmai New Instructions have an
1564 opcode suffix which is coded in the same place as an 8-bit
1565 immediate field would be. Here we fake an 8-bit immediate
1566 operand from the opcode suffix stored in tm.extension_opcode. */
1567
1568 assert (i.imm_operands == 0 && i.operands <= 2 && 2 < MAX_OPERANDS);
1569
1570 exp = &im_expressions[i.imm_operands++];
1571 i.op[i.operands].imms = exp;
1572 i.types[i.operands++] = Imm8;
1573 exp->X_op = O_constant;
1574 exp->X_add_number = i.tm.extension_opcode;
1575 i.tm.extension_opcode = None;
1576 }
1577
1578 /* For insns with operands there are more diddles to do to the opcode. */
1579 if (i.operands)
1580 {
1581 if (!process_operands ())
1582 return;
1583 }
1584 else if (!quiet_warnings && (i.tm.opcode_modifier & Ugh) != 0)
1585 {
1586 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
1587 as_warn (_("translating to `%sp'"), i.tm.name);
1588 }
1589
1590 /* Handle conversion of 'int $3' --> special int3 insn. */
1591 if (i.tm.base_opcode == INT_OPCODE && i.op[0].imms->X_add_number == 3)
1592 {
1593 i.tm.base_opcode = INT3_OPCODE;
1594 i.imm_operands = 0;
1595 }
1596
1597 if ((i.tm.opcode_modifier & (Jump | JumpByte | JumpDword))
1598 && i.op[0].disps->X_op == O_constant)
1599 {
1600 /* Convert "jmp constant" (and "call constant") to a jump (call) to
1601 the absolute address given by the constant. Since ix86 jumps and
1602 calls are pc relative, we need to generate a reloc. */
1603 i.op[0].disps->X_add_symbol = &abs_symbol;
1604 i.op[0].disps->X_op = O_symbol;
1605 }
1606
1607 if ((i.tm.opcode_modifier & Rex64) != 0)
1608 i.rex |= REX_MODE64;
1609
1610 /* For 8 bit registers we need an empty rex prefix. Also if the
1611 instruction already has a prefix, we need to convert old
1612 registers to new ones. */
1613
1614 if (((i.types[0] & Reg8) != 0
1615 && (i.op[0].regs->reg_flags & RegRex64) != 0)
1616 || ((i.types[1] & Reg8) != 0
1617 && (i.op[1].regs->reg_flags & RegRex64) != 0)
1618 || (((i.types[0] & Reg8) != 0 || (i.types[1] & Reg8) != 0)
1619 && i.rex != 0))
1620 {
1621 int x;
1622
1623 i.rex |= REX_OPCODE;
1624 for (x = 0; x < 2; x++)
1625 {
1626 /* Look for 8 bit operand that uses old registers. */
1627 if ((i.types[x] & Reg8) != 0
1628 && (i.op[x].regs->reg_flags & RegRex64) == 0)
1629 {
1630 /* In case it is "hi" register, give up. */
1631 if (i.op[x].regs->reg_num > 3)
1632 as_bad (_("can't encode register '%%%s' in an instruction requiring REX prefix."),
1633 i.op[x].regs->reg_name);
1634
1635 /* Otherwise it is equivalent to the extended register.
1636 Since the encoding doesn't change this is merely
1637 cosmetic cleanup for debug output. */
1638
1639 i.op[x].regs = i.op[x].regs + 8;
1640 }
1641 }
1642 }
1643
1644 if (i.rex != 0)
1645 add_prefix (REX_OPCODE | i.rex);
1646
1647 /* We are ready to output the insn. */
1648 output_insn ();
1649 }
1650
1651 static char *
1652 parse_insn (line, mnemonic)
1653 char *line;
1654 char *mnemonic;
1655 {
1656 char *l = line;
1657 char *token_start = l;
1658 char *mnem_p;
1659 int supported;
1660 const template *t;
1661
1662 /* Non-zero if we found a prefix only acceptable with string insns. */
1663 const char *expecting_string_instruction = NULL;
1664
1665 while (1)
1666 {
1667 mnem_p = mnemonic;
1668 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
1669 {
1670 mnem_p++;
1671 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
1672 {
1673 as_bad (_("no such instruction: `%s'"), token_start);
1674 return NULL;
1675 }
1676 l++;
1677 }
1678 if (!is_space_char (*l)
1679 && *l != END_OF_INSN
1680 && (intel_syntax
1681 || (*l != PREFIX_SEPARATOR
1682 && *l != ',')))
1683 {
1684 as_bad (_("invalid character %s in mnemonic"),
1685 output_invalid (*l));
1686 return NULL;
1687 }
1688 if (token_start == l)
1689 {
1690 if (!intel_syntax && *l == PREFIX_SEPARATOR)
1691 as_bad (_("expecting prefix; got nothing"));
1692 else
1693 as_bad (_("expecting mnemonic; got nothing"));
1694 return NULL;
1695 }
1696
1697 /* Look up instruction (or prefix) via hash table. */
1698 current_templates = hash_find (op_hash, mnemonic);
1699
1700 if (*l != END_OF_INSN
1701 && (!is_space_char (*l) || l[1] != END_OF_INSN)
1702 && current_templates
1703 && (current_templates->start->opcode_modifier & IsPrefix))
1704 {
1705 if (current_templates->start->cpu_flags
1706 & (flag_code != CODE_64BIT ? Cpu64 : CpuNo64))
1707 {
1708 as_bad ((flag_code != CODE_64BIT
1709 ? _("`%s' is only supported in 64-bit mode")
1710 : _("`%s' is not supported in 64-bit mode")),
1711 current_templates->start->name);
1712 return NULL;
1713 }
1714 /* If we are in 16-bit mode, do not allow addr16 or data16.
1715 Similarly, in 32-bit mode, do not allow addr32 or data32. */
1716 if ((current_templates->start->opcode_modifier & (Size16 | Size32))
1717 && flag_code != CODE_64BIT
1718 && (((current_templates->start->opcode_modifier & Size32) != 0)
1719 ^ (flag_code == CODE_16BIT)))
1720 {
1721 as_bad (_("redundant %s prefix"),
1722 current_templates->start->name);
1723 return NULL;
1724 }
1725 /* Add prefix, checking for repeated prefixes. */
1726 switch (add_prefix (current_templates->start->base_opcode))
1727 {
1728 case 0:
1729 return NULL;
1730 case 2:
1731 expecting_string_instruction = current_templates->start->name;
1732 break;
1733 }
1734 /* Skip past PREFIX_SEPARATOR and reset token_start. */
1735 token_start = ++l;
1736 }
1737 else
1738 break;
1739 }
1740
1741 if (!current_templates)
1742 {
1743 /* See if we can get a match by trimming off a suffix. */
1744 switch (mnem_p[-1])
1745 {
1746 case WORD_MNEM_SUFFIX:
1747 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
1748 i.suffix = SHORT_MNEM_SUFFIX;
1749 else
1750 case BYTE_MNEM_SUFFIX:
1751 case QWORD_MNEM_SUFFIX:
1752 i.suffix = mnem_p[-1];
1753 mnem_p[-1] = '\0';
1754 current_templates = hash_find (op_hash, mnemonic);
1755 break;
1756 case SHORT_MNEM_SUFFIX:
1757 case LONG_MNEM_SUFFIX:
1758 if (!intel_syntax)
1759 {
1760 i.suffix = mnem_p[-1];
1761 mnem_p[-1] = '\0';
1762 current_templates = hash_find (op_hash, mnemonic);
1763 }
1764 break;
1765
1766 /* Intel Syntax. */
1767 case 'd':
1768 if (intel_syntax)
1769 {
1770 if (intel_float_operand (mnemonic) == 1)
1771 i.suffix = SHORT_MNEM_SUFFIX;
1772 else
1773 i.suffix = LONG_MNEM_SUFFIX;
1774 mnem_p[-1] = '\0';
1775 current_templates = hash_find (op_hash, mnemonic);
1776 }
1777 break;
1778 }
1779 if (!current_templates)
1780 {
1781 as_bad (_("no such instruction: `%s'"), token_start);
1782 return NULL;
1783 }
1784 }
1785
1786 if (current_templates->start->opcode_modifier & (Jump | JumpByte))
1787 {
1788 /* Check for a branch hint. We allow ",pt" and ",pn" for
1789 predict taken and predict not taken respectively.
1790 I'm not sure that branch hints actually do anything on loop
1791 and jcxz insns (JumpByte) for current Pentium4 chips. They
1792 may work in the future and it doesn't hurt to accept them
1793 now. */
1794 if (l[0] == ',' && l[1] == 'p')
1795 {
1796 if (l[2] == 't')
1797 {
1798 if (!add_prefix (DS_PREFIX_OPCODE))
1799 return NULL;
1800 l += 3;
1801 }
1802 else if (l[2] == 'n')
1803 {
1804 if (!add_prefix (CS_PREFIX_OPCODE))
1805 return NULL;
1806 l += 3;
1807 }
1808 }
1809 }
1810 /* Any other comma loses. */
1811 if (*l == ',')
1812 {
1813 as_bad (_("invalid character %s in mnemonic"),
1814 output_invalid (*l));
1815 return NULL;
1816 }
1817
1818 /* Check if instruction is supported on specified architecture. */
1819 supported = 0;
1820 for (t = current_templates->start; t < current_templates->end; ++t)
1821 {
1822 if (!((t->cpu_flags & ~(Cpu64 | CpuNo64))
1823 & ~(cpu_arch_flags & ~(Cpu64 | CpuNo64))))
1824 supported |= 1;
1825 if (!(t->cpu_flags & (flag_code == CODE_64BIT ? CpuNo64 : Cpu64)))
1826 supported |= 2;
1827 }
1828 if (!(supported & 2))
1829 {
1830 as_bad (flag_code == CODE_64BIT
1831 ? _("`%s' is not supported in 64-bit mode")
1832 : _("`%s' is only supported in 64-bit mode"),
1833 current_templates->start->name);
1834 return NULL;
1835 }
1836 if (!(supported & 1))
1837 {
1838 as_warn (_("`%s' is not supported on `%s%s'"),
1839 current_templates->start->name,
1840 cpu_arch_name,
1841 cpu_sub_arch_name ? cpu_sub_arch_name : "");
1842 }
1843 else if ((Cpu386 & ~cpu_arch_flags) && (flag_code != CODE_16BIT))
1844 {
1845 as_warn (_("use .code16 to ensure correct addressing mode"));
1846 }
1847
1848 /* Check for rep/repne without a string instruction. */
1849 if (expecting_string_instruction)
1850 {
1851 static templates override;
1852
1853 for (t = current_templates->start; t < current_templates->end; ++t)
1854 if (t->opcode_modifier & IsString)
1855 break;
1856 if (t >= current_templates->end)
1857 {
1858 as_bad (_("expecting string instruction after `%s'"),
1859 expecting_string_instruction);
1860 return NULL;
1861 }
1862 for (override.start = t; t < current_templates->end; ++t)
1863 if (!(t->opcode_modifier & IsString))
1864 break;
1865 override.end = t;
1866 current_templates = &override;
1867 }
1868
1869 return l;
1870 }
1871
1872 static char *
1873 parse_operands (l, mnemonic)
1874 char *l;
1875 const char *mnemonic;
1876 {
1877 char *token_start;
1878
1879 /* 1 if operand is pending after ','. */
1880 unsigned int expecting_operand = 0;
1881
1882 /* Non-zero if operand parens not balanced. */
1883 unsigned int paren_not_balanced;
1884
1885 while (*l != END_OF_INSN)
1886 {
1887 /* Skip optional white space before operand. */
1888 if (is_space_char (*l))
1889 ++l;
1890 if (!is_operand_char (*l) && *l != END_OF_INSN)
1891 {
1892 as_bad (_("invalid character %s before operand %d"),
1893 output_invalid (*l),
1894 i.operands + 1);
1895 return NULL;
1896 }
1897 token_start = l; /* after white space */
1898 paren_not_balanced = 0;
1899 while (paren_not_balanced || *l != ',')
1900 {
1901 if (*l == END_OF_INSN)
1902 {
1903 if (paren_not_balanced)
1904 {
1905 if (!intel_syntax)
1906 as_bad (_("unbalanced parenthesis in operand %d."),
1907 i.operands + 1);
1908 else
1909 as_bad (_("unbalanced brackets in operand %d."),
1910 i.operands + 1);
1911 return NULL;
1912 }
1913 else
1914 break; /* we are done */
1915 }
1916 else if (!is_operand_char (*l) && !is_space_char (*l))
1917 {
1918 as_bad (_("invalid character %s in operand %d"),
1919 output_invalid (*l),
1920 i.operands + 1);
1921 return NULL;
1922 }
1923 if (!intel_syntax)
1924 {
1925 if (*l == '(')
1926 ++paren_not_balanced;
1927 if (*l == ')')
1928 --paren_not_balanced;
1929 }
1930 else
1931 {
1932 if (*l == '[')
1933 ++paren_not_balanced;
1934 if (*l == ']')
1935 --paren_not_balanced;
1936 }
1937 l++;
1938 }
1939 if (l != token_start)
1940 { /* Yes, we've read in another operand. */
1941 unsigned int operand_ok;
1942 this_operand = i.operands++;
1943 if (i.operands > MAX_OPERANDS)
1944 {
1945 as_bad (_("spurious operands; (%d operands/instruction max)"),
1946 MAX_OPERANDS);
1947 return NULL;
1948 }
1949 /* Now parse operand adding info to 'i' as we go along. */
1950 END_STRING_AND_SAVE (l);
1951
1952 if (intel_syntax)
1953 operand_ok =
1954 i386_intel_operand (token_start,
1955 intel_float_operand (mnemonic));
1956 else
1957 operand_ok = i386_operand (token_start);
1958
1959 RESTORE_END_STRING (l);
1960 if (!operand_ok)
1961 return NULL;
1962 }
1963 else
1964 {
1965 if (expecting_operand)
1966 {
1967 expecting_operand_after_comma:
1968 as_bad (_("expecting operand after ','; got nothing"));
1969 return NULL;
1970 }
1971 if (*l == ',')
1972 {
1973 as_bad (_("expecting operand before ','; got nothing"));
1974 return NULL;
1975 }
1976 }
1977
1978 /* Now *l must be either ',' or END_OF_INSN. */
1979 if (*l == ',')
1980 {
1981 if (*++l == END_OF_INSN)
1982 {
1983 /* Just skip it, if it's \n complain. */
1984 goto expecting_operand_after_comma;
1985 }
1986 expecting_operand = 1;
1987 }
1988 }
1989 return l;
1990 }
1991
1992 static void
1993 swap_operands ()
1994 {
1995 union i386_op temp_op;
1996 unsigned int temp_type;
1997 enum bfd_reloc_code_real temp_reloc;
1998 int xchg1 = 0;
1999 int xchg2 = 0;
2000
2001 if (i.operands == 2)
2002 {
2003 xchg1 = 0;
2004 xchg2 = 1;
2005 }
2006 else if (i.operands == 3)
2007 {
2008 xchg1 = 0;
2009 xchg2 = 2;
2010 }
2011 temp_type = i.types[xchg2];
2012 i.types[xchg2] = i.types[xchg1];
2013 i.types[xchg1] = temp_type;
2014 temp_op = i.op[xchg2];
2015 i.op[xchg2] = i.op[xchg1];
2016 i.op[xchg1] = temp_op;
2017 temp_reloc = i.reloc[xchg2];
2018 i.reloc[xchg2] = i.reloc[xchg1];
2019 i.reloc[xchg1] = temp_reloc;
2020
2021 if (i.mem_operands == 2)
2022 {
2023 const seg_entry *temp_seg;
2024 temp_seg = i.seg[0];
2025 i.seg[0] = i.seg[1];
2026 i.seg[1] = temp_seg;
2027 }
2028 }
2029
2030 /* Try to ensure constant immediates are represented in the smallest
2031 opcode possible. */
2032 static void
2033 optimize_imm ()
2034 {
2035 char guess_suffix = 0;
2036 int op;
2037
2038 if (i.suffix)
2039 guess_suffix = i.suffix;
2040 else if (i.reg_operands)
2041 {
2042 /* Figure out a suffix from the last register operand specified.
2043 We can't do this properly yet, ie. excluding InOutPortReg,
2044 but the following works for instructions with immediates.
2045 In any case, we can't set i.suffix yet. */
2046 for (op = i.operands; --op >= 0;)
2047 if (i.types[op] & Reg)
2048 {
2049 if (i.types[op] & Reg8)
2050 guess_suffix = BYTE_MNEM_SUFFIX;
2051 else if (i.types[op] & Reg16)
2052 guess_suffix = WORD_MNEM_SUFFIX;
2053 else if (i.types[op] & Reg32)
2054 guess_suffix = LONG_MNEM_SUFFIX;
2055 else if (i.types[op] & Reg64)
2056 guess_suffix = QWORD_MNEM_SUFFIX;
2057 break;
2058 }
2059 }
2060 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
2061 guess_suffix = WORD_MNEM_SUFFIX;
2062
2063 for (op = i.operands; --op >= 0;)
2064 if (i.types[op] & Imm)
2065 {
2066 switch (i.op[op].imms->X_op)
2067 {
2068 case O_constant:
2069 /* If a suffix is given, this operand may be shortened. */
2070 switch (guess_suffix)
2071 {
2072 case LONG_MNEM_SUFFIX:
2073 i.types[op] |= Imm32 | Imm64;
2074 break;
2075 case WORD_MNEM_SUFFIX:
2076 i.types[op] |= Imm16 | Imm32S | Imm32 | Imm64;
2077 break;
2078 case BYTE_MNEM_SUFFIX:
2079 i.types[op] |= Imm16 | Imm8 | Imm8S | Imm32S | Imm32 | Imm64;
2080 break;
2081 }
2082
2083 /* If this operand is at most 16 bits, convert it
2084 to a signed 16 bit number before trying to see
2085 whether it will fit in an even smaller size.
2086 This allows a 16-bit operand such as $0xffe0 to
2087 be recognised as within Imm8S range. */
2088 if ((i.types[op] & Imm16)
2089 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
2090 {
2091 i.op[op].imms->X_add_number =
2092 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
2093 }
2094 if ((i.types[op] & Imm32)
2095 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
2096 == 0))
2097 {
2098 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
2099 ^ ((offsetT) 1 << 31))
2100 - ((offsetT) 1 << 31));
2101 }
2102 i.types[op] |= smallest_imm_type (i.op[op].imms->X_add_number);
2103
2104 /* We must avoid matching of Imm32 templates when 64bit
2105 only immediate is available. */
2106 if (guess_suffix == QWORD_MNEM_SUFFIX)
2107 i.types[op] &= ~Imm32;
2108 break;
2109
2110 case O_absent:
2111 case O_register:
2112 abort ();
2113
2114 /* Symbols and expressions. */
2115 default:
2116 /* Convert symbolic operand to proper sizes for matching, but don't
2117 prevent matching a set of insns that only supports sizes other
2118 than those matching the insn suffix. */
2119 {
2120 unsigned int mask, allowed = 0;
2121 const template *t;
2122
2123 for (t = current_templates->start; t < current_templates->end; ++t)
2124 allowed |= t->operand_types[op];
2125 switch (guess_suffix)
2126 {
2127 case QWORD_MNEM_SUFFIX:
2128 mask = Imm64 | Imm32S;
2129 break;
2130 case LONG_MNEM_SUFFIX:
2131 mask = Imm32;
2132 break;
2133 case WORD_MNEM_SUFFIX:
2134 mask = Imm16;
2135 break;
2136 case BYTE_MNEM_SUFFIX:
2137 mask = Imm8;
2138 break;
2139 default:
2140 mask = 0;
2141 break;
2142 }
2143 if (mask & allowed)
2144 i.types[op] &= mask;
2145 }
2146 break;
2147 }
2148 }
2149 }
2150
2151 /* Try to use the smallest displacement type too. */
2152 static void
2153 optimize_disp ()
2154 {
2155 int op;
2156
2157 for (op = i.operands; --op >= 0;)
2158 if (i.types[op] & Disp)
2159 {
2160 if (i.op[op].disps->X_op == O_constant)
2161 {
2162 offsetT disp = i.op[op].disps->X_add_number;
2163
2164 if ((i.types[op] & Disp16)
2165 && (disp & ~(offsetT) 0xffff) == 0)
2166 {
2167 /* If this operand is at most 16 bits, convert
2168 to a signed 16 bit number and don't use 64bit
2169 displacement. */
2170 disp = (((disp & 0xffff) ^ 0x8000) - 0x8000);
2171 i.types[op] &= ~Disp64;
2172 }
2173 if ((i.types[op] & Disp32)
2174 && (disp & ~(((offsetT) 2 << 31) - 1)) == 0)
2175 {
2176 /* If this operand is at most 32 bits, convert
2177 to a signed 32 bit number and don't use 64bit
2178 displacement. */
2179 disp &= (((offsetT) 2 << 31) - 1);
2180 disp = (disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
2181 i.types[op] &= ~Disp64;
2182 }
2183 if (!disp && (i.types[op] & BaseIndex))
2184 {
2185 i.types[op] &= ~Disp;
2186 i.op[op].disps = 0;
2187 i.disp_operands--;
2188 }
2189 else if (flag_code == CODE_64BIT)
2190 {
2191 if (fits_in_signed_long (disp))
2192 {
2193 i.types[op] &= ~Disp64;
2194 i.types[op] |= Disp32S;
2195 }
2196 if (fits_in_unsigned_long (disp))
2197 i.types[op] |= Disp32;
2198 }
2199 if ((i.types[op] & (Disp32 | Disp32S | Disp16))
2200 && fits_in_signed_byte (disp))
2201 i.types[op] |= Disp8;
2202 }
2203 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
2204 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
2205 {
2206 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
2207 i.op[op].disps, 0, i.reloc[op]);
2208 i.types[op] &= ~Disp;
2209 }
2210 else
2211 /* We only support 64bit displacement on constants. */
2212 i.types[op] &= ~Disp64;
2213 }
2214 }
2215
2216 static int
2217 match_template ()
2218 {
2219 /* Points to template once we've found it. */
2220 const template *t;
2221 unsigned int overlap0, overlap1, overlap2;
2222 unsigned int found_reverse_match;
2223 int suffix_check;
2224
2225 #define MATCH(overlap, given, template) \
2226 ((overlap & ~JumpAbsolute) \
2227 && (((given) & (BaseIndex | JumpAbsolute)) \
2228 == ((overlap) & (BaseIndex | JumpAbsolute))))
2229
2230 /* If given types r0 and r1 are registers they must be of the same type
2231 unless the expected operand type register overlap is null.
2232 Note that Acc in a template matches every size of reg. */
2233 #define CONSISTENT_REGISTER_MATCH(m0, g0, t0, m1, g1, t1) \
2234 (((g0) & Reg) == 0 || ((g1) & Reg) == 0 \
2235 || ((g0) & Reg) == ((g1) & Reg) \
2236 || ((((m0) & Acc) ? Reg : (t0)) & (((m1) & Acc) ? Reg : (t1)) & Reg) == 0 )
2237
2238 overlap0 = 0;
2239 overlap1 = 0;
2240 overlap2 = 0;
2241 found_reverse_match = 0;
2242 suffix_check = (i.suffix == BYTE_MNEM_SUFFIX
2243 ? No_bSuf
2244 : (i.suffix == WORD_MNEM_SUFFIX
2245 ? No_wSuf
2246 : (i.suffix == SHORT_MNEM_SUFFIX
2247 ? No_sSuf
2248 : (i.suffix == LONG_MNEM_SUFFIX
2249 ? No_lSuf
2250 : (i.suffix == QWORD_MNEM_SUFFIX
2251 ? No_qSuf
2252 : (i.suffix == LONG_DOUBLE_MNEM_SUFFIX
2253 ? No_xSuf : 0))))));
2254
2255 t = current_templates->start;
2256 if (i.suffix == QWORD_MNEM_SUFFIX
2257 && flag_code != CODE_64BIT
2258 && (intel_syntax
2259 ? !(t->opcode_modifier & IgnoreSize)
2260 && !intel_float_operand (t->name)
2261 : intel_float_operand (t->name) != 2)
2262 && (!(t->operand_types[0] & (RegMMX | RegXMM))
2263 || !(t->operand_types[t->operands > 1] & (RegMMX | RegXMM)))
2264 && (t->base_opcode != 0x0fc7
2265 || t->extension_opcode != 1 /* cmpxchg8b */))
2266 t = current_templates->end;
2267 for (; t < current_templates->end; t++)
2268 {
2269 /* Must have right number of operands. */
2270 if (i.operands != t->operands)
2271 continue;
2272
2273 /* Check the suffix, except for some instructions in intel mode. */
2274 if ((t->opcode_modifier & suffix_check)
2275 && !(intel_syntax
2276 && (t->opcode_modifier & IgnoreSize)))
2277 continue;
2278
2279 /* Do not verify operands when there are none. */
2280 else if (!t->operands)
2281 {
2282 if (t->cpu_flags & ~cpu_arch_flags)
2283 continue;
2284 /* We've found a match; break out of loop. */
2285 break;
2286 }
2287
2288 overlap0 = i.types[0] & t->operand_types[0];
2289 switch (t->operands)
2290 {
2291 case 1:
2292 if (!MATCH (overlap0, i.types[0], t->operand_types[0]))
2293 continue;
2294 break;
2295 case 2:
2296 case 3:
2297 overlap1 = i.types[1] & t->operand_types[1];
2298 if (!MATCH (overlap0, i.types[0], t->operand_types[0])
2299 || !MATCH (overlap1, i.types[1], t->operand_types[1])
2300 /* monitor in SSE3 is a very special case. The first
2301 register and the second register may have differnet
2302 sizes. */
2303 || !((t->base_opcode == 0x0f01
2304 && t->extension_opcode == 0xc8)
2305 || CONSISTENT_REGISTER_MATCH (overlap0, i.types[0],
2306 t->operand_types[0],
2307 overlap1, i.types[1],
2308 t->operand_types[1])))
2309 {
2310 /* Check if other direction is valid ... */
2311 if ((t->opcode_modifier & (D | FloatD)) == 0)
2312 continue;
2313
2314 /* Try reversing direction of operands. */
2315 overlap0 = i.types[0] & t->operand_types[1];
2316 overlap1 = i.types[1] & t->operand_types[0];
2317 if (!MATCH (overlap0, i.types[0], t->operand_types[1])
2318 || !MATCH (overlap1, i.types[1], t->operand_types[0])
2319 || !CONSISTENT_REGISTER_MATCH (overlap0, i.types[0],
2320 t->operand_types[1],
2321 overlap1, i.types[1],
2322 t->operand_types[0]))
2323 {
2324 /* Does not match either direction. */
2325 continue;
2326 }
2327 /* found_reverse_match holds which of D or FloatDR
2328 we've found. */
2329 found_reverse_match = t->opcode_modifier & (D | FloatDR);
2330 }
2331 /* Found a forward 2 operand match here. */
2332 else if (t->operands == 3)
2333 {
2334 /* Here we make use of the fact that there are no
2335 reverse match 3 operand instructions, and all 3
2336 operand instructions only need to be checked for
2337 register consistency between operands 2 and 3. */
2338 overlap2 = i.types[2] & t->operand_types[2];
2339 if (!MATCH (overlap2, i.types[2], t->operand_types[2])
2340 || !CONSISTENT_REGISTER_MATCH (overlap1, i.types[1],
2341 t->operand_types[1],
2342 overlap2, i.types[2],
2343 t->operand_types[2]))
2344
2345 continue;
2346 }
2347 /* Found either forward/reverse 2 or 3 operand match here:
2348 slip through to break. */
2349 }
2350 if (t->cpu_flags & ~cpu_arch_flags)
2351 {
2352 found_reverse_match = 0;
2353 continue;
2354 }
2355 /* We've found a match; break out of loop. */
2356 break;
2357 }
2358
2359 if (t == current_templates->end)
2360 {
2361 /* We found no match. */
2362 as_bad (_("suffix or operands invalid for `%s'"),
2363 current_templates->start->name);
2364 return 0;
2365 }
2366
2367 if (!quiet_warnings)
2368 {
2369 if (!intel_syntax
2370 && ((i.types[0] & JumpAbsolute)
2371 != (t->operand_types[0] & JumpAbsolute)))
2372 {
2373 as_warn (_("indirect %s without `*'"), t->name);
2374 }
2375
2376 if ((t->opcode_modifier & (IsPrefix | IgnoreSize))
2377 == (IsPrefix | IgnoreSize))
2378 {
2379 /* Warn them that a data or address size prefix doesn't
2380 affect assembly of the next line of code. */
2381 as_warn (_("stand-alone `%s' prefix"), t->name);
2382 }
2383 }
2384
2385 /* Copy the template we found. */
2386 i.tm = *t;
2387 if (found_reverse_match)
2388 {
2389 /* If we found a reverse match we must alter the opcode
2390 direction bit. found_reverse_match holds bits to change
2391 (different for int & float insns). */
2392
2393 i.tm.base_opcode ^= found_reverse_match;
2394
2395 i.tm.operand_types[0] = t->operand_types[1];
2396 i.tm.operand_types[1] = t->operand_types[0];
2397 }
2398
2399 return 1;
2400 }
2401
2402 static int
2403 check_string ()
2404 {
2405 int mem_op = (i.types[0] & AnyMem) ? 0 : 1;
2406 if ((i.tm.operand_types[mem_op] & EsSeg) != 0)
2407 {
2408 if (i.seg[0] != NULL && i.seg[0] != &es)
2409 {
2410 as_bad (_("`%s' operand %d must use `%%es' segment"),
2411 i.tm.name,
2412 mem_op + 1);
2413 return 0;
2414 }
2415 /* There's only ever one segment override allowed per instruction.
2416 This instruction possibly has a legal segment override on the
2417 second operand, so copy the segment to where non-string
2418 instructions store it, allowing common code. */
2419 i.seg[0] = i.seg[1];
2420 }
2421 else if ((i.tm.operand_types[mem_op + 1] & EsSeg) != 0)
2422 {
2423 if (i.seg[1] != NULL && i.seg[1] != &es)
2424 {
2425 as_bad (_("`%s' operand %d must use `%%es' segment"),
2426 i.tm.name,
2427 mem_op + 2);
2428 return 0;
2429 }
2430 }
2431 return 1;
2432 }
2433
2434 static int
2435 process_suffix (void)
2436 {
2437 /* If matched instruction specifies an explicit instruction mnemonic
2438 suffix, use it. */
2439 if (i.tm.opcode_modifier & (Size16 | Size32 | Size64))
2440 {
2441 if (i.tm.opcode_modifier & Size16)
2442 i.suffix = WORD_MNEM_SUFFIX;
2443 else if (i.tm.opcode_modifier & Size64)
2444 i.suffix = QWORD_MNEM_SUFFIX;
2445 else
2446 i.suffix = LONG_MNEM_SUFFIX;
2447 }
2448 else if (i.reg_operands)
2449 {
2450 /* If there's no instruction mnemonic suffix we try to invent one
2451 based on register operands. */
2452 if (!i.suffix)
2453 {
2454 /* We take i.suffix from the last register operand specified,
2455 Destination register type is more significant than source
2456 register type. */
2457 int op;
2458
2459 for (op = i.operands; --op >= 0;)
2460 if ((i.types[op] & Reg)
2461 && !(i.tm.operand_types[op] & InOutPortReg))
2462 {
2463 i.suffix = ((i.types[op] & Reg8) ? BYTE_MNEM_SUFFIX :
2464 (i.types[op] & Reg16) ? WORD_MNEM_SUFFIX :
2465 (i.types[op] & Reg64) ? QWORD_MNEM_SUFFIX :
2466 LONG_MNEM_SUFFIX);
2467 break;
2468 }
2469 }
2470 else if (i.suffix == BYTE_MNEM_SUFFIX)
2471 {
2472 if (!check_byte_reg ())
2473 return 0;
2474 }
2475 else if (i.suffix == LONG_MNEM_SUFFIX)
2476 {
2477 if (!check_long_reg ())
2478 return 0;
2479 }
2480 else if (i.suffix == QWORD_MNEM_SUFFIX)
2481 {
2482 if (!check_qword_reg ())
2483 return 0;
2484 }
2485 else if (i.suffix == WORD_MNEM_SUFFIX)
2486 {
2487 if (!check_word_reg ())
2488 return 0;
2489 }
2490 else if (intel_syntax && (i.tm.opcode_modifier & IgnoreSize))
2491 /* Do nothing if the instruction is going to ignore the prefix. */
2492 ;
2493 else
2494 abort ();
2495 }
2496 else if ((i.tm.opcode_modifier & DefaultSize)
2497 && !i.suffix
2498 /* exclude fldenv/frstor/fsave/fstenv */
2499 && (i.tm.opcode_modifier & No_sSuf))
2500 {
2501 i.suffix = stackop_size;
2502 }
2503 else if (intel_syntax
2504 && !i.suffix
2505 && ((i.tm.operand_types[0] & JumpAbsolute)
2506 || (i.tm.opcode_modifier & (JumpByte|JumpInterSegment))
2507 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
2508 && i.tm.extension_opcode <= 3)))
2509 {
2510 switch (flag_code)
2511 {
2512 case CODE_64BIT:
2513 if (!(i.tm.opcode_modifier & No_qSuf))
2514 {
2515 i.suffix = QWORD_MNEM_SUFFIX;
2516 break;
2517 }
2518 case CODE_32BIT:
2519 if (!(i.tm.opcode_modifier & No_lSuf))
2520 i.suffix = LONG_MNEM_SUFFIX;
2521 break;
2522 case CODE_16BIT:
2523 if (!(i.tm.opcode_modifier & No_wSuf))
2524 i.suffix = WORD_MNEM_SUFFIX;
2525 break;
2526 }
2527 }
2528
2529 if (!i.suffix)
2530 {
2531 if (!intel_syntax)
2532 {
2533 if (i.tm.opcode_modifier & W)
2534 {
2535 as_bad (_("no instruction mnemonic suffix given and no register operands; can't size instruction"));
2536 return 0;
2537 }
2538 }
2539 else
2540 {
2541 unsigned int suffixes = ~i.tm.opcode_modifier
2542 & (No_bSuf
2543 | No_wSuf
2544 | No_lSuf
2545 | No_sSuf
2546 | No_xSuf
2547 | No_qSuf);
2548
2549 if ((i.tm.opcode_modifier & W)
2550 || ((suffixes & (suffixes - 1))
2551 && !(i.tm.opcode_modifier & (DefaultSize | IgnoreSize))))
2552 {
2553 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
2554 return 0;
2555 }
2556 }
2557 }
2558
2559 /* Change the opcode based on the operand size given by i.suffix;
2560 We don't need to change things for byte insns. */
2561
2562 if (i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
2563 {
2564 /* It's not a byte, select word/dword operation. */
2565 if (i.tm.opcode_modifier & W)
2566 {
2567 if (i.tm.opcode_modifier & ShortForm)
2568 i.tm.base_opcode |= 8;
2569 else
2570 i.tm.base_opcode |= 1;
2571 }
2572
2573 /* Now select between word & dword operations via the operand
2574 size prefix, except for instructions that will ignore this
2575 prefix anyway. */
2576 if (i.tm.base_opcode == 0x0f01 && i.tm.extension_opcode == 0xc8)
2577 {
2578 /* monitor in SSE3 is a very special case. The default size
2579 of AX is the size of mode. The address size override
2580 prefix will change the size of AX. */
2581 if (i.op->regs[0].reg_type &
2582 (flag_code == CODE_32BIT ? Reg16 : Reg32))
2583 if (!add_prefix (ADDR_PREFIX_OPCODE))
2584 return 0;
2585 }
2586 else if (i.suffix != QWORD_MNEM_SUFFIX
2587 && i.suffix != LONG_DOUBLE_MNEM_SUFFIX
2588 && !(i.tm.opcode_modifier & (IgnoreSize | FloatMF))
2589 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
2590 || (flag_code == CODE_64BIT
2591 && (i.tm.opcode_modifier & JumpByte))))
2592 {
2593 unsigned int prefix = DATA_PREFIX_OPCODE;
2594
2595 if (i.tm.opcode_modifier & JumpByte) /* jcxz, loop */
2596 prefix = ADDR_PREFIX_OPCODE;
2597
2598 if (!add_prefix (prefix))
2599 return 0;
2600 }
2601
2602 /* Set mode64 for an operand. */
2603 if (i.suffix == QWORD_MNEM_SUFFIX
2604 && flag_code == CODE_64BIT
2605 && (i.tm.opcode_modifier & NoRex64) == 0)
2606 i.rex |= REX_MODE64;
2607
2608 /* Size floating point instruction. */
2609 if (i.suffix == LONG_MNEM_SUFFIX)
2610 if (i.tm.opcode_modifier & FloatMF)
2611 i.tm.base_opcode ^= 4;
2612 }
2613
2614 return 1;
2615 }
2616
2617 static int
2618 check_byte_reg (void)
2619 {
2620 int op;
2621
2622 for (op = i.operands; --op >= 0;)
2623 {
2624 /* If this is an eight bit register, it's OK. If it's the 16 or
2625 32 bit version of an eight bit register, we will just use the
2626 low portion, and that's OK too. */
2627 if (i.types[op] & Reg8)
2628 continue;
2629
2630 /* movzx and movsx should not generate this warning. */
2631 if (intel_syntax
2632 && (i.tm.base_opcode == 0xfb7
2633 || i.tm.base_opcode == 0xfb6
2634 || i.tm.base_opcode == 0x63
2635 || i.tm.base_opcode == 0xfbe
2636 || i.tm.base_opcode == 0xfbf))
2637 continue;
2638
2639 if ((i.types[op] & WordReg) && i.op[op].regs->reg_num < 4)
2640 {
2641 /* Prohibit these changes in the 64bit mode, since the
2642 lowering is more complicated. */
2643 if (flag_code == CODE_64BIT
2644 && (i.tm.operand_types[op] & InOutPortReg) == 0)
2645 {
2646 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2647 i.op[op].regs->reg_name,
2648 i.suffix);
2649 return 0;
2650 }
2651 #if REGISTER_WARNINGS
2652 if (!quiet_warnings
2653 && (i.tm.operand_types[op] & InOutPortReg) == 0)
2654 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2655 (i.op[op].regs + (i.types[op] & Reg16
2656 ? REGNAM_AL - REGNAM_AX
2657 : REGNAM_AL - REGNAM_EAX))->reg_name,
2658 i.op[op].regs->reg_name,
2659 i.suffix);
2660 #endif
2661 continue;
2662 }
2663 /* Any other register is bad. */
2664 if (i.types[op] & (Reg | RegMMX | RegXMM
2665 | SReg2 | SReg3
2666 | Control | Debug | Test
2667 | FloatReg | FloatAcc))
2668 {
2669 as_bad (_("`%%%s' not allowed with `%s%c'"),
2670 i.op[op].regs->reg_name,
2671 i.tm.name,
2672 i.suffix);
2673 return 0;
2674 }
2675 }
2676 return 1;
2677 }
2678
2679 static int
2680 check_long_reg ()
2681 {
2682 int op;
2683
2684 for (op = i.operands; --op >= 0;)
2685 /* Reject eight bit registers, except where the template requires
2686 them. (eg. movzb) */
2687 if ((i.types[op] & Reg8) != 0
2688 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2689 {
2690 as_bad (_("`%%%s' not allowed with `%s%c'"),
2691 i.op[op].regs->reg_name,
2692 i.tm.name,
2693 i.suffix);
2694 return 0;
2695 }
2696 /* Warn if the e prefix on a general reg is missing. */
2697 else if ((!quiet_warnings || flag_code == CODE_64BIT)
2698 && (i.types[op] & Reg16) != 0
2699 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2700 {
2701 /* Prohibit these changes in the 64bit mode, since the
2702 lowering is more complicated. */
2703 if (flag_code == CODE_64BIT)
2704 {
2705 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2706 i.op[op].regs->reg_name,
2707 i.suffix);
2708 return 0;
2709 }
2710 #if REGISTER_WARNINGS
2711 else
2712 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2713 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
2714 i.op[op].regs->reg_name,
2715 i.suffix);
2716 #endif
2717 }
2718 /* Warn if the r prefix on a general reg is missing. */
2719 else if ((i.types[op] & Reg64) != 0
2720 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2721 {
2722 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2723 i.op[op].regs->reg_name,
2724 i.suffix);
2725 return 0;
2726 }
2727 return 1;
2728 }
2729
2730 static int
2731 check_qword_reg ()
2732 {
2733 int op;
2734
2735 for (op = i.operands; --op >= 0; )
2736 /* Reject eight bit registers, except where the template requires
2737 them. (eg. movzb) */
2738 if ((i.types[op] & Reg8) != 0
2739 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2740 {
2741 as_bad (_("`%%%s' not allowed with `%s%c'"),
2742 i.op[op].regs->reg_name,
2743 i.tm.name,
2744 i.suffix);
2745 return 0;
2746 }
2747 /* Warn if the e prefix on a general reg is missing. */
2748 else if (((i.types[op] & Reg16) != 0
2749 || (i.types[op] & Reg32) != 0)
2750 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2751 {
2752 /* Prohibit these changes in the 64bit mode, since the
2753 lowering is more complicated. */
2754 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2755 i.op[op].regs->reg_name,
2756 i.suffix);
2757 return 0;
2758 }
2759 return 1;
2760 }
2761
2762 static int
2763 check_word_reg ()
2764 {
2765 int op;
2766 for (op = i.operands; --op >= 0;)
2767 /* Reject eight bit registers, except where the template requires
2768 them. (eg. movzb) */
2769 if ((i.types[op] & Reg8) != 0
2770 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2771 {
2772 as_bad (_("`%%%s' not allowed with `%s%c'"),
2773 i.op[op].regs->reg_name,
2774 i.tm.name,
2775 i.suffix);
2776 return 0;
2777 }
2778 /* Warn if the e prefix on a general reg is present. */
2779 else if ((!quiet_warnings || flag_code == CODE_64BIT)
2780 && (i.types[op] & Reg32) != 0
2781 && (i.tm.operand_types[op] & (Reg16 | Acc)) != 0)
2782 {
2783 /* Prohibit these changes in the 64bit mode, since the
2784 lowering is more complicated. */
2785 if (flag_code == CODE_64BIT)
2786 {
2787 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2788 i.op[op].regs->reg_name,
2789 i.suffix);
2790 return 0;
2791 }
2792 else
2793 #if REGISTER_WARNINGS
2794 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2795 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
2796 i.op[op].regs->reg_name,
2797 i.suffix);
2798 #endif
2799 }
2800 return 1;
2801 }
2802
2803 static int
2804 finalize_imm ()
2805 {
2806 unsigned int overlap0, overlap1, overlap2;
2807
2808 overlap0 = i.types[0] & i.tm.operand_types[0];
2809 if ((overlap0 & (Imm8 | Imm8S | Imm16 | Imm32 | Imm32S | Imm64))
2810 && overlap0 != Imm8 && overlap0 != Imm8S
2811 && overlap0 != Imm16 && overlap0 != Imm32S
2812 && overlap0 != Imm32 && overlap0 != Imm64)
2813 {
2814 if (i.suffix)
2815 {
2816 overlap0 &= (i.suffix == BYTE_MNEM_SUFFIX
2817 ? Imm8 | Imm8S
2818 : (i.suffix == WORD_MNEM_SUFFIX
2819 ? Imm16
2820 : (i.suffix == QWORD_MNEM_SUFFIX
2821 ? Imm64 | Imm32S
2822 : Imm32)));
2823 }
2824 else if (overlap0 == (Imm16 | Imm32S | Imm32)
2825 || overlap0 == (Imm16 | Imm32)
2826 || overlap0 == (Imm16 | Imm32S))
2827 {
2828 overlap0 = ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0)
2829 ? Imm16 : Imm32S);
2830 }
2831 if (overlap0 != Imm8 && overlap0 != Imm8S
2832 && overlap0 != Imm16 && overlap0 != Imm32S
2833 && overlap0 != Imm32 && overlap0 != Imm64)
2834 {
2835 as_bad (_("no instruction mnemonic suffix given; can't determine immediate size"));
2836 return 0;
2837 }
2838 }
2839 i.types[0] = overlap0;
2840
2841 overlap1 = i.types[1] & i.tm.operand_types[1];
2842 if ((overlap1 & (Imm8 | Imm8S | Imm16 | Imm32S | Imm32 | Imm64))
2843 && overlap1 != Imm8 && overlap1 != Imm8S
2844 && overlap1 != Imm16 && overlap1 != Imm32S
2845 && overlap1 != Imm32 && overlap1 != Imm64)
2846 {
2847 if (i.suffix)
2848 {
2849 overlap1 &= (i.suffix == BYTE_MNEM_SUFFIX
2850 ? Imm8 | Imm8S
2851 : (i.suffix == WORD_MNEM_SUFFIX
2852 ? Imm16
2853 : (i.suffix == QWORD_MNEM_SUFFIX
2854 ? Imm64 | Imm32S
2855 : Imm32)));
2856 }
2857 else if (overlap1 == (Imm16 | Imm32 | Imm32S)
2858 || overlap1 == (Imm16 | Imm32)
2859 || overlap1 == (Imm16 | Imm32S))
2860 {
2861 overlap1 = ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0)
2862 ? Imm16 : Imm32S);
2863 }
2864 if (overlap1 != Imm8 && overlap1 != Imm8S
2865 && overlap1 != Imm16 && overlap1 != Imm32S
2866 && overlap1 != Imm32 && overlap1 != Imm64)
2867 {
2868 as_bad (_("no instruction mnemonic suffix given; can't determine immediate size %x %c"),overlap1, i.suffix);
2869 return 0;
2870 }
2871 }
2872 i.types[1] = overlap1;
2873
2874 overlap2 = i.types[2] & i.tm.operand_types[2];
2875 assert ((overlap2 & Imm) == 0);
2876 i.types[2] = overlap2;
2877
2878 return 1;
2879 }
2880
2881 static int
2882 process_operands ()
2883 {
2884 /* Default segment register this instruction will use for memory
2885 accesses. 0 means unknown. This is only for optimizing out
2886 unnecessary segment overrides. */
2887 const seg_entry *default_seg = 0;
2888
2889 /* The imul $imm, %reg instruction is converted into
2890 imul $imm, %reg, %reg, and the clr %reg instruction
2891 is converted into xor %reg, %reg. */
2892 if (i.tm.opcode_modifier & regKludge)
2893 {
2894 unsigned int first_reg_op = (i.types[0] & Reg) ? 0 : 1;
2895 /* Pretend we saw the extra register operand. */
2896 assert (i.op[first_reg_op + 1].regs == 0);
2897 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
2898 i.types[first_reg_op + 1] = i.types[first_reg_op];
2899 i.reg_operands = 2;
2900 }
2901
2902 if (i.tm.opcode_modifier & ShortForm)
2903 {
2904 /* The register or float register operand is in operand 0 or 1. */
2905 unsigned int op = (i.types[0] & (Reg | FloatReg)) ? 0 : 1;
2906 /* Register goes in low 3 bits of opcode. */
2907 i.tm.base_opcode |= i.op[op].regs->reg_num;
2908 if ((i.op[op].regs->reg_flags & RegRex) != 0)
2909 i.rex |= REX_EXTZ;
2910 if (!quiet_warnings && (i.tm.opcode_modifier & Ugh) != 0)
2911 {
2912 /* Warn about some common errors, but press on regardless.
2913 The first case can be generated by gcc (<= 2.8.1). */
2914 if (i.operands == 2)
2915 {
2916 /* Reversed arguments on faddp, fsubp, etc. */
2917 as_warn (_("translating to `%s %%%s,%%%s'"), i.tm.name,
2918 i.op[1].regs->reg_name,
2919 i.op[0].regs->reg_name);
2920 }
2921 else
2922 {
2923 /* Extraneous `l' suffix on fp insn. */
2924 as_warn (_("translating to `%s %%%s'"), i.tm.name,
2925 i.op[0].regs->reg_name);
2926 }
2927 }
2928 }
2929 else if (i.tm.opcode_modifier & Modrm)
2930 {
2931 /* The opcode is completed (modulo i.tm.extension_opcode which
2932 must be put into the modrm byte). Now, we make the modrm and
2933 index base bytes based on all the info we've collected. */
2934
2935 default_seg = build_modrm_byte ();
2936 }
2937 else if (i.tm.opcode_modifier & (Seg2ShortForm | Seg3ShortForm))
2938 {
2939 if (i.tm.base_opcode == POP_SEG_SHORT
2940 && i.op[0].regs->reg_num == 1)
2941 {
2942 as_bad (_("you can't `pop %%cs'"));
2943 return 0;
2944 }
2945 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
2946 if ((i.op[0].regs->reg_flags & RegRex) != 0)
2947 i.rex |= REX_EXTZ;
2948 }
2949 else if ((i.tm.base_opcode & ~(D | W)) == MOV_AX_DISP32)
2950 {
2951 default_seg = &ds;
2952 }
2953 else if ((i.tm.opcode_modifier & IsString) != 0)
2954 {
2955 /* For the string instructions that allow a segment override
2956 on one of their operands, the default segment is ds. */
2957 default_seg = &ds;
2958 }
2959
2960 if ((i.tm.base_opcode == 0x8d /* lea */
2961 || (i.tm.cpu_flags & CpuSVME))
2962 && i.seg[0] && !quiet_warnings)
2963 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
2964
2965 /* If a segment was explicitly specified, and the specified segment
2966 is not the default, use an opcode prefix to select it. If we
2967 never figured out what the default segment is, then default_seg
2968 will be zero at this point, and the specified segment prefix will
2969 always be used. */
2970 if ((i.seg[0]) && (i.seg[0] != default_seg))
2971 {
2972 if (!add_prefix (i.seg[0]->seg_prefix))
2973 return 0;
2974 }
2975 return 1;
2976 }
2977
2978 static const seg_entry *
2979 build_modrm_byte ()
2980 {
2981 const seg_entry *default_seg = 0;
2982
2983 /* i.reg_operands MUST be the number of real register operands;
2984 implicit registers do not count. */
2985 if (i.reg_operands == 2)
2986 {
2987 unsigned int source, dest;
2988 source = ((i.types[0]
2989 & (Reg | RegMMX | RegXMM
2990 | SReg2 | SReg3
2991 | Control | Debug | Test))
2992 ? 0 : 1);
2993 dest = source + 1;
2994
2995 i.rm.mode = 3;
2996 /* One of the register operands will be encoded in the i.tm.reg
2997 field, the other in the combined i.tm.mode and i.tm.regmem
2998 fields. If no form of this instruction supports a memory
2999 destination operand, then we assume the source operand may
3000 sometimes be a memory operand and so we need to store the
3001 destination in the i.rm.reg field. */
3002 if ((i.tm.operand_types[dest] & AnyMem) == 0)
3003 {
3004 i.rm.reg = i.op[dest].regs->reg_num;
3005 i.rm.regmem = i.op[source].regs->reg_num;
3006 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
3007 i.rex |= REX_EXTX;
3008 if ((i.op[source].regs->reg_flags & RegRex) != 0)
3009 i.rex |= REX_EXTZ;
3010 }
3011 else
3012 {
3013 i.rm.reg = i.op[source].regs->reg_num;
3014 i.rm.regmem = i.op[dest].regs->reg_num;
3015 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
3016 i.rex |= REX_EXTZ;
3017 if ((i.op[source].regs->reg_flags & RegRex) != 0)
3018 i.rex |= REX_EXTX;
3019 }
3020 if (flag_code != CODE_64BIT && (i.rex & (REX_EXTX | REX_EXTZ)))
3021 {
3022 if (!((i.types[0] | i.types[1]) & Control))
3023 abort ();
3024 i.rex &= ~(REX_EXTX | REX_EXTZ);
3025 add_prefix (LOCK_PREFIX_OPCODE);
3026 }
3027 }
3028 else
3029 { /* If it's not 2 reg operands... */
3030 if (i.mem_operands)
3031 {
3032 unsigned int fake_zero_displacement = 0;
3033 unsigned int op = ((i.types[0] & AnyMem)
3034 ? 0
3035 : (i.types[1] & AnyMem) ? 1 : 2);
3036
3037 default_seg = &ds;
3038
3039 if (i.base_reg == 0)
3040 {
3041 i.rm.mode = 0;
3042 if (!i.disp_operands)
3043 fake_zero_displacement = 1;
3044 if (i.index_reg == 0)
3045 {
3046 /* Operand is just <disp> */
3047 if (flag_code == CODE_64BIT)
3048 {
3049 /* 64bit mode overwrites the 32bit absolute
3050 addressing by RIP relative addressing and
3051 absolute addressing is encoded by one of the
3052 redundant SIB forms. */
3053 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3054 i.sib.base = NO_BASE_REGISTER;
3055 i.sib.index = NO_INDEX_REGISTER;
3056 i.types[op] = ((i.prefix[ADDR_PREFIX] == 0) ? Disp32S : Disp32);
3057 }
3058 else if ((flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0))
3059 {
3060 i.rm.regmem = NO_BASE_REGISTER_16;
3061 i.types[op] = Disp16;
3062 }
3063 else
3064 {
3065 i.rm.regmem = NO_BASE_REGISTER;
3066 i.types[op] = Disp32;
3067 }
3068 }
3069 else /* !i.base_reg && i.index_reg */
3070 {
3071 i.sib.index = i.index_reg->reg_num;
3072 i.sib.base = NO_BASE_REGISTER;
3073 i.sib.scale = i.log2_scale_factor;
3074 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3075 i.types[op] &= ~Disp;
3076 if (flag_code != CODE_64BIT)
3077 i.types[op] |= Disp32; /* Must be 32 bit */
3078 else
3079 i.types[op] |= Disp32S;
3080 if ((i.index_reg->reg_flags & RegRex) != 0)
3081 i.rex |= REX_EXTY;
3082 }
3083 }
3084 /* RIP addressing for 64bit mode. */
3085 else if (i.base_reg->reg_type == BaseIndex)
3086 {
3087 i.rm.regmem = NO_BASE_REGISTER;
3088 i.types[op] &= ~ Disp;
3089 i.types[op] |= Disp32S;
3090 i.flags[op] = Operand_PCrel;
3091 if (! i.disp_operands)
3092 fake_zero_displacement = 1;
3093 }
3094 else if (i.base_reg->reg_type & Reg16)
3095 {
3096 switch (i.base_reg->reg_num)
3097 {
3098 case 3: /* (%bx) */
3099 if (i.index_reg == 0)
3100 i.rm.regmem = 7;
3101 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
3102 i.rm.regmem = i.index_reg->reg_num - 6;
3103 break;
3104 case 5: /* (%bp) */
3105 default_seg = &ss;
3106 if (i.index_reg == 0)
3107 {
3108 i.rm.regmem = 6;
3109 if ((i.types[op] & Disp) == 0)
3110 {
3111 /* fake (%bp) into 0(%bp) */
3112 i.types[op] |= Disp8;
3113 fake_zero_displacement = 1;
3114 }
3115 }
3116 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
3117 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
3118 break;
3119 default: /* (%si) -> 4 or (%di) -> 5 */
3120 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
3121 }
3122 i.rm.mode = mode_from_disp_size (i.types[op]);
3123 }
3124 else /* i.base_reg and 32/64 bit mode */
3125 {
3126 if (flag_code == CODE_64BIT
3127 && (i.types[op] & Disp))
3128 i.types[op] = (i.types[op] & Disp8) | (i.prefix[ADDR_PREFIX] == 0 ? Disp32S : Disp32);
3129
3130 i.rm.regmem = i.base_reg->reg_num;
3131 if ((i.base_reg->reg_flags & RegRex) != 0)
3132 i.rex |= REX_EXTZ;
3133 i.sib.base = i.base_reg->reg_num;
3134 /* x86-64 ignores REX prefix bit here to avoid decoder
3135 complications. */
3136 if ((i.base_reg->reg_num & 7) == EBP_REG_NUM)
3137 {
3138 default_seg = &ss;
3139 if (i.disp_operands == 0)
3140 {
3141 fake_zero_displacement = 1;
3142 i.types[op] |= Disp8;
3143 }
3144 }
3145 else if (i.base_reg->reg_num == ESP_REG_NUM)
3146 {
3147 default_seg = &ss;
3148 }
3149 i.sib.scale = i.log2_scale_factor;
3150 if (i.index_reg == 0)
3151 {
3152 /* <disp>(%esp) becomes two byte modrm with no index
3153 register. We've already stored the code for esp
3154 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
3155 Any base register besides %esp will not use the
3156 extra modrm byte. */
3157 i.sib.index = NO_INDEX_REGISTER;
3158 #if !SCALE1_WHEN_NO_INDEX
3159 /* Another case where we force the second modrm byte. */
3160 if (i.log2_scale_factor)
3161 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3162 #endif
3163 }
3164 else
3165 {
3166 i.sib.index = i.index_reg->reg_num;
3167 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3168 if ((i.index_reg->reg_flags & RegRex) != 0)
3169 i.rex |= REX_EXTY;
3170 }
3171
3172 if (i.disp_operands
3173 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
3174 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
3175 i.rm.mode = 0;
3176 else
3177 i.rm.mode = mode_from_disp_size (i.types[op]);
3178 }
3179
3180 if (fake_zero_displacement)
3181 {
3182 /* Fakes a zero displacement assuming that i.types[op]
3183 holds the correct displacement size. */
3184 expressionS *exp;
3185
3186 assert (i.op[op].disps == 0);
3187 exp = &disp_expressions[i.disp_operands++];
3188 i.op[op].disps = exp;
3189 exp->X_op = O_constant;
3190 exp->X_add_number = 0;
3191 exp->X_add_symbol = (symbolS *) 0;
3192 exp->X_op_symbol = (symbolS *) 0;
3193 }
3194 }
3195
3196 /* Fill in i.rm.reg or i.rm.regmem field with register operand
3197 (if any) based on i.tm.extension_opcode. Again, we must be
3198 careful to make sure that segment/control/debug/test/MMX
3199 registers are coded into the i.rm.reg field. */
3200 if (i.reg_operands)
3201 {
3202 unsigned int op =
3203 ((i.types[0]
3204 & (Reg | RegMMX | RegXMM
3205 | SReg2 | SReg3
3206 | Control | Debug | Test))
3207 ? 0
3208 : ((i.types[1]
3209 & (Reg | RegMMX | RegXMM
3210 | SReg2 | SReg3
3211 | Control | Debug | Test))
3212 ? 1
3213 : 2));
3214 /* If there is an extension opcode to put here, the register
3215 number must be put into the regmem field. */
3216 if (i.tm.extension_opcode != None)
3217 {
3218 i.rm.regmem = i.op[op].regs->reg_num;
3219 if ((i.op[op].regs->reg_flags & RegRex) != 0)
3220 i.rex |= REX_EXTZ;
3221 }
3222 else
3223 {
3224 i.rm.reg = i.op[op].regs->reg_num;
3225 if ((i.op[op].regs->reg_flags & RegRex) != 0)
3226 i.rex |= REX_EXTX;
3227 }
3228
3229 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
3230 must set it to 3 to indicate this is a register operand
3231 in the regmem field. */
3232 if (!i.mem_operands)
3233 i.rm.mode = 3;
3234 }
3235
3236 /* Fill in i.rm.reg field with extension opcode (if any). */
3237 if (i.tm.extension_opcode != None)
3238 i.rm.reg = i.tm.extension_opcode;
3239 }
3240 return default_seg;
3241 }
3242
3243 static void
3244 output_branch ()
3245 {
3246 char *p;
3247 int code16;
3248 int prefix;
3249 relax_substateT subtype;
3250 symbolS *sym;
3251 offsetT off;
3252
3253 code16 = 0;
3254 if (flag_code == CODE_16BIT)
3255 code16 = CODE16;
3256
3257 prefix = 0;
3258 if (i.prefix[DATA_PREFIX] != 0)
3259 {
3260 prefix = 1;
3261 i.prefixes -= 1;
3262 code16 ^= CODE16;
3263 }
3264 /* Pentium4 branch hints. */
3265 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
3266 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
3267 {
3268 prefix++;
3269 i.prefixes--;
3270 }
3271 if (i.prefix[REX_PREFIX] != 0)
3272 {
3273 prefix++;
3274 i.prefixes--;
3275 }
3276
3277 if (i.prefixes != 0 && !intel_syntax)
3278 as_warn (_("skipping prefixes on this instruction"));
3279
3280 /* It's always a symbol; End frag & setup for relax.
3281 Make sure there is enough room in this frag for the largest
3282 instruction we may generate in md_convert_frag. This is 2
3283 bytes for the opcode and room for the prefix and largest
3284 displacement. */
3285 frag_grow (prefix + 2 + 4);
3286 /* Prefix and 1 opcode byte go in fr_fix. */
3287 p = frag_more (prefix + 1);
3288 if (i.prefix[DATA_PREFIX] != 0)
3289 *p++ = DATA_PREFIX_OPCODE;
3290 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
3291 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
3292 *p++ = i.prefix[SEG_PREFIX];
3293 if (i.prefix[REX_PREFIX] != 0)
3294 *p++ = i.prefix[REX_PREFIX];
3295 *p = i.tm.base_opcode;
3296
3297 if ((unsigned char) *p == JUMP_PC_RELATIVE)
3298 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, SMALL);
3299 else if ((cpu_arch_flags & Cpu386) != 0)
3300 subtype = ENCODE_RELAX_STATE (COND_JUMP, SMALL);
3301 else
3302 subtype = ENCODE_RELAX_STATE (COND_JUMP86, SMALL);
3303 subtype |= code16;
3304
3305 sym = i.op[0].disps->X_add_symbol;
3306 off = i.op[0].disps->X_add_number;
3307
3308 if (i.op[0].disps->X_op != O_constant
3309 && i.op[0].disps->X_op != O_symbol)
3310 {
3311 /* Handle complex expressions. */
3312 sym = make_expr_symbol (i.op[0].disps);
3313 off = 0;
3314 }
3315
3316 /* 1 possible extra opcode + 4 byte displacement go in var part.
3317 Pass reloc in fr_var. */
3318 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
3319 }
3320
3321 static void
3322 output_jump ()
3323 {
3324 char *p;
3325 int size;
3326 fixS *fixP;
3327
3328 if (i.tm.opcode_modifier & JumpByte)
3329 {
3330 /* This is a loop or jecxz type instruction. */
3331 size = 1;
3332 if (i.prefix[ADDR_PREFIX] != 0)
3333 {
3334 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
3335 i.prefixes -= 1;
3336 }
3337 /* Pentium4 branch hints. */
3338 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
3339 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
3340 {
3341 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
3342 i.prefixes--;
3343 }
3344 }
3345 else
3346 {
3347 int code16;
3348
3349 code16 = 0;
3350 if (flag_code == CODE_16BIT)
3351 code16 = CODE16;
3352
3353 if (i.prefix[DATA_PREFIX] != 0)
3354 {
3355 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
3356 i.prefixes -= 1;
3357 code16 ^= CODE16;
3358 }
3359
3360 size = 4;
3361 if (code16)
3362 size = 2;
3363 }
3364
3365 if (i.prefix[REX_PREFIX] != 0)
3366 {
3367 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
3368 i.prefixes -= 1;
3369 }
3370
3371 if (i.prefixes != 0 && !intel_syntax)
3372 as_warn (_("skipping prefixes on this instruction"));
3373
3374 p = frag_more (1 + size);
3375 *p++ = i.tm.base_opcode;
3376
3377 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3378 i.op[0].disps, 1, reloc (size, 1, 1, i.reloc[0]));
3379
3380 /* All jumps handled here are signed, but don't use a signed limit
3381 check for 32 and 16 bit jumps as we want to allow wrap around at
3382 4G and 64k respectively. */
3383 if (size == 1)
3384 fixP->fx_signed = 1;
3385 }
3386
3387 static void
3388 output_interseg_jump ()
3389 {
3390 char *p;
3391 int size;
3392 int prefix;
3393 int code16;
3394
3395 code16 = 0;
3396 if (flag_code == CODE_16BIT)
3397 code16 = CODE16;
3398
3399 prefix = 0;
3400 if (i.prefix[DATA_PREFIX] != 0)
3401 {
3402 prefix = 1;
3403 i.prefixes -= 1;
3404 code16 ^= CODE16;
3405 }
3406 if (i.prefix[REX_PREFIX] != 0)
3407 {
3408 prefix++;
3409 i.prefixes -= 1;
3410 }
3411
3412 size = 4;
3413 if (code16)
3414 size = 2;
3415
3416 if (i.prefixes != 0 && !intel_syntax)
3417 as_warn (_("skipping prefixes on this instruction"));
3418
3419 /* 1 opcode; 2 segment; offset */
3420 p = frag_more (prefix + 1 + 2 + size);
3421
3422 if (i.prefix[DATA_PREFIX] != 0)
3423 *p++ = DATA_PREFIX_OPCODE;
3424
3425 if (i.prefix[REX_PREFIX] != 0)
3426 *p++ = i.prefix[REX_PREFIX];
3427
3428 *p++ = i.tm.base_opcode;
3429 if (i.op[1].imms->X_op == O_constant)
3430 {
3431 offsetT n = i.op[1].imms->X_add_number;
3432
3433 if (size == 2
3434 && !fits_in_unsigned_word (n)
3435 && !fits_in_signed_word (n))
3436 {
3437 as_bad (_("16-bit jump out of range"));
3438 return;
3439 }
3440 md_number_to_chars (p, n, size);
3441 }
3442 else
3443 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3444 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
3445 if (i.op[0].imms->X_op != O_constant)
3446 as_bad (_("can't handle non absolute segment in `%s'"),
3447 i.tm.name);
3448 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
3449 }
3450
3451 static void
3452 output_insn ()
3453 {
3454 fragS *insn_start_frag;
3455 offsetT insn_start_off;
3456
3457 /* Tie dwarf2 debug info to the address at the start of the insn.
3458 We can't do this after the insn has been output as the current
3459 frag may have been closed off. eg. by frag_var. */
3460 dwarf2_emit_insn (0);
3461
3462 insn_start_frag = frag_now;
3463 insn_start_off = frag_now_fix ();
3464
3465 /* Output jumps. */
3466 if (i.tm.opcode_modifier & Jump)
3467 output_branch ();
3468 else if (i.tm.opcode_modifier & (JumpByte | JumpDword))
3469 output_jump ();
3470 else if (i.tm.opcode_modifier & JumpInterSegment)
3471 output_interseg_jump ();
3472 else
3473 {
3474 /* Output normal instructions here. */
3475 char *p;
3476 unsigned char *q;
3477 unsigned int prefix;
3478
3479 /* All opcodes on i386 have either 1 or 2 bytes. Merom New
3480 Instructions have 3 bytes. We may use one more higher byte
3481 to specify a prefix the instruction requires. */
3482 if ((i.tm.cpu_flags & CpuMNI) != 0)
3483 {
3484 if (i.tm.base_opcode & 0xff000000)
3485 {
3486 prefix = (i.tm.base_opcode >> 24) & 0xff;
3487 goto check_prefix;
3488 }
3489 }
3490 else if ((i.tm.base_opcode & 0xff0000) != 0)
3491 {
3492 prefix = (i.tm.base_opcode >> 16) & 0xff;
3493 if ((i.tm.cpu_flags & CpuPadLock) != 0)
3494 {
3495 check_prefix:
3496 if (prefix != REPE_PREFIX_OPCODE
3497 || i.prefix[LOCKREP_PREFIX] != REPE_PREFIX_OPCODE)
3498 add_prefix (prefix);
3499 }
3500 else
3501 add_prefix (prefix);
3502 }
3503
3504 /* The prefix bytes. */
3505 for (q = i.prefix;
3506 q < i.prefix + sizeof (i.prefix) / sizeof (i.prefix[0]);
3507 q++)
3508 {
3509 if (*q)
3510 {
3511 p = frag_more (1);
3512 md_number_to_chars (p, (valueT) *q, 1);
3513 }
3514 }
3515
3516 /* Now the opcode; be careful about word order here! */
3517 if (fits_in_unsigned_byte (i.tm.base_opcode))
3518 {
3519 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
3520 }
3521 else
3522 {
3523 if ((i.tm.cpu_flags & CpuMNI) != 0)
3524 {
3525 p = frag_more (3);
3526 *p++ = (i.tm.base_opcode >> 16) & 0xff;
3527 }
3528 else
3529 p = frag_more (2);
3530
3531 /* Put out high byte first: can't use md_number_to_chars! */
3532 *p++ = (i.tm.base_opcode >> 8) & 0xff;
3533 *p = i.tm.base_opcode & 0xff;
3534 }
3535
3536 /* Now the modrm byte and sib byte (if present). */
3537 if (i.tm.opcode_modifier & Modrm)
3538 {
3539 p = frag_more (1);
3540 md_number_to_chars (p,
3541 (valueT) (i.rm.regmem << 0
3542 | i.rm.reg << 3
3543 | i.rm.mode << 6),
3544 1);
3545 /* If i.rm.regmem == ESP (4)
3546 && i.rm.mode != (Register mode)
3547 && not 16 bit
3548 ==> need second modrm byte. */
3549 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
3550 && i.rm.mode != 3
3551 && !(i.base_reg && (i.base_reg->reg_type & Reg16) != 0))
3552 {
3553 p = frag_more (1);
3554 md_number_to_chars (p,
3555 (valueT) (i.sib.base << 0
3556 | i.sib.index << 3
3557 | i.sib.scale << 6),
3558 1);
3559 }
3560 }
3561
3562 if (i.disp_operands)
3563 output_disp (insn_start_frag, insn_start_off);
3564
3565 if (i.imm_operands)
3566 output_imm (insn_start_frag, insn_start_off);
3567 }
3568
3569 #ifdef DEBUG386
3570 if (flag_debug)
3571 {
3572 pi (line, &i);
3573 }
3574 #endif /* DEBUG386 */
3575 }
3576
3577 static void
3578 output_disp (insn_start_frag, insn_start_off)
3579 fragS *insn_start_frag;
3580 offsetT insn_start_off;
3581 {
3582 char *p;
3583 unsigned int n;
3584
3585 for (n = 0; n < i.operands; n++)
3586 {
3587 if (i.types[n] & Disp)
3588 {
3589 if (i.op[n].disps->X_op == O_constant)
3590 {
3591 int size;
3592 offsetT val;
3593
3594 size = 4;
3595 if (i.types[n] & (Disp8 | Disp16 | Disp64))
3596 {
3597 size = 2;
3598 if (i.types[n] & Disp8)
3599 size = 1;
3600 if (i.types[n] & Disp64)
3601 size = 8;
3602 }
3603 val = offset_in_range (i.op[n].disps->X_add_number,
3604 size);
3605 p = frag_more (size);
3606 md_number_to_chars (p, val, size);
3607 }
3608 else
3609 {
3610 enum bfd_reloc_code_real reloc_type;
3611 int size = 4;
3612 int sign = 0;
3613 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
3614
3615 /* The PC relative address is computed relative
3616 to the instruction boundary, so in case immediate
3617 fields follows, we need to adjust the value. */
3618 if (pcrel && i.imm_operands)
3619 {
3620 int imm_size = 4;
3621 unsigned int n1;
3622
3623 for (n1 = 0; n1 < i.operands; n1++)
3624 if (i.types[n1] & Imm)
3625 {
3626 if (i.types[n1] & (Imm8 | Imm8S | Imm16 | Imm64))
3627 {
3628 imm_size = 2;
3629 if (i.types[n1] & (Imm8 | Imm8S))
3630 imm_size = 1;
3631 if (i.types[n1] & Imm64)
3632 imm_size = 8;
3633 }
3634 break;
3635 }
3636 /* We should find the immediate. */
3637 if (n1 == i.operands)
3638 abort ();
3639 i.op[n].disps->X_add_number -= imm_size;
3640 }
3641
3642 if (i.types[n] & Disp32S)
3643 sign = 1;
3644
3645 if (i.types[n] & (Disp16 | Disp64))
3646 {
3647 size = 2;
3648 if (i.types[n] & Disp64)
3649 size = 8;
3650 }
3651
3652 p = frag_more (size);
3653 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
3654 if (GOT_symbol
3655 && GOT_symbol == i.op[n].disps->X_add_symbol
3656 && (((reloc_type == BFD_RELOC_32
3657 || reloc_type == BFD_RELOC_X86_64_32S)
3658 && (i.op[n].disps->X_op == O_symbol
3659 || (i.op[n].disps->X_op == O_add
3660 && ((symbol_get_value_expression
3661 (i.op[n].disps->X_op_symbol)->X_op)
3662 == O_subtract))))
3663 || reloc_type == BFD_RELOC_32_PCREL))
3664 {
3665 offsetT add;
3666
3667 if (insn_start_frag == frag_now)
3668 add = (p - frag_now->fr_literal) - insn_start_off;
3669 else
3670 {
3671 fragS *fr;
3672
3673 add = insn_start_frag->fr_fix - insn_start_off;
3674 for (fr = insn_start_frag->fr_next;
3675 fr && fr != frag_now; fr = fr->fr_next)
3676 add += fr->fr_fix;
3677 add += p - frag_now->fr_literal;
3678 }
3679
3680 if (!object_64bit)
3681 reloc_type = BFD_RELOC_386_GOTPC;
3682 else
3683 reloc_type = BFD_RELOC_X86_64_GOTPC32;
3684 i.op[n].disps->X_add_number += add;
3685 }
3686 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3687 i.op[n].disps, pcrel, reloc_type);
3688 }
3689 }
3690 }
3691 }
3692
3693 static void
3694 output_imm (insn_start_frag, insn_start_off)
3695 fragS *insn_start_frag;
3696 offsetT insn_start_off;
3697 {
3698 char *p;
3699 unsigned int n;
3700
3701 for (n = 0; n < i.operands; n++)
3702 {
3703 if (i.types[n] & Imm)
3704 {
3705 if (i.op[n].imms->X_op == O_constant)
3706 {
3707 int size;
3708 offsetT val;
3709
3710 size = 4;
3711 if (i.types[n] & (Imm8 | Imm8S | Imm16 | Imm64))
3712 {
3713 size = 2;
3714 if (i.types[n] & (Imm8 | Imm8S))
3715 size = 1;
3716 else if (i.types[n] & Imm64)
3717 size = 8;
3718 }
3719 val = offset_in_range (i.op[n].imms->X_add_number,
3720 size);
3721 p = frag_more (size);
3722 md_number_to_chars (p, val, size);
3723 }
3724 else
3725 {
3726 /* Not absolute_section.
3727 Need a 32-bit fixup (don't support 8bit
3728 non-absolute imms). Try to support other
3729 sizes ... */
3730 enum bfd_reloc_code_real reloc_type;
3731 int size = 4;
3732 int sign = 0;
3733
3734 if ((i.types[n] & (Imm32S))
3735 && (i.suffix == QWORD_MNEM_SUFFIX
3736 || (!i.suffix && (i.tm.opcode_modifier & No_lSuf))))
3737 sign = 1;
3738 if (i.types[n] & (Imm8 | Imm8S | Imm16 | Imm64))
3739 {
3740 size = 2;
3741 if (i.types[n] & (Imm8 | Imm8S))
3742 size = 1;
3743 if (i.types[n] & Imm64)
3744 size = 8;
3745 }
3746
3747 p = frag_more (size);
3748 reloc_type = reloc (size, 0, sign, i.reloc[n]);
3749
3750 /* This is tough to explain. We end up with this one if we
3751 * have operands that look like
3752 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
3753 * obtain the absolute address of the GOT, and it is strongly
3754 * preferable from a performance point of view to avoid using
3755 * a runtime relocation for this. The actual sequence of
3756 * instructions often look something like:
3757 *
3758 * call .L66
3759 * .L66:
3760 * popl %ebx
3761 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
3762 *
3763 * The call and pop essentially return the absolute address
3764 * of the label .L66 and store it in %ebx. The linker itself
3765 * will ultimately change the first operand of the addl so
3766 * that %ebx points to the GOT, but to keep things simple, the
3767 * .o file must have this operand set so that it generates not
3768 * the absolute address of .L66, but the absolute address of
3769 * itself. This allows the linker itself simply treat a GOTPC
3770 * relocation as asking for a pcrel offset to the GOT to be
3771 * added in, and the addend of the relocation is stored in the
3772 * operand field for the instruction itself.
3773 *
3774 * Our job here is to fix the operand so that it would add
3775 * the correct offset so that %ebx would point to itself. The
3776 * thing that is tricky is that .-.L66 will point to the
3777 * beginning of the instruction, so we need to further modify
3778 * the operand so that it will point to itself. There are
3779 * other cases where you have something like:
3780 *
3781 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
3782 *
3783 * and here no correction would be required. Internally in
3784 * the assembler we treat operands of this form as not being
3785 * pcrel since the '.' is explicitly mentioned, and I wonder
3786 * whether it would simplify matters to do it this way. Who
3787 * knows. In earlier versions of the PIC patches, the
3788 * pcrel_adjust field was used to store the correction, but
3789 * since the expression is not pcrel, I felt it would be
3790 * confusing to do it this way. */
3791
3792 if ((reloc_type == BFD_RELOC_32
3793 || reloc_type == BFD_RELOC_X86_64_32S)
3794 && GOT_symbol
3795 && GOT_symbol == i.op[n].imms->X_add_symbol
3796 && (i.op[n].imms->X_op == O_symbol
3797 || (i.op[n].imms->X_op == O_add
3798 && ((symbol_get_value_expression
3799 (i.op[n].imms->X_op_symbol)->X_op)
3800 == O_subtract))))
3801 {
3802 offsetT add;
3803
3804 if (insn_start_frag == frag_now)
3805 add = (p - frag_now->fr_literal) - insn_start_off;
3806 else
3807 {
3808 fragS *fr;
3809
3810 add = insn_start_frag->fr_fix - insn_start_off;
3811 for (fr = insn_start_frag->fr_next;
3812 fr && fr != frag_now; fr = fr->fr_next)
3813 add += fr->fr_fix;
3814 add += p - frag_now->fr_literal;
3815 }
3816
3817 if (!object_64bit)
3818 reloc_type = BFD_RELOC_386_GOTPC;
3819 else
3820 reloc_type = BFD_RELOC_X86_64_GOTPC32;
3821 i.op[n].imms->X_add_number += add;
3822 }
3823 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3824 i.op[n].imms, 0, reloc_type);
3825 }
3826 }
3827 }
3828 }
3829 \f
3830 /* x86_cons_fix_new is called via the expression parsing code when a
3831 reloc is needed. We use this hook to get the correct .got reloc. */
3832 static enum bfd_reloc_code_real got_reloc = NO_RELOC;
3833 static int cons_sign = -1;
3834
3835 void
3836 x86_cons_fix_new (fragS *frag,
3837 unsigned int off,
3838 unsigned int len,
3839 expressionS *exp)
3840 {
3841 enum bfd_reloc_code_real r = reloc (len, 0, cons_sign, got_reloc);
3842
3843 got_reloc = NO_RELOC;
3844
3845 #ifdef TE_PE
3846 if (exp->X_op == O_secrel)
3847 {
3848 exp->X_op = O_symbol;
3849 r = BFD_RELOC_32_SECREL;
3850 }
3851 #endif
3852
3853 fix_new_exp (frag, off, len, exp, 0, r);
3854 }
3855
3856 #if (!defined (OBJ_ELF) && !defined (OBJ_MAYBE_ELF)) || defined (LEX_AT)
3857 # define lex_got(reloc, adjust, types) NULL
3858 #else
3859 /* Parse operands of the form
3860 <symbol>@GOTOFF+<nnn>
3861 and similar .plt or .got references.
3862
3863 If we find one, set up the correct relocation in RELOC and copy the
3864 input string, minus the `@GOTOFF' into a malloc'd buffer for
3865 parsing by the calling routine. Return this buffer, and if ADJUST
3866 is non-null set it to the length of the string we removed from the
3867 input line. Otherwise return NULL. */
3868 static char *
3869 lex_got (enum bfd_reloc_code_real *reloc,
3870 int *adjust,
3871 unsigned int *types)
3872 {
3873 static const struct {
3874 const char *str;
3875 const enum bfd_reloc_code_real rel[2];
3876 const unsigned int types64;
3877 } gotrel[] = {
3878 { "PLT", { BFD_RELOC_386_PLT32, BFD_RELOC_X86_64_PLT32 }, Imm32|Imm32S|Disp32 },
3879 { "GOTOFF", { BFD_RELOC_386_GOTOFF, BFD_RELOC_X86_64_GOTOFF64 }, Imm64|Disp64 },
3880 { "GOTPCREL", { 0, BFD_RELOC_X86_64_GOTPCREL }, Imm32|Imm32S|Disp32 },
3881 { "TLSGD", { BFD_RELOC_386_TLS_GD, BFD_RELOC_X86_64_TLSGD }, Imm32|Imm32S|Disp32 },
3882 { "TLSLDM", { BFD_RELOC_386_TLS_LDM, 0 }, 0 },
3883 { "TLSLD", { 0, BFD_RELOC_X86_64_TLSLD }, Imm32|Imm32S|Disp32 },
3884 { "GOTTPOFF", { BFD_RELOC_386_TLS_IE_32, BFD_RELOC_X86_64_GOTTPOFF }, Imm32|Imm32S|Disp32 },
3885 { "TPOFF", { BFD_RELOC_386_TLS_LE_32, BFD_RELOC_X86_64_TPOFF32 }, Imm32|Imm32S|Imm64|Disp32|Disp64 },
3886 { "NTPOFF", { BFD_RELOC_386_TLS_LE, 0 }, 0 },
3887 { "DTPOFF", { BFD_RELOC_386_TLS_LDO_32, BFD_RELOC_X86_64_DTPOFF32 }, Imm32|Imm32S|Imm64|Disp32|Disp64 },
3888 { "GOTNTPOFF",{ BFD_RELOC_386_TLS_GOTIE, 0 }, 0 },
3889 { "INDNTPOFF",{ BFD_RELOC_386_TLS_IE, 0 }, 0 },
3890 { "GOT", { BFD_RELOC_386_GOT32, BFD_RELOC_X86_64_GOT32 }, Imm32|Imm32S|Disp32 },
3891 { "TLSDESC", { BFD_RELOC_386_TLS_GOTDESC, BFD_RELOC_X86_64_GOTPC32_TLSDESC }, Imm32|Imm32S|Disp32 },
3892 { "TLSCALL", { BFD_RELOC_386_TLS_DESC_CALL, BFD_RELOC_X86_64_TLSDESC_CALL }, Imm32|Imm32S|Disp32 }
3893 };
3894 char *cp;
3895 unsigned int j;
3896
3897 if (!IS_ELF)
3898 return NULL;
3899
3900 for (cp = input_line_pointer; *cp != '@'; cp++)
3901 if (is_end_of_line[(unsigned char) *cp])
3902 return NULL;
3903
3904 for (j = 0; j < sizeof (gotrel) / sizeof (gotrel[0]); j++)
3905 {
3906 int len;
3907
3908 len = strlen (gotrel[j].str);
3909 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
3910 {
3911 if (gotrel[j].rel[object_64bit] != 0)
3912 {
3913 int first, second;
3914 char *tmpbuf, *past_reloc;
3915
3916 *reloc = gotrel[j].rel[object_64bit];
3917 if (adjust)
3918 *adjust = len;
3919
3920 if (types)
3921 {
3922 if (flag_code != CODE_64BIT)
3923 *types = Imm32|Disp32;
3924 else
3925 *types = gotrel[j].types64;
3926 }
3927
3928 if (GOT_symbol == NULL)
3929 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
3930
3931 /* Replace the relocation token with ' ', so that
3932 errors like foo@GOTOFF1 will be detected. */
3933
3934 /* The length of the first part of our input line. */
3935 first = cp - input_line_pointer;
3936
3937 /* The second part goes from after the reloc token until
3938 (and including) an end_of_line char. Don't use strlen
3939 here as the end_of_line char may not be a NUL. */
3940 past_reloc = cp + 1 + len;
3941 for (cp = past_reloc; !is_end_of_line[(unsigned char) *cp++]; )
3942 ;
3943 second = cp - past_reloc;
3944
3945 /* Allocate and copy string. The trailing NUL shouldn't
3946 be necessary, but be safe. */
3947 tmpbuf = xmalloc (first + second + 2);
3948 memcpy (tmpbuf, input_line_pointer, first);
3949 tmpbuf[first] = ' ';
3950 memcpy (tmpbuf + first + 1, past_reloc, second);
3951 tmpbuf[first + second + 1] = '\0';
3952 return tmpbuf;
3953 }
3954
3955 as_bad (_("@%s reloc is not supported with %d-bit output format"),
3956 gotrel[j].str, 1 << (5 + object_64bit));
3957 return NULL;
3958 }
3959 }
3960
3961 /* Might be a symbol version string. Don't as_bad here. */
3962 return NULL;
3963 }
3964
3965 void
3966 x86_cons (exp, size)
3967 expressionS *exp;
3968 int size;
3969 {
3970 if (size == 4 || (object_64bit && size == 8))
3971 {
3972 /* Handle @GOTOFF and the like in an expression. */
3973 char *save;
3974 char *gotfree_input_line;
3975 int adjust;
3976
3977 save = input_line_pointer;
3978 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
3979 if (gotfree_input_line)
3980 input_line_pointer = gotfree_input_line;
3981
3982 expression (exp);
3983
3984 if (gotfree_input_line)
3985 {
3986 /* expression () has merrily parsed up to the end of line,
3987 or a comma - in the wrong buffer. Transfer how far
3988 input_line_pointer has moved to the right buffer. */
3989 input_line_pointer = (save
3990 + (input_line_pointer - gotfree_input_line)
3991 + adjust);
3992 free (gotfree_input_line);
3993 }
3994 }
3995 else
3996 expression (exp);
3997 }
3998 #endif
3999
4000 static void signed_cons (int size)
4001 {
4002 if (flag_code == CODE_64BIT)
4003 cons_sign = 1;
4004 cons (size);
4005 cons_sign = -1;
4006 }
4007
4008 #ifdef TE_PE
4009 static void
4010 pe_directive_secrel (dummy)
4011 int dummy ATTRIBUTE_UNUSED;
4012 {
4013 expressionS exp;
4014
4015 do
4016 {
4017 expression (&exp);
4018 if (exp.X_op == O_symbol)
4019 exp.X_op = O_secrel;
4020
4021 emit_expr (&exp, 4);
4022 }
4023 while (*input_line_pointer++ == ',');
4024
4025 input_line_pointer--;
4026 demand_empty_rest_of_line ();
4027 }
4028 #endif
4029
4030 static int i386_immediate PARAMS ((char *));
4031
4032 static int
4033 i386_immediate (imm_start)
4034 char *imm_start;
4035 {
4036 char *save_input_line_pointer;
4037 char *gotfree_input_line;
4038 segT exp_seg = 0;
4039 expressionS *exp;
4040 unsigned int types = ~0U;
4041
4042 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
4043 {
4044 as_bad (_("only 1 or 2 immediate operands are allowed"));
4045 return 0;
4046 }
4047
4048 exp = &im_expressions[i.imm_operands++];
4049 i.op[this_operand].imms = exp;
4050
4051 if (is_space_char (*imm_start))
4052 ++imm_start;
4053
4054 save_input_line_pointer = input_line_pointer;
4055 input_line_pointer = imm_start;
4056
4057 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
4058 if (gotfree_input_line)
4059 input_line_pointer = gotfree_input_line;
4060
4061 exp_seg = expression (exp);
4062
4063 SKIP_WHITESPACE ();
4064 if (*input_line_pointer)
4065 as_bad (_("junk `%s' after expression"), input_line_pointer);
4066
4067 input_line_pointer = save_input_line_pointer;
4068 if (gotfree_input_line)
4069 free (gotfree_input_line);
4070
4071 if (exp->X_op == O_absent || exp->X_op == O_big)
4072 {
4073 /* Missing or bad expr becomes absolute 0. */
4074 as_bad (_("missing or invalid immediate expression `%s' taken as 0"),
4075 imm_start);
4076 exp->X_op = O_constant;
4077 exp->X_add_number = 0;
4078 exp->X_add_symbol = (symbolS *) 0;
4079 exp->X_op_symbol = (symbolS *) 0;
4080 }
4081 else if (exp->X_op == O_constant)
4082 {
4083 /* Size it properly later. */
4084 i.types[this_operand] |= Imm64;
4085 /* If BFD64, sign extend val. */
4086 if (!use_rela_relocations)
4087 if ((exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
4088 exp->X_add_number = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
4089 }
4090 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
4091 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
4092 && exp_seg != absolute_section
4093 && exp_seg != text_section
4094 && exp_seg != data_section
4095 && exp_seg != bss_section
4096 && exp_seg != undefined_section
4097 && !bfd_is_com_section (exp_seg))
4098 {
4099 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
4100 return 0;
4101 }
4102 #endif
4103 else
4104 {
4105 /* This is an address. The size of the address will be
4106 determined later, depending on destination register,
4107 suffix, or the default for the section. */
4108 i.types[this_operand] |= Imm8 | Imm16 | Imm32 | Imm32S | Imm64;
4109 i.types[this_operand] &= types;
4110 }
4111
4112 return 1;
4113 }
4114
4115 static char *i386_scale PARAMS ((char *));
4116
4117 static char *
4118 i386_scale (scale)
4119 char *scale;
4120 {
4121 offsetT val;
4122 char *save = input_line_pointer;
4123
4124 input_line_pointer = scale;
4125 val = get_absolute_expression ();
4126
4127 switch (val)
4128 {
4129 case 1:
4130 i.log2_scale_factor = 0;
4131 break;
4132 case 2:
4133 i.log2_scale_factor = 1;
4134 break;
4135 case 4:
4136 i.log2_scale_factor = 2;
4137 break;
4138 case 8:
4139 i.log2_scale_factor = 3;
4140 break;
4141 default:
4142 {
4143 char sep = *input_line_pointer;
4144
4145 *input_line_pointer = '\0';
4146 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
4147 scale);
4148 *input_line_pointer = sep;
4149 input_line_pointer = save;
4150 return NULL;
4151 }
4152 }
4153 if (i.log2_scale_factor != 0 && i.index_reg == 0)
4154 {
4155 as_warn (_("scale factor of %d without an index register"),
4156 1 << i.log2_scale_factor);
4157 #if SCALE1_WHEN_NO_INDEX
4158 i.log2_scale_factor = 0;
4159 #endif
4160 }
4161 scale = input_line_pointer;
4162 input_line_pointer = save;
4163 return scale;
4164 }
4165
4166 static int i386_displacement PARAMS ((char *, char *));
4167
4168 static int
4169 i386_displacement (disp_start, disp_end)
4170 char *disp_start;
4171 char *disp_end;
4172 {
4173 expressionS *exp;
4174 segT exp_seg = 0;
4175 char *save_input_line_pointer;
4176 char *gotfree_input_line;
4177 int bigdisp, override;
4178 unsigned int types = Disp;
4179
4180 if ((i.types[this_operand] & JumpAbsolute)
4181 || !(current_templates->start->opcode_modifier & (Jump | JumpDword)))
4182 {
4183 bigdisp = Disp32;
4184 override = (i.prefix[ADDR_PREFIX] != 0);
4185 }
4186 else
4187 {
4188 /* For PC-relative branches, the width of the displacement
4189 is dependent upon data size, not address size. */
4190 bigdisp = 0;
4191 override = (i.prefix[DATA_PREFIX] != 0);
4192 }
4193 if (flag_code == CODE_64BIT)
4194 {
4195 if (!bigdisp)
4196 bigdisp = (override || i.suffix == WORD_MNEM_SUFFIX)
4197 ? Disp16
4198 : Disp32S | Disp32;
4199 else if (!override)
4200 bigdisp = Disp64 | Disp32S | Disp32;
4201 }
4202 else
4203 {
4204 if (!bigdisp)
4205 {
4206 if (!override)
4207 override = (i.suffix == (flag_code != CODE_16BIT
4208 ? WORD_MNEM_SUFFIX
4209 : LONG_MNEM_SUFFIX));
4210 bigdisp = Disp32;
4211 }
4212 if ((flag_code == CODE_16BIT) ^ override)
4213 bigdisp = Disp16;
4214 }
4215 i.types[this_operand] |= bigdisp;
4216
4217 exp = &disp_expressions[i.disp_operands];
4218 i.op[this_operand].disps = exp;
4219 i.disp_operands++;
4220 save_input_line_pointer = input_line_pointer;
4221 input_line_pointer = disp_start;
4222 END_STRING_AND_SAVE (disp_end);
4223
4224 #ifndef GCC_ASM_O_HACK
4225 #define GCC_ASM_O_HACK 0
4226 #endif
4227 #if GCC_ASM_O_HACK
4228 END_STRING_AND_SAVE (disp_end + 1);
4229 if ((i.types[this_operand] & BaseIndex) != 0
4230 && displacement_string_end[-1] == '+')
4231 {
4232 /* This hack is to avoid a warning when using the "o"
4233 constraint within gcc asm statements.
4234 For instance:
4235
4236 #define _set_tssldt_desc(n,addr,limit,type) \
4237 __asm__ __volatile__ ( \
4238 "movw %w2,%0\n\t" \
4239 "movw %w1,2+%0\n\t" \
4240 "rorl $16,%1\n\t" \
4241 "movb %b1,4+%0\n\t" \
4242 "movb %4,5+%0\n\t" \
4243 "movb $0,6+%0\n\t" \
4244 "movb %h1,7+%0\n\t" \
4245 "rorl $16,%1" \
4246 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
4247
4248 This works great except that the output assembler ends
4249 up looking a bit weird if it turns out that there is
4250 no offset. You end up producing code that looks like:
4251
4252 #APP
4253 movw $235,(%eax)
4254 movw %dx,2+(%eax)
4255 rorl $16,%edx
4256 movb %dl,4+(%eax)
4257 movb $137,5+(%eax)
4258 movb $0,6+(%eax)
4259 movb %dh,7+(%eax)
4260 rorl $16,%edx
4261 #NO_APP
4262
4263 So here we provide the missing zero. */
4264
4265 *displacement_string_end = '0';
4266 }
4267 #endif
4268 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
4269 if (gotfree_input_line)
4270 input_line_pointer = gotfree_input_line;
4271
4272 exp_seg = expression (exp);
4273
4274 SKIP_WHITESPACE ();
4275 if (*input_line_pointer)
4276 as_bad (_("junk `%s' after expression"), input_line_pointer);
4277 #if GCC_ASM_O_HACK
4278 RESTORE_END_STRING (disp_end + 1);
4279 #endif
4280 RESTORE_END_STRING (disp_end);
4281 input_line_pointer = save_input_line_pointer;
4282 if (gotfree_input_line)
4283 free (gotfree_input_line);
4284
4285 /* We do this to make sure that the section symbol is in
4286 the symbol table. We will ultimately change the relocation
4287 to be relative to the beginning of the section. */
4288 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
4289 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
4290 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
4291 {
4292 if (exp->X_op != O_symbol)
4293 {
4294 as_bad (_("bad expression used with @%s"),
4295 (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
4296 ? "GOTPCREL"
4297 : "GOTOFF"));
4298 return 0;
4299 }
4300
4301 if (S_IS_LOCAL (exp->X_add_symbol)
4302 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section)
4303 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
4304 exp->X_op = O_subtract;
4305 exp->X_op_symbol = GOT_symbol;
4306 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
4307 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
4308 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
4309 i.reloc[this_operand] = BFD_RELOC_64;
4310 else
4311 i.reloc[this_operand] = BFD_RELOC_32;
4312 }
4313
4314 if (exp->X_op == O_absent || exp->X_op == O_big)
4315 {
4316 /* Missing or bad expr becomes absolute 0. */
4317 as_bad (_("missing or invalid displacement expression `%s' taken as 0"),
4318 disp_start);
4319 exp->X_op = O_constant;
4320 exp->X_add_number = 0;
4321 exp->X_add_symbol = (symbolS *) 0;
4322 exp->X_op_symbol = (symbolS *) 0;
4323 }
4324
4325 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
4326 if (exp->X_op != O_constant
4327 && OUTPUT_FLAVOR == bfd_target_aout_flavour
4328 && exp_seg != absolute_section
4329 && exp_seg != text_section
4330 && exp_seg != data_section
4331 && exp_seg != bss_section
4332 && exp_seg != undefined_section
4333 && !bfd_is_com_section (exp_seg))
4334 {
4335 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
4336 return 0;
4337 }
4338 #endif
4339
4340 if (!(i.types[this_operand] & ~Disp))
4341 i.types[this_operand] &= types;
4342
4343 return 1;
4344 }
4345
4346 static int i386_index_check PARAMS ((const char *));
4347
4348 /* Make sure the memory operand we've been dealt is valid.
4349 Return 1 on success, 0 on a failure. */
4350
4351 static int
4352 i386_index_check (operand_string)
4353 const char *operand_string;
4354 {
4355 int ok;
4356 #if INFER_ADDR_PREFIX
4357 int fudged = 0;
4358
4359 tryprefix:
4360 #endif
4361 ok = 1;
4362 if ((current_templates->start->cpu_flags & CpuSVME)
4363 && current_templates->end[-1].operand_types[0] == AnyMem)
4364 {
4365 /* Memory operands of SVME insns are special in that they only allow
4366 rAX as their memory address and ignore any segment override. */
4367 unsigned RegXX;
4368
4369 /* SKINIT is even more restrictive: it always requires EAX. */
4370 if (strcmp (current_templates->start->name, "skinit") == 0)
4371 RegXX = Reg32;
4372 else if (flag_code == CODE_64BIT)
4373 RegXX = i.prefix[ADDR_PREFIX] == 0 ? Reg64 : Reg32;
4374 else
4375 RegXX = (flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0)
4376 ? Reg16
4377 : Reg32;
4378 if (!i.base_reg
4379 || !(i.base_reg->reg_type & Acc)
4380 || !(i.base_reg->reg_type & RegXX)
4381 || i.index_reg
4382 || (i.types[0] & Disp))
4383 ok = 0;
4384 }
4385 else if (flag_code == CODE_64BIT)
4386 {
4387 unsigned RegXX = (i.prefix[ADDR_PREFIX] == 0 ? Reg64 : Reg32);
4388
4389 if ((i.base_reg
4390 && ((i.base_reg->reg_type & RegXX) == 0)
4391 && (i.base_reg->reg_type != BaseIndex
4392 || i.index_reg))
4393 || (i.index_reg
4394 && ((i.index_reg->reg_type & (RegXX | BaseIndex))
4395 != (RegXX | BaseIndex))))
4396 ok = 0;
4397 }
4398 else
4399 {
4400 if ((flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0))
4401 {
4402 /* 16bit checks. */
4403 if ((i.base_reg
4404 && ((i.base_reg->reg_type & (Reg16 | BaseIndex | RegRex))
4405 != (Reg16 | BaseIndex)))
4406 || (i.index_reg
4407 && (((i.index_reg->reg_type & (Reg16 | BaseIndex))
4408 != (Reg16 | BaseIndex))
4409 || !(i.base_reg
4410 && i.base_reg->reg_num < 6
4411 && i.index_reg->reg_num >= 6
4412 && i.log2_scale_factor == 0))))
4413 ok = 0;
4414 }
4415 else
4416 {
4417 /* 32bit checks. */
4418 if ((i.base_reg
4419 && (i.base_reg->reg_type & (Reg32 | RegRex)) != Reg32)
4420 || (i.index_reg
4421 && ((i.index_reg->reg_type & (Reg32 | BaseIndex | RegRex))
4422 != (Reg32 | BaseIndex))))
4423 ok = 0;
4424 }
4425 }
4426 if (!ok)
4427 {
4428 #if INFER_ADDR_PREFIX
4429 if (i.prefix[ADDR_PREFIX] == 0)
4430 {
4431 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
4432 i.prefixes += 1;
4433 /* Change the size of any displacement too. At most one of
4434 Disp16 or Disp32 is set.
4435 FIXME. There doesn't seem to be any real need for separate
4436 Disp16 and Disp32 flags. The same goes for Imm16 and Imm32.
4437 Removing them would probably clean up the code quite a lot. */
4438 if (flag_code != CODE_64BIT && (i.types[this_operand] & (Disp16 | Disp32)))
4439 i.types[this_operand] ^= (Disp16 | Disp32);
4440 fudged = 1;
4441 goto tryprefix;
4442 }
4443 if (fudged)
4444 as_bad (_("`%s' is not a valid base/index expression"),
4445 operand_string);
4446 else
4447 #endif
4448 as_bad (_("`%s' is not a valid %s bit base/index expression"),
4449 operand_string,
4450 flag_code_names[flag_code]);
4451 }
4452 return ok;
4453 }
4454
4455 /* Parse OPERAND_STRING into the i386_insn structure I. Returns non-zero
4456 on error. */
4457
4458 static int
4459 i386_operand (operand_string)
4460 char *operand_string;
4461 {
4462 const reg_entry *r;
4463 char *end_op;
4464 char *op_string = operand_string;
4465
4466 if (is_space_char (*op_string))
4467 ++op_string;
4468
4469 /* We check for an absolute prefix (differentiating,
4470 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
4471 if (*op_string == ABSOLUTE_PREFIX)
4472 {
4473 ++op_string;
4474 if (is_space_char (*op_string))
4475 ++op_string;
4476 i.types[this_operand] |= JumpAbsolute;
4477 }
4478
4479 /* Check if operand is a register. */
4480 if ((r = parse_register (op_string, &end_op)) != NULL)
4481 {
4482 /* Check for a segment override by searching for ':' after a
4483 segment register. */
4484 op_string = end_op;
4485 if (is_space_char (*op_string))
4486 ++op_string;
4487 if (*op_string == ':' && (r->reg_type & (SReg2 | SReg3)))
4488 {
4489 switch (r->reg_num)
4490 {
4491 case 0:
4492 i.seg[i.mem_operands] = &es;
4493 break;
4494 case 1:
4495 i.seg[i.mem_operands] = &cs;
4496 break;
4497 case 2:
4498 i.seg[i.mem_operands] = &ss;
4499 break;
4500 case 3:
4501 i.seg[i.mem_operands] = &ds;
4502 break;
4503 case 4:
4504 i.seg[i.mem_operands] = &fs;
4505 break;
4506 case 5:
4507 i.seg[i.mem_operands] = &gs;
4508 break;
4509 }
4510
4511 /* Skip the ':' and whitespace. */
4512 ++op_string;
4513 if (is_space_char (*op_string))
4514 ++op_string;
4515
4516 if (!is_digit_char (*op_string)
4517 && !is_identifier_char (*op_string)
4518 && *op_string != '('
4519 && *op_string != ABSOLUTE_PREFIX)
4520 {
4521 as_bad (_("bad memory operand `%s'"), op_string);
4522 return 0;
4523 }
4524 /* Handle case of %es:*foo. */
4525 if (*op_string == ABSOLUTE_PREFIX)
4526 {
4527 ++op_string;
4528 if (is_space_char (*op_string))
4529 ++op_string;
4530 i.types[this_operand] |= JumpAbsolute;
4531 }
4532 goto do_memory_reference;
4533 }
4534 if (*op_string)
4535 {
4536 as_bad (_("junk `%s' after register"), op_string);
4537 return 0;
4538 }
4539 i.types[this_operand] |= r->reg_type & ~BaseIndex;
4540 i.op[this_operand].regs = r;
4541 i.reg_operands++;
4542 }
4543 else if (*op_string == REGISTER_PREFIX)
4544 {
4545 as_bad (_("bad register name `%s'"), op_string);
4546 return 0;
4547 }
4548 else if (*op_string == IMMEDIATE_PREFIX)
4549 {
4550 ++op_string;
4551 if (i.types[this_operand] & JumpAbsolute)
4552 {
4553 as_bad (_("immediate operand illegal with absolute jump"));
4554 return 0;
4555 }
4556 if (!i386_immediate (op_string))
4557 return 0;
4558 }
4559 else if (is_digit_char (*op_string)
4560 || is_identifier_char (*op_string)
4561 || *op_string == '(')
4562 {
4563 /* This is a memory reference of some sort. */
4564 char *base_string;
4565
4566 /* Start and end of displacement string expression (if found). */
4567 char *displacement_string_start;
4568 char *displacement_string_end;
4569
4570 do_memory_reference:
4571 if ((i.mem_operands == 1
4572 && (current_templates->start->opcode_modifier & IsString) == 0)
4573 || i.mem_operands == 2)
4574 {
4575 as_bad (_("too many memory references for `%s'"),
4576 current_templates->start->name);
4577 return 0;
4578 }
4579
4580 /* Check for base index form. We detect the base index form by
4581 looking for an ')' at the end of the operand, searching
4582 for the '(' matching it, and finding a REGISTER_PREFIX or ','
4583 after the '('. */
4584 base_string = op_string + strlen (op_string);
4585
4586 --base_string;
4587 if (is_space_char (*base_string))
4588 --base_string;
4589
4590 /* If we only have a displacement, set-up for it to be parsed later. */
4591 displacement_string_start = op_string;
4592 displacement_string_end = base_string + 1;
4593
4594 if (*base_string == ')')
4595 {
4596 char *temp_string;
4597 unsigned int parens_balanced = 1;
4598 /* We've already checked that the number of left & right ()'s are
4599 equal, so this loop will not be infinite. */
4600 do
4601 {
4602 base_string--;
4603 if (*base_string == ')')
4604 parens_balanced++;
4605 if (*base_string == '(')
4606 parens_balanced--;
4607 }
4608 while (parens_balanced);
4609
4610 temp_string = base_string;
4611
4612 /* Skip past '(' and whitespace. */
4613 ++base_string;
4614 if (is_space_char (*base_string))
4615 ++base_string;
4616
4617 if (*base_string == ','
4618 || ((i.base_reg = parse_register (base_string, &end_op)) != NULL))
4619 {
4620 displacement_string_end = temp_string;
4621
4622 i.types[this_operand] |= BaseIndex;
4623
4624 if (i.base_reg)
4625 {
4626 base_string = end_op;
4627 if (is_space_char (*base_string))
4628 ++base_string;
4629 }
4630
4631 /* There may be an index reg or scale factor here. */
4632 if (*base_string == ',')
4633 {
4634 ++base_string;
4635 if (is_space_char (*base_string))
4636 ++base_string;
4637
4638 if ((i.index_reg = parse_register (base_string, &end_op)) != NULL)
4639 {
4640 base_string = end_op;
4641 if (is_space_char (*base_string))
4642 ++base_string;
4643 if (*base_string == ',')
4644 {
4645 ++base_string;
4646 if (is_space_char (*base_string))
4647 ++base_string;
4648 }
4649 else if (*base_string != ')')
4650 {
4651 as_bad (_("expecting `,' or `)' after index register in `%s'"),
4652 operand_string);
4653 return 0;
4654 }
4655 }
4656 else if (*base_string == REGISTER_PREFIX)
4657 {
4658 as_bad (_("bad register name `%s'"), base_string);
4659 return 0;
4660 }
4661
4662 /* Check for scale factor. */
4663 if (*base_string != ')')
4664 {
4665 char *end_scale = i386_scale (base_string);
4666
4667 if (!end_scale)
4668 return 0;
4669
4670 base_string = end_scale;
4671 if (is_space_char (*base_string))
4672 ++base_string;
4673 if (*base_string != ')')
4674 {
4675 as_bad (_("expecting `)' after scale factor in `%s'"),
4676 operand_string);
4677 return 0;
4678 }
4679 }
4680 else if (!i.index_reg)
4681 {
4682 as_bad (_("expecting index register or scale factor after `,'; got '%c'"),
4683 *base_string);
4684 return 0;
4685 }
4686 }
4687 else if (*base_string != ')')
4688 {
4689 as_bad (_("expecting `,' or `)' after base register in `%s'"),
4690 operand_string);
4691 return 0;
4692 }
4693 }
4694 else if (*base_string == REGISTER_PREFIX)
4695 {
4696 as_bad (_("bad register name `%s'"), base_string);
4697 return 0;
4698 }
4699 }
4700
4701 /* If there's an expression beginning the operand, parse it,
4702 assuming displacement_string_start and
4703 displacement_string_end are meaningful. */
4704 if (displacement_string_start != displacement_string_end)
4705 {
4706 if (!i386_displacement (displacement_string_start,
4707 displacement_string_end))
4708 return 0;
4709 }
4710
4711 /* Special case for (%dx) while doing input/output op. */
4712 if (i.base_reg
4713 && i.base_reg->reg_type == (Reg16 | InOutPortReg)
4714 && i.index_reg == 0
4715 && i.log2_scale_factor == 0
4716 && i.seg[i.mem_operands] == 0
4717 && (i.types[this_operand] & Disp) == 0)
4718 {
4719 i.types[this_operand] = InOutPortReg;
4720 return 1;
4721 }
4722
4723 if (i386_index_check (operand_string) == 0)
4724 return 0;
4725 i.mem_operands++;
4726 }
4727 else
4728 {
4729 /* It's not a memory operand; argh! */
4730 as_bad (_("invalid char %s beginning operand %d `%s'"),
4731 output_invalid (*op_string),
4732 this_operand + 1,
4733 op_string);
4734 return 0;
4735 }
4736 return 1; /* Normal return. */
4737 }
4738 \f
4739 /* md_estimate_size_before_relax()
4740
4741 Called just before relax() for rs_machine_dependent frags. The x86
4742 assembler uses these frags to handle variable size jump
4743 instructions.
4744
4745 Any symbol that is now undefined will not become defined.
4746 Return the correct fr_subtype in the frag.
4747 Return the initial "guess for variable size of frag" to caller.
4748 The guess is actually the growth beyond the fixed part. Whatever
4749 we do to grow the fixed or variable part contributes to our
4750 returned value. */
4751
4752 int
4753 md_estimate_size_before_relax (fragP, segment)
4754 fragS *fragP;
4755 segT segment;
4756 {
4757 /* We've already got fragP->fr_subtype right; all we have to do is
4758 check for un-relaxable symbols. On an ELF system, we can't relax
4759 an externally visible symbol, because it may be overridden by a
4760 shared library. */
4761 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
4762 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
4763 || (IS_ELF
4764 && (S_IS_EXTERNAL (fragP->fr_symbol)
4765 || S_IS_WEAK (fragP->fr_symbol)))
4766 #endif
4767 )
4768 {
4769 /* Symbol is undefined in this segment, or we need to keep a
4770 reloc so that weak symbols can be overridden. */
4771 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
4772 enum bfd_reloc_code_real reloc_type;
4773 unsigned char *opcode;
4774 int old_fr_fix;
4775
4776 if (fragP->fr_var != NO_RELOC)
4777 reloc_type = fragP->fr_var;
4778 else if (size == 2)
4779 reloc_type = BFD_RELOC_16_PCREL;
4780 else
4781 reloc_type = BFD_RELOC_32_PCREL;
4782
4783 old_fr_fix = fragP->fr_fix;
4784 opcode = (unsigned char *) fragP->fr_opcode;
4785
4786 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
4787 {
4788 case UNCOND_JUMP:
4789 /* Make jmp (0xeb) a (d)word displacement jump. */
4790 opcode[0] = 0xe9;
4791 fragP->fr_fix += size;
4792 fix_new (fragP, old_fr_fix, size,
4793 fragP->fr_symbol,
4794 fragP->fr_offset, 1,
4795 reloc_type);
4796 break;
4797
4798 case COND_JUMP86:
4799 if (size == 2
4800 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
4801 {
4802 /* Negate the condition, and branch past an
4803 unconditional jump. */
4804 opcode[0] ^= 1;
4805 opcode[1] = 3;
4806 /* Insert an unconditional jump. */
4807 opcode[2] = 0xe9;
4808 /* We added two extra opcode bytes, and have a two byte
4809 offset. */
4810 fragP->fr_fix += 2 + 2;
4811 fix_new (fragP, old_fr_fix + 2, 2,
4812 fragP->fr_symbol,
4813 fragP->fr_offset, 1,
4814 reloc_type);
4815 break;
4816 }
4817 /* Fall through. */
4818
4819 case COND_JUMP:
4820 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
4821 {
4822 fixS *fixP;
4823
4824 fragP->fr_fix += 1;
4825 fixP = fix_new (fragP, old_fr_fix, 1,
4826 fragP->fr_symbol,
4827 fragP->fr_offset, 1,
4828 BFD_RELOC_8_PCREL);
4829 fixP->fx_signed = 1;
4830 break;
4831 }
4832
4833 /* This changes the byte-displacement jump 0x7N
4834 to the (d)word-displacement jump 0x0f,0x8N. */
4835 opcode[1] = opcode[0] + 0x10;
4836 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4837 /* We've added an opcode byte. */
4838 fragP->fr_fix += 1 + size;
4839 fix_new (fragP, old_fr_fix + 1, size,
4840 fragP->fr_symbol,
4841 fragP->fr_offset, 1,
4842 reloc_type);
4843 break;
4844
4845 default:
4846 BAD_CASE (fragP->fr_subtype);
4847 break;
4848 }
4849 frag_wane (fragP);
4850 return fragP->fr_fix - old_fr_fix;
4851 }
4852
4853 /* Guess size depending on current relax state. Initially the relax
4854 state will correspond to a short jump and we return 1, because
4855 the variable part of the frag (the branch offset) is one byte
4856 long. However, we can relax a section more than once and in that
4857 case we must either set fr_subtype back to the unrelaxed state,
4858 or return the value for the appropriate branch. */
4859 return md_relax_table[fragP->fr_subtype].rlx_length;
4860 }
4861
4862 /* Called after relax() is finished.
4863
4864 In: Address of frag.
4865 fr_type == rs_machine_dependent.
4866 fr_subtype is what the address relaxed to.
4867
4868 Out: Any fixSs and constants are set up.
4869 Caller will turn frag into a ".space 0". */
4870
4871 void
4872 md_convert_frag (abfd, sec, fragP)
4873 bfd *abfd ATTRIBUTE_UNUSED;
4874 segT sec ATTRIBUTE_UNUSED;
4875 fragS *fragP;
4876 {
4877 unsigned char *opcode;
4878 unsigned char *where_to_put_displacement = NULL;
4879 offsetT target_address;
4880 offsetT opcode_address;
4881 unsigned int extension = 0;
4882 offsetT displacement_from_opcode_start;
4883
4884 opcode = (unsigned char *) fragP->fr_opcode;
4885
4886 /* Address we want to reach in file space. */
4887 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
4888
4889 /* Address opcode resides at in file space. */
4890 opcode_address = fragP->fr_address + fragP->fr_fix;
4891
4892 /* Displacement from opcode start to fill into instruction. */
4893 displacement_from_opcode_start = target_address - opcode_address;
4894
4895 if ((fragP->fr_subtype & BIG) == 0)
4896 {
4897 /* Don't have to change opcode. */
4898 extension = 1; /* 1 opcode + 1 displacement */
4899 where_to_put_displacement = &opcode[1];
4900 }
4901 else
4902 {
4903 if (no_cond_jump_promotion
4904 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
4905 as_warn_where (fragP->fr_file, fragP->fr_line, _("long jump required"));
4906
4907 switch (fragP->fr_subtype)
4908 {
4909 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
4910 extension = 4; /* 1 opcode + 4 displacement */
4911 opcode[0] = 0xe9;
4912 where_to_put_displacement = &opcode[1];
4913 break;
4914
4915 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
4916 extension = 2; /* 1 opcode + 2 displacement */
4917 opcode[0] = 0xe9;
4918 where_to_put_displacement = &opcode[1];
4919 break;
4920
4921 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
4922 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
4923 extension = 5; /* 2 opcode + 4 displacement */
4924 opcode[1] = opcode[0] + 0x10;
4925 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4926 where_to_put_displacement = &opcode[2];
4927 break;
4928
4929 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
4930 extension = 3; /* 2 opcode + 2 displacement */
4931 opcode[1] = opcode[0] + 0x10;
4932 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4933 where_to_put_displacement = &opcode[2];
4934 break;
4935
4936 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
4937 extension = 4;
4938 opcode[0] ^= 1;
4939 opcode[1] = 3;
4940 opcode[2] = 0xe9;
4941 where_to_put_displacement = &opcode[3];
4942 break;
4943
4944 default:
4945 BAD_CASE (fragP->fr_subtype);
4946 break;
4947 }
4948 }
4949
4950 /* Now put displacement after opcode. */
4951 md_number_to_chars ((char *) where_to_put_displacement,
4952 (valueT) (displacement_from_opcode_start - extension),
4953 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
4954 fragP->fr_fix += extension;
4955 }
4956 \f
4957 /* Size of byte displacement jmp. */
4958 int md_short_jump_size = 2;
4959
4960 /* Size of dword displacement jmp. */
4961 int md_long_jump_size = 5;
4962
4963 void
4964 md_create_short_jump (ptr, from_addr, to_addr, frag, to_symbol)
4965 char *ptr;
4966 addressT from_addr, to_addr;
4967 fragS *frag ATTRIBUTE_UNUSED;
4968 symbolS *to_symbol ATTRIBUTE_UNUSED;
4969 {
4970 offsetT offset;
4971
4972 offset = to_addr - (from_addr + 2);
4973 /* Opcode for byte-disp jump. */
4974 md_number_to_chars (ptr, (valueT) 0xeb, 1);
4975 md_number_to_chars (ptr + 1, (valueT) offset, 1);
4976 }
4977
4978 void
4979 md_create_long_jump (ptr, from_addr, to_addr, frag, to_symbol)
4980 char *ptr;
4981 addressT from_addr, to_addr;
4982 fragS *frag ATTRIBUTE_UNUSED;
4983 symbolS *to_symbol ATTRIBUTE_UNUSED;
4984 {
4985 offsetT offset;
4986
4987 offset = to_addr - (from_addr + 5);
4988 md_number_to_chars (ptr, (valueT) 0xe9, 1);
4989 md_number_to_chars (ptr + 1, (valueT) offset, 4);
4990 }
4991 \f
4992 /* Apply a fixup (fixS) to segment data, once it has been determined
4993 by our caller that we have all the info we need to fix it up.
4994
4995 On the 386, immediates, displacements, and data pointers are all in
4996 the same (little-endian) format, so we don't need to care about which
4997 we are handling. */
4998
4999 void
5000 md_apply_fix (fixP, valP, seg)
5001 /* The fix we're to put in. */
5002 fixS *fixP;
5003 /* Pointer to the value of the bits. */
5004 valueT *valP;
5005 /* Segment fix is from. */
5006 segT seg ATTRIBUTE_UNUSED;
5007 {
5008 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
5009 valueT value = *valP;
5010
5011 #if !defined (TE_Mach)
5012 if (fixP->fx_pcrel)
5013 {
5014 switch (fixP->fx_r_type)
5015 {
5016 default:
5017 break;
5018
5019 case BFD_RELOC_64:
5020 fixP->fx_r_type = BFD_RELOC_64_PCREL;
5021 break;
5022 case BFD_RELOC_32:
5023 case BFD_RELOC_X86_64_32S:
5024 fixP->fx_r_type = BFD_RELOC_32_PCREL;
5025 break;
5026 case BFD_RELOC_16:
5027 fixP->fx_r_type = BFD_RELOC_16_PCREL;
5028 break;
5029 case BFD_RELOC_8:
5030 fixP->fx_r_type = BFD_RELOC_8_PCREL;
5031 break;
5032 }
5033 }
5034
5035 if (fixP->fx_addsy != NULL
5036 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
5037 || fixP->fx_r_type == BFD_RELOC_64_PCREL
5038 || fixP->fx_r_type == BFD_RELOC_16_PCREL
5039 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
5040 && !use_rela_relocations)
5041 {
5042 /* This is a hack. There should be a better way to handle this.
5043 This covers for the fact that bfd_install_relocation will
5044 subtract the current location (for partial_inplace, PC relative
5045 relocations); see more below. */
5046 #ifndef OBJ_AOUT
5047 if (IS_ELF
5048 #ifdef TE_PE
5049 || OUTPUT_FLAVOR == bfd_target_coff_flavour
5050 #endif
5051 )
5052 value += fixP->fx_where + fixP->fx_frag->fr_address;
5053 #endif
5054 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5055 if (IS_ELF)
5056 {
5057 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
5058
5059 if ((sym_seg == seg
5060 || (symbol_section_p (fixP->fx_addsy)
5061 && sym_seg != absolute_section))
5062 && !generic_force_reloc (fixP))
5063 {
5064 /* Yes, we add the values in twice. This is because
5065 bfd_install_relocation subtracts them out again. I think
5066 bfd_install_relocation is broken, but I don't dare change
5067 it. FIXME. */
5068 value += fixP->fx_where + fixP->fx_frag->fr_address;
5069 }
5070 }
5071 #endif
5072 #if defined (OBJ_COFF) && defined (TE_PE)
5073 /* For some reason, the PE format does not store a
5074 section address offset for a PC relative symbol. */
5075 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
5076 || S_IS_WEAK (fixP->fx_addsy))
5077 value += md_pcrel_from (fixP);
5078 #endif
5079 }
5080
5081 /* Fix a few things - the dynamic linker expects certain values here,
5082 and we must not disappoint it. */
5083 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5084 if (IS_ELF && fixP->fx_addsy)
5085 switch (fixP->fx_r_type)
5086 {
5087 case BFD_RELOC_386_PLT32:
5088 case BFD_RELOC_X86_64_PLT32:
5089 /* Make the jump instruction point to the address of the operand. At
5090 runtime we merely add the offset to the actual PLT entry. */
5091 value = -4;
5092 break;
5093
5094 case BFD_RELOC_386_TLS_GD:
5095 case BFD_RELOC_386_TLS_LDM:
5096 case BFD_RELOC_386_TLS_IE_32:
5097 case BFD_RELOC_386_TLS_IE:
5098 case BFD_RELOC_386_TLS_GOTIE:
5099 case BFD_RELOC_386_TLS_GOTDESC:
5100 case BFD_RELOC_X86_64_TLSGD:
5101 case BFD_RELOC_X86_64_TLSLD:
5102 case BFD_RELOC_X86_64_GOTTPOFF:
5103 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
5104 value = 0; /* Fully resolved at runtime. No addend. */
5105 /* Fallthrough */
5106 case BFD_RELOC_386_TLS_LE:
5107 case BFD_RELOC_386_TLS_LDO_32:
5108 case BFD_RELOC_386_TLS_LE_32:
5109 case BFD_RELOC_X86_64_DTPOFF32:
5110 case BFD_RELOC_X86_64_DTPOFF64:
5111 case BFD_RELOC_X86_64_TPOFF32:
5112 case BFD_RELOC_X86_64_TPOFF64:
5113 S_SET_THREAD_LOCAL (fixP->fx_addsy);
5114 break;
5115
5116 case BFD_RELOC_386_TLS_DESC_CALL:
5117 case BFD_RELOC_X86_64_TLSDESC_CALL:
5118 value = 0; /* Fully resolved at runtime. No addend. */
5119 S_SET_THREAD_LOCAL (fixP->fx_addsy);
5120 fixP->fx_done = 0;
5121 return;
5122
5123 case BFD_RELOC_386_GOT32:
5124 case BFD_RELOC_X86_64_GOT32:
5125 value = 0; /* Fully resolved at runtime. No addend. */
5126 break;
5127
5128 case BFD_RELOC_VTABLE_INHERIT:
5129 case BFD_RELOC_VTABLE_ENTRY:
5130 fixP->fx_done = 0;
5131 return;
5132
5133 default:
5134 break;
5135 }
5136 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
5137 *valP = value;
5138 #endif /* !defined (TE_Mach) */
5139
5140 /* Are we finished with this relocation now? */
5141 if (fixP->fx_addsy == NULL)
5142 fixP->fx_done = 1;
5143 else if (use_rela_relocations)
5144 {
5145 fixP->fx_no_overflow = 1;
5146 /* Remember value for tc_gen_reloc. */
5147 fixP->fx_addnumber = value;
5148 value = 0;
5149 }
5150
5151 md_number_to_chars (p, value, fixP->fx_size);
5152 }
5153 \f
5154 #define MAX_LITTLENUMS 6
5155
5156 /* Turn the string pointed to by litP into a floating point constant
5157 of type TYPE, and emit the appropriate bytes. The number of
5158 LITTLENUMS emitted is stored in *SIZEP. An error message is
5159 returned, or NULL on OK. */
5160
5161 char *
5162 md_atof (type, litP, sizeP)
5163 int type;
5164 char *litP;
5165 int *sizeP;
5166 {
5167 int prec;
5168 LITTLENUM_TYPE words[MAX_LITTLENUMS];
5169 LITTLENUM_TYPE *wordP;
5170 char *t;
5171
5172 switch (type)
5173 {
5174 case 'f':
5175 case 'F':
5176 prec = 2;
5177 break;
5178
5179 case 'd':
5180 case 'D':
5181 prec = 4;
5182 break;
5183
5184 case 'x':
5185 case 'X':
5186 prec = 5;
5187 break;
5188
5189 default:
5190 *sizeP = 0;
5191 return _("Bad call to md_atof ()");
5192 }
5193 t = atof_ieee (input_line_pointer, type, words);
5194 if (t)
5195 input_line_pointer = t;
5196
5197 *sizeP = prec * sizeof (LITTLENUM_TYPE);
5198 /* This loops outputs the LITTLENUMs in REVERSE order; in accord with
5199 the bigendian 386. */
5200 for (wordP = words + prec - 1; prec--;)
5201 {
5202 md_number_to_chars (litP, (valueT) (*wordP--), sizeof (LITTLENUM_TYPE));
5203 litP += sizeof (LITTLENUM_TYPE);
5204 }
5205 return 0;
5206 }
5207 \f
5208 static char output_invalid_buf[8];
5209
5210 static char *
5211 output_invalid (c)
5212 int c;
5213 {
5214 if (ISPRINT (c))
5215 sprintf (output_invalid_buf, "'%c'", c);
5216 else
5217 sprintf (output_invalid_buf, "(0x%x)", (unsigned) c);
5218 return output_invalid_buf;
5219 }
5220
5221 /* REG_STRING starts *before* REGISTER_PREFIX. */
5222
5223 static const reg_entry *
5224 parse_real_register (char *reg_string, char **end_op)
5225 {
5226 char *s = reg_string;
5227 char *p;
5228 char reg_name_given[MAX_REG_NAME_SIZE + 1];
5229 const reg_entry *r;
5230
5231 /* Skip possible REGISTER_PREFIX and possible whitespace. */
5232 if (*s == REGISTER_PREFIX)
5233 ++s;
5234
5235 if (is_space_char (*s))
5236 ++s;
5237
5238 p = reg_name_given;
5239 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
5240 {
5241 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
5242 return (const reg_entry *) NULL;
5243 s++;
5244 }
5245
5246 /* For naked regs, make sure that we are not dealing with an identifier.
5247 This prevents confusing an identifier like `eax_var' with register
5248 `eax'. */
5249 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
5250 return (const reg_entry *) NULL;
5251
5252 *end_op = s;
5253
5254 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
5255
5256 /* Handle floating point regs, allowing spaces in the (i) part. */
5257 if (r == i386_regtab /* %st is first entry of table */)
5258 {
5259 if (is_space_char (*s))
5260 ++s;
5261 if (*s == '(')
5262 {
5263 ++s;
5264 if (is_space_char (*s))
5265 ++s;
5266 if (*s >= '0' && *s <= '7')
5267 {
5268 r = &i386_float_regtab[*s - '0'];
5269 ++s;
5270 if (is_space_char (*s))
5271 ++s;
5272 if (*s == ')')
5273 {
5274 *end_op = s + 1;
5275 return r;
5276 }
5277 }
5278 /* We have "%st(" then garbage. */
5279 return (const reg_entry *) NULL;
5280 }
5281 }
5282
5283 if (r != NULL
5284 && ((r->reg_flags & (RegRex64 | RegRex)) | (r->reg_type & Reg64)) != 0
5285 && (r->reg_type != Control || !(cpu_arch_flags & CpuSledgehammer))
5286 && flag_code != CODE_64BIT)
5287 return (const reg_entry *) NULL;
5288
5289 return r;
5290 }
5291
5292 /* REG_STRING starts *before* REGISTER_PREFIX. */
5293
5294 static const reg_entry *
5295 parse_register (char *reg_string, char **end_op)
5296 {
5297 const reg_entry *r;
5298
5299 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
5300 r = parse_real_register (reg_string, end_op);
5301 else
5302 r = NULL;
5303 if (!r)
5304 {
5305 char *save = input_line_pointer;
5306 char c;
5307 symbolS *symbolP;
5308
5309 input_line_pointer = reg_string;
5310 c = get_symbol_end ();
5311 symbolP = symbol_find (reg_string);
5312 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
5313 {
5314 const expressionS *e = symbol_get_value_expression (symbolP);
5315
5316 know (e->X_op == O_register);
5317 know (e->X_add_number >= 0 && (valueT) e->X_add_number < ARRAY_SIZE (i386_regtab));
5318 r = i386_regtab + e->X_add_number;
5319 *end_op = input_line_pointer;
5320 }
5321 *input_line_pointer = c;
5322 input_line_pointer = save;
5323 }
5324 return r;
5325 }
5326
5327 int
5328 i386_parse_name (char *name, expressionS *e, char *nextcharP)
5329 {
5330 const reg_entry *r;
5331 char *end = input_line_pointer;
5332
5333 *end = *nextcharP;
5334 r = parse_register (name, &input_line_pointer);
5335 if (r && end <= input_line_pointer)
5336 {
5337 *nextcharP = *input_line_pointer;
5338 *input_line_pointer = 0;
5339 e->X_op = O_register;
5340 e->X_add_number = r - i386_regtab;
5341 return 1;
5342 }
5343 input_line_pointer = end;
5344 *end = 0;
5345 return 0;
5346 }
5347
5348 void
5349 md_operand (expressionS *e)
5350 {
5351 if (*input_line_pointer == REGISTER_PREFIX)
5352 {
5353 char *end;
5354 const reg_entry *r = parse_real_register (input_line_pointer, &end);
5355
5356 if (r)
5357 {
5358 e->X_op = O_register;
5359 e->X_add_number = r - i386_regtab;
5360 input_line_pointer = end;
5361 }
5362 }
5363 }
5364
5365 \f
5366 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5367 const char *md_shortopts = "kVQ:sqn";
5368 #else
5369 const char *md_shortopts = "qn";
5370 #endif
5371
5372 #define OPTION_32 (OPTION_MD_BASE + 0)
5373 #define OPTION_64 (OPTION_MD_BASE + 1)
5374 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
5375
5376 struct option md_longopts[] = {
5377 {"32", no_argument, NULL, OPTION_32},
5378 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5379 {"64", no_argument, NULL, OPTION_64},
5380 #endif
5381 {"divide", no_argument, NULL, OPTION_DIVIDE},
5382 {NULL, no_argument, NULL, 0}
5383 };
5384 size_t md_longopts_size = sizeof (md_longopts);
5385
5386 int
5387 md_parse_option (c, arg)
5388 int c;
5389 char *arg ATTRIBUTE_UNUSED;
5390 {
5391 switch (c)
5392 {
5393 case 'n':
5394 optimize_align_code = 0;
5395 break;
5396
5397 case 'q':
5398 quiet_warnings = 1;
5399 break;
5400
5401 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5402 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
5403 should be emitted or not. FIXME: Not implemented. */
5404 case 'Q':
5405 break;
5406
5407 /* -V: SVR4 argument to print version ID. */
5408 case 'V':
5409 print_version_id ();
5410 break;
5411
5412 /* -k: Ignore for FreeBSD compatibility. */
5413 case 'k':
5414 break;
5415
5416 case 's':
5417 /* -s: On i386 Solaris, this tells the native assembler to use
5418 .stab instead of .stab.excl. We always use .stab anyhow. */
5419 break;
5420
5421 case OPTION_64:
5422 {
5423 const char **list, **l;
5424
5425 list = bfd_target_list ();
5426 for (l = list; *l != NULL; l++)
5427 if (strcmp (*l, "elf64-x86-64") == 0)
5428 {
5429 default_arch = "x86_64";
5430 break;
5431 }
5432 if (*l == NULL)
5433 as_fatal (_("No compiled in support for x86_64"));
5434 free (list);
5435 }
5436 break;
5437 #endif
5438
5439 case OPTION_32:
5440 default_arch = "i386";
5441 break;
5442
5443 case OPTION_DIVIDE:
5444 #ifdef SVR4_COMMENT_CHARS
5445 {
5446 char *n, *t;
5447 const char *s;
5448
5449 n = (char *) xmalloc (strlen (i386_comment_chars) + 1);
5450 t = n;
5451 for (s = i386_comment_chars; *s != '\0'; s++)
5452 if (*s != '/')
5453 *t++ = *s;
5454 *t = '\0';
5455 i386_comment_chars = n;
5456 }
5457 #endif
5458 break;
5459
5460 default:
5461 return 0;
5462 }
5463 return 1;
5464 }
5465
5466 void
5467 md_show_usage (stream)
5468 FILE *stream;
5469 {
5470 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5471 fprintf (stream, _("\
5472 -Q ignored\n\
5473 -V print assembler version number\n\
5474 -k ignored\n"));
5475 #endif
5476 fprintf (stream, _("\
5477 -n Do not optimize code alignment\n\
5478 -q quieten some warnings\n"));
5479 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5480 fprintf (stream, _("\
5481 -s ignored\n"));
5482 #endif
5483 #ifdef SVR4_COMMENT_CHARS
5484 fprintf (stream, _("\
5485 --divide do not treat `/' as a comment character\n"));
5486 #else
5487 fprintf (stream, _("\
5488 --divide ignored\n"));
5489 #endif
5490 }
5491
5492 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
5493 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
5494
5495 /* Pick the target format to use. */
5496
5497 const char *
5498 i386_target_format ()
5499 {
5500 if (!strcmp (default_arch, "x86_64"))
5501 set_code_flag (CODE_64BIT);
5502 else if (!strcmp (default_arch, "i386"))
5503 set_code_flag (CODE_32BIT);
5504 else
5505 as_fatal (_("Unknown architecture"));
5506 switch (OUTPUT_FLAVOR)
5507 {
5508 #ifdef OBJ_MAYBE_AOUT
5509 case bfd_target_aout_flavour:
5510 return AOUT_TARGET_FORMAT;
5511 #endif
5512 #ifdef OBJ_MAYBE_COFF
5513 case bfd_target_coff_flavour:
5514 return "coff-i386";
5515 #endif
5516 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
5517 case bfd_target_elf_flavour:
5518 {
5519 if (flag_code == CODE_64BIT)
5520 {
5521 object_64bit = 1;
5522 use_rela_relocations = 1;
5523 }
5524 return flag_code == CODE_64BIT ? "elf64-x86-64" : ELF_TARGET_FORMAT;
5525 }
5526 #endif
5527 default:
5528 abort ();
5529 return NULL;
5530 }
5531 }
5532
5533 #endif /* OBJ_MAYBE_ more than one */
5534
5535 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
5536 void i386_elf_emit_arch_note ()
5537 {
5538 if (IS_ELF && cpu_arch_name != NULL)
5539 {
5540 char *p;
5541 asection *seg = now_seg;
5542 subsegT subseg = now_subseg;
5543 Elf_Internal_Note i_note;
5544 Elf_External_Note e_note;
5545 asection *note_secp;
5546 int len;
5547
5548 /* Create the .note section. */
5549 note_secp = subseg_new (".note", 0);
5550 bfd_set_section_flags (stdoutput,
5551 note_secp,
5552 SEC_HAS_CONTENTS | SEC_READONLY);
5553
5554 /* Process the arch string. */
5555 len = strlen (cpu_arch_name);
5556
5557 i_note.namesz = len + 1;
5558 i_note.descsz = 0;
5559 i_note.type = NT_ARCH;
5560 p = frag_more (sizeof (e_note.namesz));
5561 md_number_to_chars (p, (valueT) i_note.namesz, sizeof (e_note.namesz));
5562 p = frag_more (sizeof (e_note.descsz));
5563 md_number_to_chars (p, (valueT) i_note.descsz, sizeof (e_note.descsz));
5564 p = frag_more (sizeof (e_note.type));
5565 md_number_to_chars (p, (valueT) i_note.type, sizeof (e_note.type));
5566 p = frag_more (len + 1);
5567 strcpy (p, cpu_arch_name);
5568
5569 frag_align (2, 0, 0);
5570
5571 subseg_set (seg, subseg);
5572 }
5573 }
5574 #endif
5575 \f
5576 symbolS *
5577 md_undefined_symbol (name)
5578 char *name;
5579 {
5580 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
5581 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
5582 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
5583 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
5584 {
5585 if (!GOT_symbol)
5586 {
5587 if (symbol_find (name))
5588 as_bad (_("GOT already in symbol table"));
5589 GOT_symbol = symbol_new (name, undefined_section,
5590 (valueT) 0, &zero_address_frag);
5591 };
5592 return GOT_symbol;
5593 }
5594 return 0;
5595 }
5596
5597 /* Round up a section size to the appropriate boundary. */
5598
5599 valueT
5600 md_section_align (segment, size)
5601 segT segment ATTRIBUTE_UNUSED;
5602 valueT size;
5603 {
5604 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
5605 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
5606 {
5607 /* For a.out, force the section size to be aligned. If we don't do
5608 this, BFD will align it for us, but it will not write out the
5609 final bytes of the section. This may be a bug in BFD, but it is
5610 easier to fix it here since that is how the other a.out targets
5611 work. */
5612 int align;
5613
5614 align = bfd_get_section_alignment (stdoutput, segment);
5615 size = ((size + (1 << align) - 1) & ((valueT) -1 << align));
5616 }
5617 #endif
5618
5619 return size;
5620 }
5621
5622 /* On the i386, PC-relative offsets are relative to the start of the
5623 next instruction. That is, the address of the offset, plus its
5624 size, since the offset is always the last part of the insn. */
5625
5626 long
5627 md_pcrel_from (fixP)
5628 fixS *fixP;
5629 {
5630 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
5631 }
5632
5633 #ifndef I386COFF
5634
5635 static void
5636 s_bss (ignore)
5637 int ignore ATTRIBUTE_UNUSED;
5638 {
5639 int temp;
5640
5641 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5642 if (IS_ELF)
5643 obj_elf_section_change_hook ();
5644 #endif
5645 temp = get_absolute_expression ();
5646 subseg_set (bss_section, (subsegT) temp);
5647 demand_empty_rest_of_line ();
5648 }
5649
5650 #endif
5651
5652 void
5653 i386_validate_fix (fixp)
5654 fixS *fixp;
5655 {
5656 if (fixp->fx_subsy && fixp->fx_subsy == GOT_symbol)
5657 {
5658 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
5659 {
5660 if (!object_64bit)
5661 abort ();
5662 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
5663 }
5664 else
5665 {
5666 if (!object_64bit)
5667 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
5668 else
5669 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
5670 }
5671 fixp->fx_subsy = 0;
5672 }
5673 }
5674
5675 arelent *
5676 tc_gen_reloc (section, fixp)
5677 asection *section ATTRIBUTE_UNUSED;
5678 fixS *fixp;
5679 {
5680 arelent *rel;
5681 bfd_reloc_code_real_type code;
5682
5683 switch (fixp->fx_r_type)
5684 {
5685 case BFD_RELOC_X86_64_PLT32:
5686 case BFD_RELOC_X86_64_GOT32:
5687 case BFD_RELOC_X86_64_GOTPCREL:
5688 case BFD_RELOC_386_PLT32:
5689 case BFD_RELOC_386_GOT32:
5690 case BFD_RELOC_386_GOTOFF:
5691 case BFD_RELOC_386_GOTPC:
5692 case BFD_RELOC_386_TLS_GD:
5693 case BFD_RELOC_386_TLS_LDM:
5694 case BFD_RELOC_386_TLS_LDO_32:
5695 case BFD_RELOC_386_TLS_IE_32:
5696 case BFD_RELOC_386_TLS_IE:
5697 case BFD_RELOC_386_TLS_GOTIE:
5698 case BFD_RELOC_386_TLS_LE_32:
5699 case BFD_RELOC_386_TLS_LE:
5700 case BFD_RELOC_386_TLS_GOTDESC:
5701 case BFD_RELOC_386_TLS_DESC_CALL:
5702 case BFD_RELOC_X86_64_TLSGD:
5703 case BFD_RELOC_X86_64_TLSLD:
5704 case BFD_RELOC_X86_64_DTPOFF32:
5705 case BFD_RELOC_X86_64_DTPOFF64:
5706 case BFD_RELOC_X86_64_GOTTPOFF:
5707 case BFD_RELOC_X86_64_TPOFF32:
5708 case BFD_RELOC_X86_64_TPOFF64:
5709 case BFD_RELOC_X86_64_GOTOFF64:
5710 case BFD_RELOC_X86_64_GOTPC32:
5711 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
5712 case BFD_RELOC_X86_64_TLSDESC_CALL:
5713 case BFD_RELOC_RVA:
5714 case BFD_RELOC_VTABLE_ENTRY:
5715 case BFD_RELOC_VTABLE_INHERIT:
5716 #ifdef TE_PE
5717 case BFD_RELOC_32_SECREL:
5718 #endif
5719 code = fixp->fx_r_type;
5720 break;
5721 case BFD_RELOC_X86_64_32S:
5722 if (!fixp->fx_pcrel)
5723 {
5724 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
5725 code = fixp->fx_r_type;
5726 break;
5727 }
5728 default:
5729 if (fixp->fx_pcrel)
5730 {
5731 switch (fixp->fx_size)
5732 {
5733 default:
5734 as_bad_where (fixp->fx_file, fixp->fx_line,
5735 _("can not do %d byte pc-relative relocation"),
5736 fixp->fx_size);
5737 code = BFD_RELOC_32_PCREL;
5738 break;
5739 case 1: code = BFD_RELOC_8_PCREL; break;
5740 case 2: code = BFD_RELOC_16_PCREL; break;
5741 case 4: code = BFD_RELOC_32_PCREL; break;
5742 #ifdef BFD64
5743 case 8: code = BFD_RELOC_64_PCREL; break;
5744 #endif
5745 }
5746 }
5747 else
5748 {
5749 switch (fixp->fx_size)
5750 {
5751 default:
5752 as_bad_where (fixp->fx_file, fixp->fx_line,
5753 _("can not do %d byte relocation"),
5754 fixp->fx_size);
5755 code = BFD_RELOC_32;
5756 break;
5757 case 1: code = BFD_RELOC_8; break;
5758 case 2: code = BFD_RELOC_16; break;
5759 case 4: code = BFD_RELOC_32; break;
5760 #ifdef BFD64
5761 case 8: code = BFD_RELOC_64; break;
5762 #endif
5763 }
5764 }
5765 break;
5766 }
5767
5768 if ((code == BFD_RELOC_32
5769 || code == BFD_RELOC_32_PCREL
5770 || code == BFD_RELOC_X86_64_32S)
5771 && GOT_symbol
5772 && fixp->fx_addsy == GOT_symbol)
5773 {
5774 if (!object_64bit)
5775 code = BFD_RELOC_386_GOTPC;
5776 else
5777 code = BFD_RELOC_X86_64_GOTPC32;
5778 }
5779
5780 rel = (arelent *) xmalloc (sizeof (arelent));
5781 rel->sym_ptr_ptr = (asymbol **) xmalloc (sizeof (asymbol *));
5782 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
5783
5784 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
5785
5786 if (!use_rela_relocations)
5787 {
5788 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
5789 vtable entry to be used in the relocation's section offset. */
5790 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
5791 rel->address = fixp->fx_offset;
5792
5793 rel->addend = 0;
5794 }
5795 /* Use the rela in 64bit mode. */
5796 else
5797 {
5798 if (!fixp->fx_pcrel)
5799 rel->addend = fixp->fx_offset;
5800 else
5801 switch (code)
5802 {
5803 case BFD_RELOC_X86_64_PLT32:
5804 case BFD_RELOC_X86_64_GOT32:
5805 case BFD_RELOC_X86_64_GOTPCREL:
5806 case BFD_RELOC_X86_64_TLSGD:
5807 case BFD_RELOC_X86_64_TLSLD:
5808 case BFD_RELOC_X86_64_GOTTPOFF:
5809 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
5810 case BFD_RELOC_X86_64_TLSDESC_CALL:
5811 rel->addend = fixp->fx_offset - fixp->fx_size;
5812 break;
5813 default:
5814 rel->addend = (section->vma
5815 - fixp->fx_size
5816 + fixp->fx_addnumber
5817 + md_pcrel_from (fixp));
5818 break;
5819 }
5820 }
5821
5822 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
5823 if (rel->howto == NULL)
5824 {
5825 as_bad_where (fixp->fx_file, fixp->fx_line,
5826 _("cannot represent relocation type %s"),
5827 bfd_get_reloc_code_name (code));
5828 /* Set howto to a garbage value so that we can keep going. */
5829 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
5830 assert (rel->howto != NULL);
5831 }
5832
5833 return rel;
5834 }
5835
5836 \f
5837 /* Parse operands using Intel syntax. This implements a recursive descent
5838 parser based on the BNF grammar published in Appendix B of the MASM 6.1
5839 Programmer's Guide.
5840
5841 FIXME: We do not recognize the full operand grammar defined in the MASM
5842 documentation. In particular, all the structure/union and
5843 high-level macro operands are missing.
5844
5845 Uppercase words are terminals, lower case words are non-terminals.
5846 Objects surrounded by double brackets '[[' ']]' are optional. Vertical
5847 bars '|' denote choices. Most grammar productions are implemented in
5848 functions called 'intel_<production>'.
5849
5850 Initial production is 'expr'.
5851
5852 addOp + | -
5853
5854 alpha [a-zA-Z]
5855
5856 binOp & | AND | \| | OR | ^ | XOR
5857
5858 byteRegister AL | AH | BL | BH | CL | CH | DL | DH
5859
5860 constant digits [[ radixOverride ]]
5861
5862 dataType BYTE | WORD | DWORD | FWORD | QWORD | TBYTE | OWORD | XMMWORD
5863
5864 digits decdigit
5865 | digits decdigit
5866 | digits hexdigit
5867
5868 decdigit [0-9]
5869
5870 e04 e04 addOp e05
5871 | e05
5872
5873 e05 e05 binOp e06
5874 | e06
5875
5876 e06 e06 mulOp e09
5877 | e09
5878
5879 e09 OFFSET e10
5880 | SHORT e10
5881 | + e10
5882 | - e10
5883 | ~ e10
5884 | NOT e10
5885 | e09 PTR e10
5886 | e09 : e10
5887 | e10
5888
5889 e10 e10 [ expr ]
5890 | e11
5891
5892 e11 ( expr )
5893 | [ expr ]
5894 | constant
5895 | dataType
5896 | id
5897 | $
5898 | register
5899
5900 => expr expr cmpOp e04
5901 | e04
5902
5903 gpRegister AX | EAX | BX | EBX | CX | ECX | DX | EDX
5904 | BP | EBP | SP | ESP | DI | EDI | SI | ESI
5905
5906 hexdigit a | b | c | d | e | f
5907 | A | B | C | D | E | F
5908
5909 id alpha
5910 | id alpha
5911 | id decdigit
5912
5913 mulOp * | / | % | MOD | << | SHL | >> | SHR
5914
5915 quote " | '
5916
5917 register specialRegister
5918 | gpRegister
5919 | byteRegister
5920
5921 segmentRegister CS | DS | ES | FS | GS | SS
5922
5923 specialRegister CR0 | CR2 | CR3 | CR4
5924 | DR0 | DR1 | DR2 | DR3 | DR6 | DR7
5925 | TR3 | TR4 | TR5 | TR6 | TR7
5926
5927 We simplify the grammar in obvious places (e.g., register parsing is
5928 done by calling parse_register) and eliminate immediate left recursion
5929 to implement a recursive-descent parser.
5930
5931 expr e04 expr'
5932
5933 expr' cmpOp e04 expr'
5934 | Empty
5935
5936 e04 e05 e04'
5937
5938 e04' addOp e05 e04'
5939 | Empty
5940
5941 e05 e06 e05'
5942
5943 e05' binOp e06 e05'
5944 | Empty
5945
5946 e06 e09 e06'
5947
5948 e06' mulOp e09 e06'
5949 | Empty
5950
5951 e09 OFFSET e10 e09'
5952 | SHORT e10'
5953 | + e10'
5954 | - e10'
5955 | ~ e10'
5956 | NOT e10'
5957 | e10 e09'
5958
5959 e09' PTR e10 e09'
5960 | : e10 e09'
5961 | Empty
5962
5963 e10 e11 e10'
5964
5965 e10' [ expr ] e10'
5966 | Empty
5967
5968 e11 ( expr )
5969 | [ expr ]
5970 | BYTE
5971 | WORD
5972 | DWORD
5973 | FWORD
5974 | QWORD
5975 | TBYTE
5976 | OWORD
5977 | XMMWORD
5978 | .
5979 | $
5980 | register
5981 | id
5982 | constant */
5983
5984 /* Parsing structure for the intel syntax parser. Used to implement the
5985 semantic actions for the operand grammar. */
5986 struct intel_parser_s
5987 {
5988 char *op_string; /* The string being parsed. */
5989 int got_a_float; /* Whether the operand is a float. */
5990 int op_modifier; /* Operand modifier. */
5991 int is_mem; /* 1 if operand is memory reference. */
5992 int in_offset; /* >=1 if parsing operand of offset. */
5993 int in_bracket; /* >=1 if parsing operand in brackets. */
5994 const reg_entry *reg; /* Last register reference found. */
5995 char *disp; /* Displacement string being built. */
5996 char *next_operand; /* Resume point when splitting operands. */
5997 };
5998
5999 static struct intel_parser_s intel_parser;
6000
6001 /* Token structure for parsing intel syntax. */
6002 struct intel_token
6003 {
6004 int code; /* Token code. */
6005 const reg_entry *reg; /* Register entry for register tokens. */
6006 char *str; /* String representation. */
6007 };
6008
6009 static struct intel_token cur_token, prev_token;
6010
6011 /* Token codes for the intel parser. Since T_SHORT is already used
6012 by COFF, undefine it first to prevent a warning. */
6013 #define T_NIL -1
6014 #define T_CONST 1
6015 #define T_REG 2
6016 #define T_BYTE 3
6017 #define T_WORD 4
6018 #define T_DWORD 5
6019 #define T_FWORD 6
6020 #define T_QWORD 7
6021 #define T_TBYTE 8
6022 #define T_XMMWORD 9
6023 #undef T_SHORT
6024 #define T_SHORT 10
6025 #define T_OFFSET 11
6026 #define T_PTR 12
6027 #define T_ID 13
6028 #define T_SHL 14
6029 #define T_SHR 15
6030
6031 /* Prototypes for intel parser functions. */
6032 static int intel_match_token PARAMS ((int code));
6033 static void intel_get_token PARAMS ((void));
6034 static void intel_putback_token PARAMS ((void));
6035 static int intel_expr PARAMS ((void));
6036 static int intel_e04 PARAMS ((void));
6037 static int intel_e05 PARAMS ((void));
6038 static int intel_e06 PARAMS ((void));
6039 static int intel_e09 PARAMS ((void));
6040 static int intel_bracket_expr PARAMS ((void));
6041 static int intel_e10 PARAMS ((void));
6042 static int intel_e11 PARAMS ((void));
6043
6044 static int
6045 i386_intel_operand (operand_string, got_a_float)
6046 char *operand_string;
6047 int got_a_float;
6048 {
6049 int ret;
6050 char *p;
6051
6052 p = intel_parser.op_string = xstrdup (operand_string);
6053 intel_parser.disp = (char *) xmalloc (strlen (operand_string) + 1);
6054
6055 for (;;)
6056 {
6057 /* Initialize token holders. */
6058 cur_token.code = prev_token.code = T_NIL;
6059 cur_token.reg = prev_token.reg = NULL;
6060 cur_token.str = prev_token.str = NULL;
6061
6062 /* Initialize parser structure. */
6063 intel_parser.got_a_float = got_a_float;
6064 intel_parser.op_modifier = 0;
6065 intel_parser.is_mem = 0;
6066 intel_parser.in_offset = 0;
6067 intel_parser.in_bracket = 0;
6068 intel_parser.reg = NULL;
6069 intel_parser.disp[0] = '\0';
6070 intel_parser.next_operand = NULL;
6071
6072 /* Read the first token and start the parser. */
6073 intel_get_token ();
6074 ret = intel_expr ();
6075
6076 if (!ret)
6077 break;
6078
6079 if (cur_token.code != T_NIL)
6080 {
6081 as_bad (_("invalid operand for '%s' ('%s' unexpected)"),
6082 current_templates->start->name, cur_token.str);
6083 ret = 0;
6084 }
6085 /* If we found a memory reference, hand it over to i386_displacement
6086 to fill in the rest of the operand fields. */
6087 else if (intel_parser.is_mem)
6088 {
6089 if ((i.mem_operands == 1
6090 && (current_templates->start->opcode_modifier & IsString) == 0)
6091 || i.mem_operands == 2)
6092 {
6093 as_bad (_("too many memory references for '%s'"),
6094 current_templates->start->name);
6095 ret = 0;
6096 }
6097 else
6098 {
6099 char *s = intel_parser.disp;
6100 i.mem_operands++;
6101
6102 if (!quiet_warnings && intel_parser.is_mem < 0)
6103 /* See the comments in intel_bracket_expr. */
6104 as_warn (_("Treating `%s' as memory reference"), operand_string);
6105
6106 /* Add the displacement expression. */
6107 if (*s != '\0')
6108 ret = i386_displacement (s, s + strlen (s));
6109 if (ret)
6110 {
6111 /* Swap base and index in 16-bit memory operands like
6112 [si+bx]. Since i386_index_check is also used in AT&T
6113 mode we have to do that here. */
6114 if (i.base_reg
6115 && i.index_reg
6116 && (i.base_reg->reg_type & Reg16)
6117 && (i.index_reg->reg_type & Reg16)
6118 && i.base_reg->reg_num >= 6
6119 && i.index_reg->reg_num < 6)
6120 {
6121 const reg_entry *base = i.index_reg;
6122
6123 i.index_reg = i.base_reg;
6124 i.base_reg = base;
6125 }
6126 ret = i386_index_check (operand_string);
6127 }
6128 }
6129 }
6130
6131 /* Constant and OFFSET expressions are handled by i386_immediate. */
6132 else if ((intel_parser.op_modifier & (1 << T_OFFSET))
6133 || intel_parser.reg == NULL)
6134 ret = i386_immediate (intel_parser.disp);
6135
6136 if (intel_parser.next_operand && this_operand >= MAX_OPERANDS - 1)
6137 ret = 0;
6138 if (!ret || !intel_parser.next_operand)
6139 break;
6140 intel_parser.op_string = intel_parser.next_operand;
6141 this_operand = i.operands++;
6142 }
6143
6144 free (p);
6145 free (intel_parser.disp);
6146
6147 return ret;
6148 }
6149
6150 #define NUM_ADDRESS_REGS (!!i.base_reg + !!i.index_reg)
6151
6152 /* expr e04 expr'
6153
6154 expr' cmpOp e04 expr'
6155 | Empty */
6156 static int
6157 intel_expr ()
6158 {
6159 /* XXX Implement the comparison operators. */
6160 return intel_e04 ();
6161 }
6162
6163 /* e04 e05 e04'
6164
6165 e04' addOp e05 e04'
6166 | Empty */
6167 static int
6168 intel_e04 ()
6169 {
6170 int nregs = -1;
6171
6172 for (;;)
6173 {
6174 if (!intel_e05())
6175 return 0;
6176
6177 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6178 i.base_reg = i386_regtab + REGNAM_AL; /* al is invalid as base */
6179
6180 if (cur_token.code == '+')
6181 nregs = -1;
6182 else if (cur_token.code == '-')
6183 nregs = NUM_ADDRESS_REGS;
6184 else
6185 return 1;
6186
6187 strcat (intel_parser.disp, cur_token.str);
6188 intel_match_token (cur_token.code);
6189 }
6190 }
6191
6192 /* e05 e06 e05'
6193
6194 e05' binOp e06 e05'
6195 | Empty */
6196 static int
6197 intel_e05 ()
6198 {
6199 int nregs = ~NUM_ADDRESS_REGS;
6200
6201 for (;;)
6202 {
6203 if (!intel_e06())
6204 return 0;
6205
6206 if (cur_token.code == '&' || cur_token.code == '|' || cur_token.code == '^')
6207 {
6208 char str[2];
6209
6210 str[0] = cur_token.code;
6211 str[1] = 0;
6212 strcat (intel_parser.disp, str);
6213 }
6214 else
6215 break;
6216
6217 intel_match_token (cur_token.code);
6218
6219 if (nregs < 0)
6220 nregs = ~nregs;
6221 }
6222 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6223 i.base_reg = i386_regtab + REGNAM_AL + 1; /* cl is invalid as base */
6224 return 1;
6225 }
6226
6227 /* e06 e09 e06'
6228
6229 e06' mulOp e09 e06'
6230 | Empty */
6231 static int
6232 intel_e06 ()
6233 {
6234 int nregs = ~NUM_ADDRESS_REGS;
6235
6236 for (;;)
6237 {
6238 if (!intel_e09())
6239 return 0;
6240
6241 if (cur_token.code == '*' || cur_token.code == '/' || cur_token.code == '%')
6242 {
6243 char str[2];
6244
6245 str[0] = cur_token.code;
6246 str[1] = 0;
6247 strcat (intel_parser.disp, str);
6248 }
6249 else if (cur_token.code == T_SHL)
6250 strcat (intel_parser.disp, "<<");
6251 else if (cur_token.code == T_SHR)
6252 strcat (intel_parser.disp, ">>");
6253 else
6254 break;
6255
6256 intel_match_token (cur_token.code);
6257
6258 if (nregs < 0)
6259 nregs = ~nregs;
6260 }
6261 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6262 i.base_reg = i386_regtab + REGNAM_AL + 2; /* dl is invalid as base */
6263 return 1;
6264 }
6265
6266 /* e09 OFFSET e09
6267 | SHORT e09
6268 | + e09
6269 | - e09
6270 | ~ e09
6271 | NOT e09
6272 | e10 e09'
6273
6274 e09' PTR e10 e09'
6275 | : e10 e09'
6276 | Empty */
6277 static int
6278 intel_e09 ()
6279 {
6280 int nregs = ~NUM_ADDRESS_REGS;
6281 int in_offset = 0;
6282
6283 for (;;)
6284 {
6285 /* Don't consume constants here. */
6286 if (cur_token.code == '+' || cur_token.code == '-')
6287 {
6288 /* Need to look one token ahead - if the next token
6289 is a constant, the current token is its sign. */
6290 int next_code;
6291
6292 intel_match_token (cur_token.code);
6293 next_code = cur_token.code;
6294 intel_putback_token ();
6295 if (next_code == T_CONST)
6296 break;
6297 }
6298
6299 /* e09 OFFSET e09 */
6300 if (cur_token.code == T_OFFSET)
6301 {
6302 if (!in_offset++)
6303 ++intel_parser.in_offset;
6304 }
6305
6306 /* e09 SHORT e09 */
6307 else if (cur_token.code == T_SHORT)
6308 intel_parser.op_modifier |= 1 << T_SHORT;
6309
6310 /* e09 + e09 */
6311 else if (cur_token.code == '+')
6312 strcat (intel_parser.disp, "+");
6313
6314 /* e09 - e09
6315 | ~ e09
6316 | NOT e09 */
6317 else if (cur_token.code == '-' || cur_token.code == '~')
6318 {
6319 char str[2];
6320
6321 if (nregs < 0)
6322 nregs = ~nregs;
6323 str[0] = cur_token.code;
6324 str[1] = 0;
6325 strcat (intel_parser.disp, str);
6326 }
6327
6328 /* e09 e10 e09' */
6329 else
6330 break;
6331
6332 intel_match_token (cur_token.code);
6333 }
6334
6335 for (;;)
6336 {
6337 if (!intel_e10 ())
6338 return 0;
6339
6340 /* e09' PTR e10 e09' */
6341 if (cur_token.code == T_PTR)
6342 {
6343 char suffix;
6344
6345 if (prev_token.code == T_BYTE)
6346 suffix = BYTE_MNEM_SUFFIX;
6347
6348 else if (prev_token.code == T_WORD)
6349 {
6350 if (current_templates->start->name[0] == 'l'
6351 && current_templates->start->name[2] == 's'
6352 && current_templates->start->name[3] == 0)
6353 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6354 else if (intel_parser.got_a_float == 2) /* "fi..." */
6355 suffix = SHORT_MNEM_SUFFIX;
6356 else
6357 suffix = WORD_MNEM_SUFFIX;
6358 }
6359
6360 else if (prev_token.code == T_DWORD)
6361 {
6362 if (current_templates->start->name[0] == 'l'
6363 && current_templates->start->name[2] == 's'
6364 && current_templates->start->name[3] == 0)
6365 suffix = WORD_MNEM_SUFFIX;
6366 else if (flag_code == CODE_16BIT
6367 && (current_templates->start->opcode_modifier
6368 & (Jump | JumpDword)))
6369 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6370 else if (intel_parser.got_a_float == 1) /* "f..." */
6371 suffix = SHORT_MNEM_SUFFIX;
6372 else
6373 suffix = LONG_MNEM_SUFFIX;
6374 }
6375
6376 else if (prev_token.code == T_FWORD)
6377 {
6378 if (current_templates->start->name[0] == 'l'
6379 && current_templates->start->name[2] == 's'
6380 && current_templates->start->name[3] == 0)
6381 suffix = LONG_MNEM_SUFFIX;
6382 else if (!intel_parser.got_a_float)
6383 {
6384 if (flag_code == CODE_16BIT)
6385 add_prefix (DATA_PREFIX_OPCODE);
6386 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6387 }
6388 else
6389 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6390 }
6391
6392 else if (prev_token.code == T_QWORD)
6393 {
6394 if (intel_parser.got_a_float == 1) /* "f..." */
6395 suffix = LONG_MNEM_SUFFIX;
6396 else
6397 suffix = QWORD_MNEM_SUFFIX;
6398 }
6399
6400 else if (prev_token.code == T_TBYTE)
6401 {
6402 if (intel_parser.got_a_float == 1)
6403 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6404 else
6405 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6406 }
6407
6408 else if (prev_token.code == T_XMMWORD)
6409 {
6410 /* XXX ignored for now, but accepted since gcc uses it */
6411 suffix = 0;
6412 }
6413
6414 else
6415 {
6416 as_bad (_("Unknown operand modifier `%s'"), prev_token.str);
6417 return 0;
6418 }
6419
6420 /* Operands for jump/call using 'ptr' notation denote absolute
6421 addresses. */
6422 if (current_templates->start->opcode_modifier & (Jump | JumpDword))
6423 i.types[this_operand] |= JumpAbsolute;
6424
6425 if (current_templates->start->base_opcode == 0x8d /* lea */)
6426 ;
6427 else if (!i.suffix)
6428 i.suffix = suffix;
6429 else if (i.suffix != suffix)
6430 {
6431 as_bad (_("Conflicting operand modifiers"));
6432 return 0;
6433 }
6434
6435 }
6436
6437 /* e09' : e10 e09' */
6438 else if (cur_token.code == ':')
6439 {
6440 if (prev_token.code != T_REG)
6441 {
6442 /* While {call,jmp} SSSS:OOOO is MASM syntax only when SSSS is a
6443 segment/group identifier (which we don't have), using comma
6444 as the operand separator there is even less consistent, since
6445 there all branches only have a single operand. */
6446 if (this_operand != 0
6447 || intel_parser.in_offset
6448 || intel_parser.in_bracket
6449 || (!(current_templates->start->opcode_modifier
6450 & (Jump|JumpDword|JumpInterSegment))
6451 && !(current_templates->start->operand_types[0]
6452 & JumpAbsolute)))
6453 return intel_match_token (T_NIL);
6454 /* Remember the start of the 2nd operand and terminate 1st
6455 operand here.
6456 XXX This isn't right, yet (when SSSS:OOOO is right operand of
6457 another expression), but it gets at least the simplest case
6458 (a plain number or symbol on the left side) right. */
6459 intel_parser.next_operand = intel_parser.op_string;
6460 *--intel_parser.op_string = '\0';
6461 return intel_match_token (':');
6462 }
6463 }
6464
6465 /* e09' Empty */
6466 else
6467 break;
6468
6469 intel_match_token (cur_token.code);
6470
6471 }
6472
6473 if (in_offset)
6474 {
6475 --intel_parser.in_offset;
6476 if (nregs < 0)
6477 nregs = ~nregs;
6478 if (NUM_ADDRESS_REGS > nregs)
6479 {
6480 as_bad (_("Invalid operand to `OFFSET'"));
6481 return 0;
6482 }
6483 intel_parser.op_modifier |= 1 << T_OFFSET;
6484 }
6485
6486 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6487 i.base_reg = i386_regtab + REGNAM_AL + 3; /* bl is invalid as base */
6488 return 1;
6489 }
6490
6491 static int
6492 intel_bracket_expr ()
6493 {
6494 int was_offset = intel_parser.op_modifier & (1 << T_OFFSET);
6495 const char *start = intel_parser.op_string;
6496 int len;
6497
6498 if (i.op[this_operand].regs)
6499 return intel_match_token (T_NIL);
6500
6501 intel_match_token ('[');
6502
6503 /* Mark as a memory operand only if it's not already known to be an
6504 offset expression. If it's an offset expression, we need to keep
6505 the brace in. */
6506 if (!intel_parser.in_offset)
6507 {
6508 ++intel_parser.in_bracket;
6509
6510 /* Operands for jump/call inside brackets denote absolute addresses. */
6511 if (current_templates->start->opcode_modifier & (Jump | JumpDword))
6512 i.types[this_operand] |= JumpAbsolute;
6513
6514 /* Unfortunately gas always diverged from MASM in a respect that can't
6515 be easily fixed without risking to break code sequences likely to be
6516 encountered (the testsuite even check for this): MASM doesn't consider
6517 an expression inside brackets unconditionally as a memory reference.
6518 When that is e.g. a constant, an offset expression, or the sum of the
6519 two, this is still taken as a constant load. gas, however, always
6520 treated these as memory references. As a compromise, we'll try to make
6521 offset expressions inside brackets work the MASM way (since that's
6522 less likely to be found in real world code), but make constants alone
6523 continue to work the traditional gas way. In either case, issue a
6524 warning. */
6525 intel_parser.op_modifier &= ~was_offset;
6526 }
6527 else
6528 strcat (intel_parser.disp, "[");
6529
6530 /* Add a '+' to the displacement string if necessary. */
6531 if (*intel_parser.disp != '\0'
6532 && *(intel_parser.disp + strlen (intel_parser.disp) - 1) != '+')
6533 strcat (intel_parser.disp, "+");
6534
6535 if (intel_expr ()
6536 && (len = intel_parser.op_string - start - 1,
6537 intel_match_token (']')))
6538 {
6539 /* Preserve brackets when the operand is an offset expression. */
6540 if (intel_parser.in_offset)
6541 strcat (intel_parser.disp, "]");
6542 else
6543 {
6544 --intel_parser.in_bracket;
6545 if (i.base_reg || i.index_reg)
6546 intel_parser.is_mem = 1;
6547 if (!intel_parser.is_mem)
6548 {
6549 if (!(intel_parser.op_modifier & (1 << T_OFFSET)))
6550 /* Defer the warning until all of the operand was parsed. */
6551 intel_parser.is_mem = -1;
6552 else if (!quiet_warnings)
6553 as_warn (_("`[%.*s]' taken to mean just `%.*s'"), len, start, len, start);
6554 }
6555 }
6556 intel_parser.op_modifier |= was_offset;
6557
6558 return 1;
6559 }
6560 return 0;
6561 }
6562
6563 /* e10 e11 e10'
6564
6565 e10' [ expr ] e10'
6566 | Empty */
6567 static int
6568 intel_e10 ()
6569 {
6570 if (!intel_e11 ())
6571 return 0;
6572
6573 while (cur_token.code == '[')
6574 {
6575 if (!intel_bracket_expr ())
6576 return 0;
6577 }
6578
6579 return 1;
6580 }
6581
6582 /* e11 ( expr )
6583 | [ expr ]
6584 | BYTE
6585 | WORD
6586 | DWORD
6587 | FWORD
6588 | QWORD
6589 | TBYTE
6590 | OWORD
6591 | XMMWORD
6592 | $
6593 | .
6594 | register
6595 | id
6596 | constant */
6597 static int
6598 intel_e11 ()
6599 {
6600 switch (cur_token.code)
6601 {
6602 /* e11 ( expr ) */
6603 case '(':
6604 intel_match_token ('(');
6605 strcat (intel_parser.disp, "(");
6606
6607 if (intel_expr () && intel_match_token (')'))
6608 {
6609 strcat (intel_parser.disp, ")");
6610 return 1;
6611 }
6612 return 0;
6613
6614 /* e11 [ expr ] */
6615 case '[':
6616 return intel_bracket_expr ();
6617
6618 /* e11 $
6619 | . */
6620 case '.':
6621 strcat (intel_parser.disp, cur_token.str);
6622 intel_match_token (cur_token.code);
6623
6624 /* Mark as a memory operand only if it's not already known to be an
6625 offset expression. */
6626 if (!intel_parser.in_offset)
6627 intel_parser.is_mem = 1;
6628
6629 return 1;
6630
6631 /* e11 register */
6632 case T_REG:
6633 {
6634 const reg_entry *reg = intel_parser.reg = cur_token.reg;
6635
6636 intel_match_token (T_REG);
6637
6638 /* Check for segment change. */
6639 if (cur_token.code == ':')
6640 {
6641 if (!(reg->reg_type & (SReg2 | SReg3)))
6642 {
6643 as_bad (_("`%s' is not a valid segment register"), reg->reg_name);
6644 return 0;
6645 }
6646 else if (i.seg[i.mem_operands])
6647 as_warn (_("Extra segment override ignored"));
6648 else
6649 {
6650 if (!intel_parser.in_offset)
6651 intel_parser.is_mem = 1;
6652 switch (reg->reg_num)
6653 {
6654 case 0:
6655 i.seg[i.mem_operands] = &es;
6656 break;
6657 case 1:
6658 i.seg[i.mem_operands] = &cs;
6659 break;
6660 case 2:
6661 i.seg[i.mem_operands] = &ss;
6662 break;
6663 case 3:
6664 i.seg[i.mem_operands] = &ds;
6665 break;
6666 case 4:
6667 i.seg[i.mem_operands] = &fs;
6668 break;
6669 case 5:
6670 i.seg[i.mem_operands] = &gs;
6671 break;
6672 }
6673 }
6674 }
6675
6676 /* Not a segment register. Check for register scaling. */
6677 else if (cur_token.code == '*')
6678 {
6679 if (!intel_parser.in_bracket)
6680 {
6681 as_bad (_("Register scaling only allowed in memory operands"));
6682 return 0;
6683 }
6684
6685 if (reg->reg_type & Reg16) /* Disallow things like [si*1]. */
6686 reg = i386_regtab + REGNAM_AX + 4; /* sp is invalid as index */
6687 else if (i.index_reg)
6688 reg = i386_regtab + REGNAM_EAX + 4; /* esp is invalid as index */
6689
6690 /* What follows must be a valid scale. */
6691 intel_match_token ('*');
6692 i.index_reg = reg;
6693 i.types[this_operand] |= BaseIndex;
6694
6695 /* Set the scale after setting the register (otherwise,
6696 i386_scale will complain) */
6697 if (cur_token.code == '+' || cur_token.code == '-')
6698 {
6699 char *str, sign = cur_token.code;
6700 intel_match_token (cur_token.code);
6701 if (cur_token.code != T_CONST)
6702 {
6703 as_bad (_("Syntax error: Expecting a constant, got `%s'"),
6704 cur_token.str);
6705 return 0;
6706 }
6707 str = (char *) xmalloc (strlen (cur_token.str) + 2);
6708 strcpy (str + 1, cur_token.str);
6709 *str = sign;
6710 if (!i386_scale (str))
6711 return 0;
6712 free (str);
6713 }
6714 else if (!i386_scale (cur_token.str))
6715 return 0;
6716 intel_match_token (cur_token.code);
6717 }
6718
6719 /* No scaling. If this is a memory operand, the register is either a
6720 base register (first occurrence) or an index register (second
6721 occurrence). */
6722 else if (intel_parser.in_bracket)
6723 {
6724
6725 if (!i.base_reg)
6726 i.base_reg = reg;
6727 else if (!i.index_reg)
6728 i.index_reg = reg;
6729 else
6730 {
6731 as_bad (_("Too many register references in memory operand"));
6732 return 0;
6733 }
6734
6735 i.types[this_operand] |= BaseIndex;
6736 }
6737
6738 /* It's neither base nor index. */
6739 else if (!intel_parser.in_offset && !intel_parser.is_mem)
6740 {
6741 i.types[this_operand] |= reg->reg_type & ~BaseIndex;
6742 i.op[this_operand].regs = reg;
6743 i.reg_operands++;
6744 }
6745 else
6746 {
6747 as_bad (_("Invalid use of register"));
6748 return 0;
6749 }
6750
6751 /* Since registers are not part of the displacement string (except
6752 when we're parsing offset operands), we may need to remove any
6753 preceding '+' from the displacement string. */
6754 if (*intel_parser.disp != '\0'
6755 && !intel_parser.in_offset)
6756 {
6757 char *s = intel_parser.disp;
6758 s += strlen (s) - 1;
6759 if (*s == '+')
6760 *s = '\0';
6761 }
6762
6763 return 1;
6764 }
6765
6766 /* e11 BYTE
6767 | WORD
6768 | DWORD
6769 | FWORD
6770 | QWORD
6771 | TBYTE
6772 | OWORD
6773 | XMMWORD */
6774 case T_BYTE:
6775 case T_WORD:
6776 case T_DWORD:
6777 case T_FWORD:
6778 case T_QWORD:
6779 case T_TBYTE:
6780 case T_XMMWORD:
6781 intel_match_token (cur_token.code);
6782
6783 if (cur_token.code == T_PTR)
6784 return 1;
6785
6786 /* It must have been an identifier. */
6787 intel_putback_token ();
6788 cur_token.code = T_ID;
6789 /* FALLTHRU */
6790
6791 /* e11 id
6792 | constant */
6793 case T_ID:
6794 if (!intel_parser.in_offset && intel_parser.is_mem <= 0)
6795 {
6796 symbolS *symbolP;
6797
6798 /* The identifier represents a memory reference only if it's not
6799 preceded by an offset modifier and if it's not an equate. */
6800 symbolP = symbol_find(cur_token.str);
6801 if (!symbolP || S_GET_SEGMENT(symbolP) != absolute_section)
6802 intel_parser.is_mem = 1;
6803 }
6804 /* FALLTHRU */
6805
6806 case T_CONST:
6807 case '-':
6808 case '+':
6809 {
6810 char *save_str, sign = 0;
6811
6812 /* Allow constants that start with `+' or `-'. */
6813 if (cur_token.code == '-' || cur_token.code == '+')
6814 {
6815 sign = cur_token.code;
6816 intel_match_token (cur_token.code);
6817 if (cur_token.code != T_CONST)
6818 {
6819 as_bad (_("Syntax error: Expecting a constant, got `%s'"),
6820 cur_token.str);
6821 return 0;
6822 }
6823 }
6824
6825 save_str = (char *) xmalloc (strlen (cur_token.str) + 2);
6826 strcpy (save_str + !!sign, cur_token.str);
6827 if (sign)
6828 *save_str = sign;
6829
6830 /* Get the next token to check for register scaling. */
6831 intel_match_token (cur_token.code);
6832
6833 /* Check if this constant is a scaling factor for an index register. */
6834 if (cur_token.code == '*')
6835 {
6836 if (intel_match_token ('*') && cur_token.code == T_REG)
6837 {
6838 const reg_entry *reg = cur_token.reg;
6839
6840 if (!intel_parser.in_bracket)
6841 {
6842 as_bad (_("Register scaling only allowed in memory operands"));
6843 return 0;
6844 }
6845
6846 if (reg->reg_type & Reg16) /* Disallow things like [1*si]. */
6847 reg = i386_regtab + REGNAM_AX + 4; /* sp is invalid as index */
6848 else if (i.index_reg)
6849 reg = i386_regtab + REGNAM_EAX + 4; /* esp is invalid as index */
6850
6851 /* The constant is followed by `* reg', so it must be
6852 a valid scale. */
6853 i.index_reg = reg;
6854 i.types[this_operand] |= BaseIndex;
6855
6856 /* Set the scale after setting the register (otherwise,
6857 i386_scale will complain) */
6858 if (!i386_scale (save_str))
6859 return 0;
6860 intel_match_token (T_REG);
6861
6862 /* Since registers are not part of the displacement
6863 string, we may need to remove any preceding '+' from
6864 the displacement string. */
6865 if (*intel_parser.disp != '\0')
6866 {
6867 char *s = intel_parser.disp;
6868 s += strlen (s) - 1;
6869 if (*s == '+')
6870 *s = '\0';
6871 }
6872
6873 free (save_str);
6874
6875 return 1;
6876 }
6877
6878 /* The constant was not used for register scaling. Since we have
6879 already consumed the token following `*' we now need to put it
6880 back in the stream. */
6881 intel_putback_token ();
6882 }
6883
6884 /* Add the constant to the displacement string. */
6885 strcat (intel_parser.disp, save_str);
6886 free (save_str);
6887
6888 return 1;
6889 }
6890 }
6891
6892 as_bad (_("Unrecognized token '%s'"), cur_token.str);
6893 return 0;
6894 }
6895
6896 /* Match the given token against cur_token. If they match, read the next
6897 token from the operand string. */
6898 static int
6899 intel_match_token (code)
6900 int code;
6901 {
6902 if (cur_token.code == code)
6903 {
6904 intel_get_token ();
6905 return 1;
6906 }
6907 else
6908 {
6909 as_bad (_("Unexpected token `%s'"), cur_token.str);
6910 return 0;
6911 }
6912 }
6913
6914 /* Read a new token from intel_parser.op_string and store it in cur_token. */
6915 static void
6916 intel_get_token ()
6917 {
6918 char *end_op;
6919 const reg_entry *reg;
6920 struct intel_token new_token;
6921
6922 new_token.code = T_NIL;
6923 new_token.reg = NULL;
6924 new_token.str = NULL;
6925
6926 /* Free the memory allocated to the previous token and move
6927 cur_token to prev_token. */
6928 if (prev_token.str)
6929 free (prev_token.str);
6930
6931 prev_token = cur_token;
6932
6933 /* Skip whitespace. */
6934 while (is_space_char (*intel_parser.op_string))
6935 intel_parser.op_string++;
6936
6937 /* Return an empty token if we find nothing else on the line. */
6938 if (*intel_parser.op_string == '\0')
6939 {
6940 cur_token = new_token;
6941 return;
6942 }
6943
6944 /* The new token cannot be larger than the remainder of the operand
6945 string. */
6946 new_token.str = (char *) xmalloc (strlen (intel_parser.op_string) + 1);
6947 new_token.str[0] = '\0';
6948
6949 if (strchr ("0123456789", *intel_parser.op_string))
6950 {
6951 char *p = new_token.str;
6952 char *q = intel_parser.op_string;
6953 new_token.code = T_CONST;
6954
6955 /* Allow any kind of identifier char to encompass floating point and
6956 hexadecimal numbers. */
6957 while (is_identifier_char (*q))
6958 *p++ = *q++;
6959 *p = '\0';
6960
6961 /* Recognize special symbol names [0-9][bf]. */
6962 if (strlen (intel_parser.op_string) == 2
6963 && (intel_parser.op_string[1] == 'b'
6964 || intel_parser.op_string[1] == 'f'))
6965 new_token.code = T_ID;
6966 }
6967
6968 else if ((reg = parse_register (intel_parser.op_string, &end_op)) != NULL)
6969 {
6970 size_t len = end_op - intel_parser.op_string;
6971
6972 new_token.code = T_REG;
6973 new_token.reg = reg;
6974
6975 memcpy (new_token.str, intel_parser.op_string, len);
6976 new_token.str[len] = '\0';
6977 }
6978
6979 else if (is_identifier_char (*intel_parser.op_string))
6980 {
6981 char *p = new_token.str;
6982 char *q = intel_parser.op_string;
6983
6984 /* A '.' or '$' followed by an identifier char is an identifier.
6985 Otherwise, it's operator '.' followed by an expression. */
6986 if ((*q == '.' || *q == '$') && !is_identifier_char (*(q + 1)))
6987 {
6988 new_token.code = '.';
6989 new_token.str[0] = '.';
6990 new_token.str[1] = '\0';
6991 }
6992 else
6993 {
6994 while (is_identifier_char (*q) || *q == '@')
6995 *p++ = *q++;
6996 *p = '\0';
6997
6998 if (strcasecmp (new_token.str, "NOT") == 0)
6999 new_token.code = '~';
7000
7001 else if (strcasecmp (new_token.str, "MOD") == 0)
7002 new_token.code = '%';
7003
7004 else if (strcasecmp (new_token.str, "AND") == 0)
7005 new_token.code = '&';
7006
7007 else if (strcasecmp (new_token.str, "OR") == 0)
7008 new_token.code = '|';
7009
7010 else if (strcasecmp (new_token.str, "XOR") == 0)
7011 new_token.code = '^';
7012
7013 else if (strcasecmp (new_token.str, "SHL") == 0)
7014 new_token.code = T_SHL;
7015
7016 else if (strcasecmp (new_token.str, "SHR") == 0)
7017 new_token.code = T_SHR;
7018
7019 else if (strcasecmp (new_token.str, "BYTE") == 0)
7020 new_token.code = T_BYTE;
7021
7022 else if (strcasecmp (new_token.str, "WORD") == 0)
7023 new_token.code = T_WORD;
7024
7025 else if (strcasecmp (new_token.str, "DWORD") == 0)
7026 new_token.code = T_DWORD;
7027
7028 else if (strcasecmp (new_token.str, "FWORD") == 0)
7029 new_token.code = T_FWORD;
7030
7031 else if (strcasecmp (new_token.str, "QWORD") == 0)
7032 new_token.code = T_QWORD;
7033
7034 else if (strcasecmp (new_token.str, "TBYTE") == 0
7035 /* XXX remove (gcc still uses it) */
7036 || strcasecmp (new_token.str, "XWORD") == 0)
7037 new_token.code = T_TBYTE;
7038
7039 else if (strcasecmp (new_token.str, "XMMWORD") == 0
7040 || strcasecmp (new_token.str, "OWORD") == 0)
7041 new_token.code = T_XMMWORD;
7042
7043 else if (strcasecmp (new_token.str, "PTR") == 0)
7044 new_token.code = T_PTR;
7045
7046 else if (strcasecmp (new_token.str, "SHORT") == 0)
7047 new_token.code = T_SHORT;
7048
7049 else if (strcasecmp (new_token.str, "OFFSET") == 0)
7050 {
7051 new_token.code = T_OFFSET;
7052
7053 /* ??? This is not mentioned in the MASM grammar but gcc
7054 makes use of it with -mintel-syntax. OFFSET may be
7055 followed by FLAT: */
7056 if (strncasecmp (q, " FLAT:", 6) == 0)
7057 strcat (new_token.str, " FLAT:");
7058 }
7059
7060 /* ??? This is not mentioned in the MASM grammar. */
7061 else if (strcasecmp (new_token.str, "FLAT") == 0)
7062 {
7063 new_token.code = T_OFFSET;
7064 if (*q == ':')
7065 strcat (new_token.str, ":");
7066 else
7067 as_bad (_("`:' expected"));
7068 }
7069
7070 else
7071 new_token.code = T_ID;
7072 }
7073 }
7074
7075 else if (strchr ("+-/*%|&^:[]()~", *intel_parser.op_string))
7076 {
7077 new_token.code = *intel_parser.op_string;
7078 new_token.str[0] = *intel_parser.op_string;
7079 new_token.str[1] = '\0';
7080 }
7081
7082 else if (strchr ("<>", *intel_parser.op_string)
7083 && *intel_parser.op_string == *(intel_parser.op_string + 1))
7084 {
7085 new_token.code = *intel_parser.op_string == '<' ? T_SHL : T_SHR;
7086 new_token.str[0] = *intel_parser.op_string;
7087 new_token.str[1] = *intel_parser.op_string;
7088 new_token.str[2] = '\0';
7089 }
7090
7091 else
7092 as_bad (_("Unrecognized token `%s'"), intel_parser.op_string);
7093
7094 intel_parser.op_string += strlen (new_token.str);
7095 cur_token = new_token;
7096 }
7097
7098 /* Put cur_token back into the token stream and make cur_token point to
7099 prev_token. */
7100 static void
7101 intel_putback_token ()
7102 {
7103 if (cur_token.code != T_NIL)
7104 {
7105 intel_parser.op_string -= strlen (cur_token.str);
7106 free (cur_token.str);
7107 }
7108 cur_token = prev_token;
7109
7110 /* Forget prev_token. */
7111 prev_token.code = T_NIL;
7112 prev_token.reg = NULL;
7113 prev_token.str = NULL;
7114 }
7115
7116 int
7117 tc_x86_regname_to_dw2regnum (const char *regname)
7118 {
7119 unsigned int regnum;
7120 unsigned int regnames_count;
7121 static const char *const regnames_32[] =
7122 {
7123 "eax", "ecx", "edx", "ebx",
7124 "esp", "ebp", "esi", "edi",
7125 "eip", "eflags", NULL,
7126 "st0", "st1", "st2", "st3",
7127 "st4", "st5", "st6", "st7",
7128 NULL, NULL,
7129 "xmm0", "xmm1", "xmm2", "xmm3",
7130 "xmm4", "xmm5", "xmm6", "xmm7",
7131 "mm0", "mm1", "mm2", "mm3",
7132 "mm4", "mm5", "mm6", "mm7",
7133 "fcw", "fsw", "mxcsr",
7134 "es", "cs", "ss", "ds", "fs", "gs", NULL, NULL,
7135 "tr", "ldtr"
7136 };
7137 static const char *const regnames_64[] =
7138 {
7139 "rax", "rdx", "rcx", "rbx",
7140 "rsi", "rdi", "rbp", "rsp",
7141 "r8", "r9", "r10", "r11",
7142 "r12", "r13", "r14", "r15",
7143 "rip",
7144 "xmm0", "xmm1", "xmm2", "xmm3",
7145 "xmm4", "xmm5", "xmm6", "xmm7",
7146 "xmm8", "xmm9", "xmm10", "xmm11",
7147 "xmm12", "xmm13", "xmm14", "xmm15",
7148 "st0", "st1", "st2", "st3",
7149 "st4", "st5", "st6", "st7",
7150 "mm0", "mm1", "mm2", "mm3",
7151 "mm4", "mm5", "mm6", "mm7",
7152 "rflags",
7153 "es", "cs", "ss", "ds", "fs", "gs", NULL, NULL,
7154 "fs.base", "gs.base", NULL, NULL,
7155 "tr", "ldtr",
7156 "mxcsr", "fcw", "fsw"
7157 };
7158 const char *const *regnames;
7159
7160 if (flag_code == CODE_64BIT)
7161 {
7162 regnames = regnames_64;
7163 regnames_count = ARRAY_SIZE (regnames_64);
7164 }
7165 else
7166 {
7167 regnames = regnames_32;
7168 regnames_count = ARRAY_SIZE (regnames_32);
7169 }
7170
7171 for (regnum = 0; regnum < regnames_count; regnum++)
7172 if (regnames[regnum] != NULL
7173 && strcmp (regname, regnames[regnum]) == 0)
7174 return regnum;
7175
7176 return -1;
7177 }
7178
7179 void
7180 tc_x86_frame_initial_instructions (void)
7181 {
7182 static unsigned int sp_regno;
7183
7184 if (!sp_regno)
7185 sp_regno = tc_x86_regname_to_dw2regnum (flag_code == CODE_64BIT
7186 ? "rsp" : "esp");
7187
7188 cfi_add_CFA_def_cfa (sp_regno, -x86_cie_data_alignment);
7189 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
7190 }
7191
7192 int
7193 i386_elf_section_type (const char *str, size_t len)
7194 {
7195 if (flag_code == CODE_64BIT
7196 && len == sizeof ("unwind") - 1
7197 && strncmp (str, "unwind", 6) == 0)
7198 return SHT_X86_64_UNWIND;
7199
7200 return -1;
7201 }
7202
7203 #ifdef TE_PE
7204 void
7205 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
7206 {
7207 expressionS expr;
7208
7209 expr.X_op = O_secrel;
7210 expr.X_add_symbol = symbol;
7211 expr.X_add_number = 0;
7212 emit_expr (&expr, size);
7213 }
7214 #endif
7215
7216 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7217 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
7218
7219 int
7220 x86_64_section_letter (int letter, char **ptr_msg)
7221 {
7222 if (flag_code == CODE_64BIT)
7223 {
7224 if (letter == 'l')
7225 return SHF_X86_64_LARGE;
7226
7227 *ptr_msg = _("Bad .section directive: want a,l,w,x,M,S,G,T in string");
7228 }
7229 else
7230 *ptr_msg = _("Bad .section directive: want a,w,x,M,S,G,T in string");
7231 return -1;
7232 }
7233
7234 int
7235 x86_64_section_word (char *str, size_t len)
7236 {
7237 if (len == 5 && flag_code == CODE_64BIT && strncmp (str, "large", 5) == 0)
7238 return SHF_X86_64_LARGE;
7239
7240 return -1;
7241 }
7242
7243 static void
7244 handle_large_common (int small ATTRIBUTE_UNUSED)
7245 {
7246 if (flag_code != CODE_64BIT)
7247 {
7248 s_comm_internal (0, elf_common_parse);
7249 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
7250 }
7251 else
7252 {
7253 static segT lbss_section;
7254 asection *saved_com_section_ptr = elf_com_section_ptr;
7255 asection *saved_bss_section = bss_section;
7256
7257 if (lbss_section == NULL)
7258 {
7259 flagword applicable;
7260 segT seg = now_seg;
7261 subsegT subseg = now_subseg;
7262
7263 /* The .lbss section is for local .largecomm symbols. */
7264 lbss_section = subseg_new (".lbss", 0);
7265 applicable = bfd_applicable_section_flags (stdoutput);
7266 bfd_set_section_flags (stdoutput, lbss_section,
7267 applicable & SEC_ALLOC);
7268 seg_info (lbss_section)->bss = 1;
7269
7270 subseg_set (seg, subseg);
7271 }
7272
7273 elf_com_section_ptr = &_bfd_elf_large_com_section;
7274 bss_section = lbss_section;
7275
7276 s_comm_internal (0, elf_common_parse);
7277
7278 elf_com_section_ptr = saved_com_section_ptr;
7279 bss_section = saved_bss_section;
7280 }
7281 }
7282 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */
This page took 0.31533 seconds and 4 git commands to generate.