1 /* tc-i386.h -- Header file for tc-i386.c
2    Copyright 1989, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999, 2000,
3    2001, 2002, 2003, 2004
4    Free Software Foundation, Inc.
5 
6    This file is part of GAS, the GNU Assembler.
7 
8    GAS is free software; you can redistribute it and/or modify
9    it under the terms of the GNU General Public License as published by
10    the Free Software Foundation; either version 2, or (at your option)
11    any later version.
12 
13    GAS is distributed in the hope that it will be useful,
14    but WITHOUT ANY WARRANTY; without even the implied warranty of
15    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
16    GNU General Public License for more details.
17 
18    You should have received a copy of the GNU General Public License
19    along with GAS; see the file COPYING.  If not, write to the Free
20    Software Foundation, 59 Temple Place - Suite 330, Boston, MA
21    02111-1307, USA.  */
22 
23 #ifndef TC_I386
24 #define TC_I386 1
25 
26 #ifndef BFD_ASSEMBLER
27 #error So, do you know what you are doing?
28 #endif
29 
30 #ifdef ANSI_PROTOTYPES
31 struct fix;
32 #endif
33 
34 #define TARGET_BYTES_BIG_ENDIAN	0
35 
36 #ifdef TE_LYNX
37 #define TARGET_FORMAT		"coff-i386-lynx"
38 #endif
39 
40 #define TARGET_ARCH		bfd_arch_i386
41 #define TARGET_MACH		(i386_mach ())
42 extern unsigned long i386_mach PARAMS ((void));
43 
44 #ifdef TE_FreeBSD
45 #define AOUT_TARGET_FORMAT	"a.out-i386-freebsd"
46 #endif
47 #if defined(TE_NetBSD) || defined(TE_OpenBSD)
48 #define AOUT_TARGET_FORMAT	"a.out-i386-netbsd"
49 #endif
50 #ifdef TE_386BSD
51 #define AOUT_TARGET_FORMAT	"a.out-i386-bsd"
52 #endif
53 #ifdef TE_LINUX
54 #define AOUT_TARGET_FORMAT	"a.out-i386-linux"
55 #endif
56 #ifdef TE_Mach
57 #define AOUT_TARGET_FORMAT	"a.out-mach3"
58 #endif
59 #ifdef TE_DYNIX
60 #define AOUT_TARGET_FORMAT	"a.out-i386-dynix"
61 #endif
62 #ifndef AOUT_TARGET_FORMAT
63 #define AOUT_TARGET_FORMAT	"a.out-i386"
64 #endif
65 
66 #ifdef TE_FreeBSD
67 #define ELF_TARGET_FORMAT	"elf32-i386-freebsd"
68 #endif
69 #ifndef ELF_TARGET_FORMAT
70 #define ELF_TARGET_FORMAT	"elf32-i386"
71 #endif
72 
73 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
74      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
75 extern const char *i386_target_format PARAMS ((void));
76 #define TARGET_FORMAT i386_target_format ()
77 #else
78 #ifdef OBJ_ELF
79 #define TARGET_FORMAT		ELF_TARGET_FORMAT
80 #endif
81 #ifdef OBJ_AOUT
82 #define TARGET_FORMAT		AOUT_TARGET_FORMAT
83 #endif
84 #endif
85 
86 #if (defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF))
87 #define md_end i386_elf_emit_arch_note
88 extern void i386_elf_emit_arch_note PARAMS ((void));
89 #endif
90 
91 #define SUB_SEGMENT_ALIGN(SEG, FRCHAIN) 0
92 
93 #define LOCAL_LABELS_FB 1
94 
95 extern const char extra_symbol_chars[];
96 #define tc_symbol_chars extra_symbol_chars
97 
98 #define MAX_OPERANDS 3		/* max operands per insn */
99 #define MAX_IMMEDIATE_OPERANDS 2/* max immediates per insn (lcall, ljmp) */
100 #define MAX_MEMORY_OPERANDS 2	/* max memory refs per insn (string ops) */
101 
102 /* Prefixes will be emitted in the order defined below.
103    WAIT_PREFIX must be the first prefix since FWAIT is really is an
104    instruction, and so must come before any prefixes.  */
105 #define WAIT_PREFIX	0
106 #define LOCKREP_PREFIX	1
107 #define ADDR_PREFIX	2
108 #define DATA_PREFIX	3
109 #define SEG_PREFIX	4
110 #define REX_PREFIX	5       /* must come last.  */
111 #define MAX_PREFIXES	6	/* max prefixes per opcode */
112 
113 /* we define the syntax here (modulo base,index,scale syntax) */
114 #define REGISTER_PREFIX '%'
115 #define IMMEDIATE_PREFIX '$'
116 #define ABSOLUTE_PREFIX '*'
117 
118 #define TWO_BYTE_OPCODE_ESCAPE 0x0f
119 #define NOP_OPCODE (char) 0x90
120 
121 /* register numbers */
122 #define EBP_REG_NUM 5
123 #define ESP_REG_NUM 4
124 
125 /* modrm_byte.regmem for twobyte escape */
126 #define ESCAPE_TO_TWO_BYTE_ADDRESSING ESP_REG_NUM
127 /* index_base_byte.index for no index register addressing */
128 #define NO_INDEX_REGISTER ESP_REG_NUM
129 /* index_base_byte.base for no base register addressing */
130 #define NO_BASE_REGISTER EBP_REG_NUM
131 #define NO_BASE_REGISTER_16 6
132 
133 /* these are the instruction mnemonic suffixes.  */
134 #define WORD_MNEM_SUFFIX  'w'
135 #define BYTE_MNEM_SUFFIX  'b'
136 #define SHORT_MNEM_SUFFIX 's'
137 #define LONG_MNEM_SUFFIX  'l'
138 #define QWORD_MNEM_SUFFIX  'q'
139 /* Intel Syntax */
140 #define LONG_DOUBLE_MNEM_SUFFIX 'x'
141 
142 /* modrm.mode = REGMEM_FIELD_HAS_REG when a register is in there */
143 #define REGMEM_FIELD_HAS_REG 0x3/* always = 0x3 */
144 #define REGMEM_FIELD_HAS_MEM (~REGMEM_FIELD_HAS_REG)
145 
146 #define END_OF_INSN '\0'
147 
148 /* Intel Syntax */
149 /* Values 0-4 map onto scale factor */
150 #define BYTE_PTR     0
151 #define WORD_PTR     1
152 #define DWORD_PTR    2
153 #define QWORD_PTR    3
154 #define XWORD_PTR    4
155 #define SHORT        5
156 #define OFFSET_FLAT  6
157 #define FLAT         7
158 #define NONE_FOUND   8
159 
160 typedef struct
161 {
162   /* instruction name sans width suffix ("mov" for movl insns) */
163   char *name;
164 
165   /* how many operands */
166   unsigned int operands;
167 
168   /* base_opcode is the fundamental opcode byte without optional
169      prefix(es).  */
170   unsigned int base_opcode;
171 
172   /* extension_opcode is the 3 bit extension for group <n> insns.
173      This field is also used to store the 8-bit opcode suffix for the
174      AMD 3DNow! instructions.
175      If this template has no extension opcode (the usual case) use None */
176   unsigned int extension_opcode;
177 #define None 0xffff		/* If no extension_opcode is possible.  */
178 
179   /* cpu feature flags */
180   unsigned int cpu_flags;
181 #define Cpu086		  0x1	/* Any old cpu will do, 0 does the same */
182 #define Cpu186		  0x2	/* i186 or better required */
183 #define Cpu286		  0x4	/* i286 or better required */
184 #define Cpu386		  0x8	/* i386 or better required */
185 #define Cpu486		 0x10	/* i486 or better required */
186 #define Cpu586		 0x20	/* i585 or better required */
187 #define Cpu686		 0x40	/* i686 or better required */
188 #define CpuP4		 0x80	/* Pentium4 or better required */
189 #define CpuK6		0x100	/* AMD K6 or better required*/
190 #define CpuAthlon	0x200	/* AMD Athlon or better required*/
191 #define CpuSledgehammer 0x400	/* Sledgehammer or better required */
192 #define CpuMMX		0x800	/* MMX support required */
193 #define CpuSSE	       0x1000	/* Streaming SIMD extensions required */
194 #define CpuSSE2	       0x2000	/* Streaming SIMD extensions 2 required */
195 #define Cpu3dnow       0x4000	/* 3dnow! support required */
196 #define CpuPNI	       0x8000	/* Prescott New Instructions required */
197 #define CpuPadLock    0x10000	/* VIA PadLock required */
198 #define CpuSSSE3      0x20000	/* Supplementary SSE3 required */
199 #define CpuXSAVE      0x40000	/* XSAVE extensions required */
200 #define CpuAES        0x80000	/* Intel AES extensions required */
201 #define CpuPCLMUL    0x100000	/* Intel Carry-less Multiplication extensions */
202 #define CpuRdRnd     0x200000	/* Intel Random Number Generator extensions */
203 #define CpuSMAP      0x400000	/* Intel Supervisor Mode Access Prevention */
204 #define CpuVMX       0x800000	/* VMX Virtualization instructions required */
205 #define CpuSVME	    0x1000000	/* SVM Virtualization instructions required */
206 
207   /* These flags are set by gas depending on the flag_code.  */
208 #define Cpu64	     0x4000000   /* 64bit support required  */
209 #define CpuNo64      0x8000000   /* Not supported in the 64bit mode  */
210 
211   /* The default value for unknown CPUs - enable all features to avoid problems.  */
212 #define CpuUnknownFlags (Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuP4|CpuSledgehammer|CpuMMX|CpuSSE|CpuSSE2|CpuPNI|Cpu3dnow|CpuK6|CpuAthlon|CpuPadLock|CpuSSSE3|CpuXSAVE|CpuAES|CpuPCLMUL|CpuRdRnd|CpuSMAP|CpuVMX|CpuSVME)
213 
214   /* the bits in opcode_modifier are used to generate the final opcode from
215      the base_opcode.  These bits also are used to detect alternate forms of
216      the same instruction */
217   unsigned int opcode_modifier;
218 
219   /* opcode_modifier bits: */
220 #define W		   0x1	/* set if operands can be words or dwords
221 				   encoded the canonical way */
222 #define D		   0x2	/* D = 0 if Reg --> Regmem;
223 				   D = 1 if Regmem --> Reg:    MUST BE 0x2 */
224 #define Modrm		   0x4
225 #define FloatR		   0x8	/* src/dest swap for floats:   MUST BE 0x8 */
226 #define ShortForm	  0x10	/* register is in low 3 bits of opcode */
227 #define FloatMF		  0x20	/* FP insn memory format bit, sized by 0x4 */
228 #define Jump		  0x40	/* special case for jump insns.  */
229 #define JumpDword	  0x80  /* call and jump */
230 #define JumpByte	 0x100  /* loop and jecxz */
231 #define JumpInterSegment 0x200	/* special case for intersegment leaps/calls */
232 #define FloatD		 0x400	/* direction for float insns:  MUST BE 0x400 */
233 #define Seg2ShortForm	 0x800	/* encoding of load segment reg insns */
234 #define Seg3ShortForm	0x1000	/* fs/gs segment register insns.  */
235 #define Size16		0x2000	/* needs size prefix if in 32-bit mode */
236 #define Size32		0x4000	/* needs size prefix if in 16-bit mode */
237 #define Size64		0x8000	/* needs size prefix if in 16-bit mode */
238 #define IgnoreSize     0x10000  /* instruction ignores operand size prefix */
239 #define DefaultSize    0x20000  /* default insn size depends on mode */
240 #define No_bSuf	       0x40000	/* b suffix on instruction illegal */
241 #define No_wSuf	       0x80000	/* w suffix on instruction illegal */
242 #define No_lSuf	      0x100000 	/* l suffix on instruction illegal */
243 #define No_sSuf	      0x200000	/* s suffix on instruction illegal */
244 #define No_qSuf       0x400000  /* q suffix on instruction illegal */
245 #define No_xSuf       0x800000  /* x suffix on instruction illegal */
246 #define FWait	     0x1000000	/* instruction needs FWAIT */
247 #define IsString     0x2000000	/* quick test for string instructions */
248 #define regKludge    0x4000000	/* fake an extra reg operand for clr, imul */
249 #define IsPrefix     0x8000000	/* opcode is a prefix */
250 #define ImmExt	    0x10000000	/* instruction has extension in 8 bit imm */
251 #define NoRex64	    0x20000000  /* instruction don't need Rex64 prefix.  */
252 #define Rex64	    0x40000000  /* instruction require Rex64 prefix.  */
253 #define Ugh	    0x80000000	/* deprecated fp insn, gets a warning */
254 
255   /* operand_types[i] describes the type of operand i.  This is made
256      by OR'ing together all of the possible type masks.  (e.g.
257      'operand_types[i] = Reg|Imm' specifies that operand i can be
258      either a register or an immediate operand.  */
259   unsigned int operand_types[3];
260 
261   /* operand_types[i] bits */
262   /* register */
263 #define Reg8		   0x1	/* 8 bit reg */
264 #define Reg16		   0x2	/* 16 bit reg */
265 #define Reg32		   0x4	/* 32 bit reg */
266 #define Reg64		   0x8	/* 64 bit reg */
267   /* immediate */
268 #define Imm8		  0x10	/* 8 bit immediate */
269 #define Imm8S		  0x20	/* 8 bit immediate sign extended */
270 #define Imm16		  0x40	/* 16 bit immediate */
271 #define Imm32		  0x80	/* 32 bit immediate */
272 #define Imm32S		 0x100	/* 32 bit immediate sign extended */
273 #define Imm64		 0x200	/* 64 bit immediate */
274 #define Imm1		 0x400	/* 1 bit immediate */
275   /* memory */
276 #define BaseIndex	 0x800
277   /* Disp8,16,32 are used in different ways, depending on the
278      instruction.  For jumps, they specify the size of the PC relative
279      displacement, for baseindex type instructions, they specify the
280      size of the offset relative to the base register, and for memory
281      offset instructions such as `mov 1234,%al' they specify the size of
282      the offset relative to the segment base.  */
283 #define Disp8		0x1000	/* 8 bit displacement */
284 #define Disp16		0x2000	/* 16 bit displacement */
285 #define Disp32		0x4000	/* 32 bit displacement */
286 #define Disp32S	        0x8000	/* 32 bit signed displacement */
287 #define Disp64	       0x10000	/* 64 bit displacement */
288   /* specials */
289 #define InOutPortReg   0x20000	/* register to hold in/out port addr = dx */
290 #define ShiftCount     0x40000	/* register to hold shift cound = cl */
291 #define Control	       0x80000	/* Control register */
292 #define Debug	      0x100000	/* Debug register */
293 #define Test	      0x200000	/* Test register */
294 #define FloatReg      0x400000	/* Float register */
295 #define FloatAcc      0x800000	/* Float stack top %st(0) */
296 #define SReg2	     0x1000000	/* 2 bit segment register */
297 #define SReg3	     0x2000000	/* 3 bit segment register */
298 #define Acc	     0x4000000	/* Accumulator %al or %ax or %eax */
299 #define JumpAbsolute 0x8000000
300 #define RegMMX	    0x10000000	/* MMX register */
301 #define RegXMM	    0x20000000	/* XMM registers in PIII */
302 #define EsSeg	    0x40000000	/* String insn operand with fixed es segment */
303 
304   /* InvMem is for instructions with a modrm byte that only allow a
305      general register encoding in the i.tm.mode and i.tm.regmem fields,
306      eg. control reg moves.  They really ought to support a memory form,
307      but don't, so we add an InvMem flag to the register operand to
308      indicate that it should be encoded in the i.tm.regmem field.  */
309 #define InvMem	    0x80000000
310 
311 #define Reg	(Reg8|Reg16|Reg32|Reg64) /* gen'l register */
312 #define WordReg (Reg16|Reg32|Reg64)
313 #define ImplicitRegister (InOutPortReg|ShiftCount|Acc|FloatAcc)
314 #define Imm	(Imm8|Imm8S|Imm16|Imm32S|Imm32|Imm64) /* gen'l immediate */
315 #define EncImm	(Imm8|Imm16|Imm32|Imm32S) /* Encodable gen'l immediate */
316 #define Disp	(Disp8|Disp16|Disp32|Disp32S|Disp64) /* General displacement */
317 #define AnyMem	(Disp8|Disp16|Disp32|Disp32S|BaseIndex|InvMem)	/* General memory */
318   /* The following aliases are defined because the opcode table
319      carefully specifies the allowed memory types for each instruction.
320      At the moment we can only tell a memory reference size by the
321      instruction suffix, so there's not much point in defining Mem8,
322      Mem16, Mem32 and Mem64 opcode modifiers - We might as well just use
323      the suffix directly to check memory operands.  */
324 #define LLongMem AnyMem		/* 64 bits (or more) */
325 #define LongMem AnyMem		/* 32 bit memory ref */
326 #define ShortMem AnyMem		/* 16 bit memory ref */
327 #define WordMem AnyMem		/* 16 or 32 bit memory ref */
328 #define ByteMem AnyMem		/* 8 bit memory ref */
329 }
330 template;
331 
332 /*
333   'templates' is for grouping together 'template' structures for opcodes
334   of the same name.  This is only used for storing the insns in the grand
335   ole hash table of insns.
336   The templates themselves start at START and range up to (but not including)
337   END.
338   */
339 typedef struct
340 {
341   const template *start;
342   const template *end;
343 }
344 templates;
345 
346 /* these are for register name --> number & type hash lookup */
347 typedef struct
348 {
349   char *reg_name;
350   unsigned int reg_type;
351   unsigned int reg_flags;
352 #define RegRex	    0x1  /* Extended register.  */
353 #define RegRex64    0x2  /* Extended 8 bit register.  */
354   unsigned int reg_num;
355 }
356 reg_entry;
357 
358 typedef struct
359 {
360   char *seg_name;
361   unsigned int seg_prefix;
362 }
363 seg_entry;
364 
365 /* 386 operand encoding bytes:  see 386 book for details of this.  */
366 typedef struct
367 {
368   unsigned int regmem;	/* codes register or memory operand */
369   unsigned int reg;	/* codes register operand (or extended opcode) */
370   unsigned int mode;	/* how to interpret regmem & reg */
371 }
372 modrm_byte;
373 
374 /* x86-64 extension prefix.  */
375 typedef int rex_byte;
376 #define REX_OPCODE	0x40
377 
378 /* Indicates 64 bit operand size.  */
379 #define REX_MODE64	8
380 /* High extension to reg field of modrm byte.  */
381 #define REX_EXTX	4
382 /* High extension to SIB index field.  */
383 #define REX_EXTY	2
384 /* High extension to base field of modrm or SIB, or reg field of opcode.  */
385 #define REX_EXTZ	1
386 
387 /* 386 opcode byte to code indirect addressing.  */
388 typedef struct
389 {
390   unsigned base;
391   unsigned index;
392   unsigned scale;
393 }
394 sib_byte;
395 
396 /* x86 arch names and features */
397 typedef struct
398 {
399   const char *name;	/* arch name */
400   unsigned int flags;	/* cpu feature flags */
401 }
402 arch_entry;
403 
404 /* The name of the global offset table generated by the compiler. Allow
405    this to be overridden if need be.  */
406 #ifndef GLOBAL_OFFSET_TABLE_NAME
407 #ifdef OBJ_ELF
408 #define GLOBAL_OFFSET_TABLE_NAME "_GLOBAL_OFFSET_TABLE_"
409 #else
410 #define GLOBAL_OFFSET_TABLE_NAME "__GLOBAL_OFFSET_TABLE_"
411 #endif
412 #endif
413 
414 #ifndef LEX_AT
415 #define TC_PARSE_CONS_EXPRESSION(EXP, NBYTES) x86_cons (EXP, NBYTES)
416 extern void x86_cons PARAMS ((expressionS *, int));
417 
418 #define TC_CONS_FIX_NEW(FRAG,OFF,LEN,EXP) x86_cons_fix_new(FRAG, OFF, LEN, EXP)
419 extern void x86_cons_fix_new
420   PARAMS ((fragS *, unsigned int, unsigned int, expressionS *));
421 #endif
422 
423 #define DIFF_EXPR_OK    /* foo-. gets turned into PC relative relocs */
424 
425 #define NO_RELOC BFD_RELOC_NONE
426 
427 void i386_validate_fix PARAMS ((struct fix *));
428 #define TC_VALIDATE_FIX(FIX,SEGTYPE,SKIP) i386_validate_fix(FIX)
429 
430 #define tc_fix_adjustable(X)  tc_i386_fix_adjustable(X)
431 extern int tc_i386_fix_adjustable PARAMS ((struct fix *));
432 
433 /* Values passed to md_apply_fix3 don't include the symbol value.  */
434 #define MD_APPLY_SYM_VALUE(FIX) 0
435 
436 /* ELF wants external syms kept, as does PE COFF.  */
437 #if defined (TE_PE) && defined (STRICT_PE_FORMAT)
438 #define EXTERN_FORCE_RELOC				\
439   (OUTPUT_FLAVOR == bfd_target_elf_flavour		\
440    || OUTPUT_FLAVOR == bfd_target_coff_flavour)
441 #else
442 #define EXTERN_FORCE_RELOC				\
443   (OUTPUT_FLAVOR == bfd_target_elf_flavour)
444 #endif
445 
446 /* This expression evaluates to true if the relocation is for a local
447    object for which we still want to do the relocation at runtime.
448    False if we are willing to perform this relocation while building
449    the .o file.  GOTOFF does not need to be checked here because it is
450    not pcrel.  I am not sure if some of the others are ever used with
451    pcrel, but it is easier to be safe than sorry.  */
452 
453 #define TC_FORCE_RELOCATION_LOCAL(FIX)			\
454   (!(FIX)->fx_pcrel					\
455    || (FIX)->fx_plt					\
456    || (FIX)->fx_r_type == BFD_RELOC_386_PLT32		\
457    || (FIX)->fx_r_type == BFD_RELOC_386_GOT32		\
458    || (FIX)->fx_r_type == BFD_RELOC_386_GOTPC		\
459    || (FIX)->fx_r_type == BFD_RELOC_X86_64_GOTPCREL	\
460    || TC_FORCE_RELOCATION (FIX))
461 
462 #define md_operand(x)
463 
464 extern const struct relax_type md_relax_table[];
465 #define TC_GENERIC_RELAX_TABLE md_relax_table
466 
467 extern int optimize_align_code;
468 
469 #define md_do_align(n, fill, len, max, around)				\
470 if ((n)									\
471     && !need_pass_2							\
472     && optimize_align_code						\
473     && (!(fill)								\
474 	|| ((char)*(fill) == (char)0x90 && (len) == 1))			\
475     && subseg_text_p (now_seg))						\
476   {									\
477     frag_align_code ((n), (max));					\
478     goto around;							\
479   }
480 
481 #define MAX_MEM_FOR_RS_ALIGN_CODE  15
482 
483 extern void i386_align_code PARAMS ((fragS *, int));
484 
485 #define HANDLE_ALIGN(fragP)						\
486 if (fragP->fr_type == rs_align_code) 					\
487   i386_align_code (fragP, (fragP->fr_next->fr_address			\
488 			   - fragP->fr_address				\
489 			   - fragP->fr_fix));
490 
491 void i386_print_statistics PARAMS ((FILE *));
492 #define tc_print_statistics i386_print_statistics
493 
494 #define md_number_to_chars number_to_chars_littleendian
495 
496 #ifdef SCO_ELF
497 #define tc_init_after_args() sco_id ()
498 extern void sco_id PARAMS ((void));
499 #endif
500 
501 /* We want .cfi_* pseudo-ops for generating unwind info.  */
502 #define TARGET_USE_CFIPOP 1
503 
504 extern unsigned int x86_dwarf2_return_column;
505 #define DWARF2_DEFAULT_RETURN_COLUMN x86_dwarf2_return_column
506 
507 extern int x86_cie_data_alignment;
508 #define DWARF2_CIE_DATA_ALIGNMENT x86_cie_data_alignment
509 
510 #define tc_regname_to_dw2regnum tc_x86_regname_to_dw2regnum
511 extern int tc_x86_regname_to_dw2regnum PARAMS ((const char *regname));
512 
513 #define tc_cfi_frame_initial_instructions tc_x86_frame_initial_instructions
514 extern void tc_x86_frame_initial_instructions PARAMS ((void));
515 
516 #endif /* TC_I386 */
517