1
2#ifndef _X86SSE_H_
3#define _X86SSE_H_
4
5#if defined(__i386__) || defined(__386__)
6
7/* It is up to the caller to ensure that instructions issued are
8 * suitable for the host cpu.  There are no checks made in this module
9 * for mmx/sse/sse2 support on the cpu.
10 */
11struct x86_reg {
12   unsigned file:3;
13   unsigned idx:3;
14   unsigned mod:2;		/* mod_REG if this is just a register */
15   int      disp:24;		/* only +/- 23bits of offset - should be enough... */
16};
17
18struct x86_function {
19   unsigned size;
20   unsigned char *store;
21   unsigned char *csr;
22   unsigned stack_offset;
23   int need_emms;
24   const char *fn;
25};
26
27enum x86_reg_file {
28   file_REG32,
29   file_MMX,
30   file_XMM,
31   file_x87
32};
33
34/* Values for mod field of modr/m byte
35 */
36enum x86_reg_mod {
37   mod_INDIRECT,
38   mod_DISP8,
39   mod_DISP32,
40   mod_REG
41};
42
43enum x86_reg_name {
44   reg_AX,
45   reg_CX,
46   reg_DX,
47   reg_BX,
48   reg_SP,
49   reg_BP,
50   reg_SI,
51   reg_DI
52};
53
54
55enum x86_cc {
56   cc_O,			/* overflow */
57   cc_NO,			/* not overflow */
58   cc_NAE,			/* not above or equal / carry */
59   cc_AE,			/* above or equal / not carry */
60   cc_E,			/* equal / zero */
61   cc_NE			/* not equal / not zero */
62};
63
64enum sse_cc {
65   cc_Equal,
66   cc_LessThan,
67   cc_LessThanEqual,
68   cc_Unordered,
69   cc_NotEqual,
70   cc_NotLessThan,
71   cc_NotLessThanEqual,
72   cc_Ordered
73};
74
75#define cc_Z  cc_E
76#define cc_NZ cc_NE
77
78/* Begin/end/retreive function creation:
79 */
80
81
82void x86_init_func( struct x86_function *p );
83int x86_init_func_size( struct x86_function *p, unsigned code_size );
84void x86_release_func( struct x86_function *p );
85void (*x86_get_func( struct x86_function *p ))( void );
86
87
88
89/* Create and manipulate registers and regmem values:
90 */
91struct x86_reg x86_make_reg( enum x86_reg_file file,
92			     enum x86_reg_name idx );
93
94struct x86_reg x86_make_disp( struct x86_reg reg,
95			      int disp );
96
97struct x86_reg x86_deref( struct x86_reg reg );
98
99struct x86_reg x86_get_base_reg( struct x86_reg reg );
100
101
102/* Labels, jumps and fixup:
103 */
104unsigned char *x86_get_label( struct x86_function *p );
105
106void x86_jcc( struct x86_function *p,
107	      enum x86_cc cc,
108	      unsigned char *label );
109
110unsigned char *x86_jcc_forward( struct x86_function *p,
111			  enum x86_cc cc );
112
113unsigned char *x86_jmp_forward( struct x86_function *p);
114
115unsigned char *x86_call_forward( struct x86_function *p);
116
117void x86_fixup_fwd_jump( struct x86_function *p,
118			 unsigned char *fixup );
119
120void x86_jmp( struct x86_function *p, unsigned char *label );
121
122/* void x86_call( struct x86_function *p, void (*label)() ); */
123void x86_call( struct x86_function *p, struct x86_reg reg);
124
125/* michal:
126 * Temporary. As I need immediate operands, and dont want to mess with the codegen,
127 * I load the immediate into general purpose register and use it.
128 */
129void x86_mov_reg_imm( struct x86_function *p, struct x86_reg dst, int imm );
130
131
132/* Macro for sse_shufps() and sse2_pshufd():
133 */
134#define SHUF(_x,_y,_z,_w)       (((_x)<<0) | ((_y)<<2) | ((_z)<<4) | ((_w)<<6))
135#define SHUF_NOOP               RSW(0,1,2,3)
136#define GET_SHUF(swz, idx)      (((swz) >> ((idx)*2)) & 0x3)
137
138void mmx_emms( struct x86_function *p );
139void mmx_movd( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
140void mmx_movq( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
141void mmx_packssdw( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
142void mmx_packuswb( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
143
144void sse2_cvtps2dq( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
145void sse2_cvttps2dq( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
146void sse2_movd( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
147void sse2_packssdw( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
148void sse2_packsswb( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
149void sse2_packuswb( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
150void sse2_pshufd( struct x86_function *p, struct x86_reg dest, struct x86_reg arg0,
151                  unsigned char shuf );
152void sse2_rcpps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
153void sse2_rcpss( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
154
155void sse_addps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
156void sse_addss( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
157void sse_cvtps2pi( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
158void sse_divss( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
159void sse_andnps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
160void sse_andps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
161void sse_cmpps( struct x86_function *p, struct x86_reg dst, struct x86_reg src,
162                unsigned char cc );
163void sse_maxps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
164void sse_maxss( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
165void sse_minps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
166void sse_movaps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
167void sse_movhlps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
168void sse_movhps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
169void sse_movlhps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
170void sse_movlps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
171void sse_movss( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
172void sse_movups( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
173void sse_mulps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
174void sse_mulss( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
175void sse_orps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
176void sse_xorps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
177void sse_subps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
178void sse_rsqrtps( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
179void sse_rsqrtss( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
180void sse_shufps( struct x86_function *p, struct x86_reg dest, struct x86_reg arg0,
181                 unsigned char shuf );
182void sse_pmovmskb( struct x86_function *p, struct x86_reg dest, struct x86_reg src );
183
184void x86_add( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
185void x86_and( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
186void x86_cmp( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
187void x86_dec( struct x86_function *p, struct x86_reg reg );
188void x86_inc( struct x86_function *p, struct x86_reg reg );
189void x86_lea( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
190void x86_mov( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
191void x86_mul( struct x86_function *p, struct x86_reg src );
192void x86_or( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
193void x86_pop( struct x86_function *p, struct x86_reg reg );
194void x86_push( struct x86_function *p, struct x86_reg reg );
195void x86_ret( struct x86_function *p );
196void x86_sub( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
197void x86_test( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
198void x86_xor( struct x86_function *p, struct x86_reg dst, struct x86_reg src );
199void x86_sahf( struct x86_function *p );
200
201void x87_f2xm1( struct x86_function *p );
202void x87_fabs( struct x86_function *p );
203void x87_fadd( struct x86_function *p, struct x86_reg dst, struct x86_reg arg );
204void x87_faddp( struct x86_function *p, struct x86_reg dst );
205void x87_fchs( struct x86_function *p );
206void x87_fclex( struct x86_function *p );
207void x87_fcom( struct x86_function *p, struct x86_reg dst );
208void x87_fcomp( struct x86_function *p, struct x86_reg dst );
209void x87_fcos( struct x86_function *p );
210void x87_fdiv( struct x86_function *p, struct x86_reg dst, struct x86_reg arg );
211void x87_fdivp( struct x86_function *p, struct x86_reg dst );
212void x87_fdivr( struct x86_function *p, struct x86_reg dst, struct x86_reg arg );
213void x87_fdivrp( struct x86_function *p, struct x86_reg dst );
214void x87_fild( struct x86_function *p, struct x86_reg arg );
215void x87_fist( struct x86_function *p, struct x86_reg dst );
216void x87_fistp( struct x86_function *p, struct x86_reg dst );
217void x87_fld( struct x86_function *p, struct x86_reg arg );
218void x87_fld1( struct x86_function *p );
219void x87_fldcw( struct x86_function *p, struct x86_reg arg );
220void x87_fldl2e( struct x86_function *p );
221void x87_fldln2( struct x86_function *p );
222void x87_fldz( struct x86_function *p );
223void x87_fmul( struct x86_function *p, struct x86_reg dst, struct x86_reg arg );
224void x87_fmulp( struct x86_function *p, struct x86_reg dst );
225void x87_fnclex( struct x86_function *p );
226void x87_fprndint( struct x86_function *p );
227void x87_fscale( struct x86_function *p );
228void x87_fsin( struct x86_function *p );
229void x87_fsincos( struct x86_function *p );
230void x87_fsqrt( struct x86_function *p );
231void x87_fst( struct x86_function *p, struct x86_reg dst );
232void x87_fstp( struct x86_function *p, struct x86_reg dst );
233void x87_fsub( struct x86_function *p, struct x86_reg dst, struct x86_reg arg );
234void x87_fsubp( struct x86_function *p, struct x86_reg dst );
235void x87_fsubr( struct x86_function *p, struct x86_reg dst, struct x86_reg arg );
236void x87_fsubrp( struct x86_function *p, struct x86_reg dst );
237void x87_fxch( struct x86_function *p, struct x86_reg dst );
238void x87_fxtract( struct x86_function *p );
239void x87_fyl2x( struct x86_function *p );
240void x87_fyl2xp1( struct x86_function *p );
241void x87_fwait( struct x86_function *p );
242void x87_fnstsw( struct x86_function *p, struct x86_reg dst );
243void x87_fucompp( struct x86_function *p );
244void x87_fucomp( struct x86_function *p, struct x86_reg arg );
245void x87_fucom( struct x86_function *p, struct x86_reg arg );
246
247
248
249/* Retreive a reference to one of the function arguments, taking into
250 * account any push/pop activity.  Note - doesn't track explict
251 * manipulation of ESP by other instructions.
252 */
253struct x86_reg x86_fn_arg( struct x86_function *p, unsigned arg );
254
255#endif
256#endif
257