4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
26 #include "qemu/host-utils.h"
28 #include "disas/disas.h"
35 #define PREFIX_REPZ 0x01
36 #define PREFIX_REPNZ 0x02
37 #define PREFIX_LOCK 0x04
38 #define PREFIX_DATA 0x08
39 #define PREFIX_ADR 0x10
40 #define PREFIX_VEX 0x20
43 #define CODE64(s) ((s)->code64)
44 #define REX_X(s) ((s)->rex_x)
45 #define REX_B(s) ((s)->rex_b)
60 //#define MACRO_TEST 1
62 /* global register indexes */
63 static TCGv_ptr cpu_env
;
65 static TCGv cpu_cc_dst
, cpu_cc_src
, cpu_cc_src2
, cpu_cc_srcT
;
66 static TCGv_i32 cpu_cc_op
;
67 static TCGv cpu_regs
[CPU_NB_REGS
];
70 /* local register indexes (only used inside old micro ops) */
71 static TCGv cpu_tmp0
, cpu_tmp4
;
72 static TCGv_ptr cpu_ptr0
, cpu_ptr1
;
73 static TCGv_i32 cpu_tmp2_i32
, cpu_tmp3_i32
;
74 static TCGv_i64 cpu_tmp1_i64
;
76 static uint8_t gen_opc_cc_op
[OPC_BUF_SIZE
];
78 #include "exec/gen-icount.h"
81 static int x86_64_hregs
;
84 typedef struct DisasContext
{
85 /* current insn context */
86 int override
; /* -1 if no override */
90 target_ulong pc
; /* pc = eip + cs_base */
91 int is_jmp
; /* 1 = means jump (stop translation), 2 means CPU
92 static state change (stop translation) */
93 /* current block context */
94 target_ulong cs_base
; /* base of CS segment */
95 int pe
; /* protected mode */
96 int code32
; /* 32 bit code segment */
98 int lma
; /* long mode active */
99 int code64
; /* 64 bit code segment */
102 int vex_l
; /* vex vector length */
103 int vex_v
; /* vex vvvv register, without 1's compliment. */
104 int ss32
; /* 32 bit stack segment */
105 CCOp cc_op
; /* current CC operation */
107 int addseg
; /* non zero if either DS/ES/SS have a non zero base */
108 int f_st
; /* currently unused */
109 int vm86
; /* vm86 mode */
112 int tf
; /* TF cpu flag */
113 int singlestep_enabled
; /* "hardware" single step enabled */
114 int jmp_opt
; /* use direct block chaining for direct jumps */
115 int mem_index
; /* select memory access functions */
116 uint64_t flags
; /* all execution flags */
117 struct TranslationBlock
*tb
;
118 int popl_esp_hack
; /* for correct popl with esp base handling */
119 int rip_offset
; /* only used in x86_64, but left for simplicity */
121 int cpuid_ext_features
;
122 int cpuid_ext2_features
;
123 int cpuid_ext3_features
;
124 int cpuid_7_0_ebx_features
;
127 static void gen_eob(DisasContext
*s
);
128 static void gen_jmp(DisasContext
*s
, target_ulong eip
);
129 static void gen_jmp_tb(DisasContext
*s
, target_ulong eip
, int tb_num
);
130 static void gen_op(DisasContext
*s1
, int op
, TCGMemOp ot
, int d
);
132 /* i386 arith/logic operations */
152 OP_SHL1
, /* undocumented */
168 /* I386 int registers */
169 OR_EAX
, /* MUST be even numbered */
178 OR_TMP0
= 16, /* temporary operand register */
180 OR_A0
, /* temporary register used when doing address evaluation */
190 /* Bit set if the global variable is live after setting CC_OP to X. */
191 static const uint8_t cc_op_live
[CC_OP_NB
] = {
192 [CC_OP_DYNAMIC
] = USES_CC_DST
| USES_CC_SRC
| USES_CC_SRC2
,
193 [CC_OP_EFLAGS
] = USES_CC_SRC
,
194 [CC_OP_MULB
... CC_OP_MULQ
] = USES_CC_DST
| USES_CC_SRC
,
195 [CC_OP_ADDB
... CC_OP_ADDQ
] = USES_CC_DST
| USES_CC_SRC
,
196 [CC_OP_ADCB
... CC_OP_ADCQ
] = USES_CC_DST
| USES_CC_SRC
| USES_CC_SRC2
,
197 [CC_OP_SUBB
... CC_OP_SUBQ
] = USES_CC_DST
| USES_CC_SRC
| USES_CC_SRCT
,
198 [CC_OP_SBBB
... CC_OP_SBBQ
] = USES_CC_DST
| USES_CC_SRC
| USES_CC_SRC2
,
199 [CC_OP_LOGICB
... CC_OP_LOGICQ
] = USES_CC_DST
,
200 [CC_OP_INCB
... CC_OP_INCQ
] = USES_CC_DST
| USES_CC_SRC
,
201 [CC_OP_DECB
... CC_OP_DECQ
] = USES_CC_DST
| USES_CC_SRC
,
202 [CC_OP_SHLB
... CC_OP_SHLQ
] = USES_CC_DST
| USES_CC_SRC
,
203 [CC_OP_SARB
... CC_OP_SARQ
] = USES_CC_DST
| USES_CC_SRC
,
204 [CC_OP_BMILGB
... CC_OP_BMILGQ
] = USES_CC_DST
| USES_CC_SRC
,
205 [CC_OP_ADCX
] = USES_CC_DST
| USES_CC_SRC
,
206 [CC_OP_ADOX
] = USES_CC_SRC
| USES_CC_SRC2
,
207 [CC_OP_ADCOX
] = USES_CC_DST
| USES_CC_SRC
| USES_CC_SRC2
,
211 static void set_cc_op(DisasContext
*s
, CCOp op
)
215 if (s
->cc_op
== op
) {
219 /* Discard CC computation that will no longer be used. */
220 dead
= cc_op_live
[s
->cc_op
] & ~cc_op_live
[op
];
221 if (dead
& USES_CC_DST
) {
222 tcg_gen_discard_tl(cpu_cc_dst
);
224 if (dead
& USES_CC_SRC
) {
225 tcg_gen_discard_tl(cpu_cc_src
);
227 if (dead
& USES_CC_SRC2
) {
228 tcg_gen_discard_tl(cpu_cc_src2
);
230 if (dead
& USES_CC_SRCT
) {
231 tcg_gen_discard_tl(cpu_cc_srcT
);
234 if (op
== CC_OP_DYNAMIC
) {
235 /* The DYNAMIC setting is translator only, and should never be
236 stored. Thus we always consider it clean. */
237 s
->cc_op_dirty
= false;
239 /* Discard any computed CC_OP value (see shifts). */
240 if (s
->cc_op
== CC_OP_DYNAMIC
) {
241 tcg_gen_discard_i32(cpu_cc_op
);
243 s
->cc_op_dirty
= true;
248 static void gen_update_cc_op(DisasContext
*s
)
250 if (s
->cc_op_dirty
) {
251 tcg_gen_movi_i32(cpu_cc_op
, s
->cc_op
);
252 s
->cc_op_dirty
= false;
258 #define NB_OP_SIZES 4
260 #else /* !TARGET_X86_64 */
262 #define NB_OP_SIZES 3
264 #endif /* !TARGET_X86_64 */
266 #if defined(HOST_WORDS_BIGENDIAN)
267 #define REG_B_OFFSET (sizeof(target_ulong) - 1)
268 #define REG_H_OFFSET (sizeof(target_ulong) - 2)
269 #define REG_W_OFFSET (sizeof(target_ulong) - 2)
270 #define REG_L_OFFSET (sizeof(target_ulong) - 4)
271 #define REG_LH_OFFSET (sizeof(target_ulong) - 8)
273 #define REG_B_OFFSET 0
274 #define REG_H_OFFSET 1
275 #define REG_W_OFFSET 0
276 #define REG_L_OFFSET 0
277 #define REG_LH_OFFSET 4
280 /* In instruction encodings for byte register accesses the
281 * register number usually indicates "low 8 bits of register N";
282 * however there are some special cases where N 4..7 indicates
283 * [AH, CH, DH, BH], ie "bits 15..8 of register N-4". Return
284 * true for this special case, false otherwise.
286 static inline bool byte_reg_is_xH(int reg
)
292 if (reg
>= 8 || x86_64_hregs
) {
299 /* Select the size of a push/pop operation. */
300 static inline TCGMemOp
mo_pushpop(DisasContext
*s
, TCGMemOp ot
)
303 return ot
== MO_16 ? MO_16
: MO_64
;
309 /* Select only size 64 else 32. Used for SSE operand sizes. */
310 static inline TCGMemOp
mo_64_32(TCGMemOp ot
)
313 return ot
== MO_64 ? MO_64
: MO_32
;
319 /* Select size 8 if lsb of B is clear, else OT. Used for decoding
320 byte vs word opcodes. */
321 static inline TCGMemOp
mo_b_d(int b
, TCGMemOp ot
)
323 return b
& 1 ? ot
: MO_8
;
326 /* Select size 8 if lsb of B is clear, else OT capped at 32.
327 Used for decoding operand size of port opcodes. */
328 static inline TCGMemOp
mo_b_d32(int b
, TCGMemOp ot
)
330 return b
& 1 ?
(ot
== MO_16 ? MO_16
: MO_32
) : MO_8
;
333 static void gen_op_mov_reg_v(TCGMemOp ot
, int reg
, TCGv t0
)
337 if (!byte_reg_is_xH(reg
)) {
338 tcg_gen_deposit_tl(cpu_regs
[reg
], cpu_regs
[reg
], t0
, 0, 8);
340 tcg_gen_deposit_tl(cpu_regs
[reg
- 4], cpu_regs
[reg
- 4], t0
, 8, 8);
344 tcg_gen_deposit_tl(cpu_regs
[reg
], cpu_regs
[reg
], t0
, 0, 16);
347 /* For x86_64, this sets the higher half of register to zero.
348 For i386, this is equivalent to a mov. */
349 tcg_gen_ext32u_tl(cpu_regs
[reg
], t0
);
353 tcg_gen_mov_tl(cpu_regs
[reg
], t0
);
361 static inline void gen_op_mov_v_reg(TCGMemOp ot
, TCGv t0
, int reg
)
363 if (ot
== MO_8
&& byte_reg_is_xH(reg
)) {
364 tcg_gen_shri_tl(t0
, cpu_regs
[reg
- 4], 8);
365 tcg_gen_ext8u_tl(t0
, t0
);
367 tcg_gen_mov_tl(t0
, cpu_regs
[reg
]);
371 static inline void gen_op_movl_A0_reg(int reg
)
373 tcg_gen_mov_tl(cpu_A0
, cpu_regs
[reg
]);
376 static inline void gen_op_addl_A0_im(int32_t val
)
378 tcg_gen_addi_tl(cpu_A0
, cpu_A0
, val
);
380 tcg_gen_andi_tl(cpu_A0
, cpu_A0
, 0xffffffff);
385 static inline void gen_op_addq_A0_im(int64_t val
)
387 tcg_gen_addi_tl(cpu_A0
, cpu_A0
, val
);
391 static void gen_add_A0_im(DisasContext
*s
, int val
)
395 gen_op_addq_A0_im(val
);
398 gen_op_addl_A0_im(val
);
401 static inline void gen_op_jmp_v(TCGv dest
)
403 tcg_gen_st_tl(dest
, cpu_env
, offsetof(CPUX86State
, eip
));
406 static inline void gen_op_add_reg_im(TCGMemOp size
, int reg
, int32_t val
)
408 tcg_gen_addi_tl(cpu_tmp0
, cpu_regs
[reg
], val
);
409 gen_op_mov_reg_v(size
, reg
, cpu_tmp0
);
412 static inline void gen_op_add_reg_T0(TCGMemOp size
, int reg
)
414 tcg_gen_add_tl(cpu_tmp0
, cpu_regs
[reg
], cpu_T
[0]);
415 gen_op_mov_reg_v(size
, reg
, cpu_tmp0
);
418 static inline void gen_op_addl_A0_reg_sN(int shift
, int reg
)
420 tcg_gen_mov_tl(cpu_tmp0
, cpu_regs
[reg
]);
422 tcg_gen_shli_tl(cpu_tmp0
, cpu_tmp0
, shift
);
423 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
424 /* For x86_64, this sets the higher half of register to zero.
425 For i386, this is equivalent to a nop. */
426 tcg_gen_ext32u_tl(cpu_A0
, cpu_A0
);
429 static inline void gen_op_movl_A0_seg(int reg
)
431 tcg_gen_ld32u_tl(cpu_A0
, cpu_env
, offsetof(CPUX86State
, segs
[reg
].base
) + REG_L_OFFSET
);
434 static inline void gen_op_addl_A0_seg(DisasContext
*s
, int reg
)
436 tcg_gen_ld_tl(cpu_tmp0
, cpu_env
, offsetof(CPUX86State
, segs
[reg
].base
));
439 tcg_gen_andi_tl(cpu_A0
, cpu_A0
, 0xffffffff);
440 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
442 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
443 tcg_gen_andi_tl(cpu_A0
, cpu_A0
, 0xffffffff);
446 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
451 static inline void gen_op_movq_A0_seg(int reg
)
453 tcg_gen_ld_tl(cpu_A0
, cpu_env
, offsetof(CPUX86State
, segs
[reg
].base
));
456 static inline void gen_op_addq_A0_seg(int reg
)
458 tcg_gen_ld_tl(cpu_tmp0
, cpu_env
, offsetof(CPUX86State
, segs
[reg
].base
));
459 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
462 static inline void gen_op_movq_A0_reg(int reg
)
464 tcg_gen_mov_tl(cpu_A0
, cpu_regs
[reg
]);
467 static inline void gen_op_addq_A0_reg_sN(int shift
, int reg
)
469 tcg_gen_mov_tl(cpu_tmp0
, cpu_regs
[reg
]);
471 tcg_gen_shli_tl(cpu_tmp0
, cpu_tmp0
, shift
);
472 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
476 static inline void gen_op_ld_v(DisasContext
*s
, int idx
, TCGv t0
, TCGv a0
)
478 tcg_gen_qemu_ld_tl(t0
, a0
, s
->mem_index
, idx
| MO_LE
);
481 static inline void gen_op_st_v(DisasContext
*s
, int idx
, TCGv t0
, TCGv a0
)
483 tcg_gen_qemu_st_tl(t0
, a0
, s
->mem_index
, idx
| MO_LE
);
486 static inline void gen_op_st_rm_T0_A0(DisasContext
*s
, int idx
, int d
)
489 gen_op_st_v(s
, idx
, cpu_T
[0], cpu_A0
);
491 gen_op_mov_reg_v(idx
, d
, cpu_T
[0]);
495 static inline void gen_jmp_im(target_ulong pc
)
497 tcg_gen_movi_tl(cpu_tmp0
, pc
);
498 gen_op_jmp_v(cpu_tmp0
);
501 static inline void gen_string_movl_A0_ESI(DisasContext
*s
)
505 override
= s
->override
;
510 gen_op_movq_A0_seg(override
);
511 gen_op_addq_A0_reg_sN(0, R_ESI
);
513 gen_op_movq_A0_reg(R_ESI
);
519 if (s
->addseg
&& override
< 0)
522 gen_op_movl_A0_seg(override
);
523 gen_op_addl_A0_reg_sN(0, R_ESI
);
525 gen_op_movl_A0_reg(R_ESI
);
529 /* 16 address, always override */
532 tcg_gen_ext16u_tl(cpu_A0
, cpu_regs
[R_ESI
]);
533 gen_op_addl_A0_seg(s
, override
);
540 static inline void gen_string_movl_A0_EDI(DisasContext
*s
)
545 gen_op_movq_A0_reg(R_EDI
);
550 gen_op_movl_A0_seg(R_ES
);
551 gen_op_addl_A0_reg_sN(0, R_EDI
);
553 gen_op_movl_A0_reg(R_EDI
);
557 tcg_gen_ext16u_tl(cpu_A0
, cpu_regs
[R_EDI
]);
558 gen_op_addl_A0_seg(s
, R_ES
);
565 static inline void gen_op_movl_T0_Dshift(TCGMemOp ot
)
567 tcg_gen_ld32s_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
, df
));
568 tcg_gen_shli_tl(cpu_T
[0], cpu_T
[0], ot
);
571 static TCGv
gen_ext_tl(TCGv dst
, TCGv src
, TCGMemOp size
, bool sign
)
576 tcg_gen_ext8s_tl(dst
, src
);
578 tcg_gen_ext8u_tl(dst
, src
);
583 tcg_gen_ext16s_tl(dst
, src
);
585 tcg_gen_ext16u_tl(dst
, src
);
591 tcg_gen_ext32s_tl(dst
, src
);
593 tcg_gen_ext32u_tl(dst
, src
);
602 static void gen_extu(TCGMemOp ot
, TCGv reg
)
604 gen_ext_tl(reg
, reg
, ot
, false);
607 static void gen_exts(TCGMemOp ot
, TCGv reg
)
609 gen_ext_tl(reg
, reg
, ot
, true);
612 static inline void gen_op_jnz_ecx(TCGMemOp size
, int label1
)
614 tcg_gen_mov_tl(cpu_tmp0
, cpu_regs
[R_ECX
]);
615 gen_extu(size
, cpu_tmp0
);
616 tcg_gen_brcondi_tl(TCG_COND_NE
, cpu_tmp0
, 0, label1
);
619 static inline void gen_op_jz_ecx(TCGMemOp size
, int label1
)
621 tcg_gen_mov_tl(cpu_tmp0
, cpu_regs
[R_ECX
]);
622 gen_extu(size
, cpu_tmp0
);
623 tcg_gen_brcondi_tl(TCG_COND_EQ
, cpu_tmp0
, 0, label1
);
626 static void gen_helper_in_func(TCGMemOp ot
, TCGv v
, TCGv_i32 n
)
630 gen_helper_inb(v
, n
);
633 gen_helper_inw(v
, n
);
636 gen_helper_inl(v
, n
);
643 static void gen_helper_out_func(TCGMemOp ot
, TCGv_i32 v
, TCGv_i32 n
)
647 gen_helper_outb(v
, n
);
650 gen_helper_outw(v
, n
);
653 gen_helper_outl(v
, n
);
660 static void gen_check_io(DisasContext
*s
, TCGMemOp ot
, target_ulong cur_eip
,
664 target_ulong next_eip
;
667 if (s
->pe
&& (s
->cpl
> s
->iopl
|| s
->vm86
)) {
671 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
674 gen_helper_check_iob(cpu_env
, cpu_tmp2_i32
);
677 gen_helper_check_iow(cpu_env
, cpu_tmp2_i32
);
680 gen_helper_check_iol(cpu_env
, cpu_tmp2_i32
);
686 if(s
->flags
& HF_SVMI_MASK
) {
691 svm_flags
|= (1 << (4 + ot
));
692 next_eip
= s
->pc
- s
->cs_base
;
693 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
694 gen_helper_svm_check_io(cpu_env
, cpu_tmp2_i32
,
695 tcg_const_i32(svm_flags
),
696 tcg_const_i32(next_eip
- cur_eip
));
700 static inline void gen_movs(DisasContext
*s
, TCGMemOp ot
)
702 gen_string_movl_A0_ESI(s
);
703 gen_op_ld_v(s
, ot
, cpu_T
[0], cpu_A0
);
704 gen_string_movl_A0_EDI(s
);
705 gen_op_st_v(s
, ot
, cpu_T
[0], cpu_A0
);
706 gen_op_movl_T0_Dshift(ot
);
707 gen_op_add_reg_T0(s
->aflag
, R_ESI
);
708 gen_op_add_reg_T0(s
->aflag
, R_EDI
);
711 static void gen_op_update1_cc(void)
713 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
716 static void gen_op_update2_cc(void)
718 tcg_gen_mov_tl(cpu_cc_src
, cpu_T
[1]);
719 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
722 static void gen_op_update3_cc(TCGv reg
)
724 tcg_gen_mov_tl(cpu_cc_src2
, reg
);
725 tcg_gen_mov_tl(cpu_cc_src
, cpu_T
[1]);
726 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
729 static inline void gen_op_testl_T0_T1_cc(void)
731 tcg_gen_and_tl(cpu_cc_dst
, cpu_T
[0], cpu_T
[1]);
734 static void gen_op_update_neg_cc(void)
736 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
737 tcg_gen_neg_tl(cpu_cc_src
, cpu_T
[0]);
738 tcg_gen_movi_tl(cpu_cc_srcT
, 0);
741 /* compute all eflags to cc_src */
742 static void gen_compute_eflags(DisasContext
*s
)
744 TCGv zero
, dst
, src1
, src2
;
747 if (s
->cc_op
== CC_OP_EFLAGS
) {
750 if (s
->cc_op
== CC_OP_CLR
) {
751 tcg_gen_movi_tl(cpu_cc_src
, CC_Z
| CC_P
);
752 set_cc_op(s
, CC_OP_EFLAGS
);
761 /* Take care to not read values that are not live. */
762 live
= cc_op_live
[s
->cc_op
] & ~USES_CC_SRCT
;
763 dead
= live
^ (USES_CC_DST
| USES_CC_SRC
| USES_CC_SRC2
);
765 zero
= tcg_const_tl(0);
766 if (dead
& USES_CC_DST
) {
769 if (dead
& USES_CC_SRC
) {
772 if (dead
& USES_CC_SRC2
) {
778 gen_helper_cc_compute_all(cpu_cc_src
, dst
, src1
, src2
, cpu_cc_op
);
779 set_cc_op(s
, CC_OP_EFLAGS
);
786 typedef struct CCPrepare
{
796 /* compute eflags.C to reg */
797 static CCPrepare
gen_prepare_eflags_c(DisasContext
*s
, TCGv reg
)
803 case CC_OP_SUBB
... CC_OP_SUBQ
:
804 /* (DATA_TYPE)CC_SRCT < (DATA_TYPE)CC_SRC */
805 size
= s
->cc_op
- CC_OP_SUBB
;
806 t1
= gen_ext_tl(cpu_tmp0
, cpu_cc_src
, size
, false);
807 /* If no temporary was used, be careful not to alias t1 and t0. */
808 t0
= TCGV_EQUAL(t1
, cpu_cc_src
) ? cpu_tmp0
: reg
;
809 tcg_gen_mov_tl(t0
, cpu_cc_srcT
);
813 case CC_OP_ADDB
... CC_OP_ADDQ
:
814 /* (DATA_TYPE)CC_DST < (DATA_TYPE)CC_SRC */
815 size
= s
->cc_op
- CC_OP_ADDB
;
816 t1
= gen_ext_tl(cpu_tmp0
, cpu_cc_src
, size
, false);
817 t0
= gen_ext_tl(reg
, cpu_cc_dst
, size
, false);
819 return (CCPrepare
) { .cond
= TCG_COND_LTU
, .reg
= t0
,
820 .reg2
= t1
, .mask
= -1, .use_reg2
= true };
822 case CC_OP_LOGICB
... CC_OP_LOGICQ
:
824 return (CCPrepare
) { .cond
= TCG_COND_NEVER
, .mask
= -1 };
826 case CC_OP_INCB
... CC_OP_INCQ
:
827 case CC_OP_DECB
... CC_OP_DECQ
:
828 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
829 .mask
= -1, .no_setcond
= true };
831 case CC_OP_SHLB
... CC_OP_SHLQ
:
832 /* (CC_SRC >> (DATA_BITS - 1)) & 1 */
833 size
= s
->cc_op
- CC_OP_SHLB
;
834 shift
= (8 << size
) - 1;
835 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
836 .mask
= (target_ulong
)1 << shift
};
838 case CC_OP_MULB
... CC_OP_MULQ
:
839 return (CCPrepare
) { .cond
= TCG_COND_NE
,
840 .reg
= cpu_cc_src
, .mask
= -1 };
842 case CC_OP_BMILGB
... CC_OP_BMILGQ
:
843 size
= s
->cc_op
- CC_OP_BMILGB
;
844 t0
= gen_ext_tl(reg
, cpu_cc_src
, size
, false);
845 return (CCPrepare
) { .cond
= TCG_COND_EQ
, .reg
= t0
, .mask
= -1 };
849 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_dst
,
850 .mask
= -1, .no_setcond
= true };
853 case CC_OP_SARB
... CC_OP_SARQ
:
855 return (CCPrepare
) { .cond
= TCG_COND_NE
,
856 .reg
= cpu_cc_src
, .mask
= CC_C
};
859 /* The need to compute only C from CC_OP_DYNAMIC is important
860 in efficiently implementing e.g. INC at the start of a TB. */
862 gen_helper_cc_compute_c(reg
, cpu_cc_dst
, cpu_cc_src
,
863 cpu_cc_src2
, cpu_cc_op
);
864 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= reg
,
865 .mask
= -1, .no_setcond
= true };
869 /* compute eflags.P to reg */
870 static CCPrepare
gen_prepare_eflags_p(DisasContext
*s
, TCGv reg
)
872 gen_compute_eflags(s
);
873 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
877 /* compute eflags.S to reg */
878 static CCPrepare
gen_prepare_eflags_s(DisasContext
*s
, TCGv reg
)
882 gen_compute_eflags(s
);
888 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
891 return (CCPrepare
) { .cond
= TCG_COND_NEVER
, .mask
= -1 };
894 TCGMemOp size
= (s
->cc_op
- CC_OP_ADDB
) & 3;
895 TCGv t0
= gen_ext_tl(reg
, cpu_cc_dst
, size
, true);
896 return (CCPrepare
) { .cond
= TCG_COND_LT
, .reg
= t0
, .mask
= -1 };
901 /* compute eflags.O to reg */
902 static CCPrepare
gen_prepare_eflags_o(DisasContext
*s
, TCGv reg
)
907 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src2
,
908 .mask
= -1, .no_setcond
= true };
910 return (CCPrepare
) { .cond
= TCG_COND_NEVER
, .mask
= -1 };
912 gen_compute_eflags(s
);
913 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
918 /* compute eflags.Z to reg */
919 static CCPrepare
gen_prepare_eflags_z(DisasContext
*s
, TCGv reg
)
923 gen_compute_eflags(s
);
929 return (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
932 return (CCPrepare
) { .cond
= TCG_COND_ALWAYS
, .mask
= -1 };
935 TCGMemOp size
= (s
->cc_op
- CC_OP_ADDB
) & 3;
936 TCGv t0
= gen_ext_tl(reg
, cpu_cc_dst
, size
, false);
937 return (CCPrepare
) { .cond
= TCG_COND_EQ
, .reg
= t0
, .mask
= -1 };
942 /* perform a conditional store into register 'reg' according to jump opcode
943 value 'b'. In the fast case, T0 is guaranted not to be used. */
944 static CCPrepare
gen_prepare_cc(DisasContext
*s
, int b
, TCGv reg
)
946 int inv
, jcc_op
, cond
;
952 jcc_op
= (b
>> 1) & 7;
955 case CC_OP_SUBB
... CC_OP_SUBQ
:
956 /* We optimize relational operators for the cmp/jcc case. */
957 size
= s
->cc_op
- CC_OP_SUBB
;
960 tcg_gen_mov_tl(cpu_tmp4
, cpu_cc_srcT
);
961 gen_extu(size
, cpu_tmp4
);
962 t0
= gen_ext_tl(cpu_tmp0
, cpu_cc_src
, size
, false);
963 cc
= (CCPrepare
) { .cond
= TCG_COND_LEU
, .reg
= cpu_tmp4
,
964 .reg2
= t0
, .mask
= -1, .use_reg2
= true };
973 tcg_gen_mov_tl(cpu_tmp4
, cpu_cc_srcT
);
974 gen_exts(size
, cpu_tmp4
);
975 t0
= gen_ext_tl(cpu_tmp0
, cpu_cc_src
, size
, true);
976 cc
= (CCPrepare
) { .cond
= cond
, .reg
= cpu_tmp4
,
977 .reg2
= t0
, .mask
= -1, .use_reg2
= true };
987 /* This actually generates good code for JC, JZ and JS. */
990 cc
= gen_prepare_eflags_o(s
, reg
);
993 cc
= gen_prepare_eflags_c(s
, reg
);
996 cc
= gen_prepare_eflags_z(s
, reg
);
999 gen_compute_eflags(s
);
1000 cc
= (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= cpu_cc_src
,
1001 .mask
= CC_Z
| CC_C
};
1004 cc
= gen_prepare_eflags_s(s
, reg
);
1007 cc
= gen_prepare_eflags_p(s
, reg
);
1010 gen_compute_eflags(s
);
1011 if (TCGV_EQUAL(reg
, cpu_cc_src
)) {
1014 tcg_gen_shri_tl(reg
, cpu_cc_src
, 4); /* CC_O -> CC_S */
1015 tcg_gen_xor_tl(reg
, reg
, cpu_cc_src
);
1016 cc
= (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= reg
,
1021 gen_compute_eflags(s
);
1022 if (TCGV_EQUAL(reg
, cpu_cc_src
)) {
1025 tcg_gen_shri_tl(reg
, cpu_cc_src
, 4); /* CC_O -> CC_S */
1026 tcg_gen_xor_tl(reg
, reg
, cpu_cc_src
);
1027 cc
= (CCPrepare
) { .cond
= TCG_COND_NE
, .reg
= reg
,
1028 .mask
= CC_S
| CC_Z
};
1035 cc
.cond
= tcg_invert_cond(cc
.cond
);
1040 static void gen_setcc1(DisasContext
*s
, int b
, TCGv reg
)
1042 CCPrepare cc
= gen_prepare_cc(s
, b
, reg
);
1044 if (cc
.no_setcond
) {
1045 if (cc
.cond
== TCG_COND_EQ
) {
1046 tcg_gen_xori_tl(reg
, cc
.reg
, 1);
1048 tcg_gen_mov_tl(reg
, cc
.reg
);
1053 if (cc
.cond
== TCG_COND_NE
&& !cc
.use_reg2
&& cc
.imm
== 0 &&
1054 cc
.mask
!= 0 && (cc
.mask
& (cc
.mask
- 1)) == 0) {
1055 tcg_gen_shri_tl(reg
, cc
.reg
, ctztl(cc
.mask
));
1056 tcg_gen_andi_tl(reg
, reg
, 1);
1059 if (cc
.mask
!= -1) {
1060 tcg_gen_andi_tl(reg
, cc
.reg
, cc
.mask
);
1064 tcg_gen_setcond_tl(cc
.cond
, reg
, cc
.reg
, cc
.reg2
);
1066 tcg_gen_setcondi_tl(cc
.cond
, reg
, cc
.reg
, cc
.imm
);
1070 static inline void gen_compute_eflags_c(DisasContext
*s
, TCGv reg
)
1072 gen_setcc1(s
, JCC_B
<< 1, reg
);
1075 /* generate a conditional jump to label 'l1' according to jump opcode
1076 value 'b'. In the fast case, T0 is guaranted not to be used. */
1077 static inline void gen_jcc1_noeob(DisasContext
*s
, int b
, int l1
)
1079 CCPrepare cc
= gen_prepare_cc(s
, b
, cpu_T
[0]);
1081 if (cc
.mask
!= -1) {
1082 tcg_gen_andi_tl(cpu_T
[0], cc
.reg
, cc
.mask
);
1086 tcg_gen_brcond_tl(cc
.cond
, cc
.reg
, cc
.reg2
, l1
);
1088 tcg_gen_brcondi_tl(cc
.cond
, cc
.reg
, cc
.imm
, l1
);
1092 /* Generate a conditional jump to label 'l1' according to jump opcode
1093 value 'b'. In the fast case, T0 is guaranted not to be used.
1094 A translation block must end soon. */
1095 static inline void gen_jcc1(DisasContext
*s
, int b
, int l1
)
1097 CCPrepare cc
= gen_prepare_cc(s
, b
, cpu_T
[0]);
1099 gen_update_cc_op(s
);
1100 if (cc
.mask
!= -1) {
1101 tcg_gen_andi_tl(cpu_T
[0], cc
.reg
, cc
.mask
);
1104 set_cc_op(s
, CC_OP_DYNAMIC
);
1106 tcg_gen_brcond_tl(cc
.cond
, cc
.reg
, cc
.reg2
, l1
);
1108 tcg_gen_brcondi_tl(cc
.cond
, cc
.reg
, cc
.imm
, l1
);
1112 /* XXX: does not work with gdbstub "ice" single step - not a
1114 static int gen_jz_ecx_string(DisasContext
*s
, target_ulong next_eip
)
1118 l1
= gen_new_label();
1119 l2
= gen_new_label();
1120 gen_op_jnz_ecx(s
->aflag
, l1
);
1122 gen_jmp_tb(s
, next_eip
, 1);
1127 static inline void gen_stos(DisasContext
*s
, TCGMemOp ot
)
1129 gen_op_mov_v_reg(MO_32
, cpu_T
[0], R_EAX
);
1130 gen_string_movl_A0_EDI(s
);
1131 gen_op_st_v(s
, ot
, cpu_T
[0], cpu_A0
);
1132 gen_op_movl_T0_Dshift(ot
);
1133 gen_op_add_reg_T0(s
->aflag
, R_EDI
);
1136 static inline void gen_lods(DisasContext
*s
, TCGMemOp ot
)
1138 gen_string_movl_A0_ESI(s
);
1139 gen_op_ld_v(s
, ot
, cpu_T
[0], cpu_A0
);
1140 gen_op_mov_reg_v(ot
, R_EAX
, cpu_T
[0]);
1141 gen_op_movl_T0_Dshift(ot
);
1142 gen_op_add_reg_T0(s
->aflag
, R_ESI
);
1145 static inline void gen_scas(DisasContext
*s
, TCGMemOp ot
)
1147 gen_string_movl_A0_EDI(s
);
1148 gen_op_ld_v(s
, ot
, cpu_T
[1], cpu_A0
);
1149 gen_op(s
, OP_CMPL
, ot
, R_EAX
);
1150 gen_op_movl_T0_Dshift(ot
);
1151 gen_op_add_reg_T0(s
->aflag
, R_EDI
);
1154 static inline void gen_cmps(DisasContext
*s
, TCGMemOp ot
)
1156 gen_string_movl_A0_EDI(s
);
1157 gen_op_ld_v(s
, ot
, cpu_T
[1], cpu_A0
);
1158 gen_string_movl_A0_ESI(s
);
1159 gen_op(s
, OP_CMPL
, ot
, OR_TMP0
);
1160 gen_op_movl_T0_Dshift(ot
);
1161 gen_op_add_reg_T0(s
->aflag
, R_ESI
);
1162 gen_op_add_reg_T0(s
->aflag
, R_EDI
);
1165 static inline void gen_ins(DisasContext
*s
, TCGMemOp ot
)
1169 gen_string_movl_A0_EDI(s
);
1170 /* Note: we must do this dummy write first to be restartable in
1171 case of page fault. */
1172 tcg_gen_movi_tl(cpu_T
[0], 0);
1173 gen_op_st_v(s
, ot
, cpu_T
[0], cpu_A0
);
1174 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_regs
[R_EDX
]);
1175 tcg_gen_andi_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, 0xffff);
1176 gen_helper_in_func(ot
, cpu_T
[0], cpu_tmp2_i32
);
1177 gen_op_st_v(s
, ot
, cpu_T
[0], cpu_A0
);
1178 gen_op_movl_T0_Dshift(ot
);
1179 gen_op_add_reg_T0(s
->aflag
, R_EDI
);
1184 static inline void gen_outs(DisasContext
*s
, TCGMemOp ot
)
1188 gen_string_movl_A0_ESI(s
);
1189 gen_op_ld_v(s
, ot
, cpu_T
[0], cpu_A0
);
1191 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_regs
[R_EDX
]);
1192 tcg_gen_andi_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, 0xffff);
1193 tcg_gen_trunc_tl_i32(cpu_tmp3_i32
, cpu_T
[0]);
1194 gen_helper_out_func(ot
, cpu_tmp2_i32
, cpu_tmp3_i32
);
1196 gen_op_movl_T0_Dshift(ot
);
1197 gen_op_add_reg_T0(s
->aflag
, R_ESI
);
1202 /* same method as Valgrind : we generate jumps to current or next
1204 #define GEN_REPZ(op) \
1205 static inline void gen_repz_ ## op(DisasContext *s, TCGMemOp ot, \
1206 target_ulong cur_eip, target_ulong next_eip) \
1209 gen_update_cc_op(s); \
1210 l2 = gen_jz_ecx_string(s, next_eip); \
1211 gen_ ## op(s, ot); \
1212 gen_op_add_reg_im(s->aflag, R_ECX, -1); \
1213 /* a loop would cause two single step exceptions if ECX = 1 \
1214 before rep string_insn */ \
1216 gen_op_jz_ecx(s->aflag, l2); \
1217 gen_jmp(s, cur_eip); \
1220 #define GEN_REPZ2(op) \
1221 static inline void gen_repz_ ## op(DisasContext *s, TCGMemOp ot, \
1222 target_ulong cur_eip, \
1223 target_ulong next_eip, \
1227 gen_update_cc_op(s); \
1228 l2 = gen_jz_ecx_string(s, next_eip); \
1229 gen_ ## op(s, ot); \
1230 gen_op_add_reg_im(s->aflag, R_ECX, -1); \
1231 gen_update_cc_op(s); \
1232 gen_jcc1(s, (JCC_Z << 1) | (nz ^ 1), l2); \
1234 gen_op_jz_ecx(s->aflag, l2); \
1235 gen_jmp(s, cur_eip); \
1246 static void gen_helper_fp_arith_ST0_FT0(int op
)
1250 gen_helper_fadd_ST0_FT0(cpu_env
);
1253 gen_helper_fmul_ST0_FT0(cpu_env
);
1256 gen_helper_fcom_ST0_FT0(cpu_env
);
1259 gen_helper_fcom_ST0_FT0(cpu_env
);
1262 gen_helper_fsub_ST0_FT0(cpu_env
);
1265 gen_helper_fsubr_ST0_FT0(cpu_env
);
1268 gen_helper_fdiv_ST0_FT0(cpu_env
);
1271 gen_helper_fdivr_ST0_FT0(cpu_env
);
1276 /* NOTE the exception in "r" op ordering */
1277 static void gen_helper_fp_arith_STN_ST0(int op
, int opreg
)
1279 TCGv_i32 tmp
= tcg_const_i32(opreg
);
1282 gen_helper_fadd_STN_ST0(cpu_env
, tmp
);
1285 gen_helper_fmul_STN_ST0(cpu_env
, tmp
);
1288 gen_helper_fsubr_STN_ST0(cpu_env
, tmp
);
1291 gen_helper_fsub_STN_ST0(cpu_env
, tmp
);
1294 gen_helper_fdivr_STN_ST0(cpu_env
, tmp
);
1297 gen_helper_fdiv_STN_ST0(cpu_env
, tmp
);
1302 /* if d == OR_TMP0, it means memory operand (address in A0) */
1303 static void gen_op(DisasContext
*s1
, int op
, TCGMemOp ot
, int d
)
1306 gen_op_mov_v_reg(ot
, cpu_T
[0], d
);
1308 gen_op_ld_v(s1
, ot
, cpu_T
[0], cpu_A0
);
1312 gen_compute_eflags_c(s1
, cpu_tmp4
);
1313 tcg_gen_add_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1314 tcg_gen_add_tl(cpu_T
[0], cpu_T
[0], cpu_tmp4
);
1315 gen_op_st_rm_T0_A0(s1
, ot
, d
);
1316 gen_op_update3_cc(cpu_tmp4
);
1317 set_cc_op(s1
, CC_OP_ADCB
+ ot
);
1320 gen_compute_eflags_c(s1
, cpu_tmp4
);
1321 tcg_gen_sub_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1322 tcg_gen_sub_tl(cpu_T
[0], cpu_T
[0], cpu_tmp4
);
1323 gen_op_st_rm_T0_A0(s1
, ot
, d
);
1324 gen_op_update3_cc(cpu_tmp4
);
1325 set_cc_op(s1
, CC_OP_SBBB
+ ot
);
1328 tcg_gen_add_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1329 gen_op_st_rm_T0_A0(s1
, ot
, d
);
1330 gen_op_update2_cc();
1331 set_cc_op(s1
, CC_OP_ADDB
+ ot
);
1334 tcg_gen_mov_tl(cpu_cc_srcT
, cpu_T
[0]);
1335 tcg_gen_sub_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1336 gen_op_st_rm_T0_A0(s1
, ot
, d
);
1337 gen_op_update2_cc();
1338 set_cc_op(s1
, CC_OP_SUBB
+ ot
);
1342 tcg_gen_and_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1343 gen_op_st_rm_T0_A0(s1
, ot
, d
);
1344 gen_op_update1_cc();
1345 set_cc_op(s1
, CC_OP_LOGICB
+ ot
);
1348 tcg_gen_or_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1349 gen_op_st_rm_T0_A0(s1
, ot
, d
);
1350 gen_op_update1_cc();
1351 set_cc_op(s1
, CC_OP_LOGICB
+ ot
);
1354 tcg_gen_xor_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1355 gen_op_st_rm_T0_A0(s1
, ot
, d
);
1356 gen_op_update1_cc();
1357 set_cc_op(s1
, CC_OP_LOGICB
+ ot
);
1360 tcg_gen_mov_tl(cpu_cc_src
, cpu_T
[1]);
1361 tcg_gen_mov_tl(cpu_cc_srcT
, cpu_T
[0]);
1362 tcg_gen_sub_tl(cpu_cc_dst
, cpu_T
[0], cpu_T
[1]);
1363 set_cc_op(s1
, CC_OP_SUBB
+ ot
);
1368 /* if d == OR_TMP0, it means memory operand (address in A0) */
1369 static void gen_inc(DisasContext
*s1
, TCGMemOp ot
, int d
, int c
)
1372 gen_op_mov_v_reg(ot
, cpu_T
[0], d
);
1374 gen_op_ld_v(s1
, ot
, cpu_T
[0], cpu_A0
);
1376 gen_compute_eflags_c(s1
, cpu_cc_src
);
1378 tcg_gen_addi_tl(cpu_T
[0], cpu_T
[0], 1);
1379 set_cc_op(s1
, CC_OP_INCB
+ ot
);
1381 tcg_gen_addi_tl(cpu_T
[0], cpu_T
[0], -1);
1382 set_cc_op(s1
, CC_OP_DECB
+ ot
);
1384 gen_op_st_rm_T0_A0(s1
, ot
, d
);
1385 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
1388 static void gen_shift_flags(DisasContext
*s
, TCGMemOp ot
, TCGv result
,
1389 TCGv shm1
, TCGv count
, bool is_right
)
1391 TCGv_i32 z32
, s32
, oldop
;
1394 /* Store the results into the CC variables. If we know that the
1395 variable must be dead, store unconditionally. Otherwise we'll
1396 need to not disrupt the current contents. */
1397 z_tl
= tcg_const_tl(0);
1398 if (cc_op_live
[s
->cc_op
] & USES_CC_DST
) {
1399 tcg_gen_movcond_tl(TCG_COND_NE
, cpu_cc_dst
, count
, z_tl
,
1400 result
, cpu_cc_dst
);
1402 tcg_gen_mov_tl(cpu_cc_dst
, result
);
1404 if (cc_op_live
[s
->cc_op
] & USES_CC_SRC
) {
1405 tcg_gen_movcond_tl(TCG_COND_NE
, cpu_cc_src
, count
, z_tl
,
1408 tcg_gen_mov_tl(cpu_cc_src
, shm1
);
1410 tcg_temp_free(z_tl
);
1412 /* Get the two potential CC_OP values into temporaries. */
1413 tcg_gen_movi_i32(cpu_tmp2_i32
, (is_right ? CC_OP_SARB
: CC_OP_SHLB
) + ot
);
1414 if (s
->cc_op
== CC_OP_DYNAMIC
) {
1417 tcg_gen_movi_i32(cpu_tmp3_i32
, s
->cc_op
);
1418 oldop
= cpu_tmp3_i32
;
1421 /* Conditionally store the CC_OP value. */
1422 z32
= tcg_const_i32(0);
1423 s32
= tcg_temp_new_i32();
1424 tcg_gen_trunc_tl_i32(s32
, count
);
1425 tcg_gen_movcond_i32(TCG_COND_NE
, cpu_cc_op
, s32
, z32
, cpu_tmp2_i32
, oldop
);
1426 tcg_temp_free_i32(z32
);
1427 tcg_temp_free_i32(s32
);
1429 /* The CC_OP value is no longer predictable. */
1430 set_cc_op(s
, CC_OP_DYNAMIC
);
1433 static void gen_shift_rm_T1(DisasContext
*s
, TCGMemOp ot
, int op1
,
1434 int is_right
, int is_arith
)
1436 target_ulong mask
= (ot
== MO_64 ?
0x3f : 0x1f);
1439 if (op1
== OR_TMP0
) {
1440 gen_op_ld_v(s
, ot
, cpu_T
[0], cpu_A0
);
1442 gen_op_mov_v_reg(ot
, cpu_T
[0], op1
);
1445 tcg_gen_andi_tl(cpu_T
[1], cpu_T
[1], mask
);
1446 tcg_gen_subi_tl(cpu_tmp0
, cpu_T
[1], 1);
1450 gen_exts(ot
, cpu_T
[0]);
1451 tcg_gen_sar_tl(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1452 tcg_gen_sar_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1454 gen_extu(ot
, cpu_T
[0]);
1455 tcg_gen_shr_tl(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1456 tcg_gen_shr_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1459 tcg_gen_shl_tl(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1460 tcg_gen_shl_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1464 gen_op_st_rm_T0_A0(s
, ot
, op1
);
1466 gen_shift_flags(s
, ot
, cpu_T
[0], cpu_tmp0
, cpu_T
[1], is_right
);
1469 static void gen_shift_rm_im(DisasContext
*s
, TCGMemOp ot
, int op1
, int op2
,
1470 int is_right
, int is_arith
)
1472 int mask
= (ot
== MO_64 ?
0x3f : 0x1f);
1476 gen_op_ld_v(s
, ot
, cpu_T
[0], cpu_A0
);
1478 gen_op_mov_v_reg(ot
, cpu_T
[0], op1
);
1484 gen_exts(ot
, cpu_T
[0]);
1485 tcg_gen_sari_tl(cpu_tmp4
, cpu_T
[0], op2
- 1);
1486 tcg_gen_sari_tl(cpu_T
[0], cpu_T
[0], op2
);
1488 gen_extu(ot
, cpu_T
[0]);
1489 tcg_gen_shri_tl(cpu_tmp4
, cpu_T
[0], op2
- 1);
1490 tcg_gen_shri_tl(cpu_T
[0], cpu_T
[0], op2
);
1493 tcg_gen_shli_tl(cpu_tmp4
, cpu_T
[0], op2
- 1);
1494 tcg_gen_shli_tl(cpu_T
[0], cpu_T
[0], op2
);
1499 gen_op_st_rm_T0_A0(s
, ot
, op1
);
1501 /* update eflags if non zero shift */
1503 tcg_gen_mov_tl(cpu_cc_src
, cpu_tmp4
);
1504 tcg_gen_mov_tl(cpu_cc_dst
, cpu_T
[0]);
1505 set_cc_op(s
, (is_right ? CC_OP_SARB
: CC_OP_SHLB
) + ot
);
1509 static inline void tcg_gen_lshift(TCGv ret
, TCGv arg1
, target_long arg2
)
1512 tcg_gen_shli_tl(ret
, arg1
, arg2
);
1514 tcg_gen_shri_tl(ret
, arg1
, -arg2
);
1517 static void gen_rot_rm_T1(DisasContext
*s
, TCGMemOp ot
, int op1
, int is_right
)
1519 target_ulong mask
= (ot
== MO_64 ?
0x3f : 0x1f);
1523 if (op1
== OR_TMP0
) {
1524 gen_op_ld_v(s
, ot
, cpu_T
[0], cpu_A0
);
1526 gen_op_mov_v_reg(ot
, cpu_T
[0], op1
);
1529 tcg_gen_andi_tl(cpu_T
[1], cpu_T
[1], mask
);
1533 /* Replicate the 8-bit input so that a 32-bit rotate works. */
1534 tcg_gen_ext8u_tl(cpu_T
[0], cpu_T
[0]);
1535 tcg_gen_muli_tl(cpu_T
[0], cpu_T
[0], 0x01010101);
1538 /* Replicate the 16-bit input so that a 32-bit rotate works. */
1539 tcg_gen_deposit_tl(cpu_T
[0], cpu_T
[0], cpu_T
[0], 16, 16);
1542 #ifdef TARGET_X86_64
1544 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
1545 tcg_gen_trunc_tl_i32(cpu_tmp3_i32
, cpu_T
[1]);
1547 tcg_gen_rotr_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, cpu_tmp3_i32
);
1549 tcg_gen_rotl_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, cpu_tmp3_i32
);
1551 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
1556 tcg_gen_rotr_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1558 tcg_gen_rotl_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1564 gen_op_st_rm_T0_A0(s
, ot
, op1
);
1566 /* We'll need the flags computed into CC_SRC. */
1567 gen_compute_eflags(s
);
1569 /* The value that was "rotated out" is now present at the other end
1570 of the word. Compute C into CC_DST and O into CC_SRC2. Note that
1571 since we've computed the flags into CC_SRC, these variables are
1574 tcg_gen_shri_tl(cpu_cc_src2
, cpu_T
[0], mask
- 1);
1575 tcg_gen_shri_tl(cpu_cc_dst
, cpu_T
[0], mask
);
1576 tcg_gen_andi_tl(cpu_cc_dst
, cpu_cc_dst
, 1);
1578 tcg_gen_shri_tl(cpu_cc_src2
, cpu_T
[0], mask
);
1579 tcg_gen_andi_tl(cpu_cc_dst
, cpu_T
[0], 1);
1581 tcg_gen_andi_tl(cpu_cc_src2
, cpu_cc_src2
, 1);
1582 tcg_gen_xor_tl(cpu_cc_src2
, cpu_cc_src2
, cpu_cc_dst
);
1584 /* Now conditionally store the new CC_OP value. If the shift count
1585 is 0 we keep the CC_OP_EFLAGS setting so that only CC_SRC is live.
1586 Otherwise reuse CC_OP_ADCOX which have the C and O flags split out
1587 exactly as we computed above. */
1588 t0
= tcg_const_i32(0);
1589 t1
= tcg_temp_new_i32();
1590 tcg_gen_trunc_tl_i32(t1
, cpu_T
[1]);
1591 tcg_gen_movi_i32(cpu_tmp2_i32
, CC_OP_ADCOX
);
1592 tcg_gen_movi_i32(cpu_tmp3_i32
, CC_OP_EFLAGS
);
1593 tcg_gen_movcond_i32(TCG_COND_NE
, cpu_cc_op
, t1
, t0
,
1594 cpu_tmp2_i32
, cpu_tmp3_i32
);
1595 tcg_temp_free_i32(t0
);
1596 tcg_temp_free_i32(t1
);
1598 /* The CC_OP value is no longer predictable. */
1599 set_cc_op(s
, CC_OP_DYNAMIC
);
1602 static void gen_rot_rm_im(DisasContext
*s
, TCGMemOp ot
, int op1
, int op2
,
1605 int mask
= (ot
== MO_64 ?
0x3f : 0x1f);
1609 if (op1
== OR_TMP0
) {
1610 gen_op_ld_v(s
, ot
, cpu_T
[0], cpu_A0
);
1612 gen_op_mov_v_reg(ot
, cpu_T
[0], op1
);
1618 #ifdef TARGET_X86_64
1620 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
1622 tcg_gen_rotri_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, op2
);
1624 tcg_gen_rotli_i32(cpu_tmp2_i32
, cpu_tmp2_i32
, op2
);
1626 tcg_gen_extu_i32_tl(cpu_T
[0], cpu_tmp2_i32
);
1631 tcg_gen_rotri_tl(cpu_T
[0], cpu_T
[0], op2
);
1633 tcg_gen_rotli_tl(cpu_T
[0], cpu_T
[0], op2
);
1644 shift
= mask
+ 1 - shift
;
1646 gen_extu(ot
, cpu_T
[0]);
1647 tcg_gen_shli_tl(cpu_tmp0
, cpu_T
[0], shift
);
1648 tcg_gen_shri_tl(cpu_T
[0], cpu_T
[0], mask
+ 1 - shift
);
1649 tcg_gen_or_tl(cpu_T
[0], cpu_T
[0], cpu_tmp0
);
1655 gen_op_st_rm_T0_A0(s
, ot
, op1
);
1658 /* Compute the flags into CC_SRC. */
1659 gen_compute_eflags(s
);
1661 /* The value that was "rotated out" is now present at the other end
1662 of the word. Compute C into CC_DST and O into CC_SRC2. Note that
1663 since we've computed the flags into CC_SRC, these variables are
1666 tcg_gen_shri_tl(cpu_cc_src2
, cpu_T
[0], mask
- 1);
1667 tcg_gen_shri_tl(cpu_cc_dst
, cpu_T
[0], mask
);
1668 tcg_gen_andi_tl(cpu_cc_dst
, cpu_cc_dst
, 1);
1670 tcg_gen_shri_tl(cpu_cc_src2
, cpu_T
[0], mask
);
1671 tcg_gen_andi_tl(cpu_cc_dst
, cpu_T
[0], 1);
1673 tcg_gen_andi_tl(cpu_cc_src2
, cpu_cc_src2
, 1);
1674 tcg_gen_xor_tl(cpu_cc_src2
, cpu_cc_src2
, cpu_cc_dst
);
1675 set_cc_op(s
, CC_OP_ADCOX
);
1679 /* XXX: add faster immediate = 1 case */
1680 static void gen_rotc_rm_T1(DisasContext
*s
, TCGMemOp ot
, int op1
,
1683 gen_compute_eflags(s
);
1684 assert(s
->cc_op
== CC_OP_EFLAGS
);
1688 gen_op_ld_v(s
, ot
, cpu_T
[0], cpu_A0
);
1690 gen_op_mov_v_reg(ot
, cpu_T
[0], op1
);
1695 gen_helper_rcrb(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1698 gen_helper_rcrw(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1701 gen_helper_rcrl(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1703 #ifdef TARGET_X86_64
1705 gen_helper_rcrq(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1714 gen_helper_rclb(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1717 gen_helper_rclw(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1720 gen_helper_rcll(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1722 #ifdef TARGET_X86_64
1724 gen_helper_rclq(cpu_T
[0], cpu_env
, cpu_T
[0], cpu_T
[1]);
1732 gen_op_st_rm_T0_A0(s
, ot
, op1
);
1735 /* XXX: add faster immediate case */
1736 static void gen_shiftd_rm_T1(DisasContext
*s
, TCGMemOp ot
, int op1
,
1737 bool is_right
, TCGv count_in
)
1739 target_ulong mask
= (ot
== MO_64 ?
63 : 31);
1743 if (op1
== OR_TMP0
) {
1744 gen_op_ld_v(s
, ot
, cpu_T
[0], cpu_A0
);
1746 gen_op_mov_v_reg(ot
, cpu_T
[0], op1
);
1749 count
= tcg_temp_new();
1750 tcg_gen_andi_tl(count
, count_in
, mask
);
1754 /* Note: we implement the Intel behaviour for shift count > 16.
1755 This means "shrdw C, B, A" shifts A:B:A >> C. Build the B:A
1756 portion by constructing it as a 32-bit value. */
1758 tcg_gen_deposit_tl(cpu_tmp0
, cpu_T
[0], cpu_T
[1], 16, 16);
1759 tcg_gen_mov_tl(cpu_T
[1], cpu_T
[0]);
1760 tcg_gen_mov_tl(cpu_T
[0], cpu_tmp0
);
1762 tcg_gen_deposit_tl(cpu_T
[1], cpu_T
[0], cpu_T
[1], 16, 16);
1765 #ifdef TARGET_X86_64
1767 /* Concatenate the two 32-bit values and use a 64-bit shift. */
1768 tcg_gen_subi_tl(cpu_tmp0
, count
, 1);
1770 tcg_gen_concat_tl_i64(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1771 tcg_gen_shr_i64(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1772 tcg_gen_shr_i64(cpu_T
[0], cpu_T
[0], count
);
1774 tcg_gen_concat_tl_i64(cpu_T
[0], cpu_T
[1], cpu_T
[0]);
1775 tcg_gen_shl_i64(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1776 tcg_gen_shl_i64(cpu_T
[0], cpu_T
[0], count
);
1777 tcg_gen_shri_i64(cpu_tmp0
, cpu_tmp0
, 32);
1778 tcg_gen_shri_i64(cpu_T
[0], cpu_T
[0], 32);
1783 tcg_gen_subi_tl(cpu_tmp0
, count
, 1);
1785 tcg_gen_shr_tl(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1787 tcg_gen_subfi_tl(cpu_tmp4
, mask
+ 1, count
);
1788 tcg_gen_shr_tl(cpu_T
[0], cpu_T
[0], count
);
1789 tcg_gen_shl_tl(cpu_T
[1], cpu_T
[1], cpu_tmp4
);
1791 tcg_gen_shl_tl(cpu_tmp0
, cpu_T
[0], cpu_tmp0
);
1793 /* Only needed if count > 16, for Intel behaviour. */
1794 tcg_gen_subfi_tl(cpu_tmp4
, 33, count
);
1795 tcg_gen_shr_tl(cpu_tmp4
, cpu_T
[1], cpu_tmp4
);
1796 tcg_gen_or_tl(cpu_tmp0
, cpu_tmp0
, cpu_tmp4
);
1799 tcg_gen_subfi_tl(cpu_tmp4
, mask
+ 1, count
);
1800 tcg_gen_shl_tl(cpu_T
[0], cpu_T
[0], count
);
1801 tcg_gen_shr_tl(cpu_T
[1], cpu_T
[1], cpu_tmp4
);
1803 tcg_gen_movi_tl(cpu_tmp4
, 0);
1804 tcg_gen_movcond_tl(TCG_COND_EQ
, cpu_T
[1], count
, cpu_tmp4
,
1805 cpu_tmp4
, cpu_T
[1]);
1806 tcg_gen_or_tl(cpu_T
[0], cpu_T
[0], cpu_T
[1]);
1811 gen_op_st_rm_T0_A0(s
, ot
, op1
);
1813 gen_shift_flags(s
, ot
, cpu_T
[0], cpu_tmp0
, count
, is_right
);
1814 tcg_temp_free(count
);
1817 static void gen_shift(DisasContext
*s1
, int op
, TCGMemOp ot
, int d
, int s
)
1820 gen_op_mov_v_reg(ot
, cpu_T
[1], s
);
1823 gen_rot_rm_T1(s1
, ot
, d
, 0);
1826 gen_rot_rm_T1(s1
, ot
, d
, 1);
1830 gen_shift_rm_T1(s1
, ot
, d
, 0, 0);
1833 gen_shift_rm_T1(s1
, ot
, d
, 1, 0);
1836 gen_shift_rm_T1(s1
, ot
, d
, 1, 1);
1839 gen_rotc_rm_T1(s1
, ot
, d
, 0);
1842 gen_rotc_rm_T1(s1
, ot
, d
, 1);
1847 static void gen_shifti(DisasContext
*s1
, int op
, TCGMemOp ot
, int d
, int c
)
1851 gen_rot_rm_im(s1
, ot
, d
, c
, 0);
1854 gen_rot_rm_im(s1
, ot
, d
, c
, 1);
1858 gen_shift_rm_im(s1
, ot
, d
, c
, 0, 0);
1861 gen_shift_rm_im(s1
, ot
, d
, c
, 1, 0);
1864 gen_shift_rm_im(s1
, ot
, d
, c
, 1, 1);
1867 /* currently not optimized */
1868 tcg_gen_movi_tl(cpu_T
[1], c
);
1869 gen_shift(s1
, op
, ot
, d
, OR_TMP1
);
1874 static void gen_lea_modrm(CPUX86State
*env
, DisasContext
*s
, int modrm
)
1881 int mod
, rm
, code
, override
, must_add_seg
;
1884 override
= s
->override
;
1885 must_add_seg
= s
->addseg
;
1888 mod
= (modrm
>> 6) & 3;
1901 code
= cpu_ldub_code(env
, s
->pc
++);
1902 scale
= (code
>> 6) & 3;
1903 index
= ((code
>> 3) & 7) | REX_X(s
);
1905 index
= -1; /* no index */
1913 if ((base
& 7) == 5) {
1915 disp
= (int32_t)cpu_ldl_code(env
, s
->pc
);
1917 if (CODE64(s
) && !havesib
) {
1918 disp
+= s
->pc
+ s
->rip_offset
;
1925 disp
= (int8_t)cpu_ldub_code(env
, s
->pc
++);
1929 disp
= (int32_t)cpu_ldl_code(env
, s
->pc
);
1934 /* For correct popl handling with esp. */
1935 if (base
== R_ESP
&& s
->popl_esp_hack
) {
1936 disp
+= s
->popl_esp_hack
;
1939 /* Compute the address, with a minimum number of TCG ops. */
1943 sum
= cpu_regs
[index
];
1945 tcg_gen_shli_tl(cpu_A0
, cpu_regs
[index
], scale
);
1949 tcg_gen_add_tl(cpu_A0
, sum
, cpu_regs
[base
]);
1952 } else if (base
>= 0) {
1953 sum
= cpu_regs
[base
];
1955 if (TCGV_IS_UNUSED(sum
)) {
1956 tcg_gen_movi_tl(cpu_A0
, disp
);
1958 tcg_gen_addi_tl(cpu_A0
, sum
, disp
);
1963 if (base
== R_EBP
|| base
== R_ESP
) {
1970 tcg_gen_ld_tl(cpu_tmp0
, cpu_env
,
1971 offsetof(CPUX86State
, segs
[override
].base
));
1973 if (s
->aflag
== MO_32
) {
1974 tcg_gen_ext32u_tl(cpu_A0
, cpu_A0
);
1976 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
1980 tcg_gen_add_tl(cpu_A0
, cpu_A0
, cpu_tmp0
);
1983 if (s
->aflag
== MO_32
) {
1984 tcg_gen_ext32u_tl(cpu_A0
, cpu_A0
);
1992 disp
= cpu_lduw_code(env
, s
->pc
);
1994 tcg_gen_movi_tl(cpu_A0
, disp
);
1995 rm
= 0; /* avoid SS override */
2002 disp
= (int8_t)cpu_ldub_code(env
, s
->pc
++);
2006 disp
= (int16_t)cpu_lduw_code(env
, s
->pc
);
2014 tcg_gen_add_tl(cpu_A0
, cpu_regs
[R_EBX
], cpu_regs
[R_ESI
]);
2017 tcg_gen_add_tl(cpu_A0
, cpu_regs
[R_EBX
], cpu_regs
[R_EDI
]);
2020 tcg_gen_add_tl(cpu_A0
, cpu_regs
[R_EBP
], cpu_regs
[R_ESI
]);
2023 tcg_gen_add_tl(cpu_A0
, cpu_regs
[R_EBP
], cpu_regs
[R_EDI
]);
2026 sum
= cpu_regs
[R_ESI
];
2029 sum
= cpu_regs
[R_EDI
];
2032 sum
= cpu_regs
[R_EBP
];
2036 sum
= cpu_regs
[R_EBX
];
2039 tcg_gen_addi_tl(cpu_A0
, sum
, disp
);
2040 tcg_gen_ext16u_tl(cpu_A0
, cpu_A0
);
2044 if (rm
== 2 || rm
== 3 || rm
== 6) {
2050 gen_op_addl_A0_seg(s
, override
);
2059 static void gen_nop_modrm(CPUX86State
*env
, DisasContext
*s
, int modrm
)
2061 int mod
, rm
, base
, code
;
2063 mod
= (modrm
>> 6) & 3;
2074 code
= cpu_ldub_code(env
, s
->pc
++);
2116 /* used for LEA and MOV AX, mem */
2117 static void gen_add_A0_ds_seg(DisasContext
*s
)
2119 int override
, must_add_seg
;
2120 must_add_seg
= s
->addseg
;
2122 if (s
->override
>= 0) {
2123 override
= s
->override
;
2127 #ifdef TARGET_X86_64
2129 gen_op_addq_A0_seg(override
);
2133 gen_op_addl_A0_seg(s
, override
);
2138 /* generate modrm memory load or store of 'reg'. TMP0 is used if reg ==
2140 static void gen_ldst_modrm(CPUX86State
*env
, DisasContext
*s
, int modrm
,
2141 TCGMemOp ot
, int reg
, int is_store
)
2145 mod
= (modrm
>> 6) & 3;
2146 rm
= (modrm
& 7) | REX_B(s
);
2150 gen_op_mov_v_reg(ot
, cpu_T
[0], reg
);
2151 gen_op_mov_reg_v(ot
, rm
, cpu_T
[0]);
2153 gen_op_mov_v_reg(ot
, cpu_T
[0], rm
);
2155 gen_op_mov_reg_v(ot
, reg
, cpu_T
[0]);
2158 gen_lea_modrm(env
, s
, modrm
);
2161 gen_op_mov_v_reg(ot
, cpu_T
[0], reg
);
2162 gen_op_st_v(s
, ot
, cpu_T
[0], cpu_A0
);
2164 gen_op_ld_v(s
, ot
, cpu_T
[0], cpu_A0
);
2166 gen_op_mov_reg_v(ot
, reg
, cpu_T
[0]);
2171 static inline uint32_t insn_get(CPUX86State
*env
, DisasContext
*s
, TCGMemOp ot
)
2177 ret
= cpu_ldub_code(env
, s
->pc
);
2181 ret
= cpu_lduw_code(env
, s
->pc
);
2185 #ifdef TARGET_X86_64
2188 ret
= cpu_ldl_code(env
, s
->pc
);
2197 static inline int insn_const_size(TCGMemOp ot
)
2206 static inline void gen_goto_tb(DisasContext
*s
, int tb_num
, target_ulong eip
)
2208 TranslationBlock
*tb
;
2211 pc
= s
->cs_base
+ eip
;
2213 /* NOTE: we handle the case where the TB spans two pages here */
2214 if ((pc
& TARGET_PAGE_MASK
) == (tb
->pc
& TARGET_PAGE_MASK
) ||
2215 (pc
& TARGET_PAGE_MASK
) == ((s
->pc
- 1) & TARGET_PAGE_MASK
)) {
2216 /* jump to same page: we can use a direct jump */
2217 tcg_gen_goto_tb(tb_num
);
2219 tcg_gen_exit_tb((uintptr_t)tb
+ tb_num
);
2221 /* jump to another page: currently not optimized */
2227 static inline void gen_jcc(DisasContext
*s
, int b
,
2228 target_ulong val
, target_ulong next_eip
)
2233 l1
= gen_new_label();
2236 gen_goto_tb(s
, 0, next_eip
);
2239 gen_goto_tb(s
, 1, val
);
2240 s
->is_jmp
= DISAS_TB_JUMP
;
2242 l1
= gen_new_label();
2243 l2
= gen_new_label();
2246 gen_jmp_im(next_eip
);
2256 static void gen_cmovcc1(CPUX86State
*env
, DisasContext
*s
, TCGMemOp ot
, int b
,
2261 gen_ldst_modrm(env
, s
, modrm
, ot
, OR_TMP0
, 0);
2263 cc
= gen_prepare_cc(s
, b
, cpu_T
[1]);
2264 if (cc
.mask
!= -1) {
2265 TCGv t0
= tcg_temp_new();
2266 tcg_gen_andi_tl(t0
, cc
.reg
, cc
.mask
);
2270 cc
.reg2
= tcg_const_tl(cc
.imm
);
2273 tcg_gen_movcond_tl(cc
.cond
, cpu_T
[0], cc
.reg
, cc
.reg2
,
2274 cpu_T
[0], cpu_regs
[reg
]);
2275 gen_op_mov_reg_v(ot
, reg
, cpu_T
[0]);
2277 if (cc
.mask
!= -1) {
2278 tcg_temp_free(cc
.reg
);
2281 tcg_temp_free(cc
.reg2
);
2285 static inline void gen_op_movl_T0_seg(int seg_reg
)
2287 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
,
2288 offsetof(CPUX86State
,segs
[seg_reg
].selector
));
2291 static inline void gen_op_movl_seg_T0_vm(int seg_reg
)
2293 tcg_gen_andi_tl(cpu_T
[0], cpu_T
[0], 0xffff);
2294 tcg_gen_st32_tl(cpu_T
[0], cpu_env
,
2295 offsetof(CPUX86State
,segs
[seg_reg
].selector
));
2296 tcg_gen_shli_tl(cpu_T
[0], cpu_T
[0], 4);
2297 tcg_gen_st_tl(cpu_T
[0], cpu_env
,
2298 offsetof(CPUX86State
,segs
[seg_reg
].base
));
2301 /* move T0 to seg_reg and compute if the CPU state may change. Never
2302 call this function with seg_reg == R_CS */
2303 static void gen_movl_seg_T0(DisasContext
*s
, int seg_reg
, target_ulong cur_eip
)
2305 if (s
->pe
&& !s
->vm86
) {
2306 /* XXX: optimize by finding processor state dynamically */
2307 gen_update_cc_op(s
);
2308 gen_jmp_im(cur_eip
);
2309 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
2310 gen_helper_load_seg(cpu_env
, tcg_const_i32(seg_reg
), cpu_tmp2_i32
);
2311 /* abort translation because the addseg value may change or
2312 because ss32 may change. For R_SS, translation must always
2313 stop as a special handling must be done to disable hardware
2314 interrupts for the next instruction */
2315 if (seg_reg
== R_SS
|| (s
->code32
&& seg_reg
< R_FS
))
2316 s
->is_jmp
= DISAS_TB_JUMP
;
2318 gen_op_movl_seg_T0_vm(seg_reg
);
2319 if (seg_reg
== R_SS
)
2320 s
->is_jmp
= DISAS_TB_JUMP
;
2324 static inline int svm_is_rep(int prefixes
)
2326 return ((prefixes
& (PREFIX_REPZ
| PREFIX_REPNZ
)) ?
8 : 0);
2330 gen_svm_check_intercept_param(DisasContext
*s
, target_ulong pc_start
,
2331 uint32_t type
, uint64_t param
)
2333 /* no SVM activated; fast case */
2334 if (likely(!(s
->flags
& HF_SVMI_MASK
)))
2336 gen_update_cc_op(s
);
2337 gen_jmp_im(pc_start
- s
->cs_base
);
2338 gen_helper_svm_check_intercept_param(cpu_env
, tcg_const_i32(type
),
2339 tcg_const_i64(param
));
2343 gen_svm_check_intercept(DisasContext
*s
, target_ulong pc_start
, uint64_t type
)
2345 gen_svm_check_intercept_param(s
, pc_start
, type
, 0);
2348 static inline void gen_stack_update(DisasContext
*s
, int addend
)
2350 #ifdef TARGET_X86_64
2352 gen_op_add_reg_im(MO_64
, R_ESP
, addend
);
2356 gen_op_add_reg_im(MO_32
, R_ESP
, addend
);
2358 gen_op_add_reg_im(MO_16
, R_ESP
, addend
);
2362 /* Generate a push. It depends on ss32, addseg and dflag. */
2363 static void gen_push_v(DisasContext
*s
, TCGv val
)
2365 TCGMemOp a_ot
, d_ot
= mo_pushpop(s
, s
->dflag
);
2366 int size
= 1 << d_ot
;
2367 TCGv new_esp
= cpu_A0
;
2369 tcg_gen_subi_tl(cpu_A0
, cpu_regs
[R_ESP
], size
);
2373 } else if (s
->ss32
) {
2377 tcg_gen_mov_tl(new_esp
, cpu_A0
);
2378 gen_op_addl_A0_seg(s
, R_SS
);
2380 tcg_gen_ext32u_tl(cpu_A0
, cpu_A0
);
2385 tcg_gen_ext16u_tl(cpu_A0
, cpu_A0
);
2386 tcg_gen_mov_tl(new_esp
, cpu_A0
);
2387 gen_op_addl_A0_seg(s
, R_SS
);
2390 gen_op_st_v(s
, d_ot
, val
, cpu_A0
);
2391 gen_op_mov_reg_v(a_ot
, R_ESP
, new_esp
);
2394 /* two step pop is necessary for precise exceptions */
2395 static TCGMemOp
gen_pop_T0(DisasContext
*s
)
2397 TCGMemOp d_ot
= mo_pushpop(s
, s
->dflag
);
2401 addr
= cpu_regs
[R_ESP
];
2402 } else if (!s
->ss32
) {
2403 tcg_gen_ext16u_tl(cpu_A0
, cpu_regs
[R_ESP
]);
2404 gen_op_addl_A0_seg(s
, R_SS
);
2405 } else if (s
->addseg
) {
2406 tcg_gen_mov_tl(cpu_A0
, cpu_regs
[R_ESP
]);
2407 gen_op_addl_A0_seg(s
, R_SS
);
2409 tcg_gen_ext32u_tl(cpu_A0
, cpu_regs
[R_ESP
]);
2412 gen_op_ld_v(s
, d_ot
, cpu_T
[0], addr
);
2416 static void gen_pop_update(DisasContext
*s
, TCGMemOp ot
)
2418 gen_stack_update(s
, 1 << ot
);
2421 static void gen_stack_A0(DisasContext
*s
)
2423 gen_op_movl_A0_reg(R_ESP
);
2425 tcg_gen_ext16u_tl(cpu_A0
, cpu_A0
);
2426 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2428 gen_op_addl_A0_seg(s
, R_SS
);
2431 /* NOTE: wrap around in 16 bit not fully handled */
2432 static void gen_pusha(DisasContext
*s
)
2435 gen_op_movl_A0_reg(R_ESP
);
2436 gen_op_addl_A0_im(-8 << s
->dflag
);
2438 tcg_gen_ext16u_tl(cpu_A0
, cpu_A0
);
2439 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2441 gen_op_addl_A0_seg(s
, R_SS
);
2442 for(i
= 0;i
< 8; i
++) {
2443 gen_op_mov_v_reg(MO_32
, cpu_T
[0], 7 - i
);
2444 gen_op_st_v(s
, s
->dflag
, cpu_T
[0], cpu_A0
);
2445 gen_op_addl_A0_im(1 << s
->dflag
);
2447 gen_op_mov_reg_v(MO_16
+ s
->ss32
, R_ESP
, cpu_T
[1]);
2450 /* NOTE: wrap around in 16 bit not fully handled */
2451 static void gen_popa(DisasContext
*s
)
2454 gen_op_movl_A0_reg(R_ESP
);
2456 tcg_gen_ext16u_tl(cpu_A0
, cpu_A0
);
2457 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2458 tcg_gen_addi_tl(cpu_T
[1], cpu_T
[1], 8 << s
->dflag
);
2460 gen_op_addl_A0_seg(s
, R_SS
);
2461 for(i
= 0;i
< 8; i
++) {
2462 /* ESP is not reloaded */
2464 gen_op_ld_v(s
, s
->dflag
, cpu_T
[0], cpu_A0
);
2465 gen_op_mov_reg_v(s
->dflag
, 7 - i
, cpu_T
[0]);
2467 gen_op_addl_A0_im(1 << s
->dflag
);
2469 gen_op_mov_reg_v(MO_16
+ s
->ss32
, R_ESP
, cpu_T
[1]);
2472 static void gen_enter(DisasContext
*s
, int esp_addend
, int level
)
2474 TCGMemOp ot
= mo_pushpop(s
, s
->dflag
);
2475 int opsize
= 1 << ot
;
2478 #ifdef TARGET_X86_64
2480 gen_op_movl_A0_reg(R_ESP
);
2481 gen_op_addq_A0_im(-opsize
);
2482 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2485 gen_op_mov_v_reg(MO_32
, cpu_T
[0], R_EBP
);
2486 gen_op_st_v(s
, ot
, cpu_T
[0], cpu_A0
);
2488 /* XXX: must save state */
2489 gen_helper_enter64_level(cpu_env
, tcg_const_i32(level
),
2490 tcg_const_i32((ot
== MO_64
)),
2493 gen_op_mov_reg_v(ot
, R_EBP
, cpu_T
[1]);
2494 tcg_gen_addi_tl(cpu_T
[1], cpu_T
[1], -esp_addend
+ (-opsize
* level
));
2495 gen_op_mov_reg_v(MO_64
, R_ESP
, cpu_T
[1]);
2499 gen_op_movl_A0_reg(R_ESP
);
2500 gen_op_addl_A0_im(-opsize
);
2502 tcg_gen_ext16u_tl(cpu_A0
, cpu_A0
);
2503 tcg_gen_mov_tl(cpu_T
[1], cpu_A0
);
2505 gen_op_addl_A0_seg(s
, R_SS
);
2507 gen_op_mov_v_reg(MO_32
, cpu_T
[0], R_EBP
);
2508 gen_op_st_v(s
, ot
, cpu_T
[0], cpu_A0
);
2510 /* XXX: must save state */
2511 gen_helper_enter_level(cpu_env
, tcg_const_i32(level
),
2512 tcg_const_i32(s
->dflag
- 1),
2515 gen_op_mov_reg_v(ot
, R_EBP
, cpu_T
[1]);
2516 tcg_gen_addi_tl(cpu_T
[1], cpu_T
[1], -esp_addend
+ (-opsize
* level
));
2517 gen_op_mov_reg_v(MO_16
+ s
->ss32
, R_ESP
, cpu_T
[1]);
2521 static void gen_exception(DisasContext
*s
, int trapno
, target_ulong cur_eip
)
2523 gen_update_cc_op(s
);
2524 gen_jmp_im(cur_eip
);
2525 gen_helper_raise_exception(cpu_env
, tcg_const_i32(trapno
));
2526 s
->is_jmp
= DISAS_TB_JUMP
;
2529 /* an interrupt is different from an exception because of the
2531 static void gen_interrupt(DisasContext
*s
, int intno
,
2532 target_ulong cur_eip
, target_ulong next_eip
)
2534 gen_update_cc_op(s
);
2535 gen_jmp_im(cur_eip
);
2536 gen_helper_raise_interrupt(cpu_env
, tcg_const_i32(intno
),
2537 tcg_const_i32(next_eip
- cur_eip
));
2538 s
->is_jmp
= DISAS_TB_JUMP
;
2541 static void gen_debug(DisasContext
*s
, target_ulong cur_eip
)
2543 gen_update_cc_op(s
);
2544 gen_jmp_im(cur_eip
);
2545 gen_helper_debug(cpu_env
);
2546 s
->is_jmp
= DISAS_TB_JUMP
;
2549 /* generate a generic end of block. Trace exception is also generated
2551 static void gen_eob(DisasContext
*s
)
2553 gen_update_cc_op(s
);
2554 if (s
->tb
->flags
& HF_INHIBIT_IRQ_MASK
) {
2555 gen_helper_reset_inhibit_irq(cpu_env
);
2557 if (s
->tb
->flags
& HF_RF_MASK
) {
2558 gen_helper_reset_rf(cpu_env
);
2560 if (s
->singlestep_enabled
) {
2561 gen_helper_debug(cpu_env
);
2563 gen_helper_single_step(cpu_env
);
2567 s
->is_jmp
= DISAS_TB_JUMP
;
2570 /* generate a jump to eip. No segment change must happen before as a
2571 direct call to the next block may occur */
2572 static void gen_jmp_tb(DisasContext
*s
, target_ulong eip
, int tb_num
)
2574 gen_update_cc_op(s
);
2575 set_cc_op(s
, CC_OP_DYNAMIC
);
2577 gen_goto_tb(s
, tb_num
, eip
);
2578 s
->is_jmp
= DISAS_TB_JUMP
;
2585 static void gen_jmp(DisasContext
*s
, target_ulong eip
)
2587 gen_jmp_tb(s
, eip
, 0);
2590 static inline void gen_ldq_env_A0(DisasContext
*s
, int offset
)
2592 tcg_gen_qemu_ld_i64(cpu_tmp1_i64
, cpu_A0
, s
->mem_index
, MO_LEQ
);
2593 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, offset
);
2596 static inline void gen_stq_env_A0(DisasContext
*s
, int offset
)
2598 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, offset
);
2599 tcg_gen_qemu_st_i64(cpu_tmp1_i64
, cpu_A0
, s
->mem_index
, MO_LEQ
);
2602 static inline void gen_ldo_env_A0(DisasContext
*s
, int offset
)
2604 int mem_index
= s
->mem_index
;
2605 tcg_gen_qemu_ld_i64(cpu_tmp1_i64
, cpu_A0
, mem_index
, MO_LEQ
);
2606 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, offset
+ offsetof(XMMReg
, XMM_Q(0)));
2607 tcg_gen_addi_tl(cpu_tmp0
, cpu_A0
, 8);
2608 tcg_gen_qemu_ld_i64(cpu_tmp1_i64
, cpu_tmp0
, mem_index
, MO_LEQ
);
2609 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, offset
+ offsetof(XMMReg
, XMM_Q(1)));
2612 static inline void gen_sto_env_A0(DisasContext
*s
, int offset
)
2614 int mem_index
= s
->mem_index
;
2615 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, offset
+ offsetof(XMMReg
, XMM_Q(0)));
2616 tcg_gen_qemu_st_i64(cpu_tmp1_i64
, cpu_A0
, mem_index
, MO_LEQ
);
2617 tcg_gen_addi_tl(cpu_tmp0
, cpu_A0
, 8);
2618 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, offset
+ offsetof(XMMReg
, XMM_Q(1)));
2619 tcg_gen_qemu_st_i64(cpu_tmp1_i64
, cpu_tmp0
, mem_index
, MO_LEQ
);
2622 static inline void gen_op_movo(int d_offset
, int s_offset
)
2624 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, s_offset
);
2625 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, d_offset
);
2626 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, s_offset
+ 8);
2627 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, d_offset
+ 8);
2630 static inline void gen_op_movq(int d_offset
, int s_offset
)
2632 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
, s_offset
);
2633 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, d_offset
);
2636 static inline void gen_op_movl(int d_offset
, int s_offset
)
2638 tcg_gen_ld_i32(cpu_tmp2_i32
, cpu_env
, s_offset
);
2639 tcg_gen_st_i32(cpu_tmp2_i32
, cpu_env
, d_offset
);
2642 static inline void gen_op_movq_env_0(int d_offset
)
2644 tcg_gen_movi_i64(cpu_tmp1_i64
, 0);
2645 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
, d_offset
);
2648 typedef void (*SSEFunc_i_ep
)(TCGv_i32 val
, TCGv_ptr env
, TCGv_ptr reg
);
2649 typedef void (*SSEFunc_l_ep
)(TCGv_i64 val
, TCGv_ptr env
, TCGv_ptr reg
);
2650 typedef void (*SSEFunc_0_epi
)(TCGv_ptr env
, TCGv_ptr reg
, TCGv_i32 val
);
2651 typedef void (*SSEFunc_0_epl
)(TCGv_ptr env
, TCGv_ptr reg
, TCGv_i64 val
);
2652 typedef void (*SSEFunc_0_epp
)(TCGv_ptr env
, TCGv_ptr reg_a
, TCGv_ptr reg_b
);
2653 typedef void (*SSEFunc_0_eppi
)(TCGv_ptr env
, TCGv_ptr reg_a
, TCGv_ptr reg_b
,
2655 typedef void (*SSEFunc_0_ppi
)(TCGv_ptr reg_a
, TCGv_ptr reg_b
, TCGv_i32 val
);
2656 typedef void (*SSEFunc_0_eppt
)(TCGv_ptr env
, TCGv_ptr reg_a
, TCGv_ptr reg_b
,
2659 #define SSE_SPECIAL ((void *)1)
2660 #define SSE_DUMMY ((void *)2)
2662 #define MMX_OP2(x) { gen_helper_ ## x ## _mmx, gen_helper_ ## x ## _xmm }
2663 #define SSE_FOP(x) { gen_helper_ ## x ## ps, gen_helper_ ## x ## pd, \
2664 gen_helper_ ## x ## ss, gen_helper_ ## x ## sd, }
2666 static const SSEFunc_0_epp sse_op_table1
[256][4] = {
2667 /* 3DNow! extensions */
2668 [0x0e] = { SSE_DUMMY
}, /* femms */
2669 [0x0f] = { SSE_DUMMY
}, /* pf... */
2670 /* pure SSE operations */
2671 [0x10] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movups, movupd, movss, movsd */
2672 [0x11] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movups, movupd, movss, movsd */
2673 [0x12] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movlps, movlpd, movsldup, movddup */
2674 [0x13] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movlps, movlpd */
2675 [0x14] = { gen_helper_punpckldq_xmm
, gen_helper_punpcklqdq_xmm
},
2676 [0x15] = { gen_helper_punpckhdq_xmm
, gen_helper_punpckhqdq_xmm
},
2677 [0x16] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movhps, movhpd, movshdup */
2678 [0x17] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movhps, movhpd */
2680 [0x28] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movaps, movapd */
2681 [0x29] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movaps, movapd */
2682 [0x2a] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* cvtpi2ps, cvtpi2pd, cvtsi2ss, cvtsi2sd */
2683 [0x2b] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movntps, movntpd, movntss, movntsd */
2684 [0x2c] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* cvttps2pi, cvttpd2pi, cvttsd2si, cvttss2si */
2685 [0x2d] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* cvtps2pi, cvtpd2pi, cvtsd2si, cvtss2si */
2686 [0x2e] = { gen_helper_ucomiss
, gen_helper_ucomisd
},
2687 [0x2f] = { gen_helper_comiss
, gen_helper_comisd
},
2688 [0x50] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movmskps, movmskpd */
2689 [0x51] = SSE_FOP(sqrt
),
2690 [0x52] = { gen_helper_rsqrtps
, NULL
, gen_helper_rsqrtss
, NULL
},
2691 [0x53] = { gen_helper_rcpps
, NULL
, gen_helper_rcpss
, NULL
},
2692 [0x54] = { gen_helper_pand_xmm
, gen_helper_pand_xmm
}, /* andps, andpd */
2693 [0x55] = { gen_helper_pandn_xmm
, gen_helper_pandn_xmm
}, /* andnps, andnpd */
2694 [0x56] = { gen_helper_por_xmm
, gen_helper_por_xmm
}, /* orps, orpd */
2695 [0x57] = { gen_helper_pxor_xmm
, gen_helper_pxor_xmm
}, /* xorps, xorpd */
2696 [0x58] = SSE_FOP(add
),
2697 [0x59] = SSE_FOP(mul
),
2698 [0x5a] = { gen_helper_cvtps2pd
, gen_helper_cvtpd2ps
,
2699 gen_helper_cvtss2sd
, gen_helper_cvtsd2ss
},
2700 [0x5b] = { gen_helper_cvtdq2ps
, gen_helper_cvtps2dq
, gen_helper_cvttps2dq
},
2701 [0x5c] = SSE_FOP(sub
),
2702 [0x5d] = SSE_FOP(min
),
2703 [0x5e] = SSE_FOP(div
),
2704 [0x5f] = SSE_FOP(max
),
2706 [0xc2] = SSE_FOP(cmpeq
),
2707 [0xc6] = { (SSEFunc_0_epp
)gen_helper_shufps
,
2708 (SSEFunc_0_epp
)gen_helper_shufpd
}, /* XXX: casts */
2710 /* SSSE3, SSE4, MOVBE, CRC32, BMI1, BMI2, ADX. */
2711 [0x38] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
},
2712 [0x3a] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
},
2714 /* MMX ops and their SSE extensions */
2715 [0x60] = MMX_OP2(punpcklbw
),
2716 [0x61] = MMX_OP2(punpcklwd
),
2717 [0x62] = MMX_OP2(punpckldq
),
2718 [0x63] = MMX_OP2(packsswb
),
2719 [0x64] = MMX_OP2(pcmpgtb
),
2720 [0x65] = MMX_OP2(pcmpgtw
),
2721 [0x66] = MMX_OP2(pcmpgtl
),
2722 [0x67] = MMX_OP2(packuswb
),
2723 [0x68] = MMX_OP2(punpckhbw
),
2724 [0x69] = MMX_OP2(punpckhwd
),
2725 [0x6a] = MMX_OP2(punpckhdq
),
2726 [0x6b] = MMX_OP2(packssdw
),
2727 [0x6c] = { NULL
, gen_helper_punpcklqdq_xmm
},
2728 [0x6d] = { NULL
, gen_helper_punpckhqdq_xmm
},
2729 [0x6e] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movd mm, ea */
2730 [0x6f] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movq, movdqa, , movqdu */
2731 [0x70] = { (SSEFunc_0_epp
)gen_helper_pshufw_mmx
,
2732 (SSEFunc_0_epp
)gen_helper_pshufd_xmm
,
2733 (SSEFunc_0_epp
)gen_helper_pshufhw_xmm
,
2734 (SSEFunc_0_epp
)gen_helper_pshuflw_xmm
}, /* XXX: casts */
2735 [0x71] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* shiftw */
2736 [0x72] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* shiftd */
2737 [0x73] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* shiftq */
2738 [0x74] = MMX_OP2(pcmpeqb
),
2739 [0x75] = MMX_OP2(pcmpeqw
),
2740 [0x76] = MMX_OP2(pcmpeql
),
2741 [0x77] = { SSE_DUMMY
}, /* emms */
2742 [0x78] = { NULL
, SSE_SPECIAL
, NULL
, SSE_SPECIAL
}, /* extrq_i, insertq_i */
2743 [0x79] = { NULL
, gen_helper_extrq_r
, NULL
, gen_helper_insertq_r
},
2744 [0x7c] = { NULL
, gen_helper_haddpd
, NULL
, gen_helper_haddps
},
2745 [0x7d] = { NULL
, gen_helper_hsubpd
, NULL
, gen_helper_hsubps
},
2746 [0x7e] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movd, movd, , movq */
2747 [0x7f] = { SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
}, /* movq, movdqa, movdqu */
2748 [0xc4] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* pinsrw */
2749 [0xc5] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* pextrw */
2750 [0xd0] = { NULL
, gen_helper_addsubpd
, NULL
, gen_helper_addsubps
},
2751 [0xd1] = MMX_OP2(psrlw
),
2752 [0xd2] = MMX_OP2(psrld
),
2753 [0xd3] = MMX_OP2(psrlq
),
2754 [0xd4] = MMX_OP2(paddq
),
2755 [0xd5] = MMX_OP2(pmullw
),
2756 [0xd6] = { NULL
, SSE_SPECIAL
, SSE_SPECIAL
, SSE_SPECIAL
},
2757 [0xd7] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* pmovmskb */
2758 [0xd8] = MMX_OP2(psubusb
),
2759 [0xd9] = MMX_OP2(psubusw
),
2760 [0xda] = MMX_OP2(pminub
),
2761 [0xdb] = MMX_OP2(pand
),
2762 [0xdc] = MMX_OP2(paddusb
),
2763 [0xdd] = MMX_OP2(paddusw
),
2764 [0xde] = MMX_OP2(pmaxub
),
2765 [0xdf] = MMX_OP2(pandn
),
2766 [0xe0] = MMX_OP2(pavgb
),
2767 [0xe1] = MMX_OP2(psraw
),
2768 [0xe2] = MMX_OP2(psrad
),
2769 [0xe3] = MMX_OP2(pavgw
),
2770 [0xe4] = MMX_OP2(pmulhuw
),
2771 [0xe5] = MMX_OP2(pmulhw
),
2772 [0xe6] = { NULL
, gen_helper_cvttpd2dq
, gen_helper_cvtdq2pd
, gen_helper_cvtpd2dq
},
2773 [0xe7] = { SSE_SPECIAL
, SSE_SPECIAL
}, /* movntq, movntq */
2774 [0xe8] = MMX_OP2(psubsb
),
2775 [0xe9] = MMX_OP2(psubsw
),
2776 [0xea] = MMX_OP2(pminsw
),
2777 [0xeb] = MMX_OP2(por
),
2778 [0xec] = MMX_OP2(paddsb
),
2779 [0xed] = MMX_OP2(paddsw
),
2780 [0xee] = MMX_OP2(pmaxsw
),
2781 [0xef] = MMX_OP2(pxor
),
2782 [0xf0] = { NULL
, NULL
, NULL
, SSE_SPECIAL
}, /* lddqu */
2783 [0xf1] = MMX_OP2(psllw
),
2784 [0xf2] = MMX_OP2(pslld
),
2785 [0xf3] = MMX_OP2(psllq
),
2786 [0xf4] = MMX_OP2(pmuludq
),
2787 [0xf5] = MMX_OP2(pmaddwd
),
2788 [0xf6] = MMX_OP2(psadbw
),
2789 [0xf7] = { (SSEFunc_0_epp
)gen_helper_maskmov_mmx
,
2790 (SSEFunc_0_epp
)gen_helper_maskmov_xmm
}, /* XXX: casts */
2791 [0xf8] = MMX_OP2(psubb
),
2792 [0xf9] = MMX_OP2(psubw
),
2793 [0xfa] = MMX_OP2(psubl
),
2794 [0xfb] = MMX_OP2(psubq
),
2795 [0xfc] = MMX_OP2(paddb
),
2796 [0xfd] = MMX_OP2(paddw
),
2797 [0xfe] = MMX_OP2(paddl
),
2800 static const SSEFunc_0_epp sse_op_table2
[3 * 8][2] = {
2801 [0 + 2] = MMX_OP2(psrlw
),
2802 [0 + 4] = MMX_OP2(psraw
),
2803 [0 + 6] = MMX_OP2(psllw
),
2804 [8 + 2] = MMX_OP2(psrld
),
2805 [8 + 4] = MMX_OP2(psrad
),
2806 [8 + 6] = MMX_OP2(pslld
),
2807 [16 + 2] = MMX_OP2(psrlq
),
2808 [16 + 3] = { NULL
, gen_helper_psrldq_xmm
},
2809 [16 + 6] = MMX_OP2(psllq
),
2810 [16 + 7] = { NULL
, gen_helper_pslldq_xmm
},
2813 static const SSEFunc_0_epi sse_op_table3ai
[] = {
2814 gen_helper_cvtsi2ss
,
2818 #ifdef TARGET_X86_64
2819 static const SSEFunc_0_epl sse_op_table3aq
[] = {
2820 gen_helper_cvtsq2ss
,
2825 static const SSEFunc_i_ep sse_op_table3bi
[] = {
2826 gen_helper_cvttss2si
,
2827 gen_helper_cvtss2si
,
2828 gen_helper_cvttsd2si
,
2832 #ifdef TARGET_X86_64
2833 static const SSEFunc_l_ep sse_op_table3bq
[] = {
2834 gen_helper_cvttss2sq
,
2835 gen_helper_cvtss2sq
,
2836 gen_helper_cvttsd2sq
,
2841 static const SSEFunc_0_epp sse_op_table4
[8][4] = {
2852 static const SSEFunc_0_epp sse_op_table5
[256] = {
2853 [0x0c] = gen_helper_pi2fw
,
2854 [0x0d] = gen_helper_pi2fd
,
2855 [0x1c] = gen_helper_pf2iw
,
2856 [0x1d] = gen_helper_pf2id
,
2857 [0x8a] = gen_helper_pfnacc
,
2858 [0x8e] = gen_helper_pfpnacc
,
2859 [0x90] = gen_helper_pfcmpge
,
2860 [0x94] = gen_helper_pfmin
,
2861 [0x96] = gen_helper_pfrcp
,
2862 [0x97] = gen_helper_pfrsqrt
,
2863 [0x9a] = gen_helper_pfsub
,
2864 [0x9e] = gen_helper_pfadd
,
2865 [0xa0] = gen_helper_pfcmpgt
,
2866 [0xa4] = gen_helper_pfmax
,
2867 [0xa6] = gen_helper_movq
, /* pfrcpit1; no need to actually increase precision */
2868 [0xa7] = gen_helper_movq
, /* pfrsqit1 */
2869 [0xaa] = gen_helper_pfsubr
,
2870 [0xae] = gen_helper_pfacc
,
2871 [0xb0] = gen_helper_pfcmpeq
,
2872 [0xb4] = gen_helper_pfmul
,
2873 [0xb6] = gen_helper_movq
, /* pfrcpit2 */
2874 [0xb7] = gen_helper_pmulhrw_mmx
,
2875 [0xbb] = gen_helper_pswapd
,
2876 [0xbf] = gen_helper_pavgb_mmx
/* pavgusb */
2879 struct SSEOpHelper_epp
{
2880 SSEFunc_0_epp op
[2];
2884 struct SSEOpHelper_eppi
{
2885 SSEFunc_0_eppi op
[2];
2889 #define SSSE3_OP(x) { MMX_OP2(x), CPUID_EXT_SSSE3 }
2890 #define SSE41_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE41 }
2891 #define SSE42_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE42 }
2892 #define SSE41_SPECIAL { { NULL, SSE_SPECIAL }, CPUID_EXT_SSE41 }
2893 #define PCLMULQDQ_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, \
2894 CPUID_EXT_PCLMULQDQ }
2895 #define AESNI_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_AES }
2897 static const struct SSEOpHelper_epp sse_op_table6
[256] = {
2898 [0x00] = SSSE3_OP(pshufb
),
2899 [0x01] = SSSE3_OP(phaddw
),
2900 [0x02] = SSSE3_OP(phaddd
),
2901 [0x03] = SSSE3_OP(phaddsw
),
2902 [0x04] = SSSE3_OP(pmaddubsw
),
2903 [0x05] = SSSE3_OP(phsubw
),
2904 [0x06] = SSSE3_OP(phsubd
),
2905 [0x07] = SSSE3_OP(phsubsw
),
2906 [0x08] = SSSE3_OP(psignb
),
2907 [0x09] = SSSE3_OP(psignw
),
2908 [0x0a] = SSSE3_OP(psignd
),
2909 [0x0b] = SSSE3_OP(pmulhrsw
),
2910 [0x10] = SSE41_OP(pblendvb
),
2911 [0x14] = SSE41_OP(blendvps
),
2912 [0x15] = SSE41_OP(blendvpd
),
2913 [0x17] = SSE41_OP(ptest
),
2914 [0x1c] = SSSE3_OP(pabsb
),
2915 [0x1d] = SSSE3_OP(pabsw
),
2916 [0x1e] = SSSE3_OP(pabsd
),
2917 [0x20] = SSE41_OP(pmovsxbw
),
2918 [0x21] = SSE41_OP(pmovsxbd
),
2919 [0x22] = SSE41_OP(pmovsxbq
),
2920 [0x23] = SSE41_OP(pmovsxwd
),
2921 [0x24] = SSE41_OP(pmovsxwq
),
2922 [0x25] = SSE41_OP(pmovsxdq
),
2923 [0x28] = SSE41_OP(pmuldq
),
2924 [0x29] = SSE41_OP(pcmpeqq
),
2925 [0x2a] = SSE41_SPECIAL
, /* movntqda */
2926 [0x2b] = SSE41_OP(packusdw
),
2927 [0x30] = SSE41_OP(pmovzxbw
),
2928 [0x31] = SSE41_OP(pmovzxbd
),
2929 [0x32] = SSE41_OP(pmovzxbq
),
2930 [0x33] = SSE41_OP(pmovzxwd
),
2931 [0x34] = SSE41_OP(pmovzxwq
),
2932 [0x35] = SSE41_OP(pmovzxdq
),
2933 [0x37] = SSE42_OP(pcmpgtq
),
2934 [0x38] = SSE41_OP(pminsb
),
2935 [0x39] = SSE41_OP(pminsd
),
2936 [0x3a] = SSE41_OP(pminuw
),
2937 [0x3b] = SSE41_OP(pminud
),
2938 [0x3c] = SSE41_OP(pmaxsb
),
2939 [0x3d] = SSE41_OP(pmaxsd
),
2940 [0x3e] = SSE41_OP(pmaxuw
),
2941 [0x3f] = SSE41_OP(pmaxud
),
2942 [0x40] = SSE41_OP(pmulld
),
2943 [0x41] = SSE41_OP(phminposuw
),
2944 [0xdb] = AESNI_OP(aesimc
),
2945 [0xdc] = AESNI_OP(aesenc
),
2946 [0xdd] = AESNI_OP(aesenclast
),
2947 [0xde] = AESNI_OP(aesdec
),
2948 [0xdf] = AESNI_OP(aesdeclast
),
2951 static const struct SSEOpHelper_eppi sse_op_table7
[256] = {
2952 [0x08] = SSE41_OP(roundps
),
2953 [0x09] = SSE41_OP(roundpd
),
2954 [0x0a] = SSE41_OP(roundss
),
2955 [0x0b] = SSE41_OP(roundsd
),
2956 [0x0c] = SSE41_OP(blendps
),
2957 [0x0d] = SSE41_OP(blendpd
),
2958 [0x0e] = SSE41_OP(pblendw
),
2959 [0x0f] = SSSE3_OP(palignr
),
2960 [0x14] = SSE41_SPECIAL
, /* pextrb */
2961 [0x15] = SSE41_SPECIAL
, /* pextrw */
2962 [0x16] = SSE41_SPECIAL
, /* pextrd/pextrq */
2963 [0x17] = SSE41_SPECIAL
, /* extractps */
2964 [0x20] = SSE41_SPECIAL
, /* pinsrb */
2965 [0x21] = SSE41_SPECIAL
, /* insertps */
2966 [0x22] = SSE41_SPECIAL
, /* pinsrd/pinsrq */
2967 [0x40] = SSE41_OP(dpps
),
2968 [0x41] = SSE41_OP(dppd
),
2969 [0x42] = SSE41_OP(mpsadbw
),
2970 [0x44] = PCLMULQDQ_OP(pclmulqdq
),
2971 [0x60] = SSE42_OP(pcmpestrm
),
2972 [0x61] = SSE42_OP(pcmpestri
),
2973 [0x62] = SSE42_OP(pcmpistrm
),
2974 [0x63] = SSE42_OP(pcmpistri
),
2975 [0xdf] = AESNI_OP(aeskeygenassist
),
2978 static void gen_sse(CPUX86State
*env
, DisasContext
*s
, int b
,
2979 target_ulong pc_start
, int rex_r
)
2981 int b1
, op1_offset
, op2_offset
, is_xmm
, val
;
2982 int modrm
, mod
, rm
, reg
;
2983 SSEFunc_0_epp sse_fn_epp
;
2984 SSEFunc_0_eppi sse_fn_eppi
;
2985 SSEFunc_0_ppi sse_fn_ppi
;
2986 SSEFunc_0_eppt sse_fn_eppt
;
2990 if (s
->prefix
& PREFIX_DATA
)
2992 else if (s
->prefix
& PREFIX_REPZ
)
2994 else if (s
->prefix
& PREFIX_REPNZ
)
2998 sse_fn_epp
= sse_op_table1
[b
][b1
];
3002 if ((b
<= 0x5f && b
>= 0x10) || b
== 0xc6 || b
== 0xc2) {
3012 /* simple MMX/SSE operation */
3013 if (s
->flags
& HF_TS_MASK
) {
3014 gen_exception(s
, EXCP07_PREX
, pc_start
- s
->cs_base
);
3017 if (s
->flags
& HF_EM_MASK
) {
3019 gen_exception(s
, EXCP06_ILLOP
, pc_start
- s
->cs_base
);
3022 if (is_xmm
&& !(s
->flags
& HF_OSFXSR_MASK
))
3023 if ((b
!= 0x38 && b
!= 0x3a) || (s
->prefix
& PREFIX_DATA
))
3026 if (!(s
->cpuid_ext2_features
& CPUID_EXT2_3DNOW
))
3029 gen_helper_emms(cpu_env
);
3034 gen_helper_emms(cpu_env
);
3037 /* prepare MMX state (XXX: optimize by storing fptt and fptags in
3038 the static cpu state) */
3040 gen_helper_enter_mmx(cpu_env
);
3043 modrm
= cpu_ldub_code(env
, s
->pc
++);
3044 reg
= ((modrm
>> 3) & 7);
3047 mod
= (modrm
>> 6) & 3;
3048 if (sse_fn_epp
== SSE_SPECIAL
) {
3051 case 0x0e7: /* movntq */
3054 gen_lea_modrm(env
, s
, modrm
);
3055 gen_stq_env_A0(s
, offsetof(CPUX86State
, fpregs
[reg
].mmx
));
3057 case 0x1e7: /* movntdq */
3058 case 0x02b: /* movntps */
3059 case 0x12b: /* movntps */
3062 gen_lea_modrm(env
, s
, modrm
);
3063 gen_sto_env_A0(s
, offsetof(CPUX86State
, xmm_regs
[reg
]));
3065 case 0x3f0: /* lddqu */
3068 gen_lea_modrm(env
, s
, modrm
);
3069 gen_ldo_env_A0(s
, offsetof(CPUX86State
, xmm_regs
[reg
]));
3071 case 0x22b: /* movntss */
3072 case 0x32b: /* movntsd */
3075 gen_lea_modrm(env
, s
, modrm
);
3077 gen_stq_env_A0(s
, offsetof(CPUX86State
, xmm_regs
[reg
]));
3079 tcg_gen_ld32u_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,
3080 xmm_regs
[reg
].XMM_L(0)));
3081 gen_op_st_v(s
, MO_32
, cpu_T
[0], cpu_A0
);
3084 case 0x6e: /* movd mm, ea */
3085 #ifdef TARGET_X86_64
3086 if (s
->dflag
== MO_64
) {
3087 gen_ldst_modrm(env
, s
, modrm
, MO_64
, OR_TMP0
, 0);
3088 tcg_gen_st_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3092 gen_ldst_modrm(env
, s
, modrm
, MO_32
, OR_TMP0
, 0);
3093 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
,
3094 offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3095 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
3096 gen_helper_movl_mm_T0_mmx(cpu_ptr0
, cpu_tmp2_i32
);
3099 case 0x16e: /* movd xmm, ea */
3100 #ifdef TARGET_X86_64
3101 if (s
->dflag
== MO_64
) {
3102 gen_ldst_modrm(env
, s
, modrm
, MO_64
, OR_TMP0
, 0);
3103 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
,
3104 offsetof(CPUX86State
,xmm_regs
[reg
]));
3105 gen_helper_movq_mm_T0_xmm(cpu_ptr0
, cpu_T
[0]);
3109 gen_ldst_modrm(env
, s
, modrm
, MO_32
, OR_TMP0
, 0);
3110 tcg_gen_addi_ptr(cpu_ptr0
, cpu_env
,
3111 offsetof(CPUX86State
,xmm_regs
[reg
]));
3112 tcg_gen_trunc_tl_i32(cpu_tmp2_i32
, cpu_T
[0]);
3113 gen_helper_movl_mm_T0_xmm(cpu_ptr0
, cpu_tmp2_i32
);
3116 case 0x6f: /* movq mm, ea */
3118 gen_lea_modrm(env
, s
, modrm
);
3119 gen_ldq_env_A0(s
, offsetof(CPUX86State
, fpregs
[reg
].mmx
));
3122 tcg_gen_ld_i64(cpu_tmp1_i64
, cpu_env
,
3123 offsetof(CPUX86State
,fpregs
[rm
].mmx
));
3124 tcg_gen_st_i64(cpu_tmp1_i64
, cpu_env
,
3125 offsetof(CPUX86State
,fpregs
[reg
].mmx
));
3128 case 0x010: /* movups */
3129 case 0x110: /* movupd */
3130 case 0x028: /* movaps */
3131 case 0x128: /* movapd */
3132 case 0x16f: /* movdqa xmm, ea */
3133 case 0x26f: /* movdqu xmm, ea */
3135 gen_lea_modrm(env
, s
, modrm
);
3136 gen_ldo_env_A0(s
, offsetof(CPUX86State
, xmm_regs
[reg
]));
3138 rm
= (modrm
& 7) | REX_B(s
);
3139 gen_op_movo(offsetof(CPUX86State
,xmm_regs
[reg
]),
3140 offsetof(CPUX86State
,xmm_regs
[rm
]));
3143 case 0x210: /* movss xmm, ea */
3145 gen_lea_modrm(env
, s
, modrm
);
3146 gen_op_ld_v(s
, MO_32
, cpu_T
[0], cpu_A0
);
3147 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(0)));
3148 tcg_gen_movi_tl(cpu_T
[0], 0);
3149 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(1)));
3150 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(2)));
3151 tcg_gen_st32_tl(cpu_T
[0], cpu_env
, offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(3)));
3153 rm
= (modrm
& 7) | REX_B(s
);
3154 gen_op_movl(offsetof(CPUX86State
,xmm_regs
[reg
].XMM_L(0)),