Bug Summary

File:target-i386/translate.c
Location:line 1900, column 13
Description:Value stored to 'havesib' is never read

Annotated Source Code

1/*
2 * i386 translation
3 *
4 * Copyright (c) 2003 Fabrice Bellard
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
10 *
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18 */
19#include <stdarg.h>
20#include <stdlib.h>
21#include <stdio.h>
22#include <string.h>
23#include <inttypes.h>
24#include <signal.h>
25
26#include "qemu/host-utils.h"
27#include "cpu.h"
28#include "disas/disas.h"
29#include "tcg-op.h"
30
31#include "helper.h"
32#define GEN_HELPER 1
33#include "helper.h"
34
35#define PREFIX_REPZ0x01 0x01
36#define PREFIX_REPNZ0x02 0x02
37#define PREFIX_LOCK0x04 0x04
38#define PREFIX_DATA0x08 0x08
39#define PREFIX_ADR0x10 0x10
40#define PREFIX_VEX0x20 0x20
41
42#ifdef TARGET_X86_64
43#define CODE64(s)0 ((s)->code64)
44#define REX_X(s)0 ((s)->rex_x)
45#define REX_B(s)0 ((s)->rex_b)
46#else
47#define CODE64(s)0 0
48#define REX_X(s)0 0
49#define REX_B(s)0 0
50#endif
51
52#ifdef TARGET_X86_64
53# define ctztlctz32 ctz64
54# define clztlclz32 clz64
55#else
56# define ctztlctz32 ctz32
57# define clztlclz32 clz32
58#endif
59
60//#define MACRO_TEST 1
61
62/* global register indexes */
63static TCGv_ptr cpu_env;
64static TCGvTCGv_i32 cpu_A0;
65static TCGvTCGv_i32 cpu_cc_dst, cpu_cc_src, cpu_cc_src2, cpu_cc_srcT;
66static TCGv_i32 cpu_cc_op;
67static TCGvTCGv_i32 cpu_regs[CPU_NB_REGS8];
68/* local temps */
69static TCGvTCGv_i32 cpu_T[2];
70/* local register indexes (only used inside old micro ops) */
71static TCGvTCGv_i32 cpu_tmp0, cpu_tmp4;
72static TCGv_ptr cpu_ptr0, cpu_ptr1;
73static TCGv_i32 cpu_tmp2_i32, cpu_tmp3_i32;
74static TCGv_i64 cpu_tmp1_i64;
75
76static uint8_t gen_opc_cc_op[OPC_BUF_SIZE640];
77
78#include "exec/gen-icount.h"
79
80#ifdef TARGET_X86_64
81static int x86_64_hregs;
82#endif
83
84typedef struct DisasContext {
85 /* current insn context */
86 int override; /* -1 if no override */
87 int prefix;
88 TCGMemOp aflag;
89 TCGMemOp dflag;
90 target_ulong pc; /* pc = eip + cs_base */
91 int is_jmp; /* 1 = means jump (stop translation), 2 means CPU
92 static state change (stop translation) */
93 /* current block context */
94 target_ulong cs_base; /* base of CS segment */
95 int pe; /* protected mode */
96 int code32; /* 32 bit code segment */
97#ifdef TARGET_X86_64
98 int lma; /* long mode active */
99 int code64; /* 64 bit code segment */
100 int rex_x, rex_b;
101#endif
102 int vex_l; /* vex vector length */
103 int vex_v; /* vex vvvv register, without 1's compliment. */
104 int ss32; /* 32 bit stack segment */
105 CCOp cc_op; /* current CC operation */
106 bool_Bool cc_op_dirty;
107 int addseg; /* non zero if either DS/ES/SS have a non zero base */
108 int f_st; /* currently unused */
109 int vm86; /* vm86 mode */
110 int cpl;
111 int iopl;
112 int tf; /* TF cpu flag */
113 int singlestep_enabled; /* "hardware" single step enabled */
114 int jmp_opt; /* use direct block chaining for direct jumps */
115 int mem_index; /* select memory access functions */
116 uint64_t flags; /* all execution flags */
117 struct TranslationBlock *tb;
118 int popl_esp_hack; /* for correct popl with esp base handling */
119 int rip_offset; /* only used in x86_64, but left for simplicity */
120 int cpuid_features;
121 int cpuid_ext_features;
122 int cpuid_ext2_features;
123 int cpuid_ext3_features;
124 int cpuid_7_0_ebx_features;
125} DisasContext;
126
127static void gen_eob(DisasContext *s);
128static void gen_jmp(DisasContext *s, target_ulong eip);
129static void gen_jmp_tb(DisasContext *s, target_ulong eip, int tb_num);
130static void gen_op(DisasContext *s1, int op, TCGMemOp ot, int d);
131
132/* i386 arith/logic operations */
133enum {
134 OP_ADDL,
135 OP_ORL,
136 OP_ADCL,
137 OP_SBBL,
138 OP_ANDL,
139 OP_SUBL,
140 OP_XORL,
141 OP_CMPL,
142};
143
144/* i386 shift ops */
145enum {
146 OP_ROL,
147 OP_ROR,
148 OP_RCL,
149 OP_RCR,
150 OP_SHL,
151 OP_SHR,
152 OP_SHL1, /* undocumented */
153 OP_SAR = 7,
154};
155
156enum {
157 JCC_O,
158 JCC_B,
159 JCC_Z,
160 JCC_BE,
161 JCC_S,
162 JCC_P,
163 JCC_L,
164 JCC_LE,
165};
166
167enum {
168 /* I386 int registers */
169 OR_EAX, /* MUST be even numbered */
170 OR_ECX,
171 OR_EDX,
172 OR_EBX,
173 OR_ESP,
174 OR_EBP,
175 OR_ESI,
176 OR_EDI,
177
178 OR_TMP0 = 16, /* temporary operand register */
179 OR_TMP1,
180 OR_A0, /* temporary register used when doing address evaluation */
181};
182
183enum {
184 USES_CC_DST = 1,
185 USES_CC_SRC = 2,
186 USES_CC_SRC2 = 4,
187 USES_CC_SRCT = 8,
188};
189
190/* Bit set if the global variable is live after setting CC_OP to X. */
191static const uint8_t cc_op_live[CC_OP_NB] = {
192 [CC_OP_DYNAMIC] = USES_CC_DST | USES_CC_SRC | USES_CC_SRC2,
193 [CC_OP_EFLAGS] = USES_CC_SRC,
194 [CC_OP_MULB ... CC_OP_MULQ] = USES_CC_DST | USES_CC_SRC,
195 [CC_OP_ADDB ... CC_OP_ADDQ] = USES_CC_DST | USES_CC_SRC,
196 [CC_OP_ADCB ... CC_OP_ADCQ] = USES_CC_DST | USES_CC_SRC | USES_CC_SRC2,
197 [CC_OP_SUBB ... CC_OP_SUBQ] = USES_CC_DST | USES_CC_SRC | USES_CC_SRCT,
198 [CC_OP_SBBB ... CC_OP_SBBQ] = USES_CC_DST | USES_CC_SRC | USES_CC_SRC2,
199 [CC_OP_LOGICB ... CC_OP_LOGICQ] = USES_CC_DST,
200 [CC_OP_INCB ... CC_OP_INCQ] = USES_CC_DST | USES_CC_SRC,
201 [CC_OP_DECB ... CC_OP_DECQ] = USES_CC_DST | USES_CC_SRC,
202 [CC_OP_SHLB ... CC_OP_SHLQ] = USES_CC_DST | USES_CC_SRC,
203 [CC_OP_SARB ... CC_OP_SARQ] = USES_CC_DST | USES_CC_SRC,
204 [CC_OP_BMILGB ... CC_OP_BMILGQ] = USES_CC_DST | USES_CC_SRC,
205 [CC_OP_ADCX] = USES_CC_DST | USES_CC_SRC,
206 [CC_OP_ADOX] = USES_CC_SRC | USES_CC_SRC2,
207 [CC_OP_ADCOX] = USES_CC_DST | USES_CC_SRC | USES_CC_SRC2,
208 [CC_OP_CLR] = 0,
209};
210
211static void set_cc_op(DisasContext *s, CCOp op)
212{
213 int dead;
214
215 if (s->cc_op == op) {
216 return;
217 }
218
219 /* Discard CC computation that will no longer be used. */
220 dead = cc_op_live[s->cc_op] & ~cc_op_live[op];
221 if (dead & USES_CC_DST) {
222 tcg_gen_discard_tltcg_gen_discard_i32(cpu_cc_dst);
223 }
224 if (dead & USES_CC_SRC) {
225 tcg_gen_discard_tltcg_gen_discard_i32(cpu_cc_src);
226 }
227 if (dead & USES_CC_SRC2) {
228 tcg_gen_discard_tltcg_gen_discard_i32(cpu_cc_src2);
229 }
230 if (dead & USES_CC_SRCT) {
231 tcg_gen_discard_tltcg_gen_discard_i32(cpu_cc_srcT);
232 }
233
234 if (op == CC_OP_DYNAMIC) {
235 /* The DYNAMIC setting is translator only, and should never be
236 stored. Thus we always consider it clean. */
237 s->cc_op_dirty = false0;
238 } else {
239 /* Discard any computed CC_OP value (see shifts). */
240 if (s->cc_op == CC_OP_DYNAMIC) {
241 tcg_gen_discard_i32(cpu_cc_op);
242 }
243 s->cc_op_dirty = true1;
244 }
245 s->cc_op = op;
246}
247
248static void gen_update_cc_op(DisasContext *s)
249{
250 if (s->cc_op_dirty) {
251 tcg_gen_movi_i32(cpu_cc_op, s->cc_op);
252 s->cc_op_dirty = false0;
253 }
254}
255
256#ifdef TARGET_X86_64
257
258#define NB_OP_SIZES3 4
259
260#else /* !TARGET_X86_64 */
261
262#define NB_OP_SIZES3 3
263
264#endif /* !TARGET_X86_64 */
265
266#if defined(HOST_WORDS_BIGENDIAN)
267#define REG_B_OFFSET0 (sizeof(target_ulong) - 1)
268#define REG_H_OFFSET1 (sizeof(target_ulong) - 2)
269#define REG_W_OFFSET0 (sizeof(target_ulong) - 2)
270#define REG_L_OFFSET0 (sizeof(target_ulong) - 4)
271#define REG_LH_OFFSET4 (sizeof(target_ulong) - 8)
272#else
273#define REG_B_OFFSET0 0
274#define REG_H_OFFSET1 1
275#define REG_W_OFFSET0 0
276#define REG_L_OFFSET0 0
277#define REG_LH_OFFSET4 4
278#endif
279
280/* In instruction encodings for byte register accesses the
281 * register number usually indicates "low 8 bits of register N";
282 * however there are some special cases where N 4..7 indicates
283 * [AH, CH, DH, BH], ie "bits 15..8 of register N-4". Return
284 * true for this special case, false otherwise.
285 */
286static inline bool_Bool byte_reg_is_xH(int reg)
287{
288 if (reg < 4) {
289 return false0;
290 }
291#ifdef TARGET_X86_64
292 if (reg >= 8 || x86_64_hregs) {
293 return false0;
294 }
295#endif
296 return true1;
297}
298
299/* Select the size of a push/pop operation. */
300static inline TCGMemOp mo_pushpop(DisasContext *s, TCGMemOp ot)
301{
302 if (CODE64(s)0) {
303 return ot == MO_16 ? MO_16 : MO_64;
304 } else {
305 return ot;
306 }
307}
308
309/* Select only size 64 else 32. Used for SSE operand sizes. */
310static inline TCGMemOp mo_64_32(TCGMemOp ot)
311{
312#ifdef TARGET_X86_64
313 return ot == MO_64 ? MO_64 : MO_32;
314#else
315 return MO_32;
316#endif
317}
318
319/* Select size 8 if lsb of B is clear, else OT. Used for decoding
320 byte vs word opcodes. */
321static inline TCGMemOp mo_b_d(int b, TCGMemOp ot)
322{
323 return b & 1 ? ot : MO_8;
324}
325
326/* Select size 8 if lsb of B is clear, else OT capped at 32.
327 Used for decoding operand size of port opcodes. */
328static inline TCGMemOp mo_b_d32(int b, TCGMemOp ot)
329{
330 return b & 1 ? (ot == MO_16 ? MO_16 : MO_32) : MO_8;
331}
332
333static void gen_op_mov_reg_v(TCGMemOp ot, int reg, TCGvTCGv_i32 t0)
334{
335 switch(ot) {
336 case MO_8:
337 if (!byte_reg_is_xH(reg)) {
338 tcg_gen_deposit_tltcg_gen_deposit_i32(cpu_regs[reg], cpu_regs[reg], t0, 0, 8);
339 } else {
340 tcg_gen_deposit_tltcg_gen_deposit_i32(cpu_regs[reg - 4], cpu_regs[reg - 4], t0, 8, 8);
341 }
342 break;
343 case MO_16:
344 tcg_gen_deposit_tltcg_gen_deposit_i32(cpu_regs[reg], cpu_regs[reg], t0, 0, 16);
345 break;
346 case MO_32:
347 /* For x86_64, this sets the higher half of register to zero.
348 For i386, this is equivalent to a mov. */
349 tcg_gen_ext32u_tltcg_gen_mov_i32(cpu_regs[reg], t0);
350 break;
351#ifdef TARGET_X86_64
352 case MO_64:
353 tcg_gen_mov_tltcg_gen_mov_i32(cpu_regs[reg], t0);
354 break;
355#endif
356 default:
357 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 357); abort();} while (0)
;
358 }
359}
360
361static inline void gen_op_mov_v_reg(TCGMemOp ot, TCGvTCGv_i32 t0, int reg)
362{
363 if (ot == MO_8 && byte_reg_is_xH(reg)) {
364 tcg_gen_shri_tltcg_gen_shri_i32(t0, cpu_regs[reg - 4], 8);
365 tcg_gen_ext8u_tltcg_gen_ext8u_i32(t0, t0);
366 } else {
367 tcg_gen_mov_tltcg_gen_mov_i32(t0, cpu_regs[reg]);
368 }
369}
370
371static inline void gen_op_movl_A0_reg(int reg)
372{
373 tcg_gen_mov_tltcg_gen_mov_i32(cpu_A0, cpu_regs[reg]);
374}
375
376static inline void gen_op_addl_A0_im(int32_t val)
377{
378 tcg_gen_addi_tltcg_gen_addi_i32(cpu_A0, cpu_A0, val);
379#ifdef TARGET_X86_64
380 tcg_gen_andi_tltcg_gen_andi_i32(cpu_A0, cpu_A0, 0xffffffff);
381#endif
382}
383
384#ifdef TARGET_X86_64
385static inline void gen_op_addq_A0_im(int64_t val)
386{
387 tcg_gen_addi_tltcg_gen_addi_i32(cpu_A0, cpu_A0, val);
388}
389#endif
390
391static void gen_add_A0_im(DisasContext *s, int val)
392{
393#ifdef TARGET_X86_64
394 if (CODE64(s)0)
395 gen_op_addq_A0_im(val);
396 else
397#endif
398 gen_op_addl_A0_im(val);
399}
400
401static inline void gen_op_jmp_v(TCGvTCGv_i32 dest)
402{
403 tcg_gen_st_tltcg_gen_st_i32(dest, cpu_env, offsetof(CPUX86State, eip)__builtin_offsetof(CPUX86State, eip));
404}
405
406static inline void gen_op_add_reg_im(TCGMemOp size, int reg, int32_t val)
407{
408 tcg_gen_addi_tltcg_gen_addi_i32(cpu_tmp0, cpu_regs[reg], val);
409 gen_op_mov_reg_v(size, reg, cpu_tmp0);
410}
411
412static inline void gen_op_add_reg_T0(TCGMemOp size, int reg)
413{
414 tcg_gen_add_tltcg_gen_add_i32(cpu_tmp0, cpu_regs[reg], cpu_T[0]);
415 gen_op_mov_reg_v(size, reg, cpu_tmp0);
416}
417
418static inline void gen_op_addl_A0_reg_sN(int shift, int reg)
419{
420 tcg_gen_mov_tltcg_gen_mov_i32(cpu_tmp0, cpu_regs[reg]);
421 if (shift != 0)
422 tcg_gen_shli_tltcg_gen_shli_i32(cpu_tmp0, cpu_tmp0, shift);
423 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_A0, cpu_tmp0);
424 /* For x86_64, this sets the higher half of register to zero.
425 For i386, this is equivalent to a nop. */
426 tcg_gen_ext32u_tltcg_gen_mov_i32(cpu_A0, cpu_A0);
427}
428
429static inline void gen_op_movl_A0_seg(int reg)
430{
431 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_A0, cpu_env, offsetof(CPUX86State, segs[reg].base)__builtin_offsetof(CPUX86State, segs[reg].base) + REG_L_OFFSET0);
432}
433
434static inline void gen_op_addl_A0_seg(DisasContext *s, int reg)
435{
436 tcg_gen_ld_tltcg_gen_ld_i32(cpu_tmp0, cpu_env, offsetof(CPUX86State, segs[reg].base)__builtin_offsetof(CPUX86State, segs[reg].base));
437#ifdef TARGET_X86_64
438 if (CODE64(s)0) {
439 tcg_gen_andi_tltcg_gen_andi_i32(cpu_A0, cpu_A0, 0xffffffff);
440 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_A0, cpu_tmp0);
441 } else {
442 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_A0, cpu_tmp0);
443 tcg_gen_andi_tltcg_gen_andi_i32(cpu_A0, cpu_A0, 0xffffffff);
444 }
445#else
446 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_A0, cpu_tmp0);
447#endif
448}
449
450#ifdef TARGET_X86_64
451static inline void gen_op_movq_A0_seg(int reg)
452{
453 tcg_gen_ld_tltcg_gen_ld_i32(cpu_A0, cpu_env, offsetof(CPUX86State, segs[reg].base)__builtin_offsetof(CPUX86State, segs[reg].base));
454}
455
456static inline void gen_op_addq_A0_seg(int reg)
457{
458 tcg_gen_ld_tltcg_gen_ld_i32(cpu_tmp0, cpu_env, offsetof(CPUX86State, segs[reg].base)__builtin_offsetof(CPUX86State, segs[reg].base));
459 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_A0, cpu_tmp0);
460}
461
462static inline void gen_op_movq_A0_reg(int reg)
463{
464 tcg_gen_mov_tltcg_gen_mov_i32(cpu_A0, cpu_regs[reg]);
465}
466
467static inline void gen_op_addq_A0_reg_sN(int shift, int reg)
468{
469 tcg_gen_mov_tltcg_gen_mov_i32(cpu_tmp0, cpu_regs[reg]);
470 if (shift != 0)
471 tcg_gen_shli_tltcg_gen_shli_i32(cpu_tmp0, cpu_tmp0, shift);
472 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_A0, cpu_tmp0);
473}
474#endif
475
476static inline void gen_op_ld_v(DisasContext *s, int idx, TCGvTCGv_i32 t0, TCGvTCGv_i32 a0)
477{
478 tcg_gen_qemu_ld_tltcg_gen_qemu_ld_i32(t0, a0, s->mem_index, idx | MO_LE);
479}
480
481static inline void gen_op_st_v(DisasContext *s, int idx, TCGvTCGv_i32 t0, TCGvTCGv_i32 a0)
482{
483 tcg_gen_qemu_st_tltcg_gen_qemu_st_i32(t0, a0, s->mem_index, idx | MO_LE);
484}
485
486static inline void gen_op_st_rm_T0_A0(DisasContext *s, int idx, int d)
487{
488 if (d == OR_TMP0) {
489 gen_op_st_v(s, idx, cpu_T[0], cpu_A0);
490 } else {
491 gen_op_mov_reg_v(idx, d, cpu_T[0]);
492 }
493}
494
495static inline void gen_jmp_im(target_ulong pc)
496{
497 tcg_gen_movi_tltcg_gen_movi_i32(cpu_tmp0, pc);
498 gen_op_jmp_v(cpu_tmp0);
499}
500
501static inline void gen_string_movl_A0_ESI(DisasContext *s)
502{
503 int override;
504
505 override = s->override;
506 switch (s->aflag) {
507#ifdef TARGET_X86_64
508 case MO_64:
509 if (override >= 0) {
510 gen_op_movq_A0_seg(override);
511 gen_op_addq_A0_reg_sN(0, R_ESI6);
512 } else {
513 gen_op_movq_A0_reg(R_ESI6);
514 }
515 break;
516#endif
517 case MO_32:
518 /* 32 bit address */
519 if (s->addseg && override < 0)
520 override = R_DS3;
521 if (override >= 0) {
522 gen_op_movl_A0_seg(override);
523 gen_op_addl_A0_reg_sN(0, R_ESI6);
524 } else {
525 gen_op_movl_A0_reg(R_ESI6);
526 }
527 break;
528 case MO_16:
529 /* 16 address, always override */
530 if (override < 0)
531 override = R_DS3;
532 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_A0, cpu_regs[R_ESI6]);
533 gen_op_addl_A0_seg(s, override);
534 break;
535 default:
536 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 536); abort();} while (0)
;
537 }
538}
539
540static inline void gen_string_movl_A0_EDI(DisasContext *s)
541{
542 switch (s->aflag) {
543#ifdef TARGET_X86_64
544 case MO_64:
545 gen_op_movq_A0_reg(R_EDI7);
546 break;
547#endif
548 case MO_32:
549 if (s->addseg) {
550 gen_op_movl_A0_seg(R_ES0);
551 gen_op_addl_A0_reg_sN(0, R_EDI7);
552 } else {
553 gen_op_movl_A0_reg(R_EDI7);
554 }
555 break;
556 case MO_16:
557 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_A0, cpu_regs[R_EDI7]);
558 gen_op_addl_A0_seg(s, R_ES0);
559 break;
560 default:
561 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 561); abort();} while (0)
;
562 }
563}
564
565static inline void gen_op_movl_T0_Dshift(TCGMemOp ot)
566{
567 tcg_gen_ld32s_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State, df)__builtin_offsetof(CPUX86State, df));
568 tcg_gen_shli_tltcg_gen_shli_i32(cpu_T[0], cpu_T[0], ot);
569};
570
571static TCGvTCGv_i32 gen_ext_tl(TCGvTCGv_i32 dst, TCGvTCGv_i32 src, TCGMemOp size, bool_Bool sign)
572{
573 switch (size) {
574 case MO_8:
575 if (sign) {
576 tcg_gen_ext8s_tltcg_gen_ext8s_i32(dst, src);
577 } else {
578 tcg_gen_ext8u_tltcg_gen_ext8u_i32(dst, src);
579 }
580 return dst;
581 case MO_16:
582 if (sign) {
583 tcg_gen_ext16s_tltcg_gen_ext16s_i32(dst, src);
584 } else {
585 tcg_gen_ext16u_tltcg_gen_ext16u_i32(dst, src);
586 }
587 return dst;
588#ifdef TARGET_X86_64
589 case MO_32:
590 if (sign) {
591 tcg_gen_ext32s_tltcg_gen_mov_i32(dst, src);
592 } else {
593 tcg_gen_ext32u_tltcg_gen_mov_i32(dst, src);
594 }
595 return dst;
596#endif
597 default:
598 return src;
599 }
600}
601
602static void gen_extu(TCGMemOp ot, TCGvTCGv_i32 reg)
603{
604 gen_ext_tl(reg, reg, ot, false0);
605}
606
607static void gen_exts(TCGMemOp ot, TCGvTCGv_i32 reg)
608{
609 gen_ext_tl(reg, reg, ot, true1);
610}
611
612static inline void gen_op_jnz_ecx(TCGMemOp size, int label1)
613{
614 tcg_gen_mov_tltcg_gen_mov_i32(cpu_tmp0, cpu_regs[R_ECX1]);
615 gen_extu(size, cpu_tmp0);
616 tcg_gen_brcondi_tltcg_gen_brcondi_i32(TCG_COND_NE, cpu_tmp0, 0, label1);
617}
618
619static inline void gen_op_jz_ecx(TCGMemOp size, int label1)
620{
621 tcg_gen_mov_tltcg_gen_mov_i32(cpu_tmp0, cpu_regs[R_ECX1]);
622 gen_extu(size, cpu_tmp0);
623 tcg_gen_brcondi_tltcg_gen_brcondi_i32(TCG_COND_EQ, cpu_tmp0, 0, label1);
624}
625
626static void gen_helper_in_func(TCGMemOp ot, TCGvTCGv_i32 v, TCGv_i32 n)
627{
628 switch (ot) {
629 case MO_8:
630 gen_helper_inb(v, n);
631 break;
632 case MO_16:
633 gen_helper_inw(v, n);
634 break;
635 case MO_32:
636 gen_helper_inl(v, n);
637 break;
638 default:
639 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 639); abort();} while (0)
;
640 }
641}
642
643static void gen_helper_out_func(TCGMemOp ot, TCGv_i32 v, TCGv_i32 n)
644{
645 switch (ot) {
646 case MO_8:
647 gen_helper_outb(v, n);
648 break;
649 case MO_16:
650 gen_helper_outw(v, n);
651 break;
652 case MO_32:
653 gen_helper_outl(v, n);
654 break;
655 default:
656 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 656); abort();} while (0)
;
657 }
658}
659
660static void gen_check_io(DisasContext *s, TCGMemOp ot, target_ulong cur_eip,
661 uint32_t svm_flags)
662{
663 int state_saved;
664 target_ulong next_eip;
665
666 state_saved = 0;
667 if (s->pe && (s->cpl > s->iopl || s->vm86)) {
668 gen_update_cc_op(s);
669 gen_jmp_im(cur_eip);
670 state_saved = 1;
671 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
672 switch (ot) {
673 case MO_8:
674 gen_helper_check_iob(cpu_env, cpu_tmp2_i32);
675 break;
676 case MO_16:
677 gen_helper_check_iow(cpu_env, cpu_tmp2_i32);
678 break;
679 case MO_32:
680 gen_helper_check_iol(cpu_env, cpu_tmp2_i32);
681 break;
682 default:
683 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 683); abort();} while (0)
;
684 }
685 }
686 if(s->flags & HF_SVMI_MASK(1 << 21)) {
687 if (!state_saved) {
688 gen_update_cc_op(s);
689 gen_jmp_im(cur_eip);
690 }
691 svm_flags |= (1 << (4 + ot));
692 next_eip = s->pc - s->cs_base;
693 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
694 gen_helper_svm_check_io(cpu_env, cpu_tmp2_i32,
695 tcg_const_i32(svm_flags),
696 tcg_const_i32(next_eip - cur_eip));
697 }
698}
699
700static inline void gen_movs(DisasContext *s, TCGMemOp ot)
701{
702 gen_string_movl_A0_ESI(s);
703 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
704 gen_string_movl_A0_EDI(s);
705 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
706 gen_op_movl_T0_Dshift(ot);
707 gen_op_add_reg_T0(s->aflag, R_ESI6);
708 gen_op_add_reg_T0(s->aflag, R_EDI7);
709}
710
711static void gen_op_update1_cc(void)
712{
713 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
714}
715
716static void gen_op_update2_cc(void)
717{
718 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_T[1]);
719 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
720}
721
722static void gen_op_update3_cc(TCGvTCGv_i32 reg)
723{
724 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src2, reg);
725 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_T[1]);
726 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
727}
728
729static inline void gen_op_testl_T0_T1_cc(void)
730{
731 tcg_gen_and_tltcg_gen_and_i32(cpu_cc_dst, cpu_T[0], cpu_T[1]);
732}
733
734static void gen_op_update_neg_cc(void)
735{
736 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
737 tcg_gen_neg_tltcg_gen_neg_i32(cpu_cc_src, cpu_T[0]);
738 tcg_gen_movi_tltcg_gen_movi_i32(cpu_cc_srcT, 0);
739}
740
741/* compute all eflags to cc_src */
742static void gen_compute_eflags(DisasContext *s)
743{
744 TCGvTCGv_i32 zero, dst, src1, src2;
745 int live, dead;
746
747 if (s->cc_op == CC_OP_EFLAGS) {
748 return;
749 }
750 if (s->cc_op == CC_OP_CLR) {
751 tcg_gen_movi_tltcg_gen_movi_i32(cpu_cc_src, CC_Z0x0040);
752 set_cc_op(s, CC_OP_EFLAGS);
753 return;
754 }
755
756 TCGV_UNUSED(zero)zero = __extension__ ({ TCGv_i32 make_tcgv_tmp = {-1}; make_tcgv_tmp
;})
;
757 dst = cpu_cc_dst;
758 src1 = cpu_cc_src;
759 src2 = cpu_cc_src2;
760
761 /* Take care to not read values that are not live. */
762 live = cc_op_live[s->cc_op] & ~USES_CC_SRCT;
763 dead = live ^ (USES_CC_DST | USES_CC_SRC | USES_CC_SRC2);
764 if (dead) {
765 zero = tcg_const_tltcg_const_i32(0);
766 if (dead & USES_CC_DST) {
767 dst = zero;
768 }
769 if (dead & USES_CC_SRC) {
770 src1 = zero;
771 }
772 if (dead & USES_CC_SRC2) {
773 src2 = zero;
774 }
775 }
776
777 gen_update_cc_op(s);
778 gen_helper_cc_compute_all(cpu_cc_src, dst, src1, src2, cpu_cc_op);
779 set_cc_op(s, CC_OP_EFLAGS);
780
781 if (dead) {
782 tcg_temp_freetcg_temp_free_i32(zero);
783 }
784}
785
786typedef struct CCPrepare {
787 TCGCond cond;
788 TCGvTCGv_i32 reg;
789 TCGvTCGv_i32 reg2;
790 target_ulong imm;
791 target_ulong mask;
792 bool_Bool use_reg2;
793 bool_Bool no_setcond;
794} CCPrepare;
795
796/* compute eflags.C to reg */
797static CCPrepare gen_prepare_eflags_c(DisasContext *s, TCGvTCGv_i32 reg)
798{
799 TCGvTCGv_i32 t0, t1;
800 int size, shift;
801
802 switch (s->cc_op) {
803 case CC_OP_SUBB ... CC_OP_SUBQ:
804 /* (DATA_TYPE)CC_SRCT < (DATA_TYPE)CC_SRC */
805 size = s->cc_op - CC_OP_SUBB;
806 t1 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false0);
807 /* If no temporary was used, be careful not to alias t1 and t0. */
808 t0 = TCGV_EQUAL(t1, cpu_cc_src)(((t1).i32) == ((cpu_cc_src).i32)) ? cpu_tmp0 : reg;
809 tcg_gen_mov_tltcg_gen_mov_i32(t0, cpu_cc_srcT);
810 gen_extu(size, t0);
811 goto add_sub;
812
813 case CC_OP_ADDB ... CC_OP_ADDQ:
814 /* (DATA_TYPE)CC_DST < (DATA_TYPE)CC_SRC */
815 size = s->cc_op - CC_OP_ADDB;
816 t1 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false0);
817 t0 = gen_ext_tl(reg, cpu_cc_dst, size, false0);
818 add_sub:
819 return (CCPrepare) { .cond = TCG_COND_LTU, .reg = t0,
820 .reg2 = t1, .mask = -1, .use_reg2 = true1 };
821
822 case CC_OP_LOGICB ... CC_OP_LOGICQ:
823 case CC_OP_CLR:
824 return (CCPrepare) { .cond = TCG_COND_NEVER, .mask = -1 };
825
826 case CC_OP_INCB ... CC_OP_INCQ:
827 case CC_OP_DECB ... CC_OP_DECQ:
828 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
829 .mask = -1, .no_setcond = true1 };
830
831 case CC_OP_SHLB ... CC_OP_SHLQ:
832 /* (CC_SRC >> (DATA_BITS - 1)) & 1 */
833 size = s->cc_op - CC_OP_SHLB;
834 shift = (8 << size) - 1;
835 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
836 .mask = (target_ulong)1 << shift };
837
838 case CC_OP_MULB ... CC_OP_MULQ:
839 return (CCPrepare) { .cond = TCG_COND_NE,
840 .reg = cpu_cc_src, .mask = -1 };
841
842 case CC_OP_BMILGB ... CC_OP_BMILGQ:
843 size = s->cc_op - CC_OP_BMILGB;
844 t0 = gen_ext_tl(reg, cpu_cc_src, size, false0);
845 return (CCPrepare) { .cond = TCG_COND_EQ, .reg = t0, .mask = -1 };
846
847 case CC_OP_ADCX:
848 case CC_OP_ADCOX:
849 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_dst,
850 .mask = -1, .no_setcond = true1 };
851
852 case CC_OP_EFLAGS:
853 case CC_OP_SARB ... CC_OP_SARQ:
854 /* CC_SRC & 1 */
855 return (CCPrepare) { .cond = TCG_COND_NE,
856 .reg = cpu_cc_src, .mask = CC_C0x0001 };
857
858 default:
859 /* The need to compute only C from CC_OP_DYNAMIC is important
860 in efficiently implementing e.g. INC at the start of a TB. */
861 gen_update_cc_op(s);
862 gen_helper_cc_compute_c(reg, cpu_cc_dst, cpu_cc_src,
863 cpu_cc_src2, cpu_cc_op);
864 return (CCPrepare) { .cond = TCG_COND_NE, .reg = reg,
865 .mask = -1, .no_setcond = true1 };
866 }
867}
868
869/* compute eflags.P to reg */
870static CCPrepare gen_prepare_eflags_p(DisasContext *s, TCGvTCGv_i32 reg)
871{
872 gen_compute_eflags(s);
873 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
874 .mask = CC_P0x0004 };
875}
876
877/* compute eflags.S to reg */
878static CCPrepare gen_prepare_eflags_s(DisasContext *s, TCGvTCGv_i32 reg)
879{
880 switch (s->cc_op) {
881 case CC_OP_DYNAMIC:
882 gen_compute_eflags(s);
883 /* FALLTHRU */
884 case CC_OP_EFLAGS:
885 case CC_OP_ADCX:
886 case CC_OP_ADOX:
887 case CC_OP_ADCOX:
888 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
889 .mask = CC_S0x0080 };
890 case CC_OP_CLR:
891 return (CCPrepare) { .cond = TCG_COND_NEVER, .mask = -1 };
892 default:
893 {
894 TCGMemOp size = (s->cc_op - CC_OP_ADDB) & 3;
895 TCGvTCGv_i32 t0 = gen_ext_tl(reg, cpu_cc_dst, size, true1);
896 return (CCPrepare) { .cond = TCG_COND_LT, .reg = t0, .mask = -1 };
897 }
898 }
899}
900
901/* compute eflags.O to reg */
902static CCPrepare gen_prepare_eflags_o(DisasContext *s, TCGvTCGv_i32 reg)
903{
904 switch (s->cc_op) {
905 case CC_OP_ADOX:
906 case CC_OP_ADCOX:
907 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src2,
908 .mask = -1, .no_setcond = true1 };
909 case CC_OP_CLR:
910 return (CCPrepare) { .cond = TCG_COND_NEVER, .mask = -1 };
911 default:
912 gen_compute_eflags(s);
913 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
914 .mask = CC_O0x0800 };
915 }
916}
917
918/* compute eflags.Z to reg */
919static CCPrepare gen_prepare_eflags_z(DisasContext *s, TCGvTCGv_i32 reg)
920{
921 switch (s->cc_op) {
922 case CC_OP_DYNAMIC:
923 gen_compute_eflags(s);
924 /* FALLTHRU */
925 case CC_OP_EFLAGS:
926 case CC_OP_ADCX:
927 case CC_OP_ADOX:
928 case CC_OP_ADCOX:
929 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
930 .mask = CC_Z0x0040 };
931 case CC_OP_CLR:
932 return (CCPrepare) { .cond = TCG_COND_ALWAYS, .mask = -1 };
933 default:
934 {
935 TCGMemOp size = (s->cc_op - CC_OP_ADDB) & 3;
936 TCGvTCGv_i32 t0 = gen_ext_tl(reg, cpu_cc_dst, size, false0);
937 return (CCPrepare) { .cond = TCG_COND_EQ, .reg = t0, .mask = -1 };
938 }
939 }
940}
941
942/* perform a conditional store into register 'reg' according to jump opcode
943 value 'b'. In the fast case, T0 is guaranted not to be used. */
944static CCPrepare gen_prepare_cc(DisasContext *s, int b, TCGvTCGv_i32 reg)
945{
946 int inv, jcc_op, cond;
947 TCGMemOp size;
948 CCPrepare cc;
949 TCGvTCGv_i32 t0;
950
951 inv = b & 1;
952 jcc_op = (b >> 1) & 7;
953
954 switch (s->cc_op) {
955 case CC_OP_SUBB ... CC_OP_SUBQ:
956 /* We optimize relational operators for the cmp/jcc case. */
957 size = s->cc_op - CC_OP_SUBB;
958 switch (jcc_op) {
959 case JCC_BE:
960 tcg_gen_mov_tltcg_gen_mov_i32(cpu_tmp4, cpu_cc_srcT);
961 gen_extu(size, cpu_tmp4);
962 t0 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false0);
963 cc = (CCPrepare) { .cond = TCG_COND_LEU, .reg = cpu_tmp4,
964 .reg2 = t0, .mask = -1, .use_reg2 = true1 };
965 break;
966
967 case JCC_L:
968 cond = TCG_COND_LT;
969 goto fast_jcc_l;
970 case JCC_LE:
971 cond = TCG_COND_LE;
972 fast_jcc_l:
973 tcg_gen_mov_tltcg_gen_mov_i32(cpu_tmp4, cpu_cc_srcT);
974 gen_exts(size, cpu_tmp4);
975 t0 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, true1);
976 cc = (CCPrepare) { .cond = cond, .reg = cpu_tmp4,
977 .reg2 = t0, .mask = -1, .use_reg2 = true1 };
978 break;
979
980 default:
981 goto slow_jcc;
982 }
983 break;
984
985 default:
986 slow_jcc:
987 /* This actually generates good code for JC, JZ and JS. */
988 switch (jcc_op) {
989 case JCC_O:
990 cc = gen_prepare_eflags_o(s, reg);
991 break;
992 case JCC_B:
993 cc = gen_prepare_eflags_c(s, reg);
994 break;
995 case JCC_Z:
996 cc = gen_prepare_eflags_z(s, reg);
997 break;
998 case JCC_BE:
999 gen_compute_eflags(s);
1000 cc = (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
1001 .mask = CC_Z0x0040 | CC_C0x0001 };
1002 break;
1003 case JCC_S:
1004 cc = gen_prepare_eflags_s(s, reg);
1005 break;
1006 case JCC_P:
1007 cc = gen_prepare_eflags_p(s, reg);
1008 break;
1009 case JCC_L:
1010 gen_compute_eflags(s);
1011 if (TCGV_EQUAL(reg, cpu_cc_src)(((reg).i32) == ((cpu_cc_src).i32))) {
1012 reg = cpu_tmp0;
1013 }
1014 tcg_gen_shri_tltcg_gen_shri_i32(reg, cpu_cc_src, 4); /* CC_O -> CC_S */
1015 tcg_gen_xor_tltcg_gen_xor_i32(reg, reg, cpu_cc_src);
1016 cc = (CCPrepare) { .cond = TCG_COND_NE, .reg = reg,
1017 .mask = CC_S0x0080 };
1018 break;
1019 default:
1020 case JCC_LE:
1021 gen_compute_eflags(s);
1022 if (TCGV_EQUAL(reg, cpu_cc_src)(((reg).i32) == ((cpu_cc_src).i32))) {
1023 reg = cpu_tmp0;
1024 }
1025 tcg_gen_shri_tltcg_gen_shri_i32(reg, cpu_cc_src, 4); /* CC_O -> CC_S */
1026 tcg_gen_xor_tltcg_gen_xor_i32(reg, reg, cpu_cc_src);
1027 cc = (CCPrepare) { .cond = TCG_COND_NE, .reg = reg,
1028 .mask = CC_S0x0080 | CC_Z0x0040 };
1029 break;
1030 }
1031 break;
1032 }
1033
1034 if (inv) {
1035 cc.cond = tcg_invert_cond(cc.cond);
1036 }
1037 return cc;
1038}
1039
1040static void gen_setcc1(DisasContext *s, int b, TCGvTCGv_i32 reg)
1041{
1042 CCPrepare cc = gen_prepare_cc(s, b, reg);
1043
1044 if (cc.no_setcond) {
1045 if (cc.cond == TCG_COND_EQ) {
1046 tcg_gen_xori_tltcg_gen_xori_i32(reg, cc.reg, 1);
1047 } else {
1048 tcg_gen_mov_tltcg_gen_mov_i32(reg, cc.reg);
1049 }
1050 return;
1051 }
1052
1053 if (cc.cond == TCG_COND_NE && !cc.use_reg2 && cc.imm == 0 &&
1054 cc.mask != 0 && (cc.mask & (cc.mask - 1)) == 0) {
1055 tcg_gen_shri_tltcg_gen_shri_i32(reg, cc.reg, ctztlctz32(cc.mask));
1056 tcg_gen_andi_tltcg_gen_andi_i32(reg, reg, 1);
1057 return;
1058 }
1059 if (cc.mask != -1) {
1060 tcg_gen_andi_tltcg_gen_andi_i32(reg, cc.reg, cc.mask);
1061 cc.reg = reg;
1062 }
1063 if (cc.use_reg2) {
1064 tcg_gen_setcond_tltcg_gen_setcond_i32(cc.cond, reg, cc.reg, cc.reg2);
1065 } else {
1066 tcg_gen_setcondi_tltcg_gen_setcondi_i32(cc.cond, reg, cc.reg, cc.imm);
1067 }
1068}
1069
1070static inline void gen_compute_eflags_c(DisasContext *s, TCGvTCGv_i32 reg)
1071{
1072 gen_setcc1(s, JCC_B << 1, reg);
1073}
1074
1075/* generate a conditional jump to label 'l1' according to jump opcode
1076 value 'b'. In the fast case, T0 is guaranted not to be used. */
1077static inline void gen_jcc1_noeob(DisasContext *s, int b, int l1)
1078{
1079 CCPrepare cc = gen_prepare_cc(s, b, cpu_T[0]);
1080
1081 if (cc.mask != -1) {
1082 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[0], cc.reg, cc.mask);
1083 cc.reg = cpu_T[0];
1084 }
1085 if (cc.use_reg2) {
1086 tcg_gen_brcond_tltcg_gen_brcond_i32(cc.cond, cc.reg, cc.reg2, l1);
1087 } else {
1088 tcg_gen_brcondi_tltcg_gen_brcondi_i32(cc.cond, cc.reg, cc.imm, l1);
1089 }
1090}
1091
1092/* Generate a conditional jump to label 'l1' according to jump opcode
1093 value 'b'. In the fast case, T0 is guaranted not to be used.
1094 A translation block must end soon. */
1095static inline void gen_jcc1(DisasContext *s, int b, int l1)
1096{
1097 CCPrepare cc = gen_prepare_cc(s, b, cpu_T[0]);
1098
1099 gen_update_cc_op(s);
1100 if (cc.mask != -1) {
1101 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[0], cc.reg, cc.mask);
1102 cc.reg = cpu_T[0];
1103 }
1104 set_cc_op(s, CC_OP_DYNAMIC);
1105 if (cc.use_reg2) {
1106 tcg_gen_brcond_tltcg_gen_brcond_i32(cc.cond, cc.reg, cc.reg2, l1);
1107 } else {
1108 tcg_gen_brcondi_tltcg_gen_brcondi_i32(cc.cond, cc.reg, cc.imm, l1);
1109 }
1110}
1111
1112/* XXX: does not work with gdbstub "ice" single step - not a
1113 serious problem */
1114static int gen_jz_ecx_string(DisasContext *s, target_ulong next_eip)
1115{
1116 int l1, l2;
1117
1118 l1 = gen_new_label();
1119 l2 = gen_new_label();
1120 gen_op_jnz_ecx(s->aflag, l1);
1121 gen_set_label(l2);
1122 gen_jmp_tb(s, next_eip, 1);
1123 gen_set_label(l1);
1124 return l2;
1125}
1126
1127static inline void gen_stos(DisasContext *s, TCGMemOp ot)
1128{
1129 gen_op_mov_v_reg(MO_32, cpu_T[0], R_EAX0);
1130 gen_string_movl_A0_EDI(s);
1131 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
1132 gen_op_movl_T0_Dshift(ot);
1133 gen_op_add_reg_T0(s->aflag, R_EDI7);
1134}
1135
1136static inline void gen_lods(DisasContext *s, TCGMemOp ot)
1137{
1138 gen_string_movl_A0_ESI(s);
1139 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
1140 gen_op_mov_reg_v(ot, R_EAX0, cpu_T[0]);
1141 gen_op_movl_T0_Dshift(ot);
1142 gen_op_add_reg_T0(s->aflag, R_ESI6);
1143}
1144
1145static inline void gen_scas(DisasContext *s, TCGMemOp ot)
1146{
1147 gen_string_movl_A0_EDI(s);
1148 gen_op_ld_v(s, ot, cpu_T[1], cpu_A0);
1149 gen_op(s, OP_CMPL, ot, R_EAX0);
1150 gen_op_movl_T0_Dshift(ot);
1151 gen_op_add_reg_T0(s->aflag, R_EDI7);
1152}
1153
1154static inline void gen_cmps(DisasContext *s, TCGMemOp ot)
1155{
1156 gen_string_movl_A0_EDI(s);
1157 gen_op_ld_v(s, ot, cpu_T[1], cpu_A0);
1158 gen_string_movl_A0_ESI(s);
1159 gen_op(s, OP_CMPL, ot, OR_TMP0);
1160 gen_op_movl_T0_Dshift(ot);
1161 gen_op_add_reg_T0(s->aflag, R_ESI6);
1162 gen_op_add_reg_T0(s->aflag, R_EDI7);
1163}
1164
1165static inline void gen_ins(DisasContext *s, TCGMemOp ot)
1166{
1167 if (use_icount)
1168 gen_io_start();
1169 gen_string_movl_A0_EDI(s);
1170 /* Note: we must do this dummy write first to be restartable in
1171 case of page fault. */
1172 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], 0);
1173 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
1174 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_regs[R_EDX2]);
1175 tcg_gen_andi_i32(cpu_tmp2_i32, cpu_tmp2_i32, 0xffff);
1176 gen_helper_in_func(ot, cpu_T[0], cpu_tmp2_i32);
1177 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
1178 gen_op_movl_T0_Dshift(ot);
1179 gen_op_add_reg_T0(s->aflag, R_EDI7);
1180 if (use_icount)
1181 gen_io_end();
1182}
1183
1184static inline void gen_outs(DisasContext *s, TCGMemOp ot)
1185{
1186 if (use_icount)
1187 gen_io_start();
1188 gen_string_movl_A0_ESI(s);
1189 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
1190
1191 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_regs[R_EDX2]);
1192 tcg_gen_andi_i32(cpu_tmp2_i32, cpu_tmp2_i32, 0xffff);
1193 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp3_i32, cpu_T[0]);
1194 gen_helper_out_func(ot, cpu_tmp2_i32, cpu_tmp3_i32);
1195
1196 gen_op_movl_T0_Dshift(ot);
1197 gen_op_add_reg_T0(s->aflag, R_ESI6);
1198 if (use_icount)
1199 gen_io_end();
1200}
1201
1202/* same method as Valgrind : we generate jumps to current or next
1203 instruction */
1204#define GEN_REPZ(op)static inline void gen_repz_op(DisasContext *s, TCGMemOp ot, target_ulong
cur_eip, target_ulong next_eip) { int l2; gen_update_cc_op(s
); l2 = gen_jz_ecx_string(s, next_eip); gen_op(s, ot); gen_op_add_reg_im
(s->aflag, 1, -1); if (!s->jmp_opt) gen_op_jz_ecx(s->
aflag, l2); gen_jmp(s, cur_eip); }
\
1205static inline void gen_repz_ ## op(DisasContext *s, TCGMemOp ot, \
1206 target_ulong cur_eip, target_ulong next_eip) \
1207{ \
1208 int l2;\
1209 gen_update_cc_op(s); \
1210 l2 = gen_jz_ecx_string(s, next_eip); \
1211 gen_ ## op(s, ot); \
1212 gen_op_add_reg_im(s->aflag, R_ECX1, -1); \
1213 /* a loop would cause two single step exceptions if ECX = 1 \
1214 before rep string_insn */ \
1215 if (!s->jmp_opt) \
1216 gen_op_jz_ecx(s->aflag, l2); \
1217 gen_jmp(s, cur_eip); \
1218}
1219
1220#define GEN_REPZ2(op)static inline void gen_repz_op(DisasContext *s, TCGMemOp ot, target_ulong
cur_eip, target_ulong next_eip, int nz) { int l2; gen_update_cc_op
(s); l2 = gen_jz_ecx_string(s, next_eip); gen_op(s, ot); gen_op_add_reg_im
(s->aflag, 1, -1); gen_update_cc_op(s); gen_jcc1(s, (JCC_Z
<< 1) | (nz ^ 1), l2); if (!s->jmp_opt) gen_op_jz_ecx
(s->aflag, l2); gen_jmp(s, cur_eip); }
\
1221static inline void gen_repz_ ## op(DisasContext *s, TCGMemOp ot, \
1222 target_ulong cur_eip, \
1223 target_ulong next_eip, \
1224 int nz) \
1225{ \
1226 int l2;\
1227 gen_update_cc_op(s); \
1228 l2 = gen_jz_ecx_string(s, next_eip); \
1229 gen_ ## op(s, ot); \
1230 gen_op_add_reg_im(s->aflag, R_ECX1, -1); \
1231 gen_update_cc_op(s); \
1232 gen_jcc1(s, (JCC_Z << 1) | (nz ^ 1), l2); \
1233 if (!s->jmp_opt) \
1234 gen_op_jz_ecx(s->aflag, l2); \
1235 gen_jmp(s, cur_eip); \
1236}
1237
1238GEN_REPZ(movs)static inline void gen_repz_movs(DisasContext *s, TCGMemOp ot
, target_ulong cur_eip, target_ulong next_eip) { int l2; gen_update_cc_op
(s); l2 = gen_jz_ecx_string(s, next_eip); gen_movs(s, ot); gen_op_add_reg_im
(s->aflag, 1, -1); if (!s->jmp_opt) gen_op_jz_ecx(s->
aflag, l2); gen_jmp(s, cur_eip); }
1239GEN_REPZ(stos)static inline void gen_repz_stos(DisasContext *s, TCGMemOp ot
, target_ulong cur_eip, target_ulong next_eip) { int l2; gen_update_cc_op
(s); l2 = gen_jz_ecx_string(s, next_eip); gen_stos(s, ot); gen_op_add_reg_im
(s->aflag, 1, -1); if (!s->jmp_opt) gen_op_jz_ecx(s->
aflag, l2); gen_jmp(s, cur_eip); }
1240GEN_REPZ(lods)static inline void gen_repz_lods(DisasContext *s, TCGMemOp ot
, target_ulong cur_eip, target_ulong next_eip) { int l2; gen_update_cc_op
(s); l2 = gen_jz_ecx_string(s, next_eip); gen_lods(s, ot); gen_op_add_reg_im
(s->aflag, 1, -1); if (!s->jmp_opt) gen_op_jz_ecx(s->
aflag, l2); gen_jmp(s, cur_eip); }
1241GEN_REPZ(ins)static inline void gen_repz_ins(DisasContext *s, TCGMemOp ot,
target_ulong cur_eip, target_ulong next_eip) { int l2; gen_update_cc_op
(s); l2 = gen_jz_ecx_string(s, next_eip); gen_ins(s, ot); gen_op_add_reg_im
(s->aflag, 1, -1); if (!s->jmp_opt) gen_op_jz_ecx(s->
aflag, l2); gen_jmp(s, cur_eip); }
1242GEN_REPZ(outs)static inline void gen_repz_outs(DisasContext *s, TCGMemOp ot
, target_ulong cur_eip, target_ulong next_eip) { int l2; gen_update_cc_op
(s); l2 = gen_jz_ecx_string(s, next_eip); gen_outs(s, ot); gen_op_add_reg_im
(s->aflag, 1, -1); if (!s->jmp_opt) gen_op_jz_ecx(s->
aflag, l2); gen_jmp(s, cur_eip); }
1243GEN_REPZ2(scas)static inline void gen_repz_scas(DisasContext *s, TCGMemOp ot
, target_ulong cur_eip, target_ulong next_eip, int nz) { int l2
; gen_update_cc_op(s); l2 = gen_jz_ecx_string(s, next_eip); gen_scas
(s, ot); gen_op_add_reg_im(s->aflag, 1, -1); gen_update_cc_op
(s); gen_jcc1(s, (JCC_Z << 1) | (nz ^ 1), l2); if (!s->
jmp_opt) gen_op_jz_ecx(s->aflag, l2); gen_jmp(s, cur_eip);
}
1244GEN_REPZ2(cmps)static inline void gen_repz_cmps(DisasContext *s, TCGMemOp ot
, target_ulong cur_eip, target_ulong next_eip, int nz) { int l2
; gen_update_cc_op(s); l2 = gen_jz_ecx_string(s, next_eip); gen_cmps
(s, ot); gen_op_add_reg_im(s->aflag, 1, -1); gen_update_cc_op
(s); gen_jcc1(s, (JCC_Z << 1) | (nz ^ 1), l2); if (!s->
jmp_opt) gen_op_jz_ecx(s->aflag, l2); gen_jmp(s, cur_eip);
}
1245
1246static void gen_helper_fp_arith_ST0_FT0(int op)
1247{
1248 switch (op) {
1249 case 0:
1250 gen_helper_fadd_ST0_FT0(cpu_env);
1251 break;
1252 case 1:
1253 gen_helper_fmul_ST0_FT0(cpu_env);
1254 break;
1255 case 2:
1256 gen_helper_fcom_ST0_FT0(cpu_env);
1257 break;
1258 case 3:
1259 gen_helper_fcom_ST0_FT0(cpu_env);
1260 break;
1261 case 4:
1262 gen_helper_fsub_ST0_FT0(cpu_env);
1263 break;
1264 case 5:
1265 gen_helper_fsubr_ST0_FT0(cpu_env);
1266 break;
1267 case 6:
1268 gen_helper_fdiv_ST0_FT0(cpu_env);
1269 break;
1270 case 7:
1271 gen_helper_fdivr_ST0_FT0(cpu_env);
1272 break;
1273 }
1274}
1275
1276/* NOTE the exception in "r" op ordering */
1277static void gen_helper_fp_arith_STN_ST0(int op, int opreg)
1278{
1279 TCGv_i32 tmp = tcg_const_i32(opreg);
1280 switch (op) {
1281 case 0:
1282 gen_helper_fadd_STN_ST0(cpu_env, tmp);
1283 break;
1284 case 1:
1285 gen_helper_fmul_STN_ST0(cpu_env, tmp);
1286 break;
1287 case 4:
1288 gen_helper_fsubr_STN_ST0(cpu_env, tmp);
1289 break;
1290 case 5:
1291 gen_helper_fsub_STN_ST0(cpu_env, tmp);
1292 break;
1293 case 6:
1294 gen_helper_fdivr_STN_ST0(cpu_env, tmp);
1295 break;
1296 case 7:
1297 gen_helper_fdiv_STN_ST0(cpu_env, tmp);
1298 break;
1299 }
1300}
1301
1302/* if d == OR_TMP0, it means memory operand (address in A0) */
1303static void gen_op(DisasContext *s1, int op, TCGMemOp ot, int d)
1304{
1305 if (d != OR_TMP0) {
1306 gen_op_mov_v_reg(ot, cpu_T[0], d);
1307 } else {
1308 gen_op_ld_v(s1, ot, cpu_T[0], cpu_A0);
1309 }
1310 switch(op) {
1311 case OP_ADCL:
1312 gen_compute_eflags_c(s1, cpu_tmp4);
1313 tcg_gen_add_tltcg_gen_add_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1314 tcg_gen_add_tltcg_gen_add_i32(cpu_T[0], cpu_T[0], cpu_tmp4);
1315 gen_op_st_rm_T0_A0(s1, ot, d);
1316 gen_op_update3_cc(cpu_tmp4);
1317 set_cc_op(s1, CC_OP_ADCB + ot);
1318 break;
1319 case OP_SBBL:
1320 gen_compute_eflags_c(s1, cpu_tmp4);
1321 tcg_gen_sub_tltcg_gen_sub_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1322 tcg_gen_sub_tltcg_gen_sub_i32(cpu_T[0], cpu_T[0], cpu_tmp4);
1323 gen_op_st_rm_T0_A0(s1, ot, d);
1324 gen_op_update3_cc(cpu_tmp4);
1325 set_cc_op(s1, CC_OP_SBBB + ot);
1326 break;
1327 case OP_ADDL:
1328 tcg_gen_add_tltcg_gen_add_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1329 gen_op_st_rm_T0_A0(s1, ot, d);
1330 gen_op_update2_cc();
1331 set_cc_op(s1, CC_OP_ADDB + ot);
1332 break;
1333 case OP_SUBL:
1334 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_srcT, cpu_T[0]);
1335 tcg_gen_sub_tltcg_gen_sub_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1336 gen_op_st_rm_T0_A0(s1, ot, d);
1337 gen_op_update2_cc();
1338 set_cc_op(s1, CC_OP_SUBB + ot);
1339 break;
1340 default:
1341 case OP_ANDL:
1342 tcg_gen_and_tltcg_gen_and_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1343 gen_op_st_rm_T0_A0(s1, ot, d);
1344 gen_op_update1_cc();
1345 set_cc_op(s1, CC_OP_LOGICB + ot);
1346 break;
1347 case OP_ORL:
1348 tcg_gen_or_tltcg_gen_or_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1349 gen_op_st_rm_T0_A0(s1, ot, d);
1350 gen_op_update1_cc();
1351 set_cc_op(s1, CC_OP_LOGICB + ot);
1352 break;
1353 case OP_XORL:
1354 tcg_gen_xor_tltcg_gen_xor_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1355 gen_op_st_rm_T0_A0(s1, ot, d);
1356 gen_op_update1_cc();
1357 set_cc_op(s1, CC_OP_LOGICB + ot);
1358 break;
1359 case OP_CMPL:
1360 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_T[1]);
1361 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_srcT, cpu_T[0]);
1362 tcg_gen_sub_tltcg_gen_sub_i32(cpu_cc_dst, cpu_T[0], cpu_T[1]);
1363 set_cc_op(s1, CC_OP_SUBB + ot);
1364 break;
1365 }
1366}
1367
1368/* if d == OR_TMP0, it means memory operand (address in A0) */
1369static void gen_inc(DisasContext *s1, TCGMemOp ot, int d, int c)
1370{
1371 if (d != OR_TMP0) {
1372 gen_op_mov_v_reg(ot, cpu_T[0], d);
1373 } else {
1374 gen_op_ld_v(s1, ot, cpu_T[0], cpu_A0);
1375 }
1376 gen_compute_eflags_c(s1, cpu_cc_src);
1377 if (c > 0) {
1378 tcg_gen_addi_tltcg_gen_addi_i32(cpu_T[0], cpu_T[0], 1);
1379 set_cc_op(s1, CC_OP_INCB + ot);
1380 } else {
1381 tcg_gen_addi_tltcg_gen_addi_i32(cpu_T[0], cpu_T[0], -1);
1382 set_cc_op(s1, CC_OP_DECB + ot);
1383 }
1384 gen_op_st_rm_T0_A0(s1, ot, d);
1385 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
1386}
1387
1388static void gen_shift_flags(DisasContext *s, TCGMemOp ot, TCGvTCGv_i32 result,
1389 TCGvTCGv_i32 shm1, TCGvTCGv_i32 count, bool_Bool is_right)
1390{
1391 TCGv_i32 z32, s32, oldop;
1392 TCGvTCGv_i32 z_tl;
1393
1394 /* Store the results into the CC variables. If we know that the
1395 variable must be dead, store unconditionally. Otherwise we'll
1396 need to not disrupt the current contents. */
1397 z_tl = tcg_const_tltcg_const_i32(0);
1398 if (cc_op_live[s->cc_op] & USES_CC_DST) {
1399 tcg_gen_movcond_tltcg_gen_movcond_i32(TCG_COND_NE, cpu_cc_dst, count, z_tl,
1400 result, cpu_cc_dst);
1401 } else {
1402 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, result);
1403 }
1404 if (cc_op_live[s->cc_op] & USES_CC_SRC) {
1405 tcg_gen_movcond_tltcg_gen_movcond_i32(TCG_COND_NE, cpu_cc_src, count, z_tl,
1406 shm1, cpu_cc_src);
1407 } else {
1408 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, shm1);
1409 }
1410 tcg_temp_freetcg_temp_free_i32(z_tl);
1411
1412 /* Get the two potential CC_OP values into temporaries. */
1413 tcg_gen_movi_i32(cpu_tmp2_i32, (is_right ? CC_OP_SARB : CC_OP_SHLB) + ot);
1414 if (s->cc_op == CC_OP_DYNAMIC) {
1415 oldop = cpu_cc_op;
1416 } else {
1417 tcg_gen_movi_i32(cpu_tmp3_i32, s->cc_op);
1418 oldop = cpu_tmp3_i32;
1419 }
1420
1421 /* Conditionally store the CC_OP value. */
1422 z32 = tcg_const_i32(0);
1423 s32 = tcg_temp_new_i32();
1424 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(s32, count);
1425 tcg_gen_movcond_i32(TCG_COND_NE, cpu_cc_op, s32, z32, cpu_tmp2_i32, oldop);
1426 tcg_temp_free_i32(z32);
1427 tcg_temp_free_i32(s32);
1428
1429 /* The CC_OP value is no longer predictable. */
1430 set_cc_op(s, CC_OP_DYNAMIC);
1431}
1432
1433static void gen_shift_rm_T1(DisasContext *s, TCGMemOp ot, int op1,
1434 int is_right, int is_arith)
1435{
1436 target_ulong mask = (ot == MO_64 ? 0x3f : 0x1f);
1437
1438 /* load */
1439 if (op1 == OR_TMP0) {
1440 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
1441 } else {
1442 gen_op_mov_v_reg(ot, cpu_T[0], op1);
1443 }
1444
1445 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[1], cpu_T[1], mask);
1446 tcg_gen_subi_tltcg_gen_subi_i32(cpu_tmp0, cpu_T[1], 1);
1447
1448 if (is_right) {
1449 if (is_arith) {
1450 gen_exts(ot, cpu_T[0]);
1451 tcg_gen_sar_tltcg_gen_sar_i32(cpu_tmp0, cpu_T[0], cpu_tmp0);
1452 tcg_gen_sar_tltcg_gen_sar_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1453 } else {
1454 gen_extu(ot, cpu_T[0]);
1455 tcg_gen_shr_tltcg_gen_shr_i32(cpu_tmp0, cpu_T[0], cpu_tmp0);
1456 tcg_gen_shr_tltcg_gen_shr_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1457 }
1458 } else {
1459 tcg_gen_shl_tltcg_gen_shl_i32(cpu_tmp0, cpu_T[0], cpu_tmp0);
1460 tcg_gen_shl_tltcg_gen_shl_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1461 }
1462
1463 /* store */
1464 gen_op_st_rm_T0_A0(s, ot, op1);
1465
1466 gen_shift_flags(s, ot, cpu_T[0], cpu_tmp0, cpu_T[1], is_right);
1467}
1468
1469static void gen_shift_rm_im(DisasContext *s, TCGMemOp ot, int op1, int op2,
1470 int is_right, int is_arith)
1471{
1472 int mask = (ot == MO_64 ? 0x3f : 0x1f);
1473
1474 /* load */
1475 if (op1 == OR_TMP0)
1476 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
1477 else
1478 gen_op_mov_v_reg(ot, cpu_T[0], op1);
1479
1480 op2 &= mask;
1481 if (op2 != 0) {
1482 if (is_right) {
1483 if (is_arith) {
1484 gen_exts(ot, cpu_T[0]);
1485 tcg_gen_sari_tltcg_gen_sari_i32(cpu_tmp4, cpu_T[0], op2 - 1);
1486 tcg_gen_sari_tltcg_gen_sari_i32(cpu_T[0], cpu_T[0], op2);
1487 } else {
1488 gen_extu(ot, cpu_T[0]);
1489 tcg_gen_shri_tltcg_gen_shri_i32(cpu_tmp4, cpu_T[0], op2 - 1);
1490 tcg_gen_shri_tltcg_gen_shri_i32(cpu_T[0], cpu_T[0], op2);
1491 }
1492 } else {
1493 tcg_gen_shli_tltcg_gen_shli_i32(cpu_tmp4, cpu_T[0], op2 - 1);
1494 tcg_gen_shli_tltcg_gen_shli_i32(cpu_T[0], cpu_T[0], op2);
1495 }
1496 }
1497
1498 /* store */
1499 gen_op_st_rm_T0_A0(s, ot, op1);
1500
1501 /* update eflags if non zero shift */
1502 if (op2 != 0) {
1503 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_tmp4);
1504 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
1505 set_cc_op(s, (is_right ? CC_OP_SARB : CC_OP_SHLB) + ot);
1506 }
1507}
1508
1509static inline void tcg_gen_lshift(TCGvTCGv_i32 ret, TCGvTCGv_i32 arg1, target_long arg2)
1510{
1511 if (arg2 >= 0)
1512 tcg_gen_shli_tltcg_gen_shli_i32(ret, arg1, arg2);
1513 else
1514 tcg_gen_shri_tltcg_gen_shri_i32(ret, arg1, -arg2);
1515}
1516
1517static void gen_rot_rm_T1(DisasContext *s, TCGMemOp ot, int op1, int is_right)
1518{
1519 target_ulong mask = (ot == MO_64 ? 0x3f : 0x1f);
1520 TCGv_i32 t0, t1;
1521
1522 /* load */
1523 if (op1 == OR_TMP0) {
1524 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
1525 } else {
1526 gen_op_mov_v_reg(ot, cpu_T[0], op1);
1527 }
1528
1529 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[1], cpu_T[1], mask);
1530
1531 switch (ot) {
1532 case MO_8:
1533 /* Replicate the 8-bit input so that a 32-bit rotate works. */
1534 tcg_gen_ext8u_tltcg_gen_ext8u_i32(cpu_T[0], cpu_T[0]);
1535 tcg_gen_muli_tltcg_gen_muli_i32(cpu_T[0], cpu_T[0], 0x01010101);
1536 goto do_long;
1537 case MO_16:
1538 /* Replicate the 16-bit input so that a 32-bit rotate works. */
1539 tcg_gen_deposit_tltcg_gen_deposit_i32(cpu_T[0], cpu_T[0], cpu_T[0], 16, 16);
1540 goto do_long;
1541 do_long:
1542#ifdef TARGET_X86_64
1543 case MO_32:
1544 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
1545 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp3_i32, cpu_T[1]);
1546 if (is_right) {
1547 tcg_gen_rotr_i32(cpu_tmp2_i32, cpu_tmp2_i32, cpu_tmp3_i32);
1548 } else {
1549 tcg_gen_rotl_i32(cpu_tmp2_i32, cpu_tmp2_i32, cpu_tmp3_i32);
1550 }
1551 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_T[0], cpu_tmp2_i32);
1552 break;
1553#endif
1554 default:
1555 if (is_right) {
1556 tcg_gen_rotr_tltcg_gen_rotr_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1557 } else {
1558 tcg_gen_rotl_tltcg_gen_rotl_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1559 }
1560 break;
1561 }
1562
1563 /* store */
1564 gen_op_st_rm_T0_A0(s, ot, op1);
1565
1566 /* We'll need the flags computed into CC_SRC. */
1567 gen_compute_eflags(s);
1568
1569 /* The value that was "rotated out" is now present at the other end
1570 of the word. Compute C into CC_DST and O into CC_SRC2. Note that
1571 since we've computed the flags into CC_SRC, these variables are
1572 currently dead. */
1573 if (is_right) {
1574 tcg_gen_shri_tltcg_gen_shri_i32(cpu_cc_src2, cpu_T[0], mask - 1);
1575 tcg_gen_shri_tltcg_gen_shri_i32(cpu_cc_dst, cpu_T[0], mask);
1576 tcg_gen_andi_tltcg_gen_andi_i32(cpu_cc_dst, cpu_cc_dst, 1);
1577 } else {
1578 tcg_gen_shri_tltcg_gen_shri_i32(cpu_cc_src2, cpu_T[0], mask);
1579 tcg_gen_andi_tltcg_gen_andi_i32(cpu_cc_dst, cpu_T[0], 1);
1580 }
1581 tcg_gen_andi_tltcg_gen_andi_i32(cpu_cc_src2, cpu_cc_src2, 1);
1582 tcg_gen_xor_tltcg_gen_xor_i32(cpu_cc_src2, cpu_cc_src2, cpu_cc_dst);
1583
1584 /* Now conditionally store the new CC_OP value. If the shift count
1585 is 0 we keep the CC_OP_EFLAGS setting so that only CC_SRC is live.
1586 Otherwise reuse CC_OP_ADCOX which have the C and O flags split out
1587 exactly as we computed above. */
1588 t0 = tcg_const_i32(0);
1589 t1 = tcg_temp_new_i32();
1590 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(t1, cpu_T[1]);
1591 tcg_gen_movi_i32(cpu_tmp2_i32, CC_OP_ADCOX);
1592 tcg_gen_movi_i32(cpu_tmp3_i32, CC_OP_EFLAGS);
1593 tcg_gen_movcond_i32(TCG_COND_NE, cpu_cc_op, t1, t0,
1594 cpu_tmp2_i32, cpu_tmp3_i32);
1595 tcg_temp_free_i32(t0);
1596 tcg_temp_free_i32(t1);
1597
1598 /* The CC_OP value is no longer predictable. */
1599 set_cc_op(s, CC_OP_DYNAMIC);
1600}
1601
1602static void gen_rot_rm_im(DisasContext *s, TCGMemOp ot, int op1, int op2,
1603 int is_right)
1604{
1605 int mask = (ot == MO_64 ? 0x3f : 0x1f);
1606 int shift;
1607
1608 /* load */
1609 if (op1 == OR_TMP0) {
1610 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
1611 } else {
1612 gen_op_mov_v_reg(ot, cpu_T[0], op1);
1613 }
1614
1615 op2 &= mask;
1616 if (op2 != 0) {
1617 switch (ot) {
1618#ifdef TARGET_X86_64
1619 case MO_32:
1620 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
1621 if (is_right) {
1622 tcg_gen_rotri_i32(cpu_tmp2_i32, cpu_tmp2_i32, op2);
1623 } else {
1624 tcg_gen_rotli_i32(cpu_tmp2_i32, cpu_tmp2_i32, op2);
1625 }
1626 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_T[0], cpu_tmp2_i32);
1627 break;
1628#endif
1629 default:
1630 if (is_right) {
1631 tcg_gen_rotri_tltcg_gen_rotri_i32(cpu_T[0], cpu_T[0], op2);
1632 } else {
1633 tcg_gen_rotli_tltcg_gen_rotli_i32(cpu_T[0], cpu_T[0], op2);
1634 }
1635 break;
1636 case MO_8:
1637 mask = 7;
1638 goto do_shifts;
1639 case MO_16:
1640 mask = 15;
1641 do_shifts:
1642 shift = op2 & mask;
1643 if (is_right) {
1644 shift = mask + 1 - shift;
1645 }
1646 gen_extu(ot, cpu_T[0]);
1647 tcg_gen_shli_tltcg_gen_shli_i32(cpu_tmp0, cpu_T[0], shift);
1648 tcg_gen_shri_tltcg_gen_shri_i32(cpu_T[0], cpu_T[0], mask + 1 - shift);
1649 tcg_gen_or_tltcg_gen_or_i32(cpu_T[0], cpu_T[0], cpu_tmp0);
1650 break;
1651 }
1652 }
1653
1654 /* store */
1655 gen_op_st_rm_T0_A0(s, ot, op1);
1656
1657 if (op2 != 0) {
1658 /* Compute the flags into CC_SRC. */
1659 gen_compute_eflags(s);
1660
1661 /* The value that was "rotated out" is now present at the other end
1662 of the word. Compute C into CC_DST and O into CC_SRC2. Note that
1663 since we've computed the flags into CC_SRC, these variables are
1664 currently dead. */
1665 if (is_right) {
1666 tcg_gen_shri_tltcg_gen_shri_i32(cpu_cc_src2, cpu_T[0], mask - 1);
1667 tcg_gen_shri_tltcg_gen_shri_i32(cpu_cc_dst, cpu_T[0], mask);
1668 tcg_gen_andi_tltcg_gen_andi_i32(cpu_cc_dst, cpu_cc_dst, 1);
1669 } else {
1670 tcg_gen_shri_tltcg_gen_shri_i32(cpu_cc_src2, cpu_T[0], mask);
1671 tcg_gen_andi_tltcg_gen_andi_i32(cpu_cc_dst, cpu_T[0], 1);
1672 }
1673 tcg_gen_andi_tltcg_gen_andi_i32(cpu_cc_src2, cpu_cc_src2, 1);
1674 tcg_gen_xor_tltcg_gen_xor_i32(cpu_cc_src2, cpu_cc_src2, cpu_cc_dst);
1675 set_cc_op(s, CC_OP_ADCOX);
1676 }
1677}
1678
1679/* XXX: add faster immediate = 1 case */
1680static void gen_rotc_rm_T1(DisasContext *s, TCGMemOp ot, int op1,
1681 int is_right)
1682{
1683 gen_compute_eflags(s);
1684 assert(s->cc_op == CC_OP_EFLAGS)((s->cc_op == CC_OP_EFLAGS) ? (void) (0) : __assert_fail (
"s->cc_op == CC_OP_EFLAGS", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 1684, __PRETTY_FUNCTION__))
;
1685
1686 /* load */
1687 if (op1 == OR_TMP0)
1688 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
1689 else
1690 gen_op_mov_v_reg(ot, cpu_T[0], op1);
1691
1692 if (is_right) {
1693 switch (ot) {
1694 case MO_8:
1695 gen_helper_rcrb(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1696 break;
1697 case MO_16:
1698 gen_helper_rcrw(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1699 break;
1700 case MO_32:
1701 gen_helper_rcrl(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1702 break;
1703#ifdef TARGET_X86_64
1704 case MO_64:
1705 gen_helper_rcrq(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1706 break;
1707#endif
1708 default:
1709 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 1709); abort();} while (0)
;
1710 }
1711 } else {
1712 switch (ot) {
1713 case MO_8:
1714 gen_helper_rclb(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1715 break;
1716 case MO_16:
1717 gen_helper_rclw(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1718 break;
1719 case MO_32:
1720 gen_helper_rcll(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1721 break;
1722#ifdef TARGET_X86_64
1723 case MO_64:
1724 gen_helper_rclq(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1725 break;
1726#endif
1727 default:
1728 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 1728); abort();} while (0)
;
1729 }
1730 }
1731 /* store */
1732 gen_op_st_rm_T0_A0(s, ot, op1);
1733}
1734
1735/* XXX: add faster immediate case */
1736static void gen_shiftd_rm_T1(DisasContext *s, TCGMemOp ot, int op1,
1737 bool_Bool is_right, TCGvTCGv_i32 count_in)
1738{
1739 target_ulong mask = (ot == MO_64 ? 63 : 31);
1740 TCGvTCGv_i32 count;
1741
1742 /* load */
1743 if (op1 == OR_TMP0) {
1744 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
1745 } else {
1746 gen_op_mov_v_reg(ot, cpu_T[0], op1);
1747 }
1748
1749 count = tcg_temp_new()tcg_temp_new_i32();
1750 tcg_gen_andi_tltcg_gen_andi_i32(count, count_in, mask);
1751
1752 switch (ot) {
1753 case MO_16:
1754 /* Note: we implement the Intel behaviour for shift count > 16.
1755 This means "shrdw C, B, A" shifts A:B:A >> C. Build the B:A
1756 portion by constructing it as a 32-bit value. */
1757 if (is_right) {
1758 tcg_gen_deposit_tltcg_gen_deposit_i32(cpu_tmp0, cpu_T[0], cpu_T[1], 16, 16);
1759 tcg_gen_mov_tltcg_gen_mov_i32(cpu_T[1], cpu_T[0]);
1760 tcg_gen_mov_tltcg_gen_mov_i32(cpu_T[0], cpu_tmp0);
1761 } else {
1762 tcg_gen_deposit_tltcg_gen_deposit_i32(cpu_T[1], cpu_T[0], cpu_T[1], 16, 16);
1763 }
1764 /* FALLTHRU */
1765#ifdef TARGET_X86_64
1766 case MO_32:
1767 /* Concatenate the two 32-bit values and use a 64-bit shift. */
1768 tcg_gen_subi_tltcg_gen_subi_i32(cpu_tmp0, count, 1);
1769 if (is_right) {
1770 tcg_gen_concat_tl_i64tcg_gen_concat_i32_i64(cpu_T[0], cpu_T[0], cpu_T[1]);
1771 tcg_gen_shr_i64(cpu_tmp0, cpu_T[0], cpu_tmp0);
1772 tcg_gen_shr_i64(cpu_T[0], cpu_T[0], count);
1773 } else {
1774 tcg_gen_concat_tl_i64tcg_gen_concat_i32_i64(cpu_T[0], cpu_T[1], cpu_T[0]);
1775 tcg_gen_shl_i64(cpu_tmp0, cpu_T[0], cpu_tmp0);
1776 tcg_gen_shl_i64(cpu_T[0], cpu_T[0], count);
1777 tcg_gen_shri_i64(cpu_tmp0, cpu_tmp0, 32);
1778 tcg_gen_shri_i64(cpu_T[0], cpu_T[0], 32);
1779 }
1780 break;
1781#endif
1782 default:
1783 tcg_gen_subi_tltcg_gen_subi_i32(cpu_tmp0, count, 1);
1784 if (is_right) {
1785 tcg_gen_shr_tltcg_gen_shr_i32(cpu_tmp0, cpu_T[0], cpu_tmp0);
1786
1787 tcg_gen_subfi_tltcg_gen_subfi_i32(cpu_tmp4, mask + 1, count);
1788 tcg_gen_shr_tltcg_gen_shr_i32(cpu_T[0], cpu_T[0], count);
1789 tcg_gen_shl_tltcg_gen_shl_i32(cpu_T[1], cpu_T[1], cpu_tmp4);
1790 } else {
1791 tcg_gen_shl_tltcg_gen_shl_i32(cpu_tmp0, cpu_T[0], cpu_tmp0);
1792 if (ot == MO_16) {
1793 /* Only needed if count > 16, for Intel behaviour. */
1794 tcg_gen_subfi_tltcg_gen_subfi_i32(cpu_tmp4, 33, count);
1795 tcg_gen_shr_tltcg_gen_shr_i32(cpu_tmp4, cpu_T[1], cpu_tmp4);
1796 tcg_gen_or_tltcg_gen_or_i32(cpu_tmp0, cpu_tmp0, cpu_tmp4);
1797 }
1798
1799 tcg_gen_subfi_tltcg_gen_subfi_i32(cpu_tmp4, mask + 1, count);
1800 tcg_gen_shl_tltcg_gen_shl_i32(cpu_T[0], cpu_T[0], count);
1801 tcg_gen_shr_tltcg_gen_shr_i32(cpu_T[1], cpu_T[1], cpu_tmp4);
1802 }
1803 tcg_gen_movi_tltcg_gen_movi_i32(cpu_tmp4, 0);
1804 tcg_gen_movcond_tltcg_gen_movcond_i32(TCG_COND_EQ, cpu_T[1], count, cpu_tmp4,
1805 cpu_tmp4, cpu_T[1]);
1806 tcg_gen_or_tltcg_gen_or_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
1807 break;
1808 }
1809
1810 /* store */
1811 gen_op_st_rm_T0_A0(s, ot, op1);
1812
1813 gen_shift_flags(s, ot, cpu_T[0], cpu_tmp0, count, is_right);
1814 tcg_temp_freetcg_temp_free_i32(count);
1815}
1816
1817static void gen_shift(DisasContext *s1, int op, TCGMemOp ot, int d, int s)
1818{
1819 if (s != OR_TMP1)
1820 gen_op_mov_v_reg(ot, cpu_T[1], s);
1821 switch(op) {
1822 case OP_ROL:
1823 gen_rot_rm_T1(s1, ot, d, 0);
1824 break;
1825 case OP_ROR:
1826 gen_rot_rm_T1(s1, ot, d, 1);
1827 break;
1828 case OP_SHL:
1829 case OP_SHL1:
1830 gen_shift_rm_T1(s1, ot, d, 0, 0);
1831 break;
1832 case OP_SHR:
1833 gen_shift_rm_T1(s1, ot, d, 1, 0);
1834 break;
1835 case OP_SAR:
1836 gen_shift_rm_T1(s1, ot, d, 1, 1);
1837 break;
1838 case OP_RCL:
1839 gen_rotc_rm_T1(s1, ot, d, 0);
1840 break;
1841 case OP_RCR:
1842 gen_rotc_rm_T1(s1, ot, d, 1);
1843 break;
1844 }
1845}
1846
1847static void gen_shifti(DisasContext *s1, int op, TCGMemOp ot, int d, int c)
1848{
1849 switch(op) {
1850 case OP_ROL:
1851 gen_rot_rm_im(s1, ot, d, c, 0);
1852 break;
1853 case OP_ROR:
1854 gen_rot_rm_im(s1, ot, d, c, 1);
1855 break;
1856 case OP_SHL:
1857 case OP_SHL1:
1858 gen_shift_rm_im(s1, ot, d, c, 0, 0);
1859 break;
1860 case OP_SHR:
1861 gen_shift_rm_im(s1, ot, d, c, 1, 0);
1862 break;
1863 case OP_SAR:
1864 gen_shift_rm_im(s1, ot, d, c, 1, 1);
1865 break;
1866 default:
1867 /* currently not optimized */
1868 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], c);
1869 gen_shift(s1, op, ot, d, OR_TMP1);
1870 break;
1871 }
1872}
1873
1874static void gen_lea_modrm(CPUX86State *env, DisasContext *s, int modrm)
1875{
1876 target_long disp;
1877 int havesib;
1878 int base;
1879 int index;
1880 int scale;
1881 int mod, rm, code, override, must_add_seg;
1882 TCGvTCGv_i32 sum;
1883
1884 override = s->override;
1885 must_add_seg = s->addseg;
1886 if (override >= 0)
1887 must_add_seg = 1;
1888 mod = (modrm >> 6) & 3;
1889 rm = modrm & 7;
1890
1891 switch (s->aflag) {
1892 case MO_64:
1893 case MO_32:
1894 havesib = 0;
1895 base = rm;
1896 index = -1;
1897 scale = 0;
1898
1899 if (base == 4) {
1900 havesib = 1;
Value stored to 'havesib' is never read
1901 code = cpu_ldub_code(env, s->pc++);
1902 scale = (code >> 6) & 3;
1903 index = ((code >> 3) & 7) | REX_X(s)0;
1904 if (index == 4) {
1905 index = -1; /* no index */
1906 }
1907 base = (code & 7);
1908 }
1909 base |= REX_B(s)0;
1910
1911 switch (mod) {
1912 case 0:
1913 if ((base & 7) == 5) {
1914 base = -1;
1915 disp = (int32_t)cpu_ldl_code(env, s->pc);
1916 s->pc += 4;
1917 if (CODE64(s)0 && !havesib) {
1918 disp += s->pc + s->rip_offset;
1919 }
1920 } else {
1921 disp = 0;
1922 }
1923 break;
1924 case 1:
1925 disp = (int8_t)cpu_ldub_code(env, s->pc++);
1926 break;
1927 default:
1928 case 2:
1929 disp = (int32_t)cpu_ldl_code(env, s->pc);
1930 s->pc += 4;
1931 break;
1932 }
1933
1934 /* For correct popl handling with esp. */
1935 if (base == R_ESP4 && s->popl_esp_hack) {
1936 disp += s->popl_esp_hack;
1937 }
1938
1939 /* Compute the address, with a minimum number of TCG ops. */
1940 TCGV_UNUSED(sum)sum = __extension__ ({ TCGv_i32 make_tcgv_tmp = {-1}; make_tcgv_tmp
;})
;
1941 if (index >= 0) {
1942 if (scale == 0) {
1943 sum = cpu_regs[index];
1944 } else {
1945 tcg_gen_shli_tltcg_gen_shli_i32(cpu_A0, cpu_regs[index], scale);
1946 sum = cpu_A0;
1947 }
1948 if (base >= 0) {
1949 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, sum, cpu_regs[base]);
1950 sum = cpu_A0;
1951 }
1952 } else if (base >= 0) {
1953 sum = cpu_regs[base];
1954 }
1955 if (TCGV_IS_UNUSED(sum)(((sum).i32) == -1)) {
1956 tcg_gen_movi_tltcg_gen_movi_i32(cpu_A0, disp);
1957 } else {
1958 tcg_gen_addi_tltcg_gen_addi_i32(cpu_A0, sum, disp);
1959 }
1960
1961 if (must_add_seg) {
1962 if (override < 0) {
1963 if (base == R_EBP5 || base == R_ESP4) {
1964 override = R_SS2;
1965 } else {
1966 override = R_DS3;
1967 }
1968 }
1969
1970 tcg_gen_ld_tltcg_gen_ld_i32(cpu_tmp0, cpu_env,
1971 offsetof(CPUX86State, segs[override].base)__builtin_offsetof(CPUX86State, segs[override].base));
1972 if (CODE64(s)0) {
1973 if (s->aflag == MO_32) {
1974 tcg_gen_ext32u_tltcg_gen_mov_i32(cpu_A0, cpu_A0);
1975 }
1976 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_A0, cpu_tmp0);
1977 return;
1978 }
1979
1980 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_A0, cpu_tmp0);
1981 }
1982
1983 if (s->aflag == MO_32) {
1984 tcg_gen_ext32u_tltcg_gen_mov_i32(cpu_A0, cpu_A0);
1985 }
1986 break;
1987
1988 case MO_16:
1989 switch (mod) {
1990 case 0:
1991 if (rm == 6) {
1992 disp = cpu_lduw_code(env, s->pc);
1993 s->pc += 2;
1994 tcg_gen_movi_tltcg_gen_movi_i32(cpu_A0, disp);
1995 rm = 0; /* avoid SS override */
1996 goto no_rm;
1997 } else {
1998 disp = 0;
1999 }
2000 break;
2001 case 1:
2002 disp = (int8_t)cpu_ldub_code(env, s->pc++);
2003 break;
2004 default:
2005 case 2:
2006 disp = (int16_t)cpu_lduw_code(env, s->pc);
2007 s->pc += 2;
2008 break;
2009 }
2010
2011 sum = cpu_A0;
2012 switch (rm) {
2013 case 0:
2014 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_regs[R_EBX3], cpu_regs[R_ESI6]);
2015 break;
2016 case 1:
2017 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_regs[R_EBX3], cpu_regs[R_EDI7]);
2018 break;
2019 case 2:
2020 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_regs[R_EBP5], cpu_regs[R_ESI6]);
2021 break;
2022 case 3:
2023 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_regs[R_EBP5], cpu_regs[R_EDI7]);
2024 break;
2025 case 4:
2026 sum = cpu_regs[R_ESI6];
2027 break;
2028 case 5:
2029 sum = cpu_regs[R_EDI7];
2030 break;
2031 case 6:
2032 sum = cpu_regs[R_EBP5];
2033 break;
2034 default:
2035 case 7:
2036 sum = cpu_regs[R_EBX3];
2037 break;
2038 }
2039 tcg_gen_addi_tltcg_gen_addi_i32(cpu_A0, sum, disp);
2040 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_A0, cpu_A0);
2041 no_rm:
2042 if (must_add_seg) {
2043 if (override < 0) {
2044 if (rm == 2 || rm == 3 || rm == 6) {
2045 override = R_SS2;
2046 } else {
2047 override = R_DS3;
2048 }
2049 }
2050 gen_op_addl_A0_seg(s, override);
2051 }
2052 break;
2053
2054 default:
2055 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 2055); abort();} while (0)
;
2056 }
2057}
2058
2059static void gen_nop_modrm(CPUX86State *env, DisasContext *s, int modrm)
2060{
2061 int mod, rm, base, code;
2062
2063 mod = (modrm >> 6) & 3;
2064 if (mod == 3)
2065 return;
2066 rm = modrm & 7;
2067
2068 switch (s->aflag) {
2069 case MO_64:
2070 case MO_32:
2071 base = rm;
2072
2073 if (base == 4) {
2074 code = cpu_ldub_code(env, s->pc++);
2075 base = (code & 7);
2076 }
2077
2078 switch (mod) {
2079 case 0:
2080 if (base == 5) {
2081 s->pc += 4;
2082 }
2083 break;
2084 case 1:
2085 s->pc++;
2086 break;
2087 default:
2088 case 2:
2089 s->pc += 4;
2090 break;
2091 }
2092 break;
2093
2094 case MO_16:
2095 switch (mod) {
2096 case 0:
2097 if (rm == 6) {
2098 s->pc += 2;
2099 }
2100 break;
2101 case 1:
2102 s->pc++;
2103 break;
2104 default:
2105 case 2:
2106 s->pc += 2;
2107 break;
2108 }
2109 break;
2110
2111 default:
2112 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 2112); abort();} while (0)
;
2113 }
2114}
2115
2116/* used for LEA and MOV AX, mem */
2117static void gen_add_A0_ds_seg(DisasContext *s)
2118{
2119 int override, must_add_seg;
2120 must_add_seg = s->addseg;
2121 override = R_DS3;
2122 if (s->override >= 0) {
2123 override = s->override;
2124 must_add_seg = 1;
2125 }
2126 if (must_add_seg) {
2127#ifdef TARGET_X86_64
2128 if (CODE64(s)0) {
2129 gen_op_addq_A0_seg(override);
2130 } else
2131#endif
2132 {
2133 gen_op_addl_A0_seg(s, override);
2134 }
2135 }
2136}
2137
2138/* generate modrm memory load or store of 'reg'. TMP0 is used if reg ==
2139 OR_TMP0 */
2140static void gen_ldst_modrm(CPUX86State *env, DisasContext *s, int modrm,
2141 TCGMemOp ot, int reg, int is_store)
2142{
2143 int mod, rm;
2144
2145 mod = (modrm >> 6) & 3;
2146 rm = (modrm & 7) | REX_B(s)0;
2147 if (mod == 3) {
2148 if (is_store) {
2149 if (reg != OR_TMP0)
2150 gen_op_mov_v_reg(ot, cpu_T[0], reg);
2151 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
2152 } else {
2153 gen_op_mov_v_reg(ot, cpu_T[0], rm);
2154 if (reg != OR_TMP0)
2155 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
2156 }
2157 } else {
2158 gen_lea_modrm(env, s, modrm);
2159 if (is_store) {
2160 if (reg != OR_TMP0)
2161 gen_op_mov_v_reg(ot, cpu_T[0], reg);
2162 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
2163 } else {
2164 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
2165 if (reg != OR_TMP0)
2166 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
2167 }
2168 }
2169}
2170
2171static inline uint32_t insn_get(CPUX86State *env, DisasContext *s, TCGMemOp ot)
2172{
2173 uint32_t ret;
2174
2175 switch (ot) {
2176 case MO_8:
2177 ret = cpu_ldub_code(env, s->pc);
2178 s->pc++;
2179 break;
2180 case MO_16:
2181 ret = cpu_lduw_code(env, s->pc);
2182 s->pc += 2;
2183 break;
2184 case MO_32:
2185#ifdef TARGET_X86_64
2186 case MO_64:
2187#endif
2188 ret = cpu_ldl_code(env, s->pc);
2189 s->pc += 4;
2190 break;
2191 default:
2192 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 2192); abort();} while (0)
;
2193 }
2194 return ret;
2195}
2196
2197static inline int insn_const_size(TCGMemOp ot)
2198{
2199 if (ot <= MO_32) {
2200 return 1 << ot;
2201 } else {
2202 return 4;
2203 }
2204}
2205
2206static inline void gen_goto_tb(DisasContext *s, int tb_num, target_ulong eip)
2207{
2208 TranslationBlock *tb;
2209 target_ulong pc;
2210
2211 pc = s->cs_base + eip;
2212 tb = s->tb;
2213 /* NOTE: we handle the case where the TB spans two pages here */
2214 if ((pc & TARGET_PAGE_MASK~((1 << 12) - 1)) == (tb->pc & TARGET_PAGE_MASK~((1 << 12) - 1)) ||
2215 (pc & TARGET_PAGE_MASK~((1 << 12) - 1)) == ((s->pc - 1) & TARGET_PAGE_MASK~((1 << 12) - 1))) {
2216 /* jump to same page: we can use a direct jump */
2217 tcg_gen_goto_tb(tb_num);
2218 gen_jmp_im(eip);
2219 tcg_gen_exit_tb((uintptr_t)tb + tb_num);
2220 } else {
2221 /* jump to another page: currently not optimized */
2222 gen_jmp_im(eip);
2223 gen_eob(s);
2224 }
2225}
2226
2227static inline void gen_jcc(DisasContext *s, int b,
2228 target_ulong val, target_ulong next_eip)
2229{
2230 int l1, l2;
2231
2232 if (s->jmp_opt) {
2233 l1 = gen_new_label();
2234 gen_jcc1(s, b, l1);
2235
2236 gen_goto_tb(s, 0, next_eip);
2237
2238 gen_set_label(l1);
2239 gen_goto_tb(s, 1, val);
2240 s->is_jmp = DISAS_TB_JUMP3;
2241 } else {
2242 l1 = gen_new_label();
2243 l2 = gen_new_label();
2244 gen_jcc1(s, b, l1);
2245
2246 gen_jmp_im(next_eip);
2247 tcg_gen_br(l2);
2248
2249 gen_set_label(l1);
2250 gen_jmp_im(val);
2251 gen_set_label(l2);
2252 gen_eob(s);
2253 }
2254}
2255
2256static void gen_cmovcc1(CPUX86State *env, DisasContext *s, TCGMemOp ot, int b,
2257 int modrm, int reg)
2258{
2259 CCPrepare cc;
2260
2261 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
2262
2263 cc = gen_prepare_cc(s, b, cpu_T[1]);
2264 if (cc.mask != -1) {
2265 TCGvTCGv_i32 t0 = tcg_temp_new()tcg_temp_new_i32();
2266 tcg_gen_andi_tltcg_gen_andi_i32(t0, cc.reg, cc.mask);
2267 cc.reg = t0;
2268 }
2269 if (!cc.use_reg2) {
2270 cc.reg2 = tcg_const_tltcg_const_i32(cc.imm);
2271 }
2272
2273 tcg_gen_movcond_tltcg_gen_movcond_i32(cc.cond, cpu_T[0], cc.reg, cc.reg2,
2274 cpu_T[0], cpu_regs[reg]);
2275 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
2276
2277 if (cc.mask != -1) {
2278 tcg_temp_freetcg_temp_free_i32(cc.reg);
2279 }
2280 if (!cc.use_reg2) {
2281 tcg_temp_freetcg_temp_free_i32(cc.reg2);
2282 }
2283}
2284
2285static inline void gen_op_movl_T0_seg(int seg_reg)
2286{
2287 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env,
2288 offsetof(CPUX86State,segs[seg_reg].selector)__builtin_offsetof(CPUX86State, segs[seg_reg].selector));
2289}
2290
2291static inline void gen_op_movl_seg_T0_vm(int seg_reg)
2292{
2293 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[0], cpu_T[0], 0xffff);
2294 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env,
2295 offsetof(CPUX86State,segs[seg_reg].selector)__builtin_offsetof(CPUX86State, segs[seg_reg].selector));
2296 tcg_gen_shli_tltcg_gen_shli_i32(cpu_T[0], cpu_T[0], 4);
2297 tcg_gen_st_tltcg_gen_st_i32(cpu_T[0], cpu_env,
2298 offsetof(CPUX86State,segs[seg_reg].base)__builtin_offsetof(CPUX86State, segs[seg_reg].base));
2299}
2300
2301/* move T0 to seg_reg and compute if the CPU state may change. Never
2302 call this function with seg_reg == R_CS */
2303static void gen_movl_seg_T0(DisasContext *s, int seg_reg, target_ulong cur_eip)
2304{
2305 if (s->pe && !s->vm86) {
2306 /* XXX: optimize by finding processor state dynamically */
2307 gen_update_cc_op(s);
2308 gen_jmp_im(cur_eip);
2309 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
2310 gen_helper_load_seg(cpu_env, tcg_const_i32(seg_reg), cpu_tmp2_i32);
2311 /* abort translation because the addseg value may change or
2312 because ss32 may change. For R_SS, translation must always
2313 stop as a special handling must be done to disable hardware
2314 interrupts for the next instruction */
2315 if (seg_reg == R_SS2 || (s->code32 && seg_reg < R_FS4))
2316 s->is_jmp = DISAS_TB_JUMP3;
2317 } else {
2318 gen_op_movl_seg_T0_vm(seg_reg);
2319 if (seg_reg == R_SS2)
2320 s->is_jmp = DISAS_TB_JUMP3;
2321 }
2322}
2323
2324static inline int svm_is_rep(int prefixes)
2325{
2326 return ((prefixes & (PREFIX_REPZ0x01 | PREFIX_REPNZ0x02)) ? 8 : 0);
2327}
2328
2329static inline void
2330gen_svm_check_intercept_param(DisasContext *s, target_ulong pc_start,
2331 uint32_t type, uint64_t param)
2332{
2333 /* no SVM activated; fast case */
2334 if (likely(!(s->flags & HF_SVMI_MASK))__builtin_expect(!!(!(s->flags & (1 << 21))), 1))
2335 return;
2336 gen_update_cc_op(s);
2337 gen_jmp_im(pc_start - s->cs_base);
2338 gen_helper_svm_check_intercept_param(cpu_env, tcg_const_i32(type),
2339 tcg_const_i64(param));
2340}
2341
2342static inline void
2343gen_svm_check_intercept(DisasContext *s, target_ulong pc_start, uint64_t type)
2344{
2345 gen_svm_check_intercept_param(s, pc_start, type, 0);
2346}
2347
2348static inline void gen_stack_update(DisasContext *s, int addend)
2349{
2350#ifdef TARGET_X86_64
2351 if (CODE64(s)0) {
2352 gen_op_add_reg_im(MO_64, R_ESP4, addend);
2353 } else
2354#endif
2355 if (s->ss32) {
2356 gen_op_add_reg_im(MO_32, R_ESP4, addend);
2357 } else {
2358 gen_op_add_reg_im(MO_16, R_ESP4, addend);
2359 }
2360}
2361
2362/* Generate a push. It depends on ss32, addseg and dflag. */
2363static void gen_push_v(DisasContext *s, TCGvTCGv_i32 val)
2364{
2365 TCGMemOp a_ot, d_ot = mo_pushpop(s, s->dflag);
2366 int size = 1 << d_ot;
2367 TCGvTCGv_i32 new_esp = cpu_A0;
2368
2369 tcg_gen_subi_tltcg_gen_subi_i32(cpu_A0, cpu_regs[R_ESP4], size);
2370
2371 if (CODE64(s)0) {
2372 a_ot = MO_64;
2373 } else if (s->ss32) {
2374 a_ot = MO_32;
2375 if (s->addseg) {
2376 new_esp = cpu_tmp4;
2377 tcg_gen_mov_tltcg_gen_mov_i32(new_esp, cpu_A0);
2378 gen_op_addl_A0_seg(s, R_SS2);
2379 } else {
2380 tcg_gen_ext32u_tltcg_gen_mov_i32(cpu_A0, cpu_A0);
2381 }
2382 } else {
2383 a_ot = MO_16;
2384 new_esp = cpu_tmp4;
2385 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_A0, cpu_A0);
2386 tcg_gen_mov_tltcg_gen_mov_i32(new_esp, cpu_A0);
2387 gen_op_addl_A0_seg(s, R_SS2);
2388 }
2389
2390 gen_op_st_v(s, d_ot, val, cpu_A0);
2391 gen_op_mov_reg_v(a_ot, R_ESP4, new_esp);
2392}
2393
2394/* two step pop is necessary for precise exceptions */
2395static TCGMemOp gen_pop_T0(DisasContext *s)
2396{
2397 TCGMemOp d_ot = mo_pushpop(s, s->dflag);
2398 TCGvTCGv_i32 addr = cpu_A0;
2399
2400 if (CODE64(s)0) {
2401 addr = cpu_regs[R_ESP4];
2402 } else if (!s->ss32) {
2403 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_A0, cpu_regs[R_ESP4]);
2404 gen_op_addl_A0_seg(s, R_SS2);
2405 } else if (s->addseg) {
2406 tcg_gen_mov_tltcg_gen_mov_i32(cpu_A0, cpu_regs[R_ESP4]);
2407 gen_op_addl_A0_seg(s, R_SS2);
2408 } else {
2409 tcg_gen_ext32u_tltcg_gen_mov_i32(cpu_A0, cpu_regs[R_ESP4]);
2410 }
2411
2412 gen_op_ld_v(s, d_ot, cpu_T[0], addr);
2413 return d_ot;
2414}
2415
2416static void gen_pop_update(DisasContext *s, TCGMemOp ot)
2417{
2418 gen_stack_update(s, 1 << ot);
2419}
2420
2421static void gen_stack_A0(DisasContext *s)
2422{
2423 gen_op_movl_A0_reg(R_ESP4);
2424 if (!s->ss32)
2425 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_A0, cpu_A0);
2426 tcg_gen_mov_tltcg_gen_mov_i32(cpu_T[1], cpu_A0);
2427 if (s->addseg)
2428 gen_op_addl_A0_seg(s, R_SS2);
2429}
2430
2431/* NOTE: wrap around in 16 bit not fully handled */
2432static void gen_pusha(DisasContext *s)
2433{
2434 int i;
2435 gen_op_movl_A0_reg(R_ESP4);
2436 gen_op_addl_A0_im(-8 << s->dflag);
2437 if (!s->ss32)
2438 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_A0, cpu_A0);
2439 tcg_gen_mov_tltcg_gen_mov_i32(cpu_T[1], cpu_A0);
2440 if (s->addseg)
2441 gen_op_addl_A0_seg(s, R_SS2);
2442 for(i = 0;i < 8; i++) {
2443 gen_op_mov_v_reg(MO_32, cpu_T[0], 7 - i);
2444 gen_op_st_v(s, s->dflag, cpu_T[0], cpu_A0);
2445 gen_op_addl_A0_im(1 << s->dflag);
2446 }
2447 gen_op_mov_reg_v(MO_16 + s->ss32, R_ESP4, cpu_T[1]);
2448}
2449
2450/* NOTE: wrap around in 16 bit not fully handled */
2451static void gen_popa(DisasContext *s)
2452{
2453 int i;
2454 gen_op_movl_A0_reg(R_ESP4);
2455 if (!s->ss32)
2456 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_A0, cpu_A0);
2457 tcg_gen_mov_tltcg_gen_mov_i32(cpu_T[1], cpu_A0);
2458 tcg_gen_addi_tltcg_gen_addi_i32(cpu_T[1], cpu_T[1], 8 << s->dflag);
2459 if (s->addseg)
2460 gen_op_addl_A0_seg(s, R_SS2);
2461 for(i = 0;i < 8; i++) {
2462 /* ESP is not reloaded */
2463 if (i != 3) {
2464 gen_op_ld_v(s, s->dflag, cpu_T[0], cpu_A0);
2465 gen_op_mov_reg_v(s->dflag, 7 - i, cpu_T[0]);
2466 }
2467 gen_op_addl_A0_im(1 << s->dflag);
2468 }
2469 gen_op_mov_reg_v(MO_16 + s->ss32, R_ESP4, cpu_T[1]);
2470}
2471
2472static void gen_enter(DisasContext *s, int esp_addend, int level)
2473{
2474 TCGMemOp ot = mo_pushpop(s, s->dflag);
2475 int opsize = 1 << ot;
2476
2477 level &= 0x1f;
2478#ifdef TARGET_X86_64
2479 if (CODE64(s)0) {
2480 gen_op_movl_A0_reg(R_ESP4);
2481 gen_op_addq_A0_im(-opsize);
2482 tcg_gen_mov_tltcg_gen_mov_i32(cpu_T[1], cpu_A0);
2483
2484 /* push bp */
2485 gen_op_mov_v_reg(MO_32, cpu_T[0], R_EBP5);
2486 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
2487 if (level) {
2488 /* XXX: must save state */
2489 gen_helper_enter64_level(cpu_env, tcg_const_i32(level),
2490 tcg_const_i32((ot == MO_64)),
2491 cpu_T[1]);
2492 }
2493 gen_op_mov_reg_v(ot, R_EBP5, cpu_T[1]);
2494 tcg_gen_addi_tltcg_gen_addi_i32(cpu_T[1], cpu_T[1], -esp_addend + (-opsize * level));
2495 gen_op_mov_reg_v(MO_64, R_ESP4, cpu_T[1]);
2496 } else
2497#endif
2498 {
2499 gen_op_movl_A0_reg(R_ESP4);
2500 gen_op_addl_A0_im(-opsize);
2501 if (!s->ss32)
2502 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_A0, cpu_A0);
2503 tcg_gen_mov_tltcg_gen_mov_i32(cpu_T[1], cpu_A0);
2504 if (s->addseg)
2505 gen_op_addl_A0_seg(s, R_SS2);
2506 /* push bp */
2507 gen_op_mov_v_reg(MO_32, cpu_T[0], R_EBP5);
2508 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
2509 if (level) {
2510 /* XXX: must save state */
2511 gen_helper_enter_level(cpu_env, tcg_const_i32(level),
2512 tcg_const_i32(s->dflag - 1),
2513 cpu_T[1]);
2514 }
2515 gen_op_mov_reg_v(ot, R_EBP5, cpu_T[1]);
2516 tcg_gen_addi_tltcg_gen_addi_i32(cpu_T[1], cpu_T[1], -esp_addend + (-opsize * level));
2517 gen_op_mov_reg_v(MO_16 + s->ss32, R_ESP4, cpu_T[1]);
2518 }
2519}
2520
2521static void gen_exception(DisasContext *s, int trapno, target_ulong cur_eip)
2522{
2523 gen_update_cc_op(s);
2524 gen_jmp_im(cur_eip);
2525 gen_helper_raise_exception(cpu_env, tcg_const_i32(trapno));
2526 s->is_jmp = DISAS_TB_JUMP3;
2527}
2528
2529/* an interrupt is different from an exception because of the
2530 privilege checks */
2531static void gen_interrupt(DisasContext *s, int intno,
2532 target_ulong cur_eip, target_ulong next_eip)
2533{
2534 gen_update_cc_op(s);
2535 gen_jmp_im(cur_eip);
2536 gen_helper_raise_interrupt(cpu_env, tcg_const_i32(intno),
2537 tcg_const_i32(next_eip - cur_eip));
2538 s->is_jmp = DISAS_TB_JUMP3;
2539}
2540
2541static void gen_debug(DisasContext *s, target_ulong cur_eip)
2542{
2543 gen_update_cc_op(s);
2544 gen_jmp_im(cur_eip);
2545 gen_helper_debug(cpu_env);
2546 s->is_jmp = DISAS_TB_JUMP3;
2547}
2548
2549/* generate a generic end of block. Trace exception is also generated
2550 if needed */
2551static void gen_eob(DisasContext *s)
2552{
2553 gen_update_cc_op(s);
2554 if (s->tb->flags & HF_INHIBIT_IRQ_MASK(1 << 3)) {
2555 gen_helper_reset_inhibit_irq(cpu_env);
2556 }
2557 if (s->tb->flags & HF_RF_MASK(1 << 16)) {
2558 gen_helper_reset_rf(cpu_env);
2559 }
2560 if (s->singlestep_enabled) {
2561 gen_helper_debug(cpu_env);
2562 } else if (s->tf) {
2563 gen_helper_single_step(cpu_env);
2564 } else {
2565 tcg_gen_exit_tb(0);
2566 }
2567 s->is_jmp = DISAS_TB_JUMP3;
2568}
2569
2570/* generate a jump to eip. No segment change must happen before as a
2571 direct call to the next block may occur */
2572static void gen_jmp_tb(DisasContext *s, target_ulong eip, int tb_num)
2573{
2574 gen_update_cc_op(s);
2575 set_cc_op(s, CC_OP_DYNAMIC);
2576 if (s->jmp_opt) {
2577 gen_goto_tb(s, tb_num, eip);
2578 s->is_jmp = DISAS_TB_JUMP3;
2579 } else {
2580 gen_jmp_im(eip);
2581 gen_eob(s);
2582 }
2583}
2584
2585static void gen_jmp(DisasContext *s, target_ulong eip)
2586{
2587 gen_jmp_tb(s, eip, 0);
2588}
2589
2590static inline void gen_ldq_env_A0(DisasContext *s, int offset)
2591{
2592 tcg_gen_qemu_ld_i64(cpu_tmp1_i64, cpu_A0, s->mem_index, MO_LEQ);
2593 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, offset);
2594}
2595
2596static inline void gen_stq_env_A0(DisasContext *s, int offset)
2597{
2598 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, offset);
2599 tcg_gen_qemu_st_i64(cpu_tmp1_i64, cpu_A0, s->mem_index, MO_LEQ);
2600}
2601
2602static inline void gen_ldo_env_A0(DisasContext *s, int offset)
2603{
2604 int mem_index = s->mem_index;
2605 tcg_gen_qemu_ld_i64(cpu_tmp1_i64, cpu_A0, mem_index, MO_LEQ);
2606 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(0))__builtin_offsetof(XMMReg, _q[0]));
2607 tcg_gen_addi_tltcg_gen_addi_i32(cpu_tmp0, cpu_A0, 8);
2608 tcg_gen_qemu_ld_i64(cpu_tmp1_i64, cpu_tmp0, mem_index, MO_LEQ);
2609 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(1))__builtin_offsetof(XMMReg, _q[1]));
2610}
2611
2612static inline void gen_sto_env_A0(DisasContext *s, int offset)
2613{
2614 int mem_index = s->mem_index;
2615 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(0))__builtin_offsetof(XMMReg, _q[0]));
2616 tcg_gen_qemu_st_i64(cpu_tmp1_i64, cpu_A0, mem_index, MO_LEQ);
2617 tcg_gen_addi_tltcg_gen_addi_i32(cpu_tmp0, cpu_A0, 8);
2618 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(1))__builtin_offsetof(XMMReg, _q[1]));
2619 tcg_gen_qemu_st_i64(cpu_tmp1_i64, cpu_tmp0, mem_index, MO_LEQ);
2620}
2621
2622static inline void gen_op_movo(int d_offset, int s_offset)
2623{
2624 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, s_offset);
2625 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset);
2626 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, s_offset + 8);
2627 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset + 8);
2628}
2629
2630static inline void gen_op_movq(int d_offset, int s_offset)
2631{
2632 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, s_offset);
2633 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset);
2634}
2635
2636static inline void gen_op_movl(int d_offset, int s_offset)
2637{
2638 tcg_gen_ld_i32(cpu_tmp2_i32, cpu_env, s_offset);
2639 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, d_offset);
2640}
2641
2642static inline void gen_op_movq_env_0(int d_offset)
2643{
2644 tcg_gen_movi_i64(cpu_tmp1_i64, 0);
2645 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset);
2646}
2647
2648typedef void (*SSEFunc_i_ep)(TCGv_i32 val, TCGv_ptr env, TCGv_ptr reg);
2649typedef void (*SSEFunc_l_ep)(TCGv_i64 val, TCGv_ptr env, TCGv_ptr reg);
2650typedef void (*SSEFunc_0_epi)(TCGv_ptr env, TCGv_ptr reg, TCGv_i32 val);
2651typedef void (*SSEFunc_0_epl)(TCGv_ptr env, TCGv_ptr reg, TCGv_i64 val);
2652typedef void (*SSEFunc_0_epp)(TCGv_ptr env, TCGv_ptr reg_a, TCGv_ptr reg_b);
2653typedef void (*SSEFunc_0_eppi)(TCGv_ptr env, TCGv_ptr reg_a, TCGv_ptr reg_b,
2654 TCGv_i32 val);
2655typedef void (*SSEFunc_0_ppi)(TCGv_ptr reg_a, TCGv_ptr reg_b, TCGv_i32 val);
2656typedef void (*SSEFunc_0_eppt)(TCGv_ptr env, TCGv_ptr reg_a, TCGv_ptr reg_b,
2657 TCGvTCGv_i32 val);
2658
2659#define SSE_SPECIAL((void *)1) ((void *)1)
2660#define SSE_DUMMY((void *)2) ((void *)2)
2661
2662#define MMX_OP2(x){ gen_helper_x_mmx, gen_helper_x_xmm } { gen_helper_ ## x ## _mmx, gen_helper_ ## x ## _xmm }
2663#define SSE_FOP(x){ gen_helper_xps, gen_helper_xpd, gen_helper_xss, gen_helper_xsd
, }
{ gen_helper_ ## x ## ps, gen_helper_ ## x ## pd, \
2664 gen_helper_ ## x ## ss, gen_helper_ ## x ## sd, }
2665
2666static const SSEFunc_0_epp sse_op_table1[256][4] = {
2667 /* 3DNow! extensions */
2668 [0x0e] = { SSE_DUMMY((void *)2) }, /* femms */
2669 [0x0f] = { SSE_DUMMY((void *)2) }, /* pf... */
2670 /* pure SSE operations */
2671 [0x10] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movups, movupd, movss, movsd */
2672 [0x11] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movups, movupd, movss, movsd */
2673 [0x12] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movlps, movlpd, movsldup, movddup */
2674 [0x13] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movlps, movlpd */
2675 [0x14] = { gen_helper_punpckldq_xmm, gen_helper_punpcklqdq_xmm },
2676 [0x15] = { gen_helper_punpckhdq_xmm, gen_helper_punpckhqdq_xmm },
2677 [0x16] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movhps, movhpd, movshdup */
2678 [0x17] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movhps, movhpd */
2679
2680 [0x28] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movaps, movapd */
2681 [0x29] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movaps, movapd */
2682 [0x2a] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* cvtpi2ps, cvtpi2pd, cvtsi2ss, cvtsi2sd */
2683 [0x2b] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movntps, movntpd, movntss, movntsd */
2684 [0x2c] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* cvttps2pi, cvttpd2pi, cvttsd2si, cvttss2si */
2685 [0x2d] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* cvtps2pi, cvtpd2pi, cvtsd2si, cvtss2si */
2686 [0x2e] = { gen_helper_ucomiss, gen_helper_ucomisd },
2687 [0x2f] = { gen_helper_comiss, gen_helper_comisd },
2688 [0x50] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movmskps, movmskpd */
2689 [0x51] = SSE_FOP(sqrt){ gen_helper_sqrtps, gen_helper_sqrtpd, gen_helper_sqrtss, gen_helper_sqrtsd
, }
,
2690 [0x52] = { gen_helper_rsqrtps, NULL((void*)0), gen_helper_rsqrtss, NULL((void*)0) },
2691 [0x53] = { gen_helper_rcpps, NULL((void*)0), gen_helper_rcpss, NULL((void*)0) },
2692 [0x54] = { gen_helper_pand_xmm, gen_helper_pand_xmm }, /* andps, andpd */
2693 [0x55] = { gen_helper_pandn_xmm, gen_helper_pandn_xmm }, /* andnps, andnpd */
2694 [0x56] = { gen_helper_por_xmm, gen_helper_por_xmm }, /* orps, orpd */
2695 [0x57] = { gen_helper_pxor_xmm, gen_helper_pxor_xmm }, /* xorps, xorpd */
2696 [0x58] = SSE_FOP(add){ gen_helper_addps, gen_helper_addpd, gen_helper_addss, gen_helper_addsd
, }
,
2697 [0x59] = SSE_FOP(mul){ gen_helper_mulps, gen_helper_mulpd, gen_helper_mulss, gen_helper_mulsd
, }
,
2698 [0x5a] = { gen_helper_cvtps2pd, gen_helper_cvtpd2ps,
2699 gen_helper_cvtss2sd, gen_helper_cvtsd2ss },
2700 [0x5b] = { gen_helper_cvtdq2ps, gen_helper_cvtps2dq, gen_helper_cvttps2dq },
2701 [0x5c] = SSE_FOP(sub){ gen_helper_subps, gen_helper_subpd, gen_helper_subss, gen_helper_subsd
, }
,
2702 [0x5d] = SSE_FOP(min){ gen_helper_minps, gen_helper_minpd, gen_helper_minss, gen_helper_minsd
, }
,
2703 [0x5e] = SSE_FOP(div){ gen_helper_divps, gen_helper_divpd, gen_helper_divss, gen_helper_divsd
, }
,
2704 [0x5f] = SSE_FOP(max){ gen_helper_maxps, gen_helper_maxpd, gen_helper_maxss, gen_helper_maxsd
, }
,
2705
2706 [0xc2] = SSE_FOP(cmpeq){ gen_helper_cmpeqps, gen_helper_cmpeqpd, gen_helper_cmpeqss,
gen_helper_cmpeqsd, }
,
2707 [0xc6] = { (SSEFunc_0_epp)gen_helper_shufps,
2708 (SSEFunc_0_epp)gen_helper_shufpd }, /* XXX: casts */
2709
2710 /* SSSE3, SSE4, MOVBE, CRC32, BMI1, BMI2, ADX. */
2711 [0x38] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) },
2712 [0x3a] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) },
2713
2714 /* MMX ops and their SSE extensions */
2715 [0x60] = MMX_OP2(punpcklbw){ gen_helper_punpcklbw_mmx, gen_helper_punpcklbw_xmm },
2716 [0x61] = MMX_OP2(punpcklwd){ gen_helper_punpcklwd_mmx, gen_helper_punpcklwd_xmm },
2717 [0x62] = MMX_OP2(punpckldq){ gen_helper_punpckldq_mmx, gen_helper_punpckldq_xmm },
2718 [0x63] = MMX_OP2(packsswb){ gen_helper_packsswb_mmx, gen_helper_packsswb_xmm },
2719 [0x64] = MMX_OP2(pcmpgtb){ gen_helper_pcmpgtb_mmx, gen_helper_pcmpgtb_xmm },
2720 [0x65] = MMX_OP2(pcmpgtw){ gen_helper_pcmpgtw_mmx, gen_helper_pcmpgtw_xmm },
2721 [0x66] = MMX_OP2(pcmpgtl){ gen_helper_pcmpgtl_mmx, gen_helper_pcmpgtl_xmm },
2722 [0x67] = MMX_OP2(packuswb){ gen_helper_packuswb_mmx, gen_helper_packuswb_xmm },
2723 [0x68] = MMX_OP2(punpckhbw){ gen_helper_punpckhbw_mmx, gen_helper_punpckhbw_xmm },
2724 [0x69] = MMX_OP2(punpckhwd){ gen_helper_punpckhwd_mmx, gen_helper_punpckhwd_xmm },
2725 [0x6a] = MMX_OP2(punpckhdq){ gen_helper_punpckhdq_mmx, gen_helper_punpckhdq_xmm },
2726 [0x6b] = MMX_OP2(packssdw){ gen_helper_packssdw_mmx, gen_helper_packssdw_xmm },
2727 [0x6c] = { NULL((void*)0), gen_helper_punpcklqdq_xmm },
2728 [0x6d] = { NULL((void*)0), gen_helper_punpckhqdq_xmm },
2729 [0x6e] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movd mm, ea */
2730 [0x6f] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movq, movdqa, , movqdu */
2731 [0x70] = { (SSEFunc_0_epp)gen_helper_pshufw_mmx,
2732 (SSEFunc_0_epp)gen_helper_pshufd_xmm,
2733 (SSEFunc_0_epp)gen_helper_pshufhw_xmm,
2734 (SSEFunc_0_epp)gen_helper_pshuflw_xmm }, /* XXX: casts */
2735 [0x71] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* shiftw */
2736 [0x72] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* shiftd */
2737 [0x73] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* shiftq */
2738 [0x74] = MMX_OP2(pcmpeqb){ gen_helper_pcmpeqb_mmx, gen_helper_pcmpeqb_xmm },
2739 [0x75] = MMX_OP2(pcmpeqw){ gen_helper_pcmpeqw_mmx, gen_helper_pcmpeqw_xmm },
2740 [0x76] = MMX_OP2(pcmpeql){ gen_helper_pcmpeql_mmx, gen_helper_pcmpeql_xmm },
2741 [0x77] = { SSE_DUMMY((void *)2) }, /* emms */
2742 [0x78] = { NULL((void*)0), SSE_SPECIAL((void *)1), NULL((void*)0), SSE_SPECIAL((void *)1) }, /* extrq_i, insertq_i */
2743 [0x79] = { NULL((void*)0), gen_helper_extrq_r, NULL((void*)0), gen_helper_insertq_r },
2744 [0x7c] = { NULL((void*)0), gen_helper_haddpd, NULL((void*)0), gen_helper_haddps },
2745 [0x7d] = { NULL((void*)0), gen_helper_hsubpd, NULL((void*)0), gen_helper_hsubps },
2746 [0x7e] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movd, movd, , movq */
2747 [0x7f] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* movq, movdqa, movdqu */
2748 [0xc4] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* pinsrw */
2749 [0xc5] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* pextrw */
2750 [0xd0] = { NULL((void*)0), gen_helper_addsubpd, NULL((void*)0), gen_helper_addsubps },
2751 [0xd1] = MMX_OP2(psrlw){ gen_helper_psrlw_mmx, gen_helper_psrlw_xmm },
2752 [0xd2] = MMX_OP2(psrld){ gen_helper_psrld_mmx, gen_helper_psrld_xmm },
2753 [0xd3] = MMX_OP2(psrlq){ gen_helper_psrlq_mmx, gen_helper_psrlq_xmm },
2754 [0xd4] = MMX_OP2(paddq){ gen_helper_paddq_mmx, gen_helper_paddq_xmm },
2755 [0xd5] = MMX_OP2(pmullw){ gen_helper_pmullw_mmx, gen_helper_pmullw_xmm },
2756 [0xd6] = { NULL((void*)0), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) },
2757 [0xd7] = { SSE_SPECIAL((void *)1), SSE_SPECIAL((void *)1) }, /* pmovmskb */
2758 [0xd8] = MMX_OP2(psubusb){ gen_helper_psubusb_mmx, gen_helper_psubusb_xmm },
2759 [0xd9] = MMX_OP2(psubusw){ gen_helper_psubusw_mmx, gen_helper_psubusw_xmm },
2760 [0xda] = MMX_OP2(pminub){ gen_helper_pminub_mmx, gen_helper_pminub_xmm },
2761 [0xdb] = MMX_OP2(pand){ gen_helper_pand_mmx, gen_helper_pand_xmm },
2762 [0xdc] = MMX_OP2(paddusb){ gen_helper_paddusb_mmx, gen_helper_paddusb_xmm },
2763 [0xdd] = MMX_OP2(paddusw){ gen_helper_paddusw_mmx, gen_helper_paddusw_xmm },
2764 [0xde] = MMX_OP2(pmaxub){ gen_helper_pmaxub_mmx, gen_helper_pmaxub_xmm },
2765 [0xdf] = MMX_OP2(pandn){ gen_helper_pandn_mmx, gen_helper_pandn_xmm },
2766 [0xe0] = MMX_OP2(pavgb){ gen_helper_pavgb_mmx, gen_helper_pavgb_xmm },
2767 [0xe1] = MMX_OP2(psraw){ gen_helper_psraw_mmx, gen_helper_psraw_xmm },
2768 [0xe2] = MMX_OP2(psrad){ gen_helper_psrad_mmx, gen_helper_psrad_xmm },
2769 [0xe3] = MMX_OP2(pavgw){ gen_helper_pavgw_mmx, gen_helper_pavgw_xmm },
2770 [0xe4] = MMX_OP2(pmulhuw){ gen_helper_pmulhuw_mmx, gen_helper_pmulhuw_xmm },
2771 [0xe5] = MMX_OP2(pmulhw){ gen_helper_pmulhw_mmx, gen_helper_pmulhw_xmm },
2772 [0xe6] = { NULL((void*)0), gen_helper_cvttpd2dq, gen_helper_cvtdq2pd, gen_helper_cvtpd2dq },
2773 [0xe7] = { SSE_SPECIAL((void *)1) , SSE_SPECIAL((void *)1) }, /* movntq, movntq */
2774 [0xe8] = MMX_OP2(psubsb){ gen_helper_psubsb_mmx, gen_helper_psubsb_xmm },
2775 [0xe9] = MMX_OP2(psubsw){ gen_helper_psubsw_mmx, gen_helper_psubsw_xmm },
2776 [0xea] = MMX_OP2(pminsw){ gen_helper_pminsw_mmx, gen_helper_pminsw_xmm },
2777 [0xeb] = MMX_OP2(por){ gen_helper_por_mmx, gen_helper_por_xmm },
2778 [0xec] = MMX_OP2(paddsb){ gen_helper_paddsb_mmx, gen_helper_paddsb_xmm },
2779 [0xed] = MMX_OP2(paddsw){ gen_helper_paddsw_mmx, gen_helper_paddsw_xmm },
2780 [0xee] = MMX_OP2(pmaxsw){ gen_helper_pmaxsw_mmx, gen_helper_pmaxsw_xmm },
2781 [0xef] = MMX_OP2(pxor){ gen_helper_pxor_mmx, gen_helper_pxor_xmm },
2782 [0xf0] = { NULL((void*)0), NULL((void*)0), NULL((void*)0), SSE_SPECIAL((void *)1) }, /* lddqu */
2783 [0xf1] = MMX_OP2(psllw){ gen_helper_psllw_mmx, gen_helper_psllw_xmm },
2784 [0xf2] = MMX_OP2(pslld){ gen_helper_pslld_mmx, gen_helper_pslld_xmm },
2785 [0xf3] = MMX_OP2(psllq){ gen_helper_psllq_mmx, gen_helper_psllq_xmm },
2786 [0xf4] = MMX_OP2(pmuludq){ gen_helper_pmuludq_mmx, gen_helper_pmuludq_xmm },
2787 [0xf5] = MMX_OP2(pmaddwd){ gen_helper_pmaddwd_mmx, gen_helper_pmaddwd_xmm },
2788 [0xf6] = MMX_OP2(psadbw){ gen_helper_psadbw_mmx, gen_helper_psadbw_xmm },
2789 [0xf7] = { (SSEFunc_0_epp)gen_helper_maskmov_mmx,
2790 (SSEFunc_0_epp)gen_helper_maskmov_xmm }, /* XXX: casts */
2791 [0xf8] = MMX_OP2(psubb){ gen_helper_psubb_mmx, gen_helper_psubb_xmm },
2792 [0xf9] = MMX_OP2(psubw){ gen_helper_psubw_mmx, gen_helper_psubw_xmm },
2793 [0xfa] = MMX_OP2(psubl){ gen_helper_psubl_mmx, gen_helper_psubl_xmm },
2794 [0xfb] = MMX_OP2(psubq){ gen_helper_psubq_mmx, gen_helper_psubq_xmm },
2795 [0xfc] = MMX_OP2(paddb){ gen_helper_paddb_mmx, gen_helper_paddb_xmm },
2796 [0xfd] = MMX_OP2(paddw){ gen_helper_paddw_mmx, gen_helper_paddw_xmm },
2797 [0xfe] = MMX_OP2(paddl){ gen_helper_paddl_mmx, gen_helper_paddl_xmm },
2798};
2799
2800static const SSEFunc_0_epp sse_op_table2[3 * 8][2] = {
2801 [0 + 2] = MMX_OP2(psrlw){ gen_helper_psrlw_mmx, gen_helper_psrlw_xmm },
2802 [0 + 4] = MMX_OP2(psraw){ gen_helper_psraw_mmx, gen_helper_psraw_xmm },
2803 [0 + 6] = MMX_OP2(psllw){ gen_helper_psllw_mmx, gen_helper_psllw_xmm },
2804 [8 + 2] = MMX_OP2(psrld){ gen_helper_psrld_mmx, gen_helper_psrld_xmm },
2805 [8 + 4] = MMX_OP2(psrad){ gen_helper_psrad_mmx, gen_helper_psrad_xmm },
2806 [8 + 6] = MMX_OP2(pslld){ gen_helper_pslld_mmx, gen_helper_pslld_xmm },
2807 [16 + 2] = MMX_OP2(psrlq){ gen_helper_psrlq_mmx, gen_helper_psrlq_xmm },
2808 [16 + 3] = { NULL((void*)0), gen_helper_psrldq_xmm },
2809 [16 + 6] = MMX_OP2(psllq){ gen_helper_psllq_mmx, gen_helper_psllq_xmm },
2810 [16 + 7] = { NULL((void*)0), gen_helper_pslldq_xmm },
2811};
2812
2813static const SSEFunc_0_epi sse_op_table3ai[] = {
2814 gen_helper_cvtsi2ss,
2815 gen_helper_cvtsi2sd
2816};
2817
2818#ifdef TARGET_X86_64
2819static const SSEFunc_0_epl sse_op_table3aq[] = {
2820 gen_helper_cvtsq2ss,
2821 gen_helper_cvtsq2sd
2822};
2823#endif
2824
2825static const SSEFunc_i_ep sse_op_table3bi[] = {
2826 gen_helper_cvttss2si,
2827 gen_helper_cvtss2si,
2828 gen_helper_cvttsd2si,
2829 gen_helper_cvtsd2si
2830};
2831
2832#ifdef TARGET_X86_64
2833static const SSEFunc_l_ep sse_op_table3bq[] = {
2834 gen_helper_cvttss2sq,
2835 gen_helper_cvtss2sq,
2836 gen_helper_cvttsd2sq,
2837 gen_helper_cvtsd2sq
2838};
2839#endif
2840
2841static const SSEFunc_0_epp sse_op_table4[8][4] = {
2842 SSE_FOP(cmpeq){ gen_helper_cmpeqps, gen_helper_cmpeqpd, gen_helper_cmpeqss,
gen_helper_cmpeqsd, }
,
2843 SSE_FOP(cmplt){ gen_helper_cmpltps, gen_helper_cmpltpd, gen_helper_cmpltss,
gen_helper_cmpltsd, }
,
2844 SSE_FOP(cmple){ gen_helper_cmpleps, gen_helper_cmplepd, gen_helper_cmpless,
gen_helper_cmplesd, }
,
2845 SSE_FOP(cmpunord){ gen_helper_cmpunordps, gen_helper_cmpunordpd, gen_helper_cmpunordss
, gen_helper_cmpunordsd, }
,
2846 SSE_FOP(cmpneq){ gen_helper_cmpneqps, gen_helper_cmpneqpd, gen_helper_cmpneqss
, gen_helper_cmpneqsd, }
,
2847 SSE_FOP(cmpnlt){ gen_helper_cmpnltps, gen_helper_cmpnltpd, gen_helper_cmpnltss
, gen_helper_cmpnltsd, }
,
2848 SSE_FOP(cmpnle){ gen_helper_cmpnleps, gen_helper_cmpnlepd, gen_helper_cmpnless
, gen_helper_cmpnlesd, }
,
2849 SSE_FOP(cmpord){ gen_helper_cmpordps, gen_helper_cmpordpd, gen_helper_cmpordss
, gen_helper_cmpordsd, }
,
2850};
2851
2852static const SSEFunc_0_epp sse_op_table5[256] = {
2853 [0x0c] = gen_helper_pi2fw,
2854 [0x0d] = gen_helper_pi2fd,
2855 [0x1c] = gen_helper_pf2iw,
2856 [0x1d] = gen_helper_pf2id,
2857 [0x8a] = gen_helper_pfnacc,
2858 [0x8e] = gen_helper_pfpnacc,
2859 [0x90] = gen_helper_pfcmpge,
2860 [0x94] = gen_helper_pfmin,
2861 [0x96] = gen_helper_pfrcp,
2862 [0x97] = gen_helper_pfrsqrt,
2863 [0x9a] = gen_helper_pfsub,
2864 [0x9e] = gen_helper_pfadd,
2865 [0xa0] = gen_helper_pfcmpgt,
2866 [0xa4] = gen_helper_pfmax,
2867 [0xa6] = gen_helper_movq, /* pfrcpit1; no need to actually increase precision */
2868 [0xa7] = gen_helper_movq, /* pfrsqit1 */
2869 [0xaa] = gen_helper_pfsubr,
2870 [0xae] = gen_helper_pfacc,
2871 [0xb0] = gen_helper_pfcmpeq,
2872 [0xb4] = gen_helper_pfmul,
2873 [0xb6] = gen_helper_movq, /* pfrcpit2 */
2874 [0xb7] = gen_helper_pmulhrw_mmx,
2875 [0xbb] = gen_helper_pswapd,
2876 [0xbf] = gen_helper_pavgb_mmx /* pavgusb */
2877};
2878
2879struct SSEOpHelper_epp {
2880 SSEFunc_0_epp op[2];
2881 uint32_t ext_mask;
2882};
2883
2884struct SSEOpHelper_eppi {
2885 SSEFunc_0_eppi op[2];
2886 uint32_t ext_mask;
2887};
2888
2889#define SSSE3_OP(x){ { gen_helper_x_mmx, gen_helper_x_xmm }, (1 << 9) } { MMX_OP2(x){ gen_helper_x_mmx, gen_helper_x_xmm }, CPUID_EXT_SSSE3(1 << 9) }
2890#define SSE41_OP(x){ { ((void*)0), gen_helper_x_xmm }, (1 << 19) } { { NULL((void*)0), gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE41(1 << 19) }
2891#define SSE42_OP(x){ { ((void*)0), gen_helper_x_xmm }, (1 << 20) } { { NULL((void*)0), gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE42(1 << 20) }
2892#define SSE41_SPECIAL{ { ((void*)0), ((void *)1) }, (1 << 19) } { { NULL((void*)0), SSE_SPECIAL((void *)1) }, CPUID_EXT_SSE41(1 << 19) }
2893#define PCLMULQDQ_OP(x){ { ((void*)0), gen_helper_x_xmm }, (1 << 1) } { { NULL((void*)0), gen_helper_ ## x ## _xmm }, \
2894 CPUID_EXT_PCLMULQDQ(1 << 1) }
2895#define AESNI_OP(x){ { ((void*)0), gen_helper_x_xmm }, (1 << 25) } { { NULL((void*)0), gen_helper_ ## x ## _xmm }, CPUID_EXT_AES(1 << 25) }
2896
2897static const struct SSEOpHelper_epp sse_op_table6[256] = {
2898 [0x00] = SSSE3_OP(pshufb){ { gen_helper_pshufb_mmx, gen_helper_pshufb_xmm }, (1 <<
9) }
,
2899 [0x01] = SSSE3_OP(phaddw){ { gen_helper_phaddw_mmx, gen_helper_phaddw_xmm }, (1 <<
9) }
,
2900 [0x02] = SSSE3_OP(phaddd){ { gen_helper_phaddd_mmx, gen_helper_phaddd_xmm }, (1 <<
9) }
,
2901 [0x03] = SSSE3_OP(phaddsw){ { gen_helper_phaddsw_mmx, gen_helper_phaddsw_xmm }, (1 <<
9) }
,
2902 [0x04] = SSSE3_OP(pmaddubsw){ { gen_helper_pmaddubsw_mmx, gen_helper_pmaddubsw_xmm }, (1 <<
9) }
,
2903 [0x05] = SSSE3_OP(phsubw){ { gen_helper_phsubw_mmx, gen_helper_phsubw_xmm }, (1 <<
9) }
,
2904 [0x06] = SSSE3_OP(phsubd){ { gen_helper_phsubd_mmx, gen_helper_phsubd_xmm }, (1 <<
9) }
,
2905 [0x07] = SSSE3_OP(phsubsw){ { gen_helper_phsubsw_mmx, gen_helper_phsubsw_xmm }, (1 <<
9) }
,
2906 [0x08] = SSSE3_OP(psignb){ { gen_helper_psignb_mmx, gen_helper_psignb_xmm }, (1 <<
9) }
,
2907 [0x09] = SSSE3_OP(psignw){ { gen_helper_psignw_mmx, gen_helper_psignw_xmm }, (1 <<
9) }
,
2908 [0x0a] = SSSE3_OP(psignd){ { gen_helper_psignd_mmx, gen_helper_psignd_xmm }, (1 <<
9) }
,
2909 [0x0b] = SSSE3_OP(pmulhrsw){ { gen_helper_pmulhrsw_mmx, gen_helper_pmulhrsw_xmm }, (1 <<
9) }
,
2910 [0x10] = SSE41_OP(pblendvb){ { ((void*)0), gen_helper_pblendvb_xmm }, (1 << 19) },
2911 [0x14] = SSE41_OP(blendvps){ { ((void*)0), gen_helper_blendvps_xmm }, (1 << 19) },
2912 [0x15] = SSE41_OP(blendvpd){ { ((void*)0), gen_helper_blendvpd_xmm }, (1 << 19) },
2913 [0x17] = SSE41_OP(ptest){ { ((void*)0), gen_helper_ptest_xmm }, (1 << 19) },
2914 [0x1c] = SSSE3_OP(pabsb){ { gen_helper_pabsb_mmx, gen_helper_pabsb_xmm }, (1 <<
9) }
,
2915 [0x1d] = SSSE3_OP(pabsw){ { gen_helper_pabsw_mmx, gen_helper_pabsw_xmm }, (1 <<
9) }
,
2916 [0x1e] = SSSE3_OP(pabsd){ { gen_helper_pabsd_mmx, gen_helper_pabsd_xmm }, (1 <<
9) }
,
2917 [0x20] = SSE41_OP(pmovsxbw){ { ((void*)0), gen_helper_pmovsxbw_xmm }, (1 << 19) },
2918 [0x21] = SSE41_OP(pmovsxbd){ { ((void*)0), gen_helper_pmovsxbd_xmm }, (1 << 19) },
2919 [0x22] = SSE41_OP(pmovsxbq){ { ((void*)0), gen_helper_pmovsxbq_xmm }, (1 << 19) },
2920 [0x23] = SSE41_OP(pmovsxwd){ { ((void*)0), gen_helper_pmovsxwd_xmm }, (1 << 19) },
2921 [0x24] = SSE41_OP(pmovsxwq){ { ((void*)0), gen_helper_pmovsxwq_xmm }, (1 << 19) },
2922 [0x25] = SSE41_OP(pmovsxdq){ { ((void*)0), gen_helper_pmovsxdq_xmm }, (1 << 19) },
2923 [0x28] = SSE41_OP(pmuldq){ { ((void*)0), gen_helper_pmuldq_xmm }, (1 << 19) },
2924 [0x29] = SSE41_OP(pcmpeqq){ { ((void*)0), gen_helper_pcmpeqq_xmm }, (1 << 19) },
2925 [0x2a] = SSE41_SPECIAL{ { ((void*)0), ((void *)1) }, (1 << 19) }, /* movntqda */
2926 [0x2b] = SSE41_OP(packusdw){ { ((void*)0), gen_helper_packusdw_xmm }, (1 << 19) },
2927 [0x30] = SSE41_OP(pmovzxbw){ { ((void*)0), gen_helper_pmovzxbw_xmm }, (1 << 19) },
2928 [0x31] = SSE41_OP(pmovzxbd){ { ((void*)0), gen_helper_pmovzxbd_xmm }, (1 << 19) },
2929 [0x32] = SSE41_OP(pmovzxbq){ { ((void*)0), gen_helper_pmovzxbq_xmm }, (1 << 19) },
2930 [0x33] = SSE41_OP(pmovzxwd){ { ((void*)0), gen_helper_pmovzxwd_xmm }, (1 << 19) },
2931 [0x34] = SSE41_OP(pmovzxwq){ { ((void*)0), gen_helper_pmovzxwq_xmm }, (1 << 19) },
2932 [0x35] = SSE41_OP(pmovzxdq){ { ((void*)0), gen_helper_pmovzxdq_xmm }, (1 << 19) },
2933 [0x37] = SSE42_OP(pcmpgtq){ { ((void*)0), gen_helper_pcmpgtq_xmm }, (1 << 20) },
2934 [0x38] = SSE41_OP(pminsb){ { ((void*)0), gen_helper_pminsb_xmm }, (1 << 19) },
2935 [0x39] = SSE41_OP(pminsd){ { ((void*)0), gen_helper_pminsd_xmm }, (1 << 19) },
2936 [0x3a] = SSE41_OP(pminuw){ { ((void*)0), gen_helper_pminuw_xmm }, (1 << 19) },
2937 [0x3b] = SSE41_OP(pminud){ { ((void*)0), gen_helper_pminud_xmm }, (1 << 19) },
2938 [0x3c] = SSE41_OP(pmaxsb){ { ((void*)0), gen_helper_pmaxsb_xmm }, (1 << 19) },
2939 [0x3d] = SSE41_OP(pmaxsd){ { ((void*)0), gen_helper_pmaxsd_xmm }, (1 << 19) },
2940 [0x3e] = SSE41_OP(pmaxuw){ { ((void*)0), gen_helper_pmaxuw_xmm }, (1 << 19) },
2941 [0x3f] = SSE41_OP(pmaxud){ { ((void*)0), gen_helper_pmaxud_xmm }, (1 << 19) },
2942 [0x40] = SSE41_OP(pmulld){ { ((void*)0), gen_helper_pmulld_xmm }, (1 << 19) },
2943 [0x41] = SSE41_OP(phminposuw){ { ((void*)0), gen_helper_phminposuw_xmm }, (1 << 19) },
2944 [0xdb] = AESNI_OP(aesimc){ { ((void*)0), gen_helper_aesimc_xmm }, (1 << 25) },
2945 [0xdc] = AESNI_OP(aesenc){ { ((void*)0), gen_helper_aesenc_xmm }, (1 << 25) },
2946 [0xdd] = AESNI_OP(aesenclast){ { ((void*)0), gen_helper_aesenclast_xmm }, (1 << 25) },
2947 [0xde] = AESNI_OP(aesdec){ { ((void*)0), gen_helper_aesdec_xmm }, (1 << 25) },
2948 [0xdf] = AESNI_OP(aesdeclast){ { ((void*)0), gen_helper_aesdeclast_xmm }, (1 << 25) },
2949};
2950
2951static const struct SSEOpHelper_eppi sse_op_table7[256] = {
2952 [0x08] = SSE41_OP(roundps){ { ((void*)0), gen_helper_roundps_xmm }, (1 << 19) },
2953 [0x09] = SSE41_OP(roundpd){ { ((void*)0), gen_helper_roundpd_xmm }, (1 << 19) },
2954 [0x0a] = SSE41_OP(roundss){ { ((void*)0), gen_helper_roundss_xmm }, (1 << 19) },
2955 [0x0b] = SSE41_OP(roundsd){ { ((void*)0), gen_helper_roundsd_xmm }, (1 << 19) },
2956 [0x0c] = SSE41_OP(blendps){ { ((void*)0), gen_helper_blendps_xmm }, (1 << 19) },
2957 [0x0d] = SSE41_OP(blendpd){ { ((void*)0), gen_helper_blendpd_xmm }, (1 << 19) },
2958 [0x0e] = SSE41_OP(pblendw){ { ((void*)0), gen_helper_pblendw_xmm }, (1 << 19) },
2959 [0x0f] = SSSE3_OP(palignr){ { gen_helper_palignr_mmx, gen_helper_palignr_xmm }, (1 <<
9) }
,
2960 [0x14] = SSE41_SPECIAL{ { ((void*)0), ((void *)1) }, (1 << 19) }, /* pextrb */
2961 [0x15] = SSE41_SPECIAL{ { ((void*)0), ((void *)1) }, (1 << 19) }, /* pextrw */
2962 [0x16] = SSE41_SPECIAL{ { ((void*)0), ((void *)1) }, (1 << 19) }, /* pextrd/pextrq */
2963 [0x17] = SSE41_SPECIAL{ { ((void*)0), ((void *)1) }, (1 << 19) }, /* extractps */
2964 [0x20] = SSE41_SPECIAL{ { ((void*)0), ((void *)1) }, (1 << 19) }, /* pinsrb */
2965 [0x21] = SSE41_SPECIAL{ { ((void*)0), ((void *)1) }, (1 << 19) }, /* insertps */
2966 [0x22] = SSE41_SPECIAL{ { ((void*)0), ((void *)1) }, (1 << 19) }, /* pinsrd/pinsrq */
2967 [0x40] = SSE41_OP(dpps){ { ((void*)0), gen_helper_dpps_xmm }, (1 << 19) },
2968 [0x41] = SSE41_OP(dppd){ { ((void*)0), gen_helper_dppd_xmm }, (1 << 19) },
2969 [0x42] = SSE41_OP(mpsadbw){ { ((void*)0), gen_helper_mpsadbw_xmm }, (1 << 19) },
2970 [0x44] = PCLMULQDQ_OP(pclmulqdq){ { ((void*)0), gen_helper_pclmulqdq_xmm }, (1 << 1) },
2971 [0x60] = SSE42_OP(pcmpestrm){ { ((void*)0), gen_helper_pcmpestrm_xmm }, (1 << 20) },
2972 [0x61] = SSE42_OP(pcmpestri){ { ((void*)0), gen_helper_pcmpestri_xmm }, (1 << 20) },
2973 [0x62] = SSE42_OP(pcmpistrm){ { ((void*)0), gen_helper_pcmpistrm_xmm }, (1 << 20) },
2974 [0x63] = SSE42_OP(pcmpistri){ { ((void*)0), gen_helper_pcmpistri_xmm }, (1 << 20) },
2975 [0xdf] = AESNI_OP(aeskeygenassist){ { ((void*)0), gen_helper_aeskeygenassist_xmm }, (1 <<
25) }
,
2976};
2977
2978static void gen_sse(CPUX86State *env, DisasContext *s, int b,
2979 target_ulong pc_start, int rex_r)
2980{
2981 int b1, op1_offset, op2_offset, is_xmm, val;
2982 int modrm, mod, rm, reg;
2983 SSEFunc_0_epp sse_fn_epp;
2984 SSEFunc_0_eppi sse_fn_eppi;
2985 SSEFunc_0_ppi sse_fn_ppi;
2986 SSEFunc_0_eppt sse_fn_eppt;
2987 TCGMemOp ot;
2988
2989 b &= 0xff;
2990 if (s->prefix & PREFIX_DATA0x08)
2991 b1 = 1;
2992 else if (s->prefix & PREFIX_REPZ0x01)
2993 b1 = 2;
2994 else if (s->prefix & PREFIX_REPNZ0x02)
2995 b1 = 3;
2996 else
2997 b1 = 0;
2998 sse_fn_epp = sse_op_table1[b][b1];
2999 if (!sse_fn_epp) {
3000 goto illegal_op;
3001 }
3002 if ((b <= 0x5f && b >= 0x10) || b == 0xc6 || b == 0xc2) {
3003 is_xmm = 1;
3004 } else {
3005 if (b1 == 0) {
3006 /* MMX case */
3007 is_xmm = 0;
3008 } else {
3009 is_xmm = 1;
3010 }
3011 }
3012 /* simple MMX/SSE operation */
3013 if (s->flags & HF_TS_MASK(1 << 11)) {
3014 gen_exception(s, EXCP07_PREX7, pc_start - s->cs_base);
3015 return;
3016 }
3017 if (s->flags & HF_EM_MASK(1 << 10)) {
3018 illegal_op:
3019 gen_exception(s, EXCP06_ILLOP6, pc_start - s->cs_base);
3020 return;
3021 }
3022 if (is_xmm && !(s->flags & HF_OSFXSR_MASK(1 << 22)))
3023 if ((b != 0x38 && b != 0x3a) || (s->prefix & PREFIX_DATA0x08))
3024 goto illegal_op;
3025 if (b == 0x0e) {
3026 if (!(s->cpuid_ext2_features & CPUID_EXT2_3DNOW(1 << 31)))
3027 goto illegal_op;
3028 /* femms */
3029 gen_helper_emms(cpu_env);
3030 return;
3031 }
3032 if (b == 0x77) {
3033 /* emms */
3034 gen_helper_emms(cpu_env);
3035 return;
3036 }
3037 /* prepare MMX state (XXX: optimize by storing fptt and fptags in
3038 the static cpu state) */
3039 if (!is_xmm) {
3040 gen_helper_enter_mmx(cpu_env);
3041 }
3042
3043 modrm = cpu_ldub_code(env, s->pc++);
3044 reg = ((modrm >> 3) & 7);
3045 if (is_xmm)
3046 reg |= rex_r;
3047 mod = (modrm >> 6) & 3;
3048 if (sse_fn_epp == SSE_SPECIAL((void *)1)) {
3049 b |= (b1 << 8);
3050 switch(b) {
3051 case 0x0e7: /* movntq */
3052 if (mod == 3)
3053 goto illegal_op;
3054 gen_lea_modrm(env, s, modrm);
3055 gen_stq_env_A0(s, offsetof(CPUX86State, fpregs[reg].mmx)__builtin_offsetof(CPUX86State, fpregs[reg].mmx));
3056 break;
3057 case 0x1e7: /* movntdq */
3058 case 0x02b: /* movntps */
3059 case 0x12b: /* movntps */
3060 if (mod == 3)
3061 goto illegal_op;
3062 gen_lea_modrm(env, s, modrm);
3063 gen_sto_env_A0(s, offsetof(CPUX86State, xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]));
3064 break;
3065 case 0x3f0: /* lddqu */
3066 if (mod == 3)
3067 goto illegal_op;
3068 gen_lea_modrm(env, s, modrm);
3069 gen_ldo_env_A0(s, offsetof(CPUX86State, xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]));
3070 break;
3071 case 0x22b: /* movntss */
3072 case 0x32b: /* movntsd */
3073 if (mod == 3)
3074 goto illegal_op;
3075 gen_lea_modrm(env, s, modrm);
3076 if (b1 & 1) {
3077 gen_stq_env_A0(s, offsetof(CPUX86State, xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]));
3078 } else {
3079 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0])
3080 xmm_regs[reg].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0]));
3081 gen_op_st_v(s, MO_32, cpu_T[0], cpu_A0);
3082 }
3083 break;
3084 case 0x6e: /* movd mm, ea */
3085#ifdef TARGET_X86_64
3086 if (s->dflag == MO_64) {
3087 gen_ldst_modrm(env, s, modrm, MO_64, OR_TMP0, 0);
3088 tcg_gen_st_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,fpregs[reg].mmx)__builtin_offsetof(CPUX86State, fpregs[reg].mmx));
3089 } else
3090#endif
3091 {
3092 gen_ldst_modrm(env, s, modrm, MO_32, OR_TMP0, 0);
3093 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, fpregs[reg].mmx)))
3094 offsetof(CPUX86State,fpregs[reg].mmx))tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, fpregs[reg].mmx)))
;
3095 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
3096 gen_helper_movl_mm_T0_mmx(cpu_ptr0, cpu_tmp2_i32);
3097 }
3098 break;
3099 case 0x16e: /* movd xmm, ea */
3100#ifdef TARGET_X86_64
3101 if (s->dflag == MO_64) {
3102 gen_ldst_modrm(env, s, modrm, MO_64, OR_TMP0, 0);
3103 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[reg])))
3104 offsetof(CPUX86State,xmm_regs[reg]))tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[reg])))
;
3105 gen_helper_movq_mm_T0_xmm(cpu_ptr0, cpu_T[0]);
3106 } else
3107#endif
3108 {
3109 gen_ldst_modrm(env, s, modrm, MO_32, OR_TMP0, 0);
3110 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[reg])))
3111 offsetof(CPUX86State,xmm_regs[reg]))tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[reg])))
;
3112 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
3113 gen_helper_movl_mm_T0_xmm(cpu_ptr0, cpu_tmp2_i32);
3114 }
3115 break;
3116 case 0x6f: /* movq mm, ea */
3117 if (mod != 3) {
3118 gen_lea_modrm(env, s, modrm);
3119 gen_ldq_env_A0(s, offsetof(CPUX86State, fpregs[reg].mmx)__builtin_offsetof(CPUX86State, fpregs[reg].mmx));
3120 } else {
3121 rm = (modrm & 7);
3122 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env,
3123 offsetof(CPUX86State,fpregs[rm].mmx)__builtin_offsetof(CPUX86State, fpregs[rm].mmx));
3124 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env,
3125 offsetof(CPUX86State,fpregs[reg].mmx)__builtin_offsetof(CPUX86State, fpregs[reg].mmx));
3126 }
3127 break;
3128 case 0x010: /* movups */
3129 case 0x110: /* movupd */
3130 case 0x028: /* movaps */
3131 case 0x128: /* movapd */
3132 case 0x16f: /* movdqa xmm, ea */
3133 case 0x26f: /* movdqu xmm, ea */
3134 if (mod != 3) {
3135 gen_lea_modrm(env, s, modrm);
3136 gen_ldo_env_A0(s, offsetof(CPUX86State, xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]));
3137 } else {
3138 rm = (modrm & 7) | REX_B(s)0;
3139 gen_op_movo(offsetof(CPUX86State,xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]),
3140 offsetof(CPUX86State,xmm_regs[rm])__builtin_offsetof(CPUX86State, xmm_regs[rm]));
3141 }
3142 break;
3143 case 0x210: /* movss xmm, ea */
3144 if (mod != 3) {
3145 gen_lea_modrm(env, s, modrm);
3146 gen_op_ld_v(s, MO_32, cpu_T[0], cpu_A0);
3147 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0]));
3148 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], 0);
3149 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[1]));
3150 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(2))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[2]));
3151 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(3))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[3]));
3152 } else {
3153 rm = (modrm & 7) | REX_B(s)0;
3154 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0]),
3155 offsetof(CPUX86State,xmm_regs[rm].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[rm]._l[0]));
3156 }
3157 break;
3158 case 0x310: /* movsd xmm, ea */
3159 if (mod != 3) {
3160 gen_lea_modrm(env, s, modrm);
3161 gen_ldq_env_A0(s, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0])
3162 xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3163 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], 0);
3164 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(2))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[2]));
3165 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(3))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[3]));
3166 } else {
3167 rm = (modrm & 7) | REX_B(s)0;
3168 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]),
3169 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[rm]._q[0]));
3170 }
3171 break;
3172 case 0x012: /* movlps */
3173 case 0x112: /* movlpd */
3174 if (mod != 3) {
3175 gen_lea_modrm(env, s, modrm);
3176 gen_ldq_env_A0(s, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0])
3177 xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3178 } else {
3179 /* movhlps */
3180 rm = (modrm & 7) | REX_B(s)0;
3181 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]),
3182 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(1))__builtin_offsetof(CPUX86State, xmm_regs[rm]._q[1]));
3183 }
3184 break;
3185 case 0x212: /* movsldup */
3186 if (mod != 3) {
3187 gen_lea_modrm(env, s, modrm);
3188 gen_ldo_env_A0(s, offsetof(CPUX86State, xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]));
3189 } else {
3190 rm = (modrm & 7) | REX_B(s)0;
3191 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0]),
3192 offsetof(CPUX86State,xmm_regs[rm].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[rm]._l[0]));
3193 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(2))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[2]),
3194 offsetof(CPUX86State,xmm_regs[rm].XMM_L(2))__builtin_offsetof(CPUX86State, xmm_regs[rm]._l[2]));
3195 }
3196 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[1]),
3197 offsetof(CPUX86State,xmm_regs[reg].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0]));
3198 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(3))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[3]),
3199 offsetof(CPUX86State,xmm_regs[reg].XMM_L(2))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[2]));
3200 break;
3201 case 0x312: /* movddup */
3202 if (mod != 3) {
3203 gen_lea_modrm(env, s, modrm);
3204 gen_ldq_env_A0(s, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0])
3205 xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3206 } else {
3207 rm = (modrm & 7) | REX_B(s)0;
3208 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]),
3209 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[rm]._q[0]));
3210 }
3211 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[1]),
3212 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3213 break;
3214 case 0x016: /* movhps */
3215 case 0x116: /* movhpd */
3216 if (mod != 3) {
3217 gen_lea_modrm(env, s, modrm);
3218 gen_ldq_env_A0(s, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[1])
3219 xmm_regs[reg].XMM_Q(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[1]));
3220 } else {
3221 /* movlhps */
3222 rm = (modrm & 7) | REX_B(s)0;
3223 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[1]),
3224 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[rm]._q[0]));
3225 }
3226 break;
3227 case 0x216: /* movshdup */
3228 if (mod != 3) {
3229 gen_lea_modrm(env, s, modrm);
3230 gen_ldo_env_A0(s, offsetof(CPUX86State, xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]));
3231 } else {
3232 rm = (modrm & 7) | REX_B(s)0;
3233 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[1]),
3234 offsetof(CPUX86State,xmm_regs[rm].XMM_L(1))__builtin_offsetof(CPUX86State, xmm_regs[rm]._l[1]));
3235 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(3))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[3]),
3236 offsetof(CPUX86State,xmm_regs[rm].XMM_L(3))__builtin_offsetof(CPUX86State, xmm_regs[rm]._l[3]));
3237 }
3238 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0]),
3239 offsetof(CPUX86State,xmm_regs[reg].XMM_L(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[1]));
3240 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(2))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[2]),
3241 offsetof(CPUX86State,xmm_regs[reg].XMM_L(3))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[3]));
3242 break;
3243 case 0x178:
3244 case 0x378:
3245 {
3246 int bit_index, field_length;
3247
3248 if (b1 == 1 && reg != 0)
3249 goto illegal_op;
3250 field_length = cpu_ldub_code(env, s->pc++) & 0x3F;
3251 bit_index = cpu_ldub_code(env, s->pc++) & 0x3F;
3252 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[reg])))
3253 offsetof(CPUX86State,xmm_regs[reg]))tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[reg])))
;
3254 if (b1 == 1)
3255 gen_helper_extrq_i(cpu_env, cpu_ptr0,
3256 tcg_const_i32(bit_index),
3257 tcg_const_i32(field_length));
3258 else
3259 gen_helper_insertq_i(cpu_env, cpu_ptr0,
3260 tcg_const_i32(bit_index),
3261 tcg_const_i32(field_length));
3262 }
3263 break;
3264 case 0x7e: /* movd ea, mm */
3265#ifdef TARGET_X86_64
3266 if (s->dflag == MO_64) {
3267 tcg_gen_ld_i64(cpu_T[0], cpu_env,
3268 offsetof(CPUX86State,fpregs[reg].mmx)__builtin_offsetof(CPUX86State, fpregs[reg].mmx));
3269 gen_ldst_modrm(env, s, modrm, MO_64, OR_TMP0, 1);
3270 } else
3271#endif
3272 {
3273 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env,
3274 offsetof(CPUX86State,fpregs[reg].mmx.MMX_L(0))__builtin_offsetof(CPUX86State, fpregs[reg].mmx._l[0]));
3275 gen_ldst_modrm(env, s, modrm, MO_32, OR_TMP0, 1);
3276 }
3277 break;
3278 case 0x17e: /* movd ea, xmm */
3279#ifdef TARGET_X86_64
3280 if (s->dflag == MO_64) {
3281 tcg_gen_ld_i64(cpu_T[0], cpu_env,
3282 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3283 gen_ldst_modrm(env, s, modrm, MO_64, OR_TMP0, 1);
3284 } else
3285#endif
3286 {
3287 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env,
3288 offsetof(CPUX86State,xmm_regs[reg].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0]));
3289 gen_ldst_modrm(env, s, modrm, MO_32, OR_TMP0, 1);
3290 }
3291 break;
3292 case 0x27e: /* movq xmm, ea */
3293 if (mod != 3) {
3294 gen_lea_modrm(env, s, modrm);
3295 gen_ldq_env_A0(s, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0])
3296 xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3297 } else {
3298 rm = (modrm & 7) | REX_B(s)0;
3299 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]),
3300 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[rm]._q[0]));
3301 }
3302 gen_op_movq_env_0(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[1]));
3303 break;
3304 case 0x7f: /* movq ea, mm */
3305 if (mod != 3) {
3306 gen_lea_modrm(env, s, modrm);
3307 gen_stq_env_A0(s, offsetof(CPUX86State, fpregs[reg].mmx)__builtin_offsetof(CPUX86State, fpregs[reg].mmx));
3308 } else {
3309 rm = (modrm & 7);
3310 gen_op_movq(offsetof(CPUX86State,fpregs[rm].mmx)__builtin_offsetof(CPUX86State, fpregs[rm].mmx),
3311 offsetof(CPUX86State,fpregs[reg].mmx)__builtin_offsetof(CPUX86State, fpregs[reg].mmx));
3312 }
3313 break;
3314 case 0x011: /* movups */
3315 case 0x111: /* movupd */
3316 case 0x029: /* movaps */
3317 case 0x129: /* movapd */
3318 case 0x17f: /* movdqa ea, xmm */
3319 case 0x27f: /* movdqu ea, xmm */
3320 if (mod != 3) {
3321 gen_lea_modrm(env, s, modrm);
3322 gen_sto_env_A0(s, offsetof(CPUX86State, xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]));
3323 } else {
3324 rm = (modrm & 7) | REX_B(s)0;
3325 gen_op_movo(offsetof(CPUX86State,xmm_regs[rm])__builtin_offsetof(CPUX86State, xmm_regs[rm]),
3326 offsetof(CPUX86State,xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]));
3327 }
3328 break;
3329 case 0x211: /* movss ea, xmm */
3330 if (mod != 3) {
3331 gen_lea_modrm(env, s, modrm);
3332 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0]));
3333 gen_op_st_v(s, MO_32, cpu_T[0], cpu_A0);
3334 } else {
3335 rm = (modrm & 7) | REX_B(s)0;
3336 gen_op_movl(offsetof(CPUX86State,xmm_regs[rm].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[rm]._l[0]),
3337 offsetof(CPUX86State,xmm_regs[reg].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0]));
3338 }
3339 break;
3340 case 0x311: /* movsd ea, xmm */
3341 if (mod != 3) {
3342 gen_lea_modrm(env, s, modrm);
3343 gen_stq_env_A0(s, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0])
3344 xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3345 } else {
3346 rm = (modrm & 7) | REX_B(s)0;
3347 gen_op_movq(offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[rm]._q[0]),
3348 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3349 }
3350 break;
3351 case 0x013: /* movlps */
3352 case 0x113: /* movlpd */
3353 if (mod != 3) {
3354 gen_lea_modrm(env, s, modrm);
3355 gen_stq_env_A0(s, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0])
3356 xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3357 } else {
3358 goto illegal_op;
3359 }
3360 break;
3361 case 0x017: /* movhps */
3362 case 0x117: /* movhpd */
3363 if (mod != 3) {
3364 gen_lea_modrm(env, s, modrm);
3365 gen_stq_env_A0(s, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[1])
3366 xmm_regs[reg].XMM_Q(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[1]));
3367 } else {
3368 goto illegal_op;
3369 }
3370 break;
3371 case 0x71: /* shift mm, im */
3372 case 0x72:
3373 case 0x73:
3374 case 0x171: /* shift xmm, im */
3375 case 0x172:
3376 case 0x173:
3377 if (b1 >= 2) {
3378 goto illegal_op;
3379 }
3380 val = cpu_ldub_code(env, s->pc++);
3381 if (is_xmm) {
3382 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], val);
3383 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(0))__builtin_offsetof(CPUX86State, xmm_t0._l[0]));
3384 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], 0);
3385 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(1))__builtin_offsetof(CPUX86State, xmm_t0._l[1]));
3386 op1_offset = offsetof(CPUX86State,xmm_t0)__builtin_offsetof(CPUX86State, xmm_t0);
3387 } else {
3388 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], val);
3389 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,mmx_t0.MMX_L(0))__builtin_offsetof(CPUX86State, mmx_t0._l[0]));
3390 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], 0);
3391 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,mmx_t0.MMX_L(1))__builtin_offsetof(CPUX86State, mmx_t0._l[1]));
3392 op1_offset = offsetof(CPUX86State,mmx_t0)__builtin_offsetof(CPUX86State, mmx_t0);
3393 }
3394 sse_fn_epp = sse_op_table2[((b - 1) & 3) * 8 +
3395 (((modrm >> 3)) & 7)][b1];
3396 if (!sse_fn_epp) {
3397 goto illegal_op;
3398 }
3399 if (is_xmm) {
3400 rm = (modrm & 7) | REX_B(s)0;
3401 op2_offset = offsetof(CPUX86State,xmm_regs[rm])__builtin_offsetof(CPUX86State, xmm_regs[rm]);
3402 } else {
3403 rm = (modrm & 7);
3404 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx)__builtin_offsetof(CPUX86State, fpregs[rm].mmx);
3405 }
3406 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
3407 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr1).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
3408 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
3409 break;
3410 case 0x050: /* movmskps */
3411 rm = (modrm & 7) | REX_B(s)0;
3412 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[rm])))
3413 offsetof(CPUX86State,xmm_regs[rm]))tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[rm])))
;
3414 gen_helper_movmskps(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3415 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[reg], cpu_tmp2_i32);
3416 break;
3417 case 0x150: /* movmskpd */
3418 rm = (modrm & 7) | REX_B(s)0;
3419 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[rm])))
3420 offsetof(CPUX86State,xmm_regs[rm]))tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[rm])))
;
3421 gen_helper_movmskpd(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3422 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[reg], cpu_tmp2_i32);
3423 break;
3424 case 0x02a: /* cvtpi2ps */
3425 case 0x12a: /* cvtpi2pd */
3426 gen_helper_enter_mmx(cpu_env);
3427 if (mod != 3) {
3428 gen_lea_modrm(env, s, modrm);
3429 op2_offset = offsetof(CPUX86State,mmx_t0)__builtin_offsetof(CPUX86State, mmx_t0);
3430 gen_ldq_env_A0(s, op2_offset);
3431 } else {
3432 rm = (modrm & 7);
3433 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx)__builtin_offsetof(CPUX86State, fpregs[rm].mmx);
3434 }
3435 op1_offset = offsetof(CPUX86State,xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]);
3436 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
3437 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr1).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
3438 switch(b >> 8) {
3439 case 0x0:
3440 gen_helper_cvtpi2ps(cpu_env, cpu_ptr0, cpu_ptr1);
3441 break;
3442 default:
3443 case 0x1:
3444 gen_helper_cvtpi2pd(cpu_env, cpu_ptr0, cpu_ptr1);
3445 break;
3446 }
3447 break;
3448 case 0x22a: /* cvtsi2ss */
3449 case 0x32a: /* cvtsi2sd */
3450 ot = mo_64_32(s->dflag);
3451 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3452 op1_offset = offsetof(CPUX86State,xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]);
3453 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
3454 if (ot == MO_32) {
3455 SSEFunc_0_epi sse_fn_epi = sse_op_table3ai[(b >> 8) & 1];
3456 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
3457 sse_fn_epi(cpu_env, cpu_ptr0, cpu_tmp2_i32);
3458 } else {
3459#ifdef TARGET_X86_64
3460 SSEFunc_0_epl sse_fn_epl = sse_op_table3aq[(b >> 8) & 1];
3461 sse_fn_epl(cpu_env, cpu_ptr0, cpu_T[0]);
3462#else
3463 goto illegal_op;
3464#endif
3465 }
3466 break;
3467 case 0x02c: /* cvttps2pi */
3468 case 0x12c: /* cvttpd2pi */
3469 case 0x02d: /* cvtps2pi */
3470 case 0x12d: /* cvtpd2pi */
3471 gen_helper_enter_mmx(cpu_env);
3472 if (mod != 3) {
3473 gen_lea_modrm(env, s, modrm);
3474 op2_offset = offsetof(CPUX86State,xmm_t0)__builtin_offsetof(CPUX86State, xmm_t0);
3475 gen_ldo_env_A0(s, op2_offset);
3476 } else {
3477 rm = (modrm & 7) | REX_B(s)0;
3478 op2_offset = offsetof(CPUX86State,xmm_regs[rm])__builtin_offsetof(CPUX86State, xmm_regs[rm]);
3479 }
3480 op1_offset = offsetof(CPUX86State,fpregs[reg & 7].mmx)__builtin_offsetof(CPUX86State, fpregs[reg & 7].mmx);
3481 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
3482 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr1).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
3483 switch(b) {
3484 case 0x02c:
3485 gen_helper_cvttps2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3486 break;
3487 case 0x12c:
3488 gen_helper_cvttpd2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3489 break;
3490 case 0x02d:
3491 gen_helper_cvtps2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3492 break;
3493 case 0x12d:
3494 gen_helper_cvtpd2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3495 break;
3496 }
3497 break;
3498 case 0x22c: /* cvttss2si */
3499 case 0x32c: /* cvttsd2si */
3500 case 0x22d: /* cvtss2si */
3501 case 0x32d: /* cvtsd2si */
3502 ot = mo_64_32(s->dflag);
3503 if (mod != 3) {
3504 gen_lea_modrm(env, s, modrm);
3505 if ((b >> 8) & 1) {
3506 gen_ldq_env_A0(s, offsetof(CPUX86State, xmm_t0.XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_t0._q[0]));
3507 } else {
3508 gen_op_ld_v(s, MO_32, cpu_T[0], cpu_A0);
3509 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(0))__builtin_offsetof(CPUX86State, xmm_t0._l[0]));
3510 }
3511 op2_offset = offsetof(CPUX86State,xmm_t0)__builtin_offsetof(CPUX86State, xmm_t0);
3512 } else {
3513 rm = (modrm & 7) | REX_B(s)0;
3514 op2_offset = offsetof(CPUX86State,xmm_regs[rm])__builtin_offsetof(CPUX86State, xmm_regs[rm]);
3515 }
3516 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
3517 if (ot == MO_32) {
3518 SSEFunc_i_ep sse_fn_i_ep =
3519 sse_op_table3bi[((b >> 7) & 2) | (b & 1)];
3520 sse_fn_i_ep(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3521 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_T[0], cpu_tmp2_i32);
3522 } else {
3523#ifdef TARGET_X86_64
3524 SSEFunc_l_ep sse_fn_l_ep =
3525 sse_op_table3bq[((b >> 7) & 2) | (b & 1)];
3526 sse_fn_l_ep(cpu_T[0], cpu_env, cpu_ptr0);
3527#else
3528 goto illegal_op;
3529#endif
3530 }
3531 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
3532 break;
3533 case 0xc4: /* pinsrw */
3534 case 0x1c4:
3535 s->rip_offset = 1;
3536 gen_ldst_modrm(env, s, modrm, MO_16, OR_TMP0, 0);
3537 val = cpu_ldub_code(env, s->pc++);
3538 if (b1) {
3539 val &= 7;
3540 tcg_gen_st16_tltcg_gen_st16_i32(cpu_T[0], cpu_env,
3541 offsetof(CPUX86State,xmm_regs[reg].XMM_W(val))__builtin_offsetof(CPUX86State, xmm_regs[reg]._w[val]));
3542 } else {
3543 val &= 3;
3544 tcg_gen_st16_tltcg_gen_st16_i32(cpu_T[0], cpu_env,
3545 offsetof(CPUX86State,fpregs[reg].mmx.MMX_W(val))__builtin_offsetof(CPUX86State, fpregs[reg].mmx._w[val]));
3546 }
3547 break;
3548 case 0xc5: /* pextrw */
3549 case 0x1c5:
3550 if (mod != 3)
3551 goto illegal_op;
3552 ot = mo_64_32(s->dflag);
3553 val = cpu_ldub_code(env, s->pc++);
3554 if (b1) {
3555 val &= 7;
3556 rm = (modrm & 7) | REX_B(s)0;
3557 tcg_gen_ld16u_tltcg_gen_ld16u_i32(cpu_T[0], cpu_env,
3558 offsetof(CPUX86State,xmm_regs[rm].XMM_W(val))__builtin_offsetof(CPUX86State, xmm_regs[rm]._w[val]));
3559 } else {
3560 val &= 3;
3561 rm = (modrm & 7);
3562 tcg_gen_ld16u_tltcg_gen_ld16u_i32(cpu_T[0], cpu_env,
3563 offsetof(CPUX86State,fpregs[rm].mmx.MMX_W(val))__builtin_offsetof(CPUX86State, fpregs[rm].mmx._w[val]));
3564 }
3565 reg = ((modrm >> 3) & 7) | rex_r;
3566 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
3567 break;
3568 case 0x1d6: /* movq ea, xmm */
3569 if (mod != 3) {
3570 gen_lea_modrm(env, s, modrm);
3571 gen_stq_env_A0(s, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0])
3572 xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3573 } else {
3574 rm = (modrm & 7) | REX_B(s)0;
3575 gen_op_movq(offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[rm]._q[0]),
3576 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]));
3577 gen_op_movq_env_0(offsetof(CPUX86State,xmm_regs[rm].XMM_Q(1))__builtin_offsetof(CPUX86State, xmm_regs[rm]._q[1]));
3578 }
3579 break;
3580 case 0x2d6: /* movq2dq */
3581 gen_helper_enter_mmx(cpu_env);
3582 rm = (modrm & 7);
3583 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[0]),
3584 offsetof(CPUX86State,fpregs[rm].mmx)__builtin_offsetof(CPUX86State, fpregs[rm].mmx));
3585 gen_op_movq_env_0(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[1]));
3586 break;
3587 case 0x3d6: /* movdq2q */
3588 gen_helper_enter_mmx(cpu_env);
3589 rm = (modrm & 7) | REX_B(s)0;
3590 gen_op_movq(offsetof(CPUX86State,fpregs[reg & 7].mmx)__builtin_offsetof(CPUX86State, fpregs[reg & 7].mmx),
3591 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0))__builtin_offsetof(CPUX86State, xmm_regs[rm]._q[0]));
3592 break;
3593 case 0xd7: /* pmovmskb */
3594 case 0x1d7:
3595 if (mod != 3)
3596 goto illegal_op;
3597 if (b1) {
3598 rm = (modrm & 7) | REX_B(s)0;
3599 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, offsetof(CPUX86State,xmm_regs[rm]))tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, xmm_regs[rm])))
;
3600 gen_helper_pmovmskb_xmm(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3601 } else {
3602 rm = (modrm & 7);
3603 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, offsetof(CPUX86State,fpregs[rm].mmx))tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (__builtin_offsetof
(CPUX86State, fpregs[rm].mmx)))
;
3604 gen_helper_pmovmskb_mmx(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3605 }
3606 reg = ((modrm >> 3) & 7) | rex_r;
3607 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[reg], cpu_tmp2_i32);
3608 break;
3609
3610 case 0x138:
3611 case 0x038:
3612 b = modrm;
3613 if ((b & 0xf0) == 0xf0) {
3614 goto do_0f_38_fx;
3615 }
3616 modrm = cpu_ldub_code(env, s->pc++);
3617 rm = modrm & 7;
3618 reg = ((modrm >> 3) & 7) | rex_r;
3619 mod = (modrm >> 6) & 3;
3620 if (b1 >= 2) {
3621 goto illegal_op;
3622 }
3623
3624 sse_fn_epp = sse_op_table6[b].op[b1];
3625 if (!sse_fn_epp) {
3626 goto illegal_op;
3627 }
3628 if (!(s->cpuid_ext_features & sse_op_table6[b].ext_mask))
3629 goto illegal_op;
3630
3631 if (b1) {
3632 op1_offset = offsetof(CPUX86State,xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]);
3633 if (mod == 3) {
3634 op2_offset = offsetof(CPUX86State,xmm_regs[rm | REX_B(s)])__builtin_offsetof(CPUX86State, xmm_regs[rm | 0]);
3635 } else {
3636 op2_offset = offsetof(CPUX86State,xmm_t0)__builtin_offsetof(CPUX86State, xmm_t0);
3637 gen_lea_modrm(env, s, modrm);
3638 switch (b) {
3639 case 0x20: case 0x30: /* pmovsxbw, pmovzxbw */
3640 case 0x23: case 0x33: /* pmovsxwd, pmovzxwd */
3641 case 0x25: case 0x35: /* pmovsxdq, pmovzxdq */
3642 gen_ldq_env_A0(s, op2_offset +
3643 offsetof(XMMReg, XMM_Q(0))__builtin_offsetof(XMMReg, _q[0]));
3644 break;
3645 case 0x21: case 0x31: /* pmovsxbd, pmovzxbd */
3646 case 0x24: case 0x34: /* pmovsxwq, pmovzxwq */
3647 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
3648 s->mem_index, MO_LEUL);
3649 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, op2_offset +
3650 offsetof(XMMReg, XMM_L(0))__builtin_offsetof(XMMReg, _l[0]));
3651 break;
3652 case 0x22: case 0x32: /* pmovsxbq, pmovzxbq */
3653 tcg_gen_qemu_ld_tltcg_gen_qemu_ld_i32(cpu_tmp0, cpu_A0,
3654 s->mem_index, MO_LEUW);
3655 tcg_gen_st16_tltcg_gen_st16_i32(cpu_tmp0, cpu_env, op2_offset +
3656 offsetof(XMMReg, XMM_W(0))__builtin_offsetof(XMMReg, _w[0]));
3657 break;
3658 case 0x2a: /* movntqda */
3659 gen_ldo_env_A0(s, op1_offset);
3660 return;
3661 default:
3662 gen_ldo_env_A0(s, op2_offset);
3663 }
3664 }
3665 } else {
3666 op1_offset = offsetof(CPUX86State,fpregs[reg].mmx)__builtin_offsetof(CPUX86State, fpregs[reg].mmx);
3667 if (mod == 3) {
3668 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx)__builtin_offsetof(CPUX86State, fpregs[rm].mmx);
3669 } else {
3670 op2_offset = offsetof(CPUX86State,mmx_t0)__builtin_offsetof(CPUX86State, mmx_t0);
3671 gen_lea_modrm(env, s, modrm);
3672 gen_ldq_env_A0(s, op2_offset);
3673 }
3674 }
3675 if (sse_fn_epp == SSE_SPECIAL((void *)1)) {
3676 goto illegal_op;
3677 }
3678
3679 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
3680 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr1).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
3681 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
3682
3683 if (b == 0x17) {
3684 set_cc_op(s, CC_OP_EFLAGS);
3685 }
3686 break;
3687
3688 case 0x238:
3689 case 0x338:
3690 do_0f_38_fx:
3691 /* Various integer extensions at 0f 38 f[0-f]. */
3692 b = modrm | (b1 << 8);
3693 modrm = cpu_ldub_code(env, s->pc++);
3694 reg = ((modrm >> 3) & 7) | rex_r;
3695
3696 switch (b) {
3697 case 0x3f0: /* crc32 Gd,Eb */
3698 case 0x3f1: /* crc32 Gd,Ey */
3699 do_crc32:
3700 if (!(s->cpuid_ext_features & CPUID_EXT_SSE42(1 << 20))) {
3701 goto illegal_op;
3702 }
3703 if ((b & 0xff) == 0xf0) {
3704 ot = MO_8;
3705 } else if (s->dflag != MO_64) {
3706 ot = (s->prefix & PREFIX_DATA0x08 ? MO_16 : MO_32);
3707 } else {
3708 ot = MO_64;
3709 }
3710
3711 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_regs[reg]);
3712 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3713 gen_helper_crc32(cpu_T[0], cpu_tmp2_i32,
3714 cpu_T[0], tcg_const_i32(8 << ot));
3715
3716 ot = mo_64_32(s->dflag);
3717 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
3718 break;
3719
3720 case 0x1f0: /* crc32 or movbe */
3721 case 0x1f1:
3722 /* For these insns, the f3 prefix is supposed to have priority
3723 over the 66 prefix, but that's not what we implement above
3724 setting b1. */
3725 if (s->prefix & PREFIX_REPNZ0x02) {
3726 goto do_crc32;
3727 }
3728 /* FALLTHRU */
3729 case 0x0f0: /* movbe Gy,My */
3730 case 0x0f1: /* movbe My,Gy */
3731 if (!(s->cpuid_ext_features & CPUID_EXT_MOVBE(1 << 22))) {
3732 goto illegal_op;
3733 }
3734 if (s->dflag != MO_64) {
3735 ot = (s->prefix & PREFIX_DATA0x08 ? MO_16 : MO_32);
3736 } else {
3737 ot = MO_64;
3738 }
3739
3740 gen_lea_modrm(env, s, modrm);
3741 if ((b & 1) == 0) {
3742 tcg_gen_qemu_ld_tltcg_gen_qemu_ld_i32(cpu_T[0], cpu_A0,
3743 s->mem_index, ot | MO_BE);
3744 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
3745 } else {
3746 tcg_gen_qemu_st_tltcg_gen_qemu_st_i32(cpu_regs[reg], cpu_A0,
3747 s->mem_index, ot | MO_BE);
3748 }
3749 break;
3750
3751 case 0x0f2: /* andn Gy, By, Ey */
3752 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_BMI1(1 << 3))
3753 || !(s->prefix & PREFIX_VEX0x20)
3754 || s->vex_l != 0) {
3755 goto illegal_op;
3756 }
3757 ot = mo_64_32(s->dflag);
3758 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3759 tcg_gen_andc_tltcg_gen_andc_i32(cpu_T[0], cpu_regs[s->vex_v], cpu_T[0]);
3760 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
3761 gen_op_update1_cc();
3762 set_cc_op(s, CC_OP_LOGICB + ot);
3763 break;
3764
3765 case 0x0f7: /* bextr Gy, Ey, By */
3766 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_BMI1(1 << 3))
3767 || !(s->prefix & PREFIX_VEX0x20)
3768 || s->vex_l != 0) {
3769 goto illegal_op;
3770 }
3771 ot = mo_64_32(s->dflag);
3772 {
3773 TCGvTCGv_i32 bound, zero;
3774
3775 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3776 /* Extract START, and shift the operand.
3777 Shifts larger than operand size get zeros. */
3778 tcg_gen_ext8u_tltcg_gen_ext8u_i32(cpu_A0, cpu_regs[s->vex_v]);
3779 tcg_gen_shr_tltcg_gen_shr_i32(cpu_T[0], cpu_T[0], cpu_A0);
3780
3781 bound = tcg_const_tltcg_const_i32(ot == MO_64 ? 63 : 31);
3782 zero = tcg_const_tltcg_const_i32(0);
3783 tcg_gen_movcond_tltcg_gen_movcond_i32(TCG_COND_LEU, cpu_T[0], cpu_A0, bound,
3784 cpu_T[0], zero);
3785 tcg_temp_freetcg_temp_free_i32(zero);
3786
3787 /* Extract the LEN into a mask. Lengths larger than
3788 operand size get all ones. */
3789 tcg_gen_shri_tltcg_gen_shri_i32(cpu_A0, cpu_regs[s->vex_v], 8);
3790 tcg_gen_ext8u_tltcg_gen_ext8u_i32(cpu_A0, cpu_A0);
3791 tcg_gen_movcond_tltcg_gen_movcond_i32(TCG_COND_LEU, cpu_A0, cpu_A0, bound,
3792 cpu_A0, bound);
3793 tcg_temp_freetcg_temp_free_i32(bound);
3794 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], 1);
3795 tcg_gen_shl_tltcg_gen_shl_i32(cpu_T[1], cpu_T[1], cpu_A0);
3796 tcg_gen_subi_tltcg_gen_subi_i32(cpu_T[1], cpu_T[1], 1);
3797 tcg_gen_and_tltcg_gen_and_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
3798
3799 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
3800 gen_op_update1_cc();
3801 set_cc_op(s, CC_OP_LOGICB + ot);
3802 }
3803 break;
3804
3805 case 0x0f5: /* bzhi Gy, Ey, By */
3806 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_BMI2(1 << 8))
3807 || !(s->prefix & PREFIX_VEX0x20)
3808 || s->vex_l != 0) {
3809 goto illegal_op;
3810 }
3811 ot = mo_64_32(s->dflag);
3812 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3813 tcg_gen_ext8u_tltcg_gen_ext8u_i32(cpu_T[1], cpu_regs[s->vex_v]);
3814 {
3815 TCGvTCGv_i32 bound = tcg_const_tltcg_const_i32(ot == MO_64 ? 63 : 31);
3816 /* Note that since we're using BMILG (in order to get O
3817 cleared) we need to store the inverse into C. */
3818 tcg_gen_setcond_tltcg_gen_setcond_i32(TCG_COND_LT, cpu_cc_src,
3819 cpu_T[1], bound);
3820 tcg_gen_movcond_tltcg_gen_movcond_i32(TCG_COND_GT, cpu_T[1], cpu_T[1],
3821 bound, bound, cpu_T[1]);
3822 tcg_temp_freetcg_temp_free_i32(bound);
3823 }
3824 tcg_gen_movi_tltcg_gen_movi_i32(cpu_A0, -1);
3825 tcg_gen_shl_tltcg_gen_shl_i32(cpu_A0, cpu_A0, cpu_T[1]);
3826 tcg_gen_andc_tltcg_gen_andc_i32(cpu_T[0], cpu_T[0], cpu_A0);
3827 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
3828 gen_op_update1_cc();
3829 set_cc_op(s, CC_OP_BMILGB + ot);
3830 break;
3831
3832 case 0x3f6: /* mulx By, Gy, rdx, Ey */
3833 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_BMI2(1 << 8))
3834 || !(s->prefix & PREFIX_VEX0x20)
3835 || s->vex_l != 0) {
3836 goto illegal_op;
3837 }
3838 ot = mo_64_32(s->dflag);
3839 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3840 switch (ot) {
3841 default:
3842 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
3843 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp3_i32, cpu_regs[R_EDX2]);
3844 tcg_gen_mulu2_i32(cpu_tmp2_i32, cpu_tmp3_i32,
3845 cpu_tmp2_i32, cpu_tmp3_i32);
3846 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[s->vex_v], cpu_tmp2_i32);
3847 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[reg], cpu_tmp3_i32);
3848 break;
3849#ifdef TARGET_X86_64
3850 case MO_64:
3851 tcg_gen_mulu2_i64(cpu_regs[s->vex_v], cpu_regs[reg],
3852 cpu_T[0], cpu_regs[R_EDX2]);
3853 break;
3854#endif
3855 }
3856 break;
3857
3858 case 0x3f5: /* pdep Gy, By, Ey */
3859 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_BMI2(1 << 8))
3860 || !(s->prefix & PREFIX_VEX0x20)
3861 || s->vex_l != 0) {
3862 goto illegal_op;
3863 }
3864 ot = mo_64_32(s->dflag);
3865 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3866 /* Note that by zero-extending the mask operand, we
3867 automatically handle zero-extending the result. */
3868 if (ot == MO_64) {
3869 tcg_gen_mov_tltcg_gen_mov_i32(cpu_T[1], cpu_regs[s->vex_v]);
3870 } else {
3871 tcg_gen_ext32u_tltcg_gen_mov_i32(cpu_T[1], cpu_regs[s->vex_v]);
3872 }
3873 gen_helper_pdep(cpu_regs[reg], cpu_T[0], cpu_T[1]);
3874 break;
3875
3876 case 0x2f5: /* pext Gy, By, Ey */
3877 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_BMI2(1 << 8))
3878 || !(s->prefix & PREFIX_VEX0x20)
3879 || s->vex_l != 0) {
3880 goto illegal_op;
3881 }
3882 ot = mo_64_32(s->dflag);
3883 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3884 /* Note that by zero-extending the mask operand, we
3885 automatically handle zero-extending the result. */
3886 if (ot == MO_64) {
3887 tcg_gen_mov_tltcg_gen_mov_i32(cpu_T[1], cpu_regs[s->vex_v]);
3888 } else {
3889 tcg_gen_ext32u_tltcg_gen_mov_i32(cpu_T[1], cpu_regs[s->vex_v]);
3890 }
3891 gen_helper_pext(cpu_regs[reg], cpu_T[0], cpu_T[1]);
3892 break;
3893
3894 case 0x1f6: /* adcx Gy, Ey */
3895 case 0x2f6: /* adox Gy, Ey */
3896 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_ADX(1 << 19))) {
3897 goto illegal_op;
3898 } else {
3899 TCGvTCGv_i32 carry_in, carry_out, zero;
3900 int end_op;
3901
3902 ot = mo_64_32(s->dflag);
3903 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3904
3905 /* Re-use the carry-out from a previous round. */
3906 TCGV_UNUSED(carry_in)carry_in = __extension__ ({ TCGv_i32 make_tcgv_tmp = {-1}; make_tcgv_tmp
;})
;
3907 carry_out = (b == 0x1f6 ? cpu_cc_dst : cpu_cc_src2);
3908 switch (s->cc_op) {
3909 case CC_OP_ADCX:
3910 if (b == 0x1f6) {
3911 carry_in = cpu_cc_dst;
3912 end_op = CC_OP_ADCX;
3913 } else {
3914 end_op = CC_OP_ADCOX;
3915 }
3916 break;
3917 case CC_OP_ADOX:
3918 if (b == 0x1f6) {
3919 end_op = CC_OP_ADCOX;
3920 } else {
3921 carry_in = cpu_cc_src2;
3922 end_op = CC_OP_ADOX;
3923 }
3924 break;
3925 case CC_OP_ADCOX:
3926 end_op = CC_OP_ADCOX;
3927 carry_in = carry_out;
3928 break;
3929 default:
3930 end_op = (b == 0x1f6 ? CC_OP_ADCX : CC_OP_ADOX);
3931 break;
3932 }
3933 /* If we can't reuse carry-out, get it out of EFLAGS. */
3934 if (TCGV_IS_UNUSED(carry_in)(((carry_in).i32) == -1)) {
3935 if (s->cc_op != CC_OP_ADCX && s->cc_op != CC_OP_ADOX) {
3936 gen_compute_eflags(s);
3937 }
3938 carry_in = cpu_tmp0;
3939 tcg_gen_shri_tltcg_gen_shri_i32(carry_in, cpu_cc_src,
3940 ctz32(b == 0x1f6 ? CC_C0x0001 : CC_O0x0800));
3941 tcg_gen_andi_tltcg_gen_andi_i32(carry_in, carry_in, 1);
3942 }
3943
3944 switch (ot) {
3945#ifdef TARGET_X86_64
3946 case MO_32:
3947 /* If we know TL is 64-bit, and we want a 32-bit
3948 result, just do everything in 64-bit arithmetic. */
3949 tcg_gen_ext32u_i64(cpu_regs[reg], cpu_regs[reg]);
3950 tcg_gen_ext32u_i64(cpu_T[0], cpu_T[0]);
3951 tcg_gen_add_i64(cpu_T[0], cpu_T[0], cpu_regs[reg]);
3952 tcg_gen_add_i64(cpu_T[0], cpu_T[0], carry_in);
3953 tcg_gen_ext32u_i64(cpu_regs[reg], cpu_T[0]);
3954 tcg_gen_shri_i64(carry_out, cpu_T[0], 32);
3955 break;
3956#endif
3957 default:
3958 /* Otherwise compute the carry-out in two steps. */
3959 zero = tcg_const_tltcg_const_i32(0);
3960 tcg_gen_add2_tltcg_gen_add2_i32(cpu_T[0], carry_out,
3961 cpu_T[0], zero,
3962 carry_in, zero);
3963 tcg_gen_add2_tltcg_gen_add2_i32(cpu_regs[reg], carry_out,
3964 cpu_regs[reg], carry_out,
3965 cpu_T[0], zero);
3966 tcg_temp_freetcg_temp_free_i32(zero);
3967 break;
3968 }
3969 set_cc_op(s, end_op);
3970 }
3971 break;
3972
3973 case 0x1f7: /* shlx Gy, Ey, By */
3974 case 0x2f7: /* sarx Gy, Ey, By */
3975 case 0x3f7: /* shrx Gy, Ey, By */
3976 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_BMI2(1 << 8))
3977 || !(s->prefix & PREFIX_VEX0x20)
3978 || s->vex_l != 0) {
3979 goto illegal_op;
3980 }
3981 ot = mo_64_32(s->dflag);
3982 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3983 if (ot == MO_64) {
3984 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[1], cpu_regs[s->vex_v], 63);
3985 } else {
3986 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[1], cpu_regs[s->vex_v], 31);
3987 }
3988 if (b == 0x1f7) {
3989 tcg_gen_shl_tltcg_gen_shl_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
3990 } else if (b == 0x2f7) {
3991 if (ot != MO_64) {
3992 tcg_gen_ext32s_tltcg_gen_mov_i32(cpu_T[0], cpu_T[0]);
3993 }
3994 tcg_gen_sar_tltcg_gen_sar_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
3995 } else {
3996 if (ot != MO_64) {
3997 tcg_gen_ext32u_tltcg_gen_mov_i32(cpu_T[0], cpu_T[0]);
3998 }
3999 tcg_gen_shr_tltcg_gen_shr_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
4000 }
4001 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
4002 break;
4003
4004 case 0x0f3:
4005 case 0x1f3:
4006 case 0x2f3:
4007 case 0x3f3: /* Group 17 */
4008 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_BMI1(1 << 3))
4009 || !(s->prefix & PREFIX_VEX0x20)
4010 || s->vex_l != 0) {
4011 goto illegal_op;
4012 }
4013 ot = mo_64_32(s->dflag);
4014 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
4015
4016 switch (reg & 7) {
4017 case 1: /* blsr By,Ey */
4018 tcg_gen_neg_tltcg_gen_neg_i32(cpu_T[1], cpu_T[0]);
4019 tcg_gen_and_tltcg_gen_and_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
4020 gen_op_mov_reg_v(ot, s->vex_v, cpu_T[0]);
4021 gen_op_update2_cc();
4022 set_cc_op(s, CC_OP_BMILGB + ot);
4023 break;
4024
4025 case 2: /* blsmsk By,Ey */
4026 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_T[0]);
4027 tcg_gen_subi_tltcg_gen_subi_i32(cpu_T[0], cpu_T[0], 1);
4028 tcg_gen_xor_tltcg_gen_xor_i32(cpu_T[0], cpu_T[0], cpu_cc_src);
4029 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
4030 set_cc_op(s, CC_OP_BMILGB + ot);
4031 break;
4032
4033 case 3: /* blsi By, Ey */
4034 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_T[0]);
4035 tcg_gen_subi_tltcg_gen_subi_i32(cpu_T[0], cpu_T[0], 1);
4036 tcg_gen_and_tltcg_gen_and_i32(cpu_T[0], cpu_T[0], cpu_cc_src);
4037 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
4038 set_cc_op(s, CC_OP_BMILGB + ot);
4039 break;
4040
4041 default:
4042 goto illegal_op;
4043 }
4044 break;
4045
4046 default:
4047 goto illegal_op;
4048 }
4049 break;
4050
4051 case 0x03a:
4052 case 0x13a:
4053 b = modrm;
4054 modrm = cpu_ldub_code(env, s->pc++);
4055 rm = modrm & 7;
4056 reg = ((modrm >> 3) & 7) | rex_r;
4057 mod = (modrm >> 6) & 3;
4058 if (b1 >= 2) {
4059 goto illegal_op;
4060 }
4061
4062 sse_fn_eppi = sse_op_table7[b].op[b1];
4063 if (!sse_fn_eppi) {
4064 goto illegal_op;
4065 }
4066 if (!(s->cpuid_ext_features & sse_op_table7[b].ext_mask))
4067 goto illegal_op;
4068
4069 if (sse_fn_eppi == SSE_SPECIAL((void *)1)) {
4070 ot = mo_64_32(s->dflag);
4071 rm = (modrm & 7) | REX_B(s)0;
4072 if (mod != 3)
4073 gen_lea_modrm(env, s, modrm);
4074 reg = ((modrm >> 3) & 7) | rex_r;
4075 val = cpu_ldub_code(env, s->pc++);
4076 switch (b) {
4077 case 0x14: /* pextrb */
4078 tcg_gen_ld8u_tltcg_gen_ld8u_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._b[val & 15
])
4079 xmm_regs[reg].XMM_B(val & 15))__builtin_offsetof(CPUX86State, xmm_regs[reg]._b[val & 15
])
);
4080 if (mod == 3) {
4081 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
4082 } else {
4083 tcg_gen_qemu_st_tltcg_gen_qemu_st_i32(cpu_T[0], cpu_A0,
4084 s->mem_index, MO_UB);
4085 }
4086 break;
4087 case 0x15: /* pextrw */
4088 tcg_gen_ld16u_tltcg_gen_ld16u_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._w[val & 7]
)
4089 xmm_regs[reg].XMM_W(val & 7))__builtin_offsetof(CPUX86State, xmm_regs[reg]._w[val & 7]
)
);
4090 if (mod == 3) {
4091 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
4092 } else {
4093 tcg_gen_qemu_st_tltcg_gen_qemu_st_i32(cpu_T[0], cpu_A0,
4094 s->mem_index, MO_LEUW);
4095 }
4096 break;
4097 case 0x16:
4098 if (ot == MO_32) { /* pextrd */
4099 tcg_gen_ld_i32(cpu_tmp2_i32, cpu_env,
4100 offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[val & 3]
)
4101 xmm_regs[reg].XMM_L(val & 3))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[val & 3]
)
);
4102 if (mod == 3) {
4103 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[rm], cpu_tmp2_i32);
4104 } else {
4105 tcg_gen_qemu_st_i32(cpu_tmp2_i32, cpu_A0,
4106 s->mem_index, MO_LEUL);
4107 }
4108 } else { /* pextrq */
4109#ifdef TARGET_X86_64
4110 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env,
4111 offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[val & 1]
)
4112 xmm_regs[reg].XMM_Q(val & 1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[val & 1]
)
);
4113 if (mod == 3) {
4114 tcg_gen_mov_i64(cpu_regs[rm], cpu_tmp1_i64);
4115 } else {
4116 tcg_gen_qemu_st_i64(cpu_tmp1_i64, cpu_A0,
4117 s->mem_index, MO_LEQ);
4118 }
4119#else
4120 goto illegal_op;
4121#endif
4122 }
4123 break;
4124 case 0x17: /* extractps */
4125 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[val & 3]
)
4126 xmm_regs[reg].XMM_L(val & 3))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[val & 3]
)
);
4127 if (mod == 3) {
4128 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
4129 } else {
4130 tcg_gen_qemu_st_tltcg_gen_qemu_st_i32(cpu_T[0], cpu_A0,
4131 s->mem_index, MO_LEUL);
4132 }
4133 break;
4134 case 0x20: /* pinsrb */
4135 if (mod == 3) {
4136 gen_op_mov_v_reg(MO_32, cpu_T[0], rm);
4137 } else {
4138 tcg_gen_qemu_ld_tltcg_gen_qemu_ld_i32(cpu_T[0], cpu_A0,
4139 s->mem_index, MO_UB);
4140 }
4141 tcg_gen_st8_tltcg_gen_st8_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._b[val & 15
])
4142 xmm_regs[reg].XMM_B(val & 15))__builtin_offsetof(CPUX86State, xmm_regs[reg]._b[val & 15
])
);
4143 break;
4144 case 0x21: /* insertps */
4145 if (mod == 3) {
4146 tcg_gen_ld_i32(cpu_tmp2_i32, cpu_env,
4147 offsetof(CPUX86State,xmm_regs[rm]__builtin_offsetof(CPUX86State, xmm_regs[rm] ._l[(val >>
6) & 3])
4148 .XMM_L((val >> 6) & 3))__builtin_offsetof(CPUX86State, xmm_regs[rm] ._l[(val >>
6) & 3])
);
4149 } else {
4150 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
4151 s->mem_index, MO_LEUL);
4152 }
4153 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env,
4154 offsetof(CPUX86State,xmm_regs[reg]__builtin_offsetof(CPUX86State, xmm_regs[reg] ._l[(val >>
4) & 3])
4155 .XMM_L((val >> 4) & 3))__builtin_offsetof(CPUX86State, xmm_regs[reg] ._l[(val >>
4) & 3])
);
4156 if ((val >> 0) & 1)
4157 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4158 cpu_env, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0])
4159 xmm_regs[reg].XMM_L(0))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[0]));
4160 if ((val >> 1) & 1)
4161 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4162 cpu_env, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[1])
4163 xmm_regs[reg].XMM_L(1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[1]));
4164 if ((val >> 2) & 1)
4165 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4166 cpu_env, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[2])
4167 xmm_regs[reg].XMM_L(2))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[2]));
4168 if ((val >> 3) & 1)
4169 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4170 cpu_env, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[3])
4171 xmm_regs[reg].XMM_L(3))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[3]));
4172 break;
4173 case 0x22:
4174 if (ot == MO_32) { /* pinsrd */
4175 if (mod == 3) {
4176 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_regs[rm]);
4177 } else {
4178 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
4179 s->mem_index, MO_LEUL);
4180 }
4181 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env,
4182 offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[val & 3]
)
4183 xmm_regs[reg].XMM_L(val & 3))__builtin_offsetof(CPUX86State, xmm_regs[reg]._l[val & 3]
)
);
4184 } else { /* pinsrq */
4185#ifdef TARGET_X86_64
4186 if (mod == 3) {
4187 gen_op_mov_v_reg(ot, cpu_tmp1_i64, rm);
4188 } else {
4189 tcg_gen_qemu_ld_i64(cpu_tmp1_i64, cpu_A0,
4190 s->mem_index, MO_LEQ);
4191 }
4192 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env,
4193 offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[val & 1]
)
4194 xmm_regs[reg].XMM_Q(val & 1))__builtin_offsetof(CPUX86State, xmm_regs[reg]._q[val & 1]
)
);
4195#else
4196 goto illegal_op;
4197#endif
4198 }
4199 break;
4200 }
4201 return;
4202 }
4203
4204 if (b1) {
4205 op1_offset = offsetof(CPUX86State,xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]);
4206 if (mod == 3) {
4207 op2_offset = offsetof(CPUX86State,xmm_regs[rm | REX_B(s)])__builtin_offsetof(CPUX86State, xmm_regs[rm | 0]);
4208 } else {
4209 op2_offset = offsetof(CPUX86State,xmm_t0)__builtin_offsetof(CPUX86State, xmm_t0);
4210 gen_lea_modrm(env, s, modrm);
4211 gen_ldo_env_A0(s, op2_offset);
4212 }
4213 } else {
4214 op1_offset = offsetof(CPUX86State,fpregs[reg].mmx)__builtin_offsetof(CPUX86State, fpregs[reg].mmx);
4215 if (mod == 3) {
4216 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx)__builtin_offsetof(CPUX86State, fpregs[rm].mmx);
4217 } else {
4218 op2_offset = offsetof(CPUX86State,mmx_t0)__builtin_offsetof(CPUX86State, mmx_t0);
4219 gen_lea_modrm(env, s, modrm);
4220 gen_ldq_env_A0(s, op2_offset);
4221 }
4222 }
4223 val = cpu_ldub_code(env, s->pc++);
4224
4225 if ((b & 0xfc) == 0x60) { /* pcmpXstrX */
4226 set_cc_op(s, CC_OP_EFLAGS);
4227
4228 if (s->dflag == MO_64) {
4229 /* The helper must use entire 64-bit gp registers */
4230 val |= 1 << 8;
4231 }
4232 }
4233
4234 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
4235 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr1).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
4236 sse_fn_eppi(cpu_env, cpu_ptr0, cpu_ptr1, tcg_const_i32(val));
4237 break;
4238
4239 case 0x33a:
4240 /* Various integer extensions at 0f 3a f[0-f]. */
4241 b = modrm | (b1 << 8);
4242 modrm = cpu_ldub_code(env, s->pc++);
4243 reg = ((modrm >> 3) & 7) | rex_r;
4244
4245 switch (b) {
4246 case 0x3f0: /* rorx Gy,Ey, Ib */
4247 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_BMI2(1 << 8))
4248 || !(s->prefix & PREFIX_VEX0x20)
4249 || s->vex_l != 0) {
4250 goto illegal_op;
4251 }
4252 ot = mo_64_32(s->dflag);
4253 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
4254 b = cpu_ldub_code(env, s->pc++);
4255 if (ot == MO_64) {
4256 tcg_gen_rotri_tltcg_gen_rotri_i32(cpu_T[0], cpu_T[0], b & 63);
4257 } else {
4258 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
4259 tcg_gen_rotri_i32(cpu_tmp2_i32, cpu_tmp2_i32, b & 31);
4260 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_T[0], cpu_tmp2_i32);
4261 }
4262 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
4263 break;
4264
4265 default:
4266 goto illegal_op;
4267 }
4268 break;
4269
4270 default:
4271 goto illegal_op;
4272 }
4273 } else {
4274 /* generic MMX or SSE operation */
4275 switch(b) {
4276 case 0x70: /* pshufx insn */
4277 case 0xc6: /* pshufx insn */
4278 case 0xc2: /* compare insns */
4279 s->rip_offset = 1;
4280 break;
4281 default:
4282 break;
4283 }
4284 if (is_xmm) {
4285 op1_offset = offsetof(CPUX86State,xmm_regs[reg])__builtin_offsetof(CPUX86State, xmm_regs[reg]);
4286 if (mod != 3) {
4287 gen_lea_modrm(env, s, modrm);
4288 op2_offset = offsetof(CPUX86State,xmm_t0)__builtin_offsetof(CPUX86State, xmm_t0);
4289 if (b1 >= 2 && ((b >= 0x50 && b <= 0x5f && b != 0x5b) ||
4290 b == 0xc2)) {
4291 /* specific case for SSE single instructions */
4292 if (b1 == 2) {
4293 /* 32 bit access */
4294 gen_op_ld_v(s, MO_32, cpu_T[0], cpu_A0);
4295 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(0))__builtin_offsetof(CPUX86State, xmm_t0._l[0]));
4296 } else {
4297 /* 64 bit access */
4298 gen_ldq_env_A0(s, offsetof(CPUX86State,__builtin_offsetof(CPUX86State, xmm_t0._d[0])
4299 xmm_t0.XMM_D(0))__builtin_offsetof(CPUX86State, xmm_t0._d[0]));
4300 }
4301 } else {
4302 gen_ldo_env_A0(s, op2_offset);
4303 }
4304 } else {
4305 rm = (modrm & 7) | REX_B(s)0;
4306 op2_offset = offsetof(CPUX86State,xmm_regs[rm])__builtin_offsetof(CPUX86State, xmm_regs[rm]);
4307 }
4308 } else {
4309 op1_offset = offsetof(CPUX86State,fpregs[reg].mmx)__builtin_offsetof(CPUX86State, fpregs[reg].mmx);
4310 if (mod != 3) {
4311 gen_lea_modrm(env, s, modrm);
4312 op2_offset = offsetof(CPUX86State,mmx_t0)__builtin_offsetof(CPUX86State, mmx_t0);
4313 gen_ldq_env_A0(s, op2_offset);
4314 } else {
4315 rm = (modrm & 7);
4316 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx)__builtin_offsetof(CPUX86State, fpregs[rm].mmx);
4317 }
4318 }
4319 switch(b) {
4320 case 0x0f: /* 3DNow! data insns */
4321 if (!(s->cpuid_ext2_features & CPUID_EXT2_3DNOW(1 << 31)))
4322 goto illegal_op;
4323 val = cpu_ldub_code(env, s->pc++);
4324 sse_fn_epp = sse_op_table5[val];
4325 if (!sse_fn_epp) {
4326 goto illegal_op;
4327 }
4328 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
4329 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr1).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
4330 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
4331 break;
4332 case 0x70: /* pshufx insn */
4333 case 0xc6: /* pshufx insn */
4334 val = cpu_ldub_code(env, s->pc++);
4335 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
4336 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr1).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
4337 /* XXX: introduce a new table? */
4338 sse_fn_ppi = (SSEFunc_0_ppi)sse_fn_epp;
4339 sse_fn_ppi(cpu_ptr0, cpu_ptr1, tcg_const_i32(val));
4340 break;
4341 case 0xc2:
4342 /* compare insns */
4343 val = cpu_ldub_code(env, s->pc++);
4344 if (val >= 8)
4345 goto illegal_op;
4346 sse_fn_epp = sse_op_table4[val][b1];
4347
4348 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
4349 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr1).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
4350 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
4351 break;
4352 case 0xf7:
4353 /* maskmov : we must prepare A0 */
4354 if (mod != 3)
4355 goto illegal_op;
4356 tcg_gen_mov_tltcg_gen_mov_i32(cpu_A0, cpu_regs[R_EDI7]);
4357 gen_extu(s->aflag, cpu_A0);
4358 gen_add_A0_ds_seg(s);
4359
4360 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
4361 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr1).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
4362 /* XXX: introduce a new table? */
4363 sse_fn_eppt = (SSEFunc_0_eppt)sse_fn_epp;
4364 sse_fn_eppt(cpu_env, cpu_ptr0, cpu_ptr1, cpu_A0);
4365 break;
4366 default:
4367 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr0).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op1_offset
))
;
4368 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset)tcg_gen_addi_i64(__extension__ ({ TCGv_i64 make_tcgv_tmp = {(
(cpu_ptr1).iptr)}; make_tcgv_tmp;}), __extension__ ({ TCGv_i64
make_tcgv_tmp = {((cpu_env).iptr)}; make_tcgv_tmp;}), (op2_offset
))
;
4369 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
4370 break;
4371 }
4372 if (b == 0x2e || b == 0x2f) {
4373 set_cc_op(s, CC_OP_EFLAGS);
4374 }
4375 }
4376}
4377
4378/* convert one instruction. s->is_jmp is set if the translation must
4379 be stopped. Return the next pc value */
4380static target_ulong disas_insn(CPUX86State *env, DisasContext *s,
4381 target_ulong pc_start)
4382{
4383 int b, prefixes;
4384 int shift;
4385 TCGMemOp ot, aflag, dflag;
4386 int modrm, reg, rm, mod, op, opreg, val;
4387 target_ulong next_eip, tval;
4388 int rex_w, rex_r;
4389
4390 if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP | CPU_LOG_TB_OP_OPT))__builtin_expect(!!(qemu_loglevel_mask((1 << 2) | (1 <<
3))), 0)
) {
4391 tcg_gen_debug_insn_start(pc_start);
4392 }
4393 s->pc = pc_start;
4394 prefixes = 0;
4395 s->override = -1;
4396 rex_w = -1;
4397 rex_r = 0;
4398#ifdef TARGET_X86_64
4399 s->rex_x = 0;
4400 s->rex_b = 0;
4401 x86_64_hregs = 0;
4402#endif
4403 s->rip_offset = 0; /* for relative ip address */
4404 s->vex_l = 0;
4405 s->vex_v = 0;
4406 next_byte:
4407 b = cpu_ldub_code(env, s->pc);
4408 s->pc++;
4409 /* Collect prefixes. */
4410 switch (b) {
4411 case 0xf3:
4412 prefixes |= PREFIX_REPZ0x01;
4413 goto next_byte;
4414 case 0xf2:
4415 prefixes |= PREFIX_REPNZ0x02;
4416 goto next_byte;
4417 case 0xf0:
4418 prefixes |= PREFIX_LOCK0x04;
4419 goto next_byte;
4420 case 0x2e:
4421 s->override = R_CS1;
4422 goto next_byte;
4423 case 0x36:
4424 s->override = R_SS2;
4425 goto next_byte;
4426 case 0x3e:
4427 s->override = R_DS3;
4428 goto next_byte;
4429 case 0x26:
4430 s->override = R_ES0;
4431 goto next_byte;
4432 case 0x64:
4433 s->override = R_FS4;
4434 goto next_byte;
4435 case 0x65:
4436 s->override = R_GS5;
4437 goto next_byte;
4438 case 0x66:
4439 prefixes |= PREFIX_DATA0x08;
4440 goto next_byte;
4441 case 0x67:
4442 prefixes |= PREFIX_ADR0x10;
4443 goto next_byte;
4444#ifdef TARGET_X86_64
4445 case 0x40 ... 0x4f:
4446 if (CODE64(s)0) {
4447 /* REX prefix */
4448 rex_w = (b >> 3) & 1;
4449 rex_r = (b & 0x4) << 1;
4450 s->rex_x = (b & 0x2) << 2;
4451 REX_B(s)0 = (b & 0x1) << 3;
4452 x86_64_hregs = 1; /* select uniform byte register addressing */
4453 goto next_byte;
4454 }
4455 break;
4456#endif
4457 case 0xc5: /* 2-byte VEX */
4458 case 0xc4: /* 3-byte VEX */
4459 /* VEX prefixes cannot be used except in 32-bit mode.
4460 Otherwise the instruction is LES or LDS. */
4461 if (s->code32 && !s->vm86) {
4462 static const int pp_prefix[4] = {
4463 0, PREFIX_DATA0x08, PREFIX_REPZ0x01, PREFIX_REPNZ0x02
4464 };
4465 int vex3, vex2 = cpu_ldub_code(env, s->pc);
4466
4467 if (!CODE64(s)0 && (vex2 & 0xc0) != 0xc0) {
4468 /* 4.1.4.6: In 32-bit mode, bits [7:6] must be 11b,
4469 otherwise the instruction is LES or LDS. */
4470 break;
4471 }
4472 s->pc++;
4473
4474 /* 4.1.1-4.1.3: No preceding lock, 66, f2, f3, or rex prefixes. */
4475 if (prefixes & (PREFIX_REPZ0x01 | PREFIX_REPNZ0x02
4476 | PREFIX_LOCK0x04 | PREFIX_DATA0x08)) {
4477 goto illegal_op;
4478 }
4479#ifdef TARGET_X86_64
4480 if (x86_64_hregs) {
4481 goto illegal_op;
4482 }
4483#endif
4484 rex_r = (~vex2 >> 4) & 8;
4485 if (b == 0xc5) {
4486 vex3 = vex2;
4487 b = cpu_ldub_code(env, s->pc++);
4488 } else {
4489#ifdef TARGET_X86_64
4490 s->rex_x = (~vex2 >> 3) & 8;
4491 s->rex_b = (~vex2 >> 2) & 8;
4492#endif
4493 vex3 = cpu_ldub_code(env, s->pc++);
4494 rex_w = (vex3 >> 7) & 1;
4495 switch (vex2 & 0x1f) {
4496 case 0x01: /* Implied 0f leading opcode bytes. */
4497 b = cpu_ldub_code(env, s->pc++) | 0x100;
4498 break;
4499 case 0x02: /* Implied 0f 38 leading opcode bytes. */
4500 b = 0x138;
4501 break;
4502 case 0x03: /* Implied 0f 3a leading opcode bytes. */
4503 b = 0x13a;
4504 break;
4505 default: /* Reserved for future use. */
4506 goto illegal_op;
4507 }
4508 }
4509 s->vex_v = (~vex3 >> 3) & 0xf;
4510 s->vex_l = (vex3 >> 2) & 1;
4511 prefixes |= pp_prefix[vex3 & 3] | PREFIX_VEX0x20;
4512 }
4513 break;
4514 }
4515
4516 /* Post-process prefixes. */
4517 if (CODE64(s)0) {
4518 /* In 64-bit mode, the default data size is 32-bit. Select 64-bit
4519 data with rex_w, and 16-bit data with 0x66; rex_w takes precedence
4520 over 0x66 if both are present. */
4521 dflag = (rex_w > 0 ? MO_64 : prefixes & PREFIX_DATA0x08 ? MO_16 : MO_32);
4522 /* In 64-bit mode, 0x67 selects 32-bit addressing. */
4523 aflag = (prefixes & PREFIX_ADR0x10 ? MO_32 : MO_64);
4524 } else {
4525 /* In 16/32-bit mode, 0x66 selects the opposite data size. */
4526 if (s->code32 ^ ((prefixes & PREFIX_DATA0x08) != 0)) {
4527 dflag = MO_32;
4528 } else {
4529 dflag = MO_16;
4530 }
4531 /* In 16/32-bit mode, 0x67 selects the opposite addressing. */
4532 if (s->code32 ^ ((prefixes & PREFIX_ADR0x10) != 0)) {
4533 aflag = MO_32;
4534 } else {
4535 aflag = MO_16;
4536 }
4537 }
4538
4539 s->prefix = prefixes;
4540 s->aflag = aflag;
4541 s->dflag = dflag;
4542
4543 /* lock generation */
4544 if (prefixes & PREFIX_LOCK0x04)
4545 gen_helper_lock();
4546
4547 /* now check op code */
4548 reswitch:
4549 switch(b) {
4550 case 0x0f:
4551 /**************************/
4552 /* extended op code */
4553 b = cpu_ldub_code(env, s->pc++) | 0x100;
4554 goto reswitch;
4555
4556 /**************************/
4557 /* arith & logic */
4558 case 0x00 ... 0x05:
4559 case 0x08 ... 0x0d:
4560 case 0x10 ... 0x15:
4561 case 0x18 ... 0x1d:
4562 case 0x20 ... 0x25:
4563 case 0x28 ... 0x2d:
4564 case 0x30 ... 0x35:
4565 case 0x38 ... 0x3d:
4566 {
4567 int op, f, val;
4568 op = (b >> 3) & 7;
4569 f = (b >> 1) & 3;
4570
4571 ot = mo_b_d(b, dflag);
4572
4573 switch(f) {
4574 case 0: /* OP Ev, Gv */
4575 modrm = cpu_ldub_code(env, s->pc++);
4576 reg = ((modrm >> 3) & 7) | rex_r;
4577 mod = (modrm >> 6) & 3;
4578 rm = (modrm & 7) | REX_B(s)0;
4579 if (mod != 3) {
4580 gen_lea_modrm(env, s, modrm);
4581 opreg = OR_TMP0;
4582 } else if (op == OP_XORL && rm == reg) {
4583 xor_zero:
4584 /* xor reg, reg optimisation */
4585 set_cc_op(s, CC_OP_CLR);
4586 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], 0);
4587 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
4588 break;
4589 } else {
4590 opreg = rm;
4591 }
4592 gen_op_mov_v_reg(ot, cpu_T[1], reg);
4593 gen_op(s, op, ot, opreg);
4594 break;
4595 case 1: /* OP Gv, Ev */
4596 modrm = cpu_ldub_code(env, s->pc++);
4597 mod = (modrm >> 6) & 3;
4598 reg = ((modrm >> 3) & 7) | rex_r;
4599 rm = (modrm & 7) | REX_B(s)0;
4600 if (mod != 3) {
4601 gen_lea_modrm(env, s, modrm);
4602 gen_op_ld_v(s, ot, cpu_T[1], cpu_A0);
4603 } else if (op == OP_XORL && rm == reg) {
4604 goto xor_zero;
4605 } else {
4606 gen_op_mov_v_reg(ot, cpu_T[1], rm);
4607 }
4608 gen_op(s, op, ot, reg);
4609 break;
4610 case 2: /* OP A, Iv */
4611 val = insn_get(env, s, ot);
4612 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], val);
4613 gen_op(s, op, ot, OR_EAX);
4614 break;
4615 }
4616 }
4617 break;
4618
4619 case 0x82:
4620 if (CODE64(s)0)
4621 goto illegal_op;
4622 case 0x80: /* GRP1 */
4623 case 0x81:
4624 case 0x83:
4625 {
4626 int val;
4627
4628 ot = mo_b_d(b, dflag);
4629
4630 modrm = cpu_ldub_code(env, s->pc++);
4631 mod = (modrm >> 6) & 3;
4632 rm = (modrm & 7) | REX_B(s)0;
4633 op = (modrm >> 3) & 7;
4634
4635 if (mod != 3) {
4636 if (b == 0x83)
4637 s->rip_offset = 1;
4638 else
4639 s->rip_offset = insn_const_size(ot);
4640 gen_lea_modrm(env, s, modrm);
4641 opreg = OR_TMP0;
4642 } else {
4643 opreg = rm;
4644 }
4645
4646 switch(b) {
4647 default:
4648 case 0x80:
4649 case 0x81:
4650 case 0x82:
4651 val = insn_get(env, s, ot);
4652 break;
4653 case 0x83:
4654 val = (int8_t)insn_get(env, s, MO_8);
4655 break;
4656 }
4657 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], val);
4658 gen_op(s, op, ot, opreg);
4659 }
4660 break;
4661
4662 /**************************/
4663 /* inc, dec, and other misc arith */
4664 case 0x40 ... 0x47: /* inc Gv */
4665 ot = dflag;
4666 gen_inc(s, ot, OR_EAX + (b & 7), 1);
4667 break;
4668 case 0x48 ... 0x4f: /* dec Gv */
4669 ot = dflag;
4670 gen_inc(s, ot, OR_EAX + (b & 7), -1);
4671 break;
4672 case 0xf6: /* GRP3 */
4673 case 0xf7:
4674 ot = mo_b_d(b, dflag);
4675
4676 modrm = cpu_ldub_code(env, s->pc++);
4677 mod = (modrm >> 6) & 3;
4678 rm = (modrm & 7) | REX_B(s)0;
4679 op = (modrm >> 3) & 7;
4680 if (mod != 3) {
4681 if (op == 0)
4682 s->rip_offset = insn_const_size(ot);
4683 gen_lea_modrm(env, s, modrm);
4684 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
4685 } else {
4686 gen_op_mov_v_reg(ot, cpu_T[0], rm);
4687 }
4688
4689 switch(op) {
4690 case 0: /* test */
4691 val = insn_get(env, s, ot);
4692 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], val);
4693 gen_op_testl_T0_T1_cc();
4694 set_cc_op(s, CC_OP_LOGICB + ot);
4695 break;
4696 case 2: /* not */
4697 tcg_gen_not_tltcg_gen_not_i32(cpu_T[0], cpu_T[0]);
4698 if (mod != 3) {
4699 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
4700 } else {
4701 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
4702 }
4703 break;
4704 case 3: /* neg */
4705 tcg_gen_neg_tltcg_gen_neg_i32(cpu_T[0], cpu_T[0]);
4706 if (mod != 3) {
4707 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
4708 } else {
4709 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
4710 }
4711 gen_op_update_neg_cc();
4712 set_cc_op(s, CC_OP_SUBB + ot);
4713 break;
4714 case 4: /* mul */
4715 switch(ot) {
4716 case MO_8:
4717 gen_op_mov_v_reg(MO_8, cpu_T[1], R_EAX0);
4718 tcg_gen_ext8u_tltcg_gen_ext8u_i32(cpu_T[0], cpu_T[0]);
4719 tcg_gen_ext8u_tltcg_gen_ext8u_i32(cpu_T[1], cpu_T[1]);
4720 /* XXX: use 32 bit mul which could be faster */
4721 tcg_gen_mul_tltcg_gen_mul_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
4722 gen_op_mov_reg_v(MO_16, R_EAX0, cpu_T[0]);
4723 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
4724 tcg_gen_andi_tltcg_gen_andi_i32(cpu_cc_src, cpu_T[0], 0xff00);
4725 set_cc_op(s, CC_OP_MULB);
4726 break;
4727 case MO_16:
4728 gen_op_mov_v_reg(MO_16, cpu_T[1], R_EAX0);
4729 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_T[0], cpu_T[0]);
4730 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_T[1], cpu_T[1]);
4731 /* XXX: use 32 bit mul which could be faster */
4732 tcg_gen_mul_tltcg_gen_mul_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
4733 gen_op_mov_reg_v(MO_16, R_EAX0, cpu_T[0]);
4734 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
4735 tcg_gen_shri_tltcg_gen_shri_i32(cpu_T[0], cpu_T[0], 16);
4736 gen_op_mov_reg_v(MO_16, R_EDX2, cpu_T[0]);
4737 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_T[0]);
4738 set_cc_op(s, CC_OP_MULW);
4739 break;
4740 default:
4741 case MO_32:
4742 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
4743 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp3_i32, cpu_regs[R_EAX0]);
4744 tcg_gen_mulu2_i32(cpu_tmp2_i32, cpu_tmp3_i32,
4745 cpu_tmp2_i32, cpu_tmp3_i32);
4746 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[R_EAX0], cpu_tmp2_i32);
4747 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[R_EDX2], cpu_tmp3_i32);
4748 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_regs[R_EAX0]);
4749 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_regs[R_EDX2]);
4750 set_cc_op(s, CC_OP_MULL);
4751 break;
4752#ifdef TARGET_X86_64
4753 case MO_64:
4754 tcg_gen_mulu2_i64(cpu_regs[R_EAX0], cpu_regs[R_EDX2],
4755 cpu_T[0], cpu_regs[R_EAX0]);
4756 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_regs[R_EAX0]);
4757 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_regs[R_EDX2]);
4758 set_cc_op(s, CC_OP_MULQ);
4759 break;
4760#endif
4761 }
4762 break;
4763 case 5: /* imul */
4764 switch(ot) {
4765 case MO_8:
4766 gen_op_mov_v_reg(MO_8, cpu_T[1], R_EAX0);
4767 tcg_gen_ext8s_tltcg_gen_ext8s_i32(cpu_T[0], cpu_T[0]);
4768 tcg_gen_ext8s_tltcg_gen_ext8s_i32(cpu_T[1], cpu_T[1]);
4769 /* XXX: use 32 bit mul which could be faster */
4770 tcg_gen_mul_tltcg_gen_mul_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
4771 gen_op_mov_reg_v(MO_16, R_EAX0, cpu_T[0]);
4772 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
4773 tcg_gen_ext8s_tltcg_gen_ext8s_i32(cpu_tmp0, cpu_T[0]);
4774 tcg_gen_sub_tltcg_gen_sub_i32(cpu_cc_src, cpu_T[0], cpu_tmp0);
4775 set_cc_op(s, CC_OP_MULB);
4776 break;
4777 case MO_16:
4778 gen_op_mov_v_reg(MO_16, cpu_T[1], R_EAX0);
4779 tcg_gen_ext16s_tltcg_gen_ext16s_i32(cpu_T[0], cpu_T[0]);
4780 tcg_gen_ext16s_tltcg_gen_ext16s_i32(cpu_T[1], cpu_T[1]);
4781 /* XXX: use 32 bit mul which could be faster */
4782 tcg_gen_mul_tltcg_gen_mul_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
4783 gen_op_mov_reg_v(MO_16, R_EAX0, cpu_T[0]);
4784 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
4785 tcg_gen_ext16s_tltcg_gen_ext16s_i32(cpu_tmp0, cpu_T[0]);
4786 tcg_gen_sub_tltcg_gen_sub_i32(cpu_cc_src, cpu_T[0], cpu_tmp0);
4787 tcg_gen_shri_tltcg_gen_shri_i32(cpu_T[0], cpu_T[0], 16);
4788 gen_op_mov_reg_v(MO_16, R_EDX2, cpu_T[0]);
4789 set_cc_op(s, CC_OP_MULW);
4790 break;
4791 default:
4792 case MO_32:
4793 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
4794 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp3_i32, cpu_regs[R_EAX0]);
4795 tcg_gen_muls2_i32(cpu_tmp2_i32, cpu_tmp3_i32,
4796 cpu_tmp2_i32, cpu_tmp3_i32);
4797 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[R_EAX0], cpu_tmp2_i32);
4798 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[R_EDX2], cpu_tmp3_i32);
4799 tcg_gen_sari_i32(cpu_tmp2_i32, cpu_tmp2_i32, 31);
4800 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_regs[R_EAX0]);
4801 tcg_gen_sub_i32(cpu_tmp2_i32, cpu_tmp2_i32, cpu_tmp3_i32);
4802 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_cc_src, cpu_tmp2_i32);
4803 set_cc_op(s, CC_OP_MULL);
4804 break;
4805#ifdef TARGET_X86_64
4806 case MO_64:
4807 tcg_gen_muls2_i64(cpu_regs[R_EAX0], cpu_regs[R_EDX2],
4808 cpu_T[0], cpu_regs[R_EAX0]);
4809 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_regs[R_EAX0]);
4810 tcg_gen_sari_tltcg_gen_sari_i32(cpu_cc_src, cpu_regs[R_EAX0], 63);
4811 tcg_gen_sub_tltcg_gen_sub_i32(cpu_cc_src, cpu_cc_src, cpu_regs[R_EDX2]);
4812 set_cc_op(s, CC_OP_MULQ);
4813 break;
4814#endif
4815 }
4816 break;
4817 case 6: /* div */
4818 switch(ot) {
4819 case MO_8:
4820 gen_jmp_im(pc_start - s->cs_base);
4821 gen_helper_divb_AL(cpu_env, cpu_T[0]);
4822 break;
4823 case MO_16:
4824 gen_jmp_im(pc_start - s->cs_base);
4825 gen_helper_divw_AX(cpu_env, cpu_T[0]);
4826 break;
4827 default:
4828 case MO_32:
4829 gen_jmp_im(pc_start - s->cs_base);
4830 gen_helper_divl_EAX(cpu_env, cpu_T[0]);
4831 break;
4832#ifdef TARGET_X86_64
4833 case MO_64:
4834 gen_jmp_im(pc_start - s->cs_base);
4835 gen_helper_divq_EAX(cpu_env, cpu_T[0]);
4836 break;
4837#endif
4838 }
4839 break;
4840 case 7: /* idiv */
4841 switch(ot) {
4842 case MO_8:
4843 gen_jmp_im(pc_start - s->cs_base);
4844 gen_helper_idivb_AL(cpu_env, cpu_T[0]);
4845 break;
4846 case MO_16:
4847 gen_jmp_im(pc_start - s->cs_base);
4848 gen_helper_idivw_AX(cpu_env, cpu_T[0]);
4849 break;
4850 default:
4851 case MO_32:
4852 gen_jmp_im(pc_start - s->cs_base);
4853 gen_helper_idivl_EAX(cpu_env, cpu_T[0]);
4854 break;
4855#ifdef TARGET_X86_64
4856 case MO_64:
4857 gen_jmp_im(pc_start - s->cs_base);
4858 gen_helper_idivq_EAX(cpu_env, cpu_T[0]);
4859 break;
4860#endif
4861 }
4862 break;
4863 default:
4864 goto illegal_op;
4865 }
4866 break;
4867
4868 case 0xfe: /* GRP4 */
4869 case 0xff: /* GRP5 */
4870 ot = mo_b_d(b, dflag);
4871
4872 modrm = cpu_ldub_code(env, s->pc++);
4873 mod = (modrm >> 6) & 3;
4874 rm = (modrm & 7) | REX_B(s)0;
4875 op = (modrm >> 3) & 7;
4876 if (op >= 2 && b == 0xfe) {
4877 goto illegal_op;
4878 }
4879 if (CODE64(s)0) {
4880 if (op == 2 || op == 4) {
4881 /* operand size for jumps is 64 bit */
4882 ot = MO_64;
4883 } else if (op == 3 || op == 5) {
4884 ot = dflag != MO_16 ? MO_32 + (rex_w == 1) : MO_16;
4885 } else if (op == 6) {
4886 /* default push size is 64 bit */
4887 ot = mo_pushpop(s, dflag);
4888 }
4889 }
4890 if (mod != 3) {
4891 gen_lea_modrm(env, s, modrm);
4892 if (op >= 2 && op != 3 && op != 5)
4893 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
4894 } else {
4895 gen_op_mov_v_reg(ot, cpu_T[0], rm);
4896 }
4897
4898 switch(op) {
4899 case 0: /* inc Ev */
4900 if (mod != 3)
4901 opreg = OR_TMP0;
4902 else
4903 opreg = rm;
4904 gen_inc(s, ot, opreg, 1);
4905 break;
4906 case 1: /* dec Ev */
4907 if (mod != 3)
4908 opreg = OR_TMP0;
4909 else
4910 opreg = rm;
4911 gen_inc(s, ot, opreg, -1);
4912 break;
4913 case 2: /* call Ev */
4914 /* XXX: optimize if memory (no 'and' is necessary) */
4915 if (dflag == MO_16) {
4916 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_T[0], cpu_T[0]);
4917 }
4918 next_eip = s->pc - s->cs_base;
4919 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], next_eip);
4920 gen_push_v(s, cpu_T[1]);
4921 gen_op_jmp_v(cpu_T[0]);
4922 gen_eob(s);
4923 break;
4924 case 3: /* lcall Ev */
4925 gen_op_ld_v(s, ot, cpu_T[1], cpu_A0);
4926 gen_add_A0_im(s, 1 << ot);
4927 gen_op_ld_v(s, MO_16, cpu_T[0], cpu_A0);
4928 do_lcall:
4929 if (s->pe && !s->vm86) {
4930 gen_update_cc_op(s);
4931 gen_jmp_im(pc_start - s->cs_base);
4932 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
4933 gen_helper_lcall_protected(cpu_env, cpu_tmp2_i32, cpu_T[1],
4934 tcg_const_i32(dflag - 1),
4935 tcg_const_i32(s->pc - pc_start));
4936 } else {
4937 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
4938 gen_helper_lcall_real(cpu_env, cpu_tmp2_i32, cpu_T[1],
4939 tcg_const_i32(dflag - 1),
4940 tcg_const_i32(s->pc - s->cs_base));
4941 }
4942 gen_eob(s);
4943 break;
4944 case 4: /* jmp Ev */
4945 if (dflag == MO_16) {
4946 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_T[0], cpu_T[0]);
4947 }
4948 gen_op_jmp_v(cpu_T[0]);
4949 gen_eob(s);
4950 break;
4951 case 5: /* ljmp Ev */
4952 gen_op_ld_v(s, ot, cpu_T[1], cpu_A0);
4953 gen_add_A0_im(s, 1 << ot);
4954 gen_op_ld_v(s, MO_16, cpu_T[0], cpu_A0);
4955 do_ljmp:
4956 if (s->pe && !s->vm86) {
4957 gen_update_cc_op(s);
4958 gen_jmp_im(pc_start - s->cs_base);
4959 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
4960 gen_helper_ljmp_protected(cpu_env, cpu_tmp2_i32, cpu_T[1],
4961 tcg_const_i32(s->pc - pc_start));
4962 } else {
4963 gen_op_movl_seg_T0_vm(R_CS1);
4964 gen_op_jmp_v(cpu_T[1]);
4965 }
4966 gen_eob(s);
4967 break;
4968 case 6: /* push Ev */
4969 gen_push_v(s, cpu_T[0]);
4970 break;
4971 default:
4972 goto illegal_op;
4973 }
4974 break;
4975
4976 case 0x84: /* test Ev, Gv */
4977 case 0x85:
4978 ot = mo_b_d(b, dflag);
4979
4980 modrm = cpu_ldub_code(env, s->pc++);
4981 reg = ((modrm >> 3) & 7) | rex_r;
4982
4983 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
4984 gen_op_mov_v_reg(ot, cpu_T[1], reg);
4985 gen_op_testl_T0_T1_cc();
4986 set_cc_op(s, CC_OP_LOGICB + ot);
4987 break;
4988
4989 case 0xa8: /* test eAX, Iv */
4990 case 0xa9:
4991 ot = mo_b_d(b, dflag);
4992 val = insn_get(env, s, ot);
4993
4994 gen_op_mov_v_reg(ot, cpu_T[0], OR_EAX);
4995 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], val);
4996 gen_op_testl_T0_T1_cc();
4997 set_cc_op(s, CC_OP_LOGICB + ot);
4998 break;
4999
5000 case 0x98: /* CWDE/CBW */
5001 switch (dflag) {
5002#ifdef TARGET_X86_64
5003 case MO_64:
5004 gen_op_mov_v_reg(MO_32, cpu_T[0], R_EAX0);
5005 tcg_gen_ext32s_tltcg_gen_mov_i32(cpu_T[0], cpu_T[0]);
5006 gen_op_mov_reg_v(MO_64, R_EAX0, cpu_T[0]);
5007 break;
5008#endif
5009 case MO_32:
5010 gen_op_mov_v_reg(MO_16, cpu_T[0], R_EAX0);
5011 tcg_gen_ext16s_tltcg_gen_ext16s_i32(cpu_T[0], cpu_T[0]);
5012 gen_op_mov_reg_v(MO_32, R_EAX0, cpu_T[0]);
5013 break;
5014 case MO_16:
5015 gen_op_mov_v_reg(MO_8, cpu_T[0], R_EAX0);
5016 tcg_gen_ext8s_tltcg_gen_ext8s_i32(cpu_T[0], cpu_T[0]);
5017 gen_op_mov_reg_v(MO_16, R_EAX0, cpu_T[0]);
5018 break;
5019 default:
5020 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 5020); abort();} while (0)
;
5021 }
5022 break;
5023 case 0x99: /* CDQ/CWD */
5024 switch (dflag) {
5025#ifdef TARGET_X86_64
5026 case MO_64:
5027 gen_op_mov_v_reg(MO_64, cpu_T[0], R_EAX0);
5028 tcg_gen_sari_tltcg_gen_sari_i32(cpu_T[0], cpu_T[0], 63);
5029 gen_op_mov_reg_v(MO_64, R_EDX2, cpu_T[0]);
5030 break;
5031#endif
5032 case MO_32:
5033 gen_op_mov_v_reg(MO_32, cpu_T[0], R_EAX0);
5034 tcg_gen_ext32s_tltcg_gen_mov_i32(cpu_T[0], cpu_T[0]);
5035 tcg_gen_sari_tltcg_gen_sari_i32(cpu_T[0], cpu_T[0], 31);
5036 gen_op_mov_reg_v(MO_32, R_EDX2, cpu_T[0]);
5037 break;
5038 case MO_16:
5039 gen_op_mov_v_reg(MO_16, cpu_T[0], R_EAX0);
5040 tcg_gen_ext16s_tltcg_gen_ext16s_i32(cpu_T[0], cpu_T[0]);
5041 tcg_gen_sari_tltcg_gen_sari_i32(cpu_T[0], cpu_T[0], 15);
5042 gen_op_mov_reg_v(MO_16, R_EDX2, cpu_T[0]);
5043 break;
5044 default:
5045 tcg_abort()do { fprintf(stderr, "%s:%d: tcg fatal error\n", "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 5045); abort();} while (0)
;
5046 }
5047 break;
5048 case 0x1af: /* imul Gv, Ev */
5049 case 0x69: /* imul Gv, Ev, I */
5050 case 0x6b:
5051 ot = dflag;
5052 modrm = cpu_ldub_code(env, s->pc++);
5053 reg = ((modrm >> 3) & 7) | rex_r;
5054 if (b == 0x69)
5055 s->rip_offset = insn_const_size(ot);
5056 else if (b == 0x6b)
5057 s->rip_offset = 1;
5058 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
5059 if (b == 0x69) {
5060 val = insn_get(env, s, ot);
5061 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], val);
5062 } else if (b == 0x6b) {
5063 val = (int8_t)insn_get(env, s, MO_8);
5064 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], val);
5065 } else {
5066 gen_op_mov_v_reg(ot, cpu_T[1], reg);
5067 }
5068 switch (ot) {
5069#ifdef TARGET_X86_64
5070 case MO_64:
5071 tcg_gen_muls2_i64(cpu_regs[reg], cpu_T[1], cpu_T[0], cpu_T[1]);
5072 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_regs[reg]);
5073 tcg_gen_sari_tltcg_gen_sari_i32(cpu_cc_src, cpu_cc_dst, 63);
5074 tcg_gen_sub_tltcg_gen_sub_i32(cpu_cc_src, cpu_cc_src, cpu_T[1]);
5075 break;
5076#endif
5077 case MO_32:
5078 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
5079 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp3_i32, cpu_T[1]);
5080 tcg_gen_muls2_i32(cpu_tmp2_i32, cpu_tmp3_i32,
5081 cpu_tmp2_i32, cpu_tmp3_i32);
5082 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_regs[reg], cpu_tmp2_i32);
5083 tcg_gen_sari_i32(cpu_tmp2_i32, cpu_tmp2_i32, 31);
5084 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_regs[reg]);
5085 tcg_gen_sub_i32(cpu_tmp2_i32, cpu_tmp2_i32, cpu_tmp3_i32);
5086 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_cc_src, cpu_tmp2_i32);
5087 break;
5088 default:
5089 tcg_gen_ext16s_tltcg_gen_ext16s_i32(cpu_T[0], cpu_T[0]);
5090 tcg_gen_ext16s_tltcg_gen_ext16s_i32(cpu_T[1], cpu_T[1]);
5091 /* XXX: use 32 bit mul which could be faster */
5092 tcg_gen_mul_tltcg_gen_mul_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
5093 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
5094 tcg_gen_ext16s_tltcg_gen_ext16s_i32(cpu_tmp0, cpu_T[0]);
5095 tcg_gen_sub_tltcg_gen_sub_i32(cpu_cc_src, cpu_T[0], cpu_tmp0);
5096 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
5097 break;
5098 }
5099 set_cc_op(s, CC_OP_MULB + ot);
5100 break;
5101 case 0x1c0:
5102 case 0x1c1: /* xadd Ev, Gv */
5103 ot = mo_b_d(b, dflag);
5104 modrm = cpu_ldub_code(env, s->pc++);
5105 reg = ((modrm >> 3) & 7) | rex_r;
5106 mod = (modrm >> 6) & 3;
5107 if (mod == 3) {
5108 rm = (modrm & 7) | REX_B(s)0;
5109 gen_op_mov_v_reg(ot, cpu_T[0], reg);
5110 gen_op_mov_v_reg(ot, cpu_T[1], rm);
5111 tcg_gen_add_tltcg_gen_add_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
5112 gen_op_mov_reg_v(ot, reg, cpu_T[1]);
5113 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
5114 } else {
5115 gen_lea_modrm(env, s, modrm);
5116 gen_op_mov_v_reg(ot, cpu_T[0], reg);
5117 gen_op_ld_v(s, ot, cpu_T[1], cpu_A0);
5118 tcg_gen_add_tltcg_gen_add_i32(cpu_T[0], cpu_T[0], cpu_T[1]);
5119 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
5120 gen_op_mov_reg_v(ot, reg, cpu_T[1]);
5121 }
5122 gen_op_update2_cc();
5123 set_cc_op(s, CC_OP_ADDB + ot);
5124 break;
5125 case 0x1b0:
5126 case 0x1b1: /* cmpxchg Ev, Gv */
5127 {
5128 int label1, label2;
5129 TCGvTCGv_i32 t0, t1, t2, a0;
5130
5131 ot = mo_b_d(b, dflag);
5132 modrm = cpu_ldub_code(env, s->pc++);
5133 reg = ((modrm >> 3) & 7) | rex_r;
5134 mod = (modrm >> 6) & 3;
5135 t0 = tcg_temp_local_new()tcg_temp_local_new_i32();
5136 t1 = tcg_temp_local_new()tcg_temp_local_new_i32();
5137 t2 = tcg_temp_local_new()tcg_temp_local_new_i32();
5138 a0 = tcg_temp_local_new()tcg_temp_local_new_i32();
5139 gen_op_mov_v_reg(ot, t1, reg);
5140 if (mod == 3) {
5141 rm = (modrm & 7) | REX_B(s)0;
5142 gen_op_mov_v_reg(ot, t0, rm);
5143 } else {
5144 gen_lea_modrm(env, s, modrm);
5145 tcg_gen_mov_tltcg_gen_mov_i32(a0, cpu_A0);
5146 gen_op_ld_v(s, ot, t0, a0);
5147 rm = 0; /* avoid warning */
5148 }
5149 label1 = gen_new_label();
5150 tcg_gen_mov_tltcg_gen_mov_i32(t2, cpu_regs[R_EAX0]);
5151 gen_extu(ot, t0);
5152 gen_extu(ot, t2);
5153 tcg_gen_brcond_tltcg_gen_brcond_i32(TCG_COND_EQ, t2, t0, label1);
5154 label2 = gen_new_label();
5155 if (mod == 3) {
5156 gen_op_mov_reg_v(ot, R_EAX0, t0);
5157 tcg_gen_br(label2);
5158 gen_set_label(label1);
5159 gen_op_mov_reg_v(ot, rm, t1);
5160 } else {
5161 /* perform no-op store cycle like physical cpu; must be
5162 before changing accumulator to ensure idempotency if
5163 the store faults and the instruction is restarted */
5164 gen_op_st_v(s, ot, t0, a0);
5165 gen_op_mov_reg_v(ot, R_EAX0, t0);
5166 tcg_gen_br(label2);
5167 gen_set_label(label1);
5168 gen_op_st_v(s, ot, t1, a0);
5169 }
5170 gen_set_label(label2);
5171 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, t0);
5172 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_srcT, t2);
5173 tcg_gen_sub_tltcg_gen_sub_i32(cpu_cc_dst, t2, t0);
5174 set_cc_op(s, CC_OP_SUBB + ot);
5175 tcg_temp_freetcg_temp_free_i32(t0);
5176 tcg_temp_freetcg_temp_free_i32(t1);
5177 tcg_temp_freetcg_temp_free_i32(t2);
5178 tcg_temp_freetcg_temp_free_i32(a0);
5179 }
5180 break;
5181 case 0x1c7: /* cmpxchg8b */
5182 modrm = cpu_ldub_code(env, s->pc++);
5183 mod = (modrm >> 6) & 3;
5184 if ((mod == 3) || ((modrm & 0x38) != 0x8))
5185 goto illegal_op;
5186#ifdef TARGET_X86_64
5187 if (dflag == MO_64) {
5188 if (!(s->cpuid_ext_features & CPUID_EXT_CX16(1 << 13)))
5189 goto illegal_op;
5190 gen_jmp_im(pc_start - s->cs_base);
5191 gen_update_cc_op(s);
5192 gen_lea_modrm(env, s, modrm);
5193 gen_helper_cmpxchg16b(cpu_env, cpu_A0);
5194 } else
5195#endif
5196 {
5197 if (!(s->cpuid_features & CPUID_CX8(1 << 8)))
5198 goto illegal_op;
5199 gen_jmp_im(pc_start - s->cs_base);
5200 gen_update_cc_op(s);
5201 gen_lea_modrm(env, s, modrm);
5202 gen_helper_cmpxchg8b(cpu_env, cpu_A0);
5203 }
5204 set_cc_op(s, CC_OP_EFLAGS);
5205 break;
5206
5207 /**************************/
5208 /* push/pop */
5209 case 0x50 ... 0x57: /* push */
5210 gen_op_mov_v_reg(MO_32, cpu_T[0], (b & 7) | REX_B(s)0);
5211 gen_push_v(s, cpu_T[0]);
5212 break;
5213 case 0x58 ... 0x5f: /* pop */
5214 ot = gen_pop_T0(s);
5215 /* NOTE: order is important for pop %sp */
5216 gen_pop_update(s, ot);
5217 gen_op_mov_reg_v(ot, (b & 7) | REX_B(s)0, cpu_T[0]);
5218 break;
5219 case 0x60: /* pusha */
5220 if (CODE64(s)0)
5221 goto illegal_op;
5222 gen_pusha(s);
5223 break;
5224 case 0x61: /* popa */
5225 if (CODE64(s)0)
5226 goto illegal_op;
5227 gen_popa(s);
5228 break;
5229 case 0x68: /* push Iv */
5230 case 0x6a:
5231 ot = mo_pushpop(s, dflag);
5232 if (b == 0x68)
5233 val = insn_get(env, s, ot);
5234 else
5235 val = (int8_t)insn_get(env, s, MO_8);
5236 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], val);
5237 gen_push_v(s, cpu_T[0]);
5238 break;
5239 case 0x8f: /* pop Ev */
5240 modrm = cpu_ldub_code(env, s->pc++);
5241 mod = (modrm >> 6) & 3;
5242 ot = gen_pop_T0(s);
5243 if (mod == 3) {
5244 /* NOTE: order is important for pop %sp */
5245 gen_pop_update(s, ot);
5246 rm = (modrm & 7) | REX_B(s)0;
5247 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
5248 } else {
5249 /* NOTE: order is important too for MMU exceptions */
5250 s->popl_esp_hack = 1 << ot;
5251 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
5252 s->popl_esp_hack = 0;
5253 gen_pop_update(s, ot);
5254 }
5255 break;
5256 case 0xc8: /* enter */
5257 {
5258 int level;
5259 val = cpu_lduw_code(env, s->pc);
5260 s->pc += 2;
5261 level = cpu_ldub_code(env, s->pc++);
5262 gen_enter(s, val, level);
5263 }
5264 break;
5265 case 0xc9: /* leave */
5266 /* XXX: exception not precise (ESP is updated before potential exception) */
5267 if (CODE64(s)0) {
5268 gen_op_mov_v_reg(MO_64, cpu_T[0], R_EBP5);
5269 gen_op_mov_reg_v(MO_64, R_ESP4, cpu_T[0]);
5270 } else if (s->ss32) {
5271 gen_op_mov_v_reg(MO_32, cpu_T[0], R_EBP5);
5272 gen_op_mov_reg_v(MO_32, R_ESP4, cpu_T[0]);
5273 } else {
5274 gen_op_mov_v_reg(MO_16, cpu_T[0], R_EBP5);
5275 gen_op_mov_reg_v(MO_16, R_ESP4, cpu_T[0]);
5276 }
5277 ot = gen_pop_T0(s);
5278 gen_op_mov_reg_v(ot, R_EBP5, cpu_T[0]);
5279 gen_pop_update(s, ot);
5280 break;
5281 case 0x06: /* push es */
5282 case 0x0e: /* push cs */
5283 case 0x16: /* push ss */
5284 case 0x1e: /* push ds */
5285 if (CODE64(s)0)
5286 goto illegal_op;
5287 gen_op_movl_T0_seg(b >> 3);
5288 gen_push_v(s, cpu_T[0]);
5289 break;
5290 case 0x1a0: /* push fs */
5291 case 0x1a8: /* push gs */
5292 gen_op_movl_T0_seg((b >> 3) & 7);
5293 gen_push_v(s, cpu_T[0]);
5294 break;
5295 case 0x07: /* pop es */
5296 case 0x17: /* pop ss */
5297 case 0x1f: /* pop ds */
5298 if (CODE64(s)0)
5299 goto illegal_op;
5300 reg = b >> 3;
5301 ot = gen_pop_T0(s);
5302 gen_movl_seg_T0(s, reg, pc_start - s->cs_base);
5303 gen_pop_update(s, ot);
5304 if (reg == R_SS2) {
5305 /* if reg == SS, inhibit interrupts/trace. */
5306 /* If several instructions disable interrupts, only the
5307 _first_ does it */
5308 if (!(s->tb->flags & HF_INHIBIT_IRQ_MASK(1 << 3)))
5309 gen_helper_set_inhibit_irq(cpu_env);
5310 s->tf = 0;
5311 }
5312 if (s->is_jmp) {
5313 gen_jmp_im(s->pc - s->cs_base);
5314 gen_eob(s);
5315 }
5316 break;
5317 case 0x1a1: /* pop fs */
5318 case 0x1a9: /* pop gs */
5319 ot = gen_pop_T0(s);
5320 gen_movl_seg_T0(s, (b >> 3) & 7, pc_start - s->cs_base);
5321 gen_pop_update(s, ot);
5322 if (s->is_jmp) {
5323 gen_jmp_im(s->pc - s->cs_base);
5324 gen_eob(s);
5325 }
5326 break;
5327
5328 /**************************/
5329 /* mov */
5330 case 0x88:
5331 case 0x89: /* mov Gv, Ev */
5332 ot = mo_b_d(b, dflag);
5333 modrm = cpu_ldub_code(env, s->pc++);
5334 reg = ((modrm >> 3) & 7) | rex_r;
5335
5336 /* generate a generic store */
5337 gen_ldst_modrm(env, s, modrm, ot, reg, 1);
5338 break;
5339 case 0xc6:
5340 case 0xc7: /* mov Ev, Iv */
5341 ot = mo_b_d(b, dflag);
5342 modrm = cpu_ldub_code(env, s->pc++);
5343 mod = (modrm >> 6) & 3;
5344 if (mod != 3) {
5345 s->rip_offset = insn_const_size(ot);
5346 gen_lea_modrm(env, s, modrm);
5347 }
5348 val = insn_get(env, s, ot);
5349 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], val);
5350 if (mod != 3) {
5351 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
5352 } else {
5353 gen_op_mov_reg_v(ot, (modrm & 7) | REX_B(s)0, cpu_T[0]);
5354 }
5355 break;
5356 case 0x8a:
5357 case 0x8b: /* mov Ev, Gv */
5358 ot = mo_b_d(b, dflag);
5359 modrm = cpu_ldub_code(env, s->pc++);
5360 reg = ((modrm >> 3) & 7) | rex_r;
5361
5362 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
5363 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
5364 break;
5365 case 0x8e: /* mov seg, Gv */
5366 modrm = cpu_ldub_code(env, s->pc++);
5367 reg = (modrm >> 3) & 7;
5368 if (reg >= 6 || reg == R_CS1)
5369 goto illegal_op;
5370 gen_ldst_modrm(env, s, modrm, MO_16, OR_TMP0, 0);
5371 gen_movl_seg_T0(s, reg, pc_start - s->cs_base);
5372 if (reg == R_SS2) {
5373 /* if reg == SS, inhibit interrupts/trace */
5374 /* If several instructions disable interrupts, only the
5375 _first_ does it */
5376 if (!(s->tb->flags & HF_INHIBIT_IRQ_MASK(1 << 3)))
5377 gen_helper_set_inhibit_irq(cpu_env);
5378 s->tf = 0;
5379 }
5380 if (s->is_jmp) {
5381 gen_jmp_im(s->pc - s->cs_base);
5382 gen_eob(s);
5383 }
5384 break;
5385 case 0x8c: /* mov Gv, seg */
5386 modrm = cpu_ldub_code(env, s->pc++);
5387 reg = (modrm >> 3) & 7;
5388 mod = (modrm >> 6) & 3;
5389 if (reg >= 6)
5390 goto illegal_op;
5391 gen_op_movl_T0_seg(reg);
5392 ot = mod == 3 ? dflag : MO_16;
5393 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
5394 break;
5395
5396 case 0x1b6: /* movzbS Gv, Eb */
5397 case 0x1b7: /* movzwS Gv, Eb */
5398 case 0x1be: /* movsbS Gv, Eb */
5399 case 0x1bf: /* movswS Gv, Eb */
5400 {
5401 TCGMemOp d_ot;
5402 TCGMemOp s_ot;
5403
5404 /* d_ot is the size of destination */
5405 d_ot = dflag;
5406 /* ot is the size of source */
5407 ot = (b & 1) + MO_8;
5408 /* s_ot is the sign+size of source */
5409 s_ot = b & 8 ? MO_SIGN | ot : ot;
5410
5411 modrm = cpu_ldub_code(env, s->pc++);
5412 reg = ((modrm >> 3) & 7) | rex_r;
5413 mod = (modrm >> 6) & 3;
5414 rm = (modrm & 7) | REX_B(s)0;
5415
5416 if (mod == 3) {
5417 gen_op_mov_v_reg(ot, cpu_T[0], rm);
5418 switch (s_ot) {
5419 case MO_UB:
5420 tcg_gen_ext8u_tltcg_gen_ext8u_i32(cpu_T[0], cpu_T[0]);
5421 break;
5422 case MO_SB:
5423 tcg_gen_ext8s_tltcg_gen_ext8s_i32(cpu_T[0], cpu_T[0]);
5424 break;
5425 case MO_UW:
5426 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_T[0], cpu_T[0]);
5427 break;
5428 default:
5429 case MO_SW:
5430 tcg_gen_ext16s_tltcg_gen_ext16s_i32(cpu_T[0], cpu_T[0]);
5431 break;
5432 }
5433 gen_op_mov_reg_v(d_ot, reg, cpu_T[0]);
5434 } else {
5435 gen_lea_modrm(env, s, modrm);
5436 gen_op_ld_v(s, s_ot, cpu_T[0], cpu_A0);
5437 gen_op_mov_reg_v(d_ot, reg, cpu_T[0]);
5438 }
5439 }
5440 break;
5441
5442 case 0x8d: /* lea */
5443 ot = dflag;
5444 modrm = cpu_ldub_code(env, s->pc++);
5445 mod = (modrm >> 6) & 3;
5446 if (mod == 3)
5447 goto illegal_op;
5448 reg = ((modrm >> 3) & 7) | rex_r;
5449 /* we must ensure that no segment is added */
5450 s->override = -1;
5451 val = s->addseg;
5452 s->addseg = 0;
5453 gen_lea_modrm(env, s, modrm);
5454 s->addseg = val;
5455 gen_op_mov_reg_v(ot, reg, cpu_A0);
5456 break;
5457
5458 case 0xa0: /* mov EAX, Ov */
5459 case 0xa1:
5460 case 0xa2: /* mov Ov, EAX */
5461 case 0xa3:
5462 {
5463 target_ulong offset_addr;
5464
5465 ot = mo_b_d(b, dflag);
5466 switch (s->aflag) {
5467#ifdef TARGET_X86_64
5468 case MO_64:
5469 offset_addr = cpu_ldq_code(env, s->pc);
5470 s->pc += 8;
5471 break;
5472#endif
5473 default:
5474 offset_addr = insn_get(env, s, s->aflag);
5475 break;
5476 }
5477 tcg_gen_movi_tltcg_gen_movi_i32(cpu_A0, offset_addr);
5478 gen_add_A0_ds_seg(s);
5479 if ((b & 2) == 0) {
5480 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
5481 gen_op_mov_reg_v(ot, R_EAX0, cpu_T[0]);
5482 } else {
5483 gen_op_mov_v_reg(ot, cpu_T[0], R_EAX0);
5484 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
5485 }
5486 }
5487 break;
5488 case 0xd7: /* xlat */
5489 tcg_gen_mov_tltcg_gen_mov_i32(cpu_A0, cpu_regs[R_EBX3]);
5490 tcg_gen_ext8u_tltcg_gen_ext8u_i32(cpu_T[0], cpu_regs[R_EAX0]);
5491 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_A0, cpu_T[0]);
5492 gen_extu(s->aflag, cpu_A0);
5493 gen_add_A0_ds_seg(s);
5494 gen_op_ld_v(s, MO_8, cpu_T[0], cpu_A0);
5495 gen_op_mov_reg_v(MO_8, R_EAX0, cpu_T[0]);
5496 break;
5497 case 0xb0 ... 0xb7: /* mov R, Ib */
5498 val = insn_get(env, s, MO_8);
5499 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], val);
5500 gen_op_mov_reg_v(MO_8, (b & 7) | REX_B(s)0, cpu_T[0]);
5501 break;
5502 case 0xb8 ... 0xbf: /* mov R, Iv */
5503#ifdef TARGET_X86_64
5504 if (dflag == MO_64) {
5505 uint64_t tmp;
5506 /* 64 bit case */
5507 tmp = cpu_ldq_code(env, s->pc);
5508 s->pc += 8;
5509 reg = (b & 7) | REX_B(s)0;
5510 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], tmp);
5511 gen_op_mov_reg_v(MO_64, reg, cpu_T[0]);
5512 } else
5513#endif
5514 {
5515 ot = dflag;
5516 val = insn_get(env, s, ot);
5517 reg = (b & 7) | REX_B(s)0;
5518 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], val);
5519 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
5520 }
5521 break;
5522
5523 case 0x91 ... 0x97: /* xchg R, EAX */
5524 do_xchg_reg_eax:
5525 ot = dflag;
5526 reg = (b & 7) | REX_B(s)0;
5527 rm = R_EAX0;
5528 goto do_xchg_reg;
5529 case 0x86:
5530 case 0x87: /* xchg Ev, Gv */
5531 ot = mo_b_d(b, dflag);
5532 modrm = cpu_ldub_code(env, s->pc++);
5533 reg = ((modrm >> 3) & 7) | rex_r;
5534 mod = (modrm >> 6) & 3;
5535 if (mod == 3) {
5536 rm = (modrm & 7) | REX_B(s)0;
5537 do_xchg_reg:
5538 gen_op_mov_v_reg(ot, cpu_T[0], reg);
5539 gen_op_mov_v_reg(ot, cpu_T[1], rm);
5540 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
5541 gen_op_mov_reg_v(ot, reg, cpu_T[1]);
5542 } else {
5543 gen_lea_modrm(env, s, modrm);
5544 gen_op_mov_v_reg(ot, cpu_T[0], reg);
5545 /* for xchg, lock is implicit */
5546 if (!(prefixes & PREFIX_LOCK0x04))
5547 gen_helper_lock();
5548 gen_op_ld_v(s, ot, cpu_T[1], cpu_A0);
5549 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
5550 if (!(prefixes & PREFIX_LOCK0x04))
5551 gen_helper_unlock();
5552 gen_op_mov_reg_v(ot, reg, cpu_T[1]);
5553 }
5554 break;
5555 case 0xc4: /* les Gv */
5556 /* In CODE64 this is VEX3; see above. */
5557 op = R_ES0;
5558 goto do_lxx;
5559 case 0xc5: /* lds Gv */
5560 /* In CODE64 this is VEX2; see above. */
5561 op = R_DS3;
5562 goto do_lxx;
5563 case 0x1b2: /* lss Gv */
5564 op = R_SS2;
5565 goto do_lxx;
5566 case 0x1b4: /* lfs Gv */
5567 op = R_FS4;
5568 goto do_lxx;
5569 case 0x1b5: /* lgs Gv */
5570 op = R_GS5;
5571 do_lxx:
5572 ot = dflag != MO_16 ? MO_32 : MO_16;
5573 modrm = cpu_ldub_code(env, s->pc++);
5574 reg = ((modrm >> 3) & 7) | rex_r;
5575 mod = (modrm >> 6) & 3;
5576 if (mod == 3)
5577 goto illegal_op;
5578 gen_lea_modrm(env, s, modrm);
5579 gen_op_ld_v(s, ot, cpu_T[1], cpu_A0);
5580 gen_add_A0_im(s, 1 << ot);
5581 /* load the segment first to handle exceptions properly */
5582 gen_op_ld_v(s, MO_16, cpu_T[0], cpu_A0);
5583 gen_movl_seg_T0(s, op, pc_start - s->cs_base);
5584 /* then put the data */
5585 gen_op_mov_reg_v(ot, reg, cpu_T[1]);
5586 if (s->is_jmp) {
5587 gen_jmp_im(s->pc - s->cs_base);
5588 gen_eob(s);
5589 }
5590 break;
5591
5592 /************************/
5593 /* shifts */
5594 case 0xc0:
5595 case 0xc1:
5596 /* shift Ev,Ib */
5597 shift = 2;
5598 grp2:
5599 {
5600 ot = mo_b_d(b, dflag);
5601 modrm = cpu_ldub_code(env, s->pc++);
5602 mod = (modrm >> 6) & 3;
5603 op = (modrm >> 3) & 7;
5604
5605 if (mod != 3) {
5606 if (shift == 2) {
5607 s->rip_offset = 1;
5608 }
5609 gen_lea_modrm(env, s, modrm);
5610 opreg = OR_TMP0;
5611 } else {
5612 opreg = (modrm & 7) | REX_B(s)0;
5613 }
5614
5615 /* simpler op */
5616 if (shift == 0) {
5617 gen_shift(s, op, ot, opreg, OR_ECX);
5618 } else {
5619 if (shift == 2) {
5620 shift = cpu_ldub_code(env, s->pc++);
5621 }
5622 gen_shifti(s, op, ot, opreg, shift);
5623 }
5624 }
5625 break;
5626 case 0xd0:
5627 case 0xd1:
5628 /* shift Ev,1 */
5629 shift = 1;
5630 goto grp2;
5631 case 0xd2:
5632 case 0xd3:
5633 /* shift Ev,cl */
5634 shift = 0;
5635 goto grp2;
5636
5637 case 0x1a4: /* shld imm */
5638 op = 0;
5639 shift = 1;
5640 goto do_shiftd;
5641 case 0x1a5: /* shld cl */
5642 op = 0;
5643 shift = 0;
5644 goto do_shiftd;
5645 case 0x1ac: /* shrd imm */
5646 op = 1;
5647 shift = 1;
5648 goto do_shiftd;
5649 case 0x1ad: /* shrd cl */
5650 op = 1;
5651 shift = 0;
5652 do_shiftd:
5653 ot = dflag;
5654 modrm = cpu_ldub_code(env, s->pc++);
5655 mod = (modrm >> 6) & 3;
5656 rm = (modrm & 7) | REX_B(s)0;
5657 reg = ((modrm >> 3) & 7) | rex_r;
5658 if (mod != 3) {
5659 gen_lea_modrm(env, s, modrm);
5660 opreg = OR_TMP0;
5661 } else {
5662 opreg = rm;
5663 }
5664 gen_op_mov_v_reg(ot, cpu_T[1], reg);
5665
5666 if (shift) {
5667 TCGvTCGv_i32 imm = tcg_const_tltcg_const_i32(cpu_ldub_code(env, s->pc++));
5668 gen_shiftd_rm_T1(s, ot, opreg, op, imm);
5669 tcg_temp_freetcg_temp_free_i32(imm);
5670 } else {
5671 gen_shiftd_rm_T1(s, ot, opreg, op, cpu_regs[R_ECX1]);
5672 }
5673 break;
5674
5675 /************************/
5676 /* floats */
5677 case 0xd8 ... 0xdf:
5678 if (s->flags & (HF_EM_MASK(1 << 10) | HF_TS_MASK(1 << 11))) {
5679 /* if CR0.EM or CR0.TS are set, generate an FPU exception */
5680 /* XXX: what to do if illegal op ? */
5681 gen_exception(s, EXCP07_PREX7, pc_start - s->cs_base);
5682 break;
5683 }
5684 modrm = cpu_ldub_code(env, s->pc++);
5685 mod = (modrm >> 6) & 3;
5686 rm = modrm & 7;
5687 op = ((b & 7) << 3) | ((modrm >> 3) & 7);
5688 if (mod != 3) {
5689 /* memory op */
5690 gen_lea_modrm(env, s, modrm);
5691 switch(op) {
5692 case 0x00 ... 0x07: /* fxxxs */
5693 case 0x10 ... 0x17: /* fixxxl */
5694 case 0x20 ... 0x27: /* fxxxl */
5695 case 0x30 ... 0x37: /* fixxx */
5696 {
5697 int op1;
5698 op1 = op & 7;
5699
5700 switch(op >> 4) {
5701 case 0:
5702 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
5703 s->mem_index, MO_LEUL);
5704 gen_helper_flds_FT0(cpu_env, cpu_tmp2_i32);
5705 break;
5706 case 1:
5707 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
5708 s->mem_index, MO_LEUL);
5709 gen_helper_fildl_FT0(cpu_env, cpu_tmp2_i32);
5710 break;
5711 case 2:
5712 tcg_gen_qemu_ld_i64(cpu_tmp1_i64, cpu_A0,
5713 s->mem_index, MO_LEQ);
5714 gen_helper_fldl_FT0(cpu_env, cpu_tmp1_i64);
5715 break;
5716 case 3:
5717 default:
5718 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
5719 s->mem_index, MO_LESW);
5720 gen_helper_fildl_FT0(cpu_env, cpu_tmp2_i32);
5721 break;
5722 }
5723
5724 gen_helper_fp_arith_ST0_FT0(op1);
5725 if (op1 == 3) {
5726 /* fcomp needs pop */
5727 gen_helper_fpop(cpu_env);
5728 }
5729 }
5730 break;
5731 case 0x08: /* flds */
5732 case 0x0a: /* fsts */
5733 case 0x0b: /* fstps */
5734 case 0x18 ... 0x1b: /* fildl, fisttpl, fistl, fistpl */
5735 case 0x28 ... 0x2b: /* fldl, fisttpll, fstl, fstpl */
5736 case 0x38 ... 0x3b: /* filds, fisttps, fists, fistps */
5737 switch(op & 7) {
5738 case 0:
5739 switch(op >> 4) {
5740 case 0:
5741 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
5742 s->mem_index, MO_LEUL);
5743 gen_helper_flds_ST0(cpu_env, cpu_tmp2_i32);
5744 break;
5745 case 1:
5746 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
5747 s->mem_index, MO_LEUL);
5748 gen_helper_fildl_ST0(cpu_env, cpu_tmp2_i32);
5749 break;
5750 case 2:
5751 tcg_gen_qemu_ld_i64(cpu_tmp1_i64, cpu_A0,
5752 s->mem_index, MO_LEQ);
5753 gen_helper_fldl_ST0(cpu_env, cpu_tmp1_i64);
5754 break;
5755 case 3:
5756 default:
5757 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
5758 s->mem_index, MO_LESW);
5759 gen_helper_fildl_ST0(cpu_env, cpu_tmp2_i32);
5760 break;
5761 }
5762 break;
5763 case 1:
5764 /* XXX: the corresponding CPUID bit must be tested ! */
5765 switch(op >> 4) {
5766 case 1:
5767 gen_helper_fisttl_ST0(cpu_tmp2_i32, cpu_env);
5768 tcg_gen_qemu_st_i32(cpu_tmp2_i32, cpu_A0,
5769 s->mem_index, MO_LEUL);
5770 break;
5771 case 2:
5772 gen_helper_fisttll_ST0(cpu_tmp1_i64, cpu_env);
5773 tcg_gen_qemu_st_i64(cpu_tmp1_i64, cpu_A0,
5774 s->mem_index, MO_LEQ);
5775 break;
5776 case 3:
5777 default:
5778 gen_helper_fistt_ST0(cpu_tmp2_i32, cpu_env);
5779 tcg_gen_qemu_st_i32(cpu_tmp2_i32, cpu_A0,
5780 s->mem_index, MO_LEUW);
5781 break;
5782 }
5783 gen_helper_fpop(cpu_env);
5784 break;
5785 default:
5786 switch(op >> 4) {
5787 case 0:
5788 gen_helper_fsts_ST0(cpu_tmp2_i32, cpu_env);
5789 tcg_gen_qemu_st_i32(cpu_tmp2_i32, cpu_A0,
5790 s->mem_index, MO_LEUL);
5791 break;
5792 case 1:
5793 gen_helper_fistl_ST0(cpu_tmp2_i32, cpu_env);
5794 tcg_gen_qemu_st_i32(cpu_tmp2_i32, cpu_A0,
5795 s->mem_index, MO_LEUL);
5796 break;
5797 case 2:
5798 gen_helper_fstl_ST0(cpu_tmp1_i64, cpu_env);
5799 tcg_gen_qemu_st_i64(cpu_tmp1_i64, cpu_A0,
5800 s->mem_index, MO_LEQ);
5801 break;
5802 case 3:
5803 default:
5804 gen_helper_fist_ST0(cpu_tmp2_i32, cpu_env);
5805 tcg_gen_qemu_st_i32(cpu_tmp2_i32, cpu_A0,
5806 s->mem_index, MO_LEUW);
5807 break;
5808 }
5809 if ((op & 7) == 3)
5810 gen_helper_fpop(cpu_env);
5811 break;
5812 }
5813 break;
5814 case 0x0c: /* fldenv mem */
5815 gen_update_cc_op(s);
5816 gen_jmp_im(pc_start - s->cs_base);
5817 gen_helper_fldenv(cpu_env, cpu_A0, tcg_const_i32(dflag - 1));
5818 break;
5819 case 0x0d: /* fldcw mem */
5820 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
5821 s->mem_index, MO_LEUW);
5822 gen_helper_fldcw(cpu_env, cpu_tmp2_i32);
5823 break;
5824 case 0x0e: /* fnstenv mem */
5825 gen_update_cc_op(s);
5826 gen_jmp_im(pc_start - s->cs_base);
5827 gen_helper_fstenv(cpu_env, cpu_A0, tcg_const_i32(dflag - 1));
5828 break;
5829 case 0x0f: /* fnstcw mem */
5830 gen_helper_fnstcw(cpu_tmp2_i32, cpu_env);
5831 tcg_gen_qemu_st_i32(cpu_tmp2_i32, cpu_A0,
5832 s->mem_index, MO_LEUW);
5833 break;
5834 case 0x1d: /* fldt mem */
5835 gen_update_cc_op(s);
5836 gen_jmp_im(pc_start - s->cs_base);
5837 gen_helper_fldt_ST0(cpu_env, cpu_A0);
5838 break;
5839 case 0x1f: /* fstpt mem */
5840 gen_update_cc_op(s);
5841 gen_jmp_im(pc_start - s->cs_base);
5842 gen_helper_fstt_ST0(cpu_env, cpu_A0);
5843 gen_helper_fpop(cpu_env);
5844 break;
5845 case 0x2c: /* frstor mem */
5846 gen_update_cc_op(s);
5847 gen_jmp_im(pc_start - s->cs_base);
5848 gen_helper_frstor(cpu_env, cpu_A0, tcg_const_i32(dflag - 1));
5849 break;
5850 case 0x2e: /* fnsave mem */
5851 gen_update_cc_op(s);
5852 gen_jmp_im(pc_start - s->cs_base);
5853 gen_helper_fsave(cpu_env, cpu_A0, tcg_const_i32(dflag - 1));
5854 break;
5855 case 0x2f: /* fnstsw mem */
5856 gen_helper_fnstsw(cpu_tmp2_i32, cpu_env);
5857 tcg_gen_qemu_st_i32(cpu_tmp2_i32, cpu_A0,
5858 s->mem_index, MO_LEUW);
5859 break;
5860 case 0x3c: /* fbld */
5861 gen_update_cc_op(s);
5862 gen_jmp_im(pc_start - s->cs_base);
5863 gen_helper_fbld_ST0(cpu_env, cpu_A0);
5864 break;
5865 case 0x3e: /* fbstp */
5866 gen_update_cc_op(s);
5867 gen_jmp_im(pc_start - s->cs_base);
5868 gen_helper_fbst_ST0(cpu_env, cpu_A0);
5869 gen_helper_fpop(cpu_env);
5870 break;
5871 case 0x3d: /* fildll */
5872 tcg_gen_qemu_ld_i64(cpu_tmp1_i64, cpu_A0, s->mem_index, MO_LEQ);
5873 gen_helper_fildll_ST0(cpu_env, cpu_tmp1_i64);
5874 break;
5875 case 0x3f: /* fistpll */
5876 gen_helper_fistll_ST0(cpu_tmp1_i64, cpu_env);
5877 tcg_gen_qemu_st_i64(cpu_tmp1_i64, cpu_A0, s->mem_index, MO_LEQ);
5878 gen_helper_fpop(cpu_env);
5879 break;
5880 default:
5881 goto illegal_op;
5882 }
5883 } else {
5884 /* register float ops */
5885 opreg = rm;
5886
5887 switch(op) {
5888 case 0x08: /* fld sti */
5889 gen_helper_fpush(cpu_env);
5890 gen_helper_fmov_ST0_STN(cpu_env,
5891 tcg_const_i32((opreg + 1) & 7));
5892 break;
5893 case 0x09: /* fxchg sti */
5894 case 0x29: /* fxchg4 sti, undocumented op */
5895 case 0x39: /* fxchg7 sti, undocumented op */
5896 gen_helper_fxchg_ST0_STN(cpu_env, tcg_const_i32(opreg));
5897 break;
5898 case 0x0a: /* grp d9/2 */
5899 switch(rm) {
5900 case 0: /* fnop */
5901 /* check exceptions (FreeBSD FPU probe) */
5902 gen_update_cc_op(s);
5903 gen_jmp_im(pc_start - s->cs_base);
5904 gen_helper_fwait(cpu_env);
5905 break;
5906 default:
5907 goto illegal_op;
5908 }
5909 break;
5910 case 0x0c: /* grp d9/4 */
5911 switch(rm) {
5912 case 0: /* fchs */
5913 gen_helper_fchs_ST0(cpu_env);
5914 break;
5915 case 1: /* fabs */
5916 gen_helper_fabs_ST0(cpu_env);
5917 break;
5918 case 4: /* ftst */
5919 gen_helper_fldz_FT0(cpu_env);
5920 gen_helper_fcom_ST0_FT0(cpu_env);
5921 break;
5922 case 5: /* fxam */
5923 gen_helper_fxam_ST0(cpu_env);
5924 break;
5925 default:
5926 goto illegal_op;
5927 }
5928 break;
5929 case 0x0d: /* grp d9/5 */
5930 {
5931 switch(rm) {
5932 case 0:
5933 gen_helper_fpush(cpu_env);
5934 gen_helper_fld1_ST0(cpu_env);
5935 break;
5936 case 1:
5937 gen_helper_fpush(cpu_env);
5938 gen_helper_fldl2t_ST0(cpu_env);
5939 break;
5940 case 2:
5941 gen_helper_fpush(cpu_env);
5942 gen_helper_fldl2e_ST0(cpu_env);
5943 break;
5944 case 3:
5945 gen_helper_fpush(cpu_env);
5946 gen_helper_fldpi_ST0(cpu_env);
5947 break;
5948 case 4:
5949 gen_helper_fpush(cpu_env);
5950 gen_helper_fldlg2_ST0(cpu_env);
5951 break;
5952 case 5:
5953 gen_helper_fpush(cpu_env);
5954 gen_helper_fldln2_ST0(cpu_env);
5955 break;
5956 case 6:
5957 gen_helper_fpush(cpu_env);
5958 gen_helper_fldz_ST0(cpu_env);
5959 break;
5960 default:
5961 goto illegal_op;
5962 }
5963 }
5964 break;
5965 case 0x0e: /* grp d9/6 */
5966 switch(rm) {
5967 case 0: /* f2xm1 */
5968 gen_helper_f2xm1(cpu_env);
5969 break;
5970 case 1: /* fyl2x */
5971 gen_helper_fyl2x(cpu_env);
5972 break;
5973 case 2: /* fptan */
5974 gen_helper_fptan(cpu_env);
5975 break;
5976 case 3: /* fpatan */
5977 gen_helper_fpatan(cpu_env);
5978 break;
5979 case 4: /* fxtract */
5980 gen_helper_fxtract(cpu_env);
5981 break;
5982 case 5: /* fprem1 */
5983 gen_helper_fprem1(cpu_env);
5984 break;
5985 case 6: /* fdecstp */
5986 gen_helper_fdecstp(cpu_env);
5987 break;
5988 default:
5989 case 7: /* fincstp */
5990 gen_helper_fincstp(cpu_env);
5991 break;
5992 }
5993 break;
5994 case 0x0f: /* grp d9/7 */
5995 switch(rm) {
5996 case 0: /* fprem */
5997 gen_helper_fprem(cpu_env);
5998 break;
5999 case 1: /* fyl2xp1 */
6000 gen_helper_fyl2xp1(cpu_env);
6001 break;
6002 case 2: /* fsqrt */
6003 gen_helper_fsqrt(cpu_env);
6004 break;
6005 case 3: /* fsincos */
6006 gen_helper_fsincos(cpu_env);
6007 break;
6008 case 5: /* fscale */
6009 gen_helper_fscale(cpu_env);
6010 break;
6011 case 4: /* frndint */
6012 gen_helper_frndint(cpu_env);
6013 break;
6014 case 6: /* fsin */
6015 gen_helper_fsin(cpu_env);
6016 break;
6017 default:
6018 case 7: /* fcos */
6019 gen_helper_fcos(cpu_env);
6020 break;
6021 }
6022 break;
6023 case 0x00: case 0x01: case 0x04 ... 0x07: /* fxxx st, sti */
6024 case 0x20: case 0x21: case 0x24 ... 0x27: /* fxxx sti, st */
6025 case 0x30: case 0x31: case 0x34 ... 0x37: /* fxxxp sti, st */
6026 {
6027 int op1;
6028
6029 op1 = op & 7;
6030 if (op >= 0x20) {
6031 gen_helper_fp_arith_STN_ST0(op1, opreg);
6032 if (op >= 0x30)
6033 gen_helper_fpop(cpu_env);
6034 } else {
6035 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6036 gen_helper_fp_arith_ST0_FT0(op1);
6037 }
6038 }
6039 break;
6040 case 0x02: /* fcom */
6041 case 0x22: /* fcom2, undocumented op */
6042 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6043 gen_helper_fcom_ST0_FT0(cpu_env);
6044 break;
6045 case 0x03: /* fcomp */
6046 case 0x23: /* fcomp3, undocumented op */
6047 case 0x32: /* fcomp5, undocumented op */
6048 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6049 gen_helper_fcom_ST0_FT0(cpu_env);
6050 gen_helper_fpop(cpu_env);
6051 break;
6052 case 0x15: /* da/5 */
6053 switch(rm) {
6054 case 1: /* fucompp */
6055 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(1));
6056 gen_helper_fucom_ST0_FT0(cpu_env);
6057 gen_helper_fpop(cpu_env);
6058 gen_helper_fpop(cpu_env);
6059 break;
6060 default:
6061 goto illegal_op;
6062 }
6063 break;
6064 case 0x1c:
6065 switch(rm) {
6066 case 0: /* feni (287 only, just do nop here) */
6067 break;
6068 case 1: /* fdisi (287 only, just do nop here) */
6069 break;
6070 case 2: /* fclex */
6071 gen_helper_fclex(cpu_env);
6072 break;
6073 case 3: /* fninit */
6074 gen_helper_fninit(cpu_env);
6075 break;
6076 case 4: /* fsetpm (287 only, just do nop here) */
6077 break;
6078 default:
6079 goto illegal_op;
6080 }
6081 break;
6082 case 0x1d: /* fucomi */
6083 if (!(s->cpuid_features & CPUID_CMOV(1 << 15))) {
6084 goto illegal_op;
6085 }
6086 gen_update_cc_op(s);
6087 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6088 gen_helper_fucomi_ST0_FT0(cpu_env);
6089 set_cc_op(s, CC_OP_EFLAGS);
6090 break;
6091 case 0x1e: /* fcomi */
6092 if (!(s->cpuid_features & CPUID_CMOV(1 << 15))) {
6093 goto illegal_op;
6094 }
6095 gen_update_cc_op(s);
6096 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6097 gen_helper_fcomi_ST0_FT0(cpu_env);
6098 set_cc_op(s, CC_OP_EFLAGS);
6099 break;
6100 case 0x28: /* ffree sti */
6101 gen_helper_ffree_STN(cpu_env, tcg_const_i32(opreg));
6102 break;
6103 case 0x2a: /* fst sti */
6104 gen_helper_fmov_STN_ST0(cpu_env, tcg_const_i32(opreg));
6105 break;
6106 case 0x2b: /* fstp sti */
6107 case 0x0b: /* fstp1 sti, undocumented op */
6108 case 0x3a: /* fstp8 sti, undocumented op */
6109 case 0x3b: /* fstp9 sti, undocumented op */
6110 gen_helper_fmov_STN_ST0(cpu_env, tcg_const_i32(opreg));
6111 gen_helper_fpop(cpu_env);
6112 break;
6113 case 0x2c: /* fucom st(i) */
6114 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6115 gen_helper_fucom_ST0_FT0(cpu_env);
6116 break;
6117 case 0x2d: /* fucomp st(i) */
6118 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6119 gen_helper_fucom_ST0_FT0(cpu_env);
6120 gen_helper_fpop(cpu_env);
6121 break;
6122 case 0x33: /* de/3 */
6123 switch(rm) {
6124 case 1: /* fcompp */
6125 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(1));
6126 gen_helper_fcom_ST0_FT0(cpu_env);
6127 gen_helper_fpop(cpu_env);
6128 gen_helper_fpop(cpu_env);
6129 break;
6130 default:
6131 goto illegal_op;
6132 }
6133 break;
6134 case 0x38: /* ffreep sti, undocumented op */
6135 gen_helper_ffree_STN(cpu_env, tcg_const_i32(opreg));
6136 gen_helper_fpop(cpu_env);
6137 break;
6138 case 0x3c: /* df/4 */
6139 switch(rm) {
6140 case 0:
6141 gen_helper_fnstsw(cpu_tmp2_i32, cpu_env);
6142 tcg_gen_extu_i32_tltcg_gen_mov_i32(cpu_T[0], cpu_tmp2_i32);
6143 gen_op_mov_reg_v(MO_16, R_EAX0, cpu_T[0]);
6144 break;
6145 default:
6146 goto illegal_op;
6147 }
6148 break;
6149 case 0x3d: /* fucomip */
6150 if (!(s->cpuid_features & CPUID_CMOV(1 << 15))) {
6151 goto illegal_op;
6152 }
6153 gen_update_cc_op(s);
6154 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6155 gen_helper_fucomi_ST0_FT0(cpu_env);
6156 gen_helper_fpop(cpu_env);
6157 set_cc_op(s, CC_OP_EFLAGS);
6158 break;
6159 case 0x3e: /* fcomip */
6160 if (!(s->cpuid_features & CPUID_CMOV(1 << 15))) {
6161 goto illegal_op;
6162 }
6163 gen_update_cc_op(s);
6164 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6165 gen_helper_fcomi_ST0_FT0(cpu_env);
6166 gen_helper_fpop(cpu_env);
6167 set_cc_op(s, CC_OP_EFLAGS);
6168 break;
6169 case 0x10 ... 0x13: /* fcmovxx */
6170 case 0x18 ... 0x1b:
6171 {
6172 int op1, l1;
6173 static const uint8_t fcmov_cc[8] = {
6174 (JCC_B << 1),
6175 (JCC_Z << 1),
6176 (JCC_BE << 1),
6177 (JCC_P << 1),
6178 };
6179
6180 if (!(s->cpuid_features & CPUID_CMOV(1 << 15))) {
6181 goto illegal_op;
6182 }
6183 op1 = fcmov_cc[op & 3] | (((op >> 3) & 1) ^ 1);
6184 l1 = gen_new_label();
6185 gen_jcc1_noeob(s, op1, l1);
6186 gen_helper_fmov_ST0_STN(cpu_env, tcg_const_i32(opreg));
6187 gen_set_label(l1);
6188 }
6189 break;
6190 default:
6191 goto illegal_op;
6192 }
6193 }
6194 break;
6195 /************************/
6196 /* string ops */
6197
6198 case 0xa4: /* movsS */
6199 case 0xa5:
6200 ot = mo_b_d(b, dflag);
6201 if (prefixes & (PREFIX_REPZ0x01 | PREFIX_REPNZ0x02)) {
6202 gen_repz_movs(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6203 } else {
6204 gen_movs(s, ot);
6205 }
6206 break;
6207
6208 case 0xaa: /* stosS */
6209 case 0xab:
6210 ot = mo_b_d(b, dflag);
6211 if (prefixes & (PREFIX_REPZ0x01 | PREFIX_REPNZ0x02)) {
6212 gen_repz_stos(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6213 } else {
6214 gen_stos(s, ot);
6215 }
6216 break;
6217 case 0xac: /* lodsS */
6218 case 0xad:
6219 ot = mo_b_d(b, dflag);
6220 if (prefixes & (PREFIX_REPZ0x01 | PREFIX_REPNZ0x02)) {
6221 gen_repz_lods(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6222 } else {
6223 gen_lods(s, ot);
6224 }
6225 break;
6226 case 0xae: /* scasS */
6227 case 0xaf:
6228 ot = mo_b_d(b, dflag);
6229 if (prefixes & PREFIX_REPNZ0x02) {
6230 gen_repz_scas(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 1);
6231 } else if (prefixes & PREFIX_REPZ0x01) {
6232 gen_repz_scas(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 0);
6233 } else {
6234 gen_scas(s, ot);
6235 }
6236 break;
6237
6238 case 0xa6: /* cmpsS */
6239 case 0xa7:
6240 ot = mo_b_d(b, dflag);
6241 if (prefixes & PREFIX_REPNZ0x02) {
6242 gen_repz_cmps(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 1);
6243 } else if (prefixes & PREFIX_REPZ0x01) {
6244 gen_repz_cmps(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 0);
6245 } else {
6246 gen_cmps(s, ot);
6247 }
6248 break;
6249 case 0x6c: /* insS */
6250 case 0x6d:
6251 ot = mo_b_d32(b, dflag);
6252 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_T[0], cpu_regs[R_EDX2]);
6253 gen_check_io(s, ot, pc_start - s->cs_base,
6254 SVM_IOIO_TYPE_MASK1 | svm_is_rep(prefixes) | 4);
6255 if (prefixes & (PREFIX_REPZ0x01 | PREFIX_REPNZ0x02)) {
6256 gen_repz_ins(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6257 } else {
6258 gen_ins(s, ot);
6259 if (use_icount) {
6260 gen_jmp(s, s->pc - s->cs_base);
6261 }
6262 }
6263 break;
6264 case 0x6e: /* outsS */
6265 case 0x6f:
6266 ot = mo_b_d32(b, dflag);
6267 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_T[0], cpu_regs[R_EDX2]);
6268 gen_check_io(s, ot, pc_start - s->cs_base,
6269 svm_is_rep(prefixes) | 4);
6270 if (prefixes & (PREFIX_REPZ0x01 | PREFIX_REPNZ0x02)) {
6271 gen_repz_outs(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6272 } else {
6273 gen_outs(s, ot);
6274 if (use_icount) {
6275 gen_jmp(s, s->pc - s->cs_base);
6276 }
6277 }
6278 break;
6279
6280 /************************/
6281 /* port I/O */
6282
6283 case 0xe4:
6284 case 0xe5:
6285 ot = mo_b_d32(b, dflag);
6286 val = cpu_ldub_code(env, s->pc++);
6287 gen_check_io(s, ot, pc_start - s->cs_base,
6288 SVM_IOIO_TYPE_MASK1 | svm_is_rep(prefixes));
6289 if (use_icount)
6290 gen_io_start();
6291 tcg_gen_movi_i32(cpu_tmp2_i32, val);
6292 gen_helper_in_func(ot, cpu_T[1], cpu_tmp2_i32);
6293 gen_op_mov_reg_v(ot, R_EAX0, cpu_T[1]);
6294 if (use_icount) {
6295 gen_io_end();
6296 gen_jmp(s, s->pc - s->cs_base);
6297 }
6298 break;
6299 case 0xe6:
6300 case 0xe7:
6301 ot = mo_b_d32(b, dflag);
6302 val = cpu_ldub_code(env, s->pc++);
6303 gen_check_io(s, ot, pc_start - s->cs_base,
6304 svm_is_rep(prefixes));
6305 gen_op_mov_v_reg(ot, cpu_T[1], R_EAX0);
6306
6307 if (use_icount)
6308 gen_io_start();
6309 tcg_gen_movi_i32(cpu_tmp2_i32, val);
6310 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp3_i32, cpu_T[1]);
6311 gen_helper_out_func(ot, cpu_tmp2_i32, cpu_tmp3_i32);
6312 if (use_icount) {
6313 gen_io_end();
6314 gen_jmp(s, s->pc - s->cs_base);
6315 }
6316 break;
6317 case 0xec:
6318 case 0xed:
6319 ot = mo_b_d32(b, dflag);
6320 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_T[0], cpu_regs[R_EDX2]);
6321 gen_check_io(s, ot, pc_start - s->cs_base,
6322 SVM_IOIO_TYPE_MASK1 | svm_is_rep(prefixes));
6323 if (use_icount)
6324 gen_io_start();
6325 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
6326 gen_helper_in_func(ot, cpu_T[1], cpu_tmp2_i32);
6327 gen_op_mov_reg_v(ot, R_EAX0, cpu_T[1]);
6328 if (use_icount) {
6329 gen_io_end();
6330 gen_jmp(s, s->pc - s->cs_base);
6331 }
6332 break;
6333 case 0xee:
6334 case 0xef:
6335 ot = mo_b_d32(b, dflag);
6336 tcg_gen_ext16u_tltcg_gen_ext16u_i32(cpu_T[0], cpu_regs[R_EDX2]);
6337 gen_check_io(s, ot, pc_start - s->cs_base,
6338 svm_is_rep(prefixes));
6339 gen_op_mov_v_reg(ot, cpu_T[1], R_EAX0);
6340
6341 if (use_icount)
6342 gen_io_start();
6343 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
6344 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp3_i32, cpu_T[1]);
6345 gen_helper_out_func(ot, cpu_tmp2_i32, cpu_tmp3_i32);
6346 if (use_icount) {
6347 gen_io_end();
6348 gen_jmp(s, s->pc - s->cs_base);
6349 }
6350 break;
6351
6352 /************************/
6353 /* control */
6354 case 0xc2: /* ret im */
6355 val = cpu_ldsw_code(env, s->pc);
6356 s->pc += 2;
6357 ot = gen_pop_T0(s);
6358 gen_stack_update(s, val + (1 << ot));
6359 /* Note that gen_pop_T0 uses a zero-extending load. */
6360 gen_op_jmp_v(cpu_T[0]);
6361 gen_eob(s);
6362 break;
6363 case 0xc3: /* ret */
6364 ot = gen_pop_T0(s);
6365 gen_pop_update(s, ot);
6366 /* Note that gen_pop_T0 uses a zero-extending load. */
6367 gen_op_jmp_v(cpu_T[0]);
6368 gen_eob(s);
6369 break;
6370 case 0xca: /* lret im */
6371 val = cpu_ldsw_code(env, s->pc);
6372 s->pc += 2;
6373 do_lret:
6374 if (s->pe && !s->vm86) {
6375 gen_update_cc_op(s);
6376 gen_jmp_im(pc_start - s->cs_base);
6377 gen_helper_lret_protected(cpu_env, tcg_const_i32(dflag - 1),
6378 tcg_const_i32(val));
6379 } else {
6380 gen_stack_A0(s);
6381 /* pop offset */
6382 gen_op_ld_v(s, dflag, cpu_T[0], cpu_A0);
6383 /* NOTE: keeping EIP updated is not a problem in case of
6384 exception */
6385 gen_op_jmp_v(cpu_T[0]);
6386 /* pop selector */
6387 gen_op_addl_A0_im(1 << dflag);
6388 gen_op_ld_v(s, dflag, cpu_T[0], cpu_A0);
6389 gen_op_movl_seg_T0_vm(R_CS1);
6390 /* add stack offset */
6391 gen_stack_update(s, val + (2 << dflag));
6392 }
6393 gen_eob(s);
6394 break;
6395 case 0xcb: /* lret */
6396 val = 0;
6397 goto do_lret;
6398 case 0xcf: /* iret */
6399 gen_svm_check_intercept(s, pc_start, SVM_EXIT_IRET0x074);
6400 if (!s->pe) {
6401 /* real mode */
6402 gen_helper_iret_real(cpu_env, tcg_const_i32(dflag - 1));
6403 set_cc_op(s, CC_OP_EFLAGS);
6404 } else if (s->vm86) {
6405 if (s->iopl != 3) {
6406 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
6407 } else {
6408 gen_helper_iret_real(cpu_env, tcg_const_i32(dflag - 1));
6409 set_cc_op(s, CC_OP_EFLAGS);
6410 }
6411 } else {
6412 gen_update_cc_op(s);
6413 gen_jmp_im(pc_start - s->cs_base);
6414 gen_helper_iret_protected(cpu_env, tcg_const_i32(dflag - 1),
6415 tcg_const_i32(s->pc - s->cs_base));
6416 set_cc_op(s, CC_OP_EFLAGS);
6417 }
6418 gen_eob(s);
6419 break;
6420 case 0xe8: /* call im */
6421 {
6422 if (dflag != MO_16) {
6423 tval = (int32_t)insn_get(env, s, MO_32);
6424 } else {
6425 tval = (int16_t)insn_get(env, s, MO_16);
6426 }
6427 next_eip = s->pc - s->cs_base;
6428 tval += next_eip;
6429 if (dflag == MO_16) {
6430 tval &= 0xffff;
6431 } else if (!CODE64(s)0) {
6432 tval &= 0xffffffff;
6433 }
6434 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], next_eip);
6435 gen_push_v(s, cpu_T[0]);
6436 gen_jmp(s, tval);
6437 }
6438 break;
6439 case 0x9a: /* lcall im */
6440 {
6441 unsigned int selector, offset;
6442
6443 if (CODE64(s)0)
6444 goto illegal_op;
6445 ot = dflag;
6446 offset = insn_get(env, s, ot);
6447 selector = insn_get(env, s, MO_16);
6448
6449 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], selector);
6450 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], offset);
6451 }
6452 goto do_lcall;
6453 case 0xe9: /* jmp im */
6454 if (dflag != MO_16) {
6455 tval = (int32_t)insn_get(env, s, MO_32);
6456 } else {
6457 tval = (int16_t)insn_get(env, s, MO_16);
6458 }
6459 tval += s->pc - s->cs_base;
6460 if (dflag == MO_16) {
6461 tval &= 0xffff;
6462 } else if (!CODE64(s)0) {
6463 tval &= 0xffffffff;
6464 }
6465 gen_jmp(s, tval);
6466 break;
6467 case 0xea: /* ljmp im */
6468 {
6469 unsigned int selector, offset;
6470
6471 if (CODE64(s)0)
6472 goto illegal_op;
6473 ot = dflag;
6474 offset = insn_get(env, s, ot);
6475 selector = insn_get(env, s, MO_16);
6476
6477 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[0], selector);
6478 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], offset);
6479 }
6480 goto do_ljmp;
6481 case 0xeb: /* jmp Jb */
6482 tval = (int8_t)insn_get(env, s, MO_8);
6483 tval += s->pc - s->cs_base;
6484 if (dflag == MO_16) {
6485 tval &= 0xffff;
6486 }
6487 gen_jmp(s, tval);
6488 break;
6489 case 0x70 ... 0x7f: /* jcc Jb */
6490 tval = (int8_t)insn_get(env, s, MO_8);
6491 goto do_jcc;
6492 case 0x180 ... 0x18f: /* jcc Jv */
6493 if (dflag != MO_16) {
6494 tval = (int32_t)insn_get(env, s, MO_32);
6495 } else {
6496 tval = (int16_t)insn_get(env, s, MO_16);
6497 }
6498 do_jcc:
6499 next_eip = s->pc - s->cs_base;
6500 tval += next_eip;
6501 if (dflag == MO_16) {
6502 tval &= 0xffff;
6503 }
6504 gen_jcc(s, b, tval, next_eip);
6505 break;
6506
6507 case 0x190 ... 0x19f: /* setcc Gv */
6508 modrm = cpu_ldub_code(env, s->pc++);
6509 gen_setcc1(s, b, cpu_T[0]);
6510 gen_ldst_modrm(env, s, modrm, MO_8, OR_TMP0, 1);
6511 break;
6512 case 0x140 ... 0x14f: /* cmov Gv, Ev */
6513 if (!(s->cpuid_features & CPUID_CMOV(1 << 15))) {
6514 goto illegal_op;
6515 }
6516 ot = dflag;
6517 modrm = cpu_ldub_code(env, s->pc++);
6518 reg = ((modrm >> 3) & 7) | rex_r;
6519 gen_cmovcc1(env, s, ot, b, modrm, reg);
6520 break;
6521
6522 /************************/
6523 /* flags */
6524 case 0x9c: /* pushf */
6525 gen_svm_check_intercept(s, pc_start, SVM_EXIT_PUSHF0x070);
6526 if (s->vm86 && s->iopl != 3) {
6527 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
6528 } else {
6529 gen_update_cc_op(s);
6530 gen_helper_read_eflags(cpu_T[0], cpu_env);
6531 gen_push_v(s, cpu_T[0]);
6532 }
6533 break;
6534 case 0x9d: /* popf */
6535 gen_svm_check_intercept(s, pc_start, SVM_EXIT_POPF0x071);
6536 if (s->vm86 && s->iopl != 3) {
6537 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
6538 } else {
6539 ot = gen_pop_T0(s);
6540 if (s->cpl == 0) {
6541 if (dflag != MO_16) {
6542 gen_helper_write_eflags(cpu_env, cpu_T[0],
6543 tcg_const_i32((TF_MASK0x00000100 | AC_MASK0x00040000 |
6544 ID_MASK0x00200000 | NT_MASK0x00004000 |
6545 IF_MASK0x00000200 |
6546 IOPL_MASK0x00003000)));
6547 } else {
6548 gen_helper_write_eflags(cpu_env, cpu_T[0],
6549 tcg_const_i32((TF_MASK0x00000100 | AC_MASK0x00040000 |
6550 ID_MASK0x00200000 | NT_MASK0x00004000 |
6551 IF_MASK0x00000200 | IOPL_MASK0x00003000)
6552 & 0xffff));
6553 }
6554 } else {
6555 if (s->cpl <= s->iopl) {
6556 if (dflag != MO_16) {
6557 gen_helper_write_eflags(cpu_env, cpu_T[0],
6558 tcg_const_i32((TF_MASK0x00000100 |
6559 AC_MASK0x00040000 |
6560 ID_MASK0x00200000 |
6561 NT_MASK0x00004000 |
6562 IF_MASK0x00000200)));
6563 } else {
6564 gen_helper_write_eflags(cpu_env, cpu_T[0],
6565 tcg_const_i32((TF_MASK0x00000100 |
6566 AC_MASK0x00040000 |
6567 ID_MASK0x00200000 |
6568 NT_MASK0x00004000 |
6569 IF_MASK0x00000200)
6570 & 0xffff));
6571 }
6572 } else {
6573 if (dflag != MO_16) {
6574 gen_helper_write_eflags(cpu_env, cpu_T[0],
6575 tcg_const_i32((TF_MASK0x00000100 | AC_MASK0x00040000 |
6576 ID_MASK0x00200000 | NT_MASK0x00004000)));
6577 } else {
6578 gen_helper_write_eflags(cpu_env, cpu_T[0],
6579 tcg_const_i32((TF_MASK0x00000100 | AC_MASK0x00040000 |
6580 ID_MASK0x00200000 | NT_MASK0x00004000)
6581 & 0xffff));
6582 }
6583 }
6584 }
6585 gen_pop_update(s, ot);
6586 set_cc_op(s, CC_OP_EFLAGS);
6587 /* abort translation because TF/AC flag may change */
6588 gen_jmp_im(s->pc - s->cs_base);
6589 gen_eob(s);
6590 }
6591 break;
6592 case 0x9e: /* sahf */
6593 if (CODE64(s)0 && !(s->cpuid_ext3_features & CPUID_EXT3_LAHF_LM(1 << 0)))
6594 goto illegal_op;
6595 gen_op_mov_v_reg(MO_8, cpu_T[0], R_AH4);
6596 gen_compute_eflags(s);
6597 tcg_gen_andi_tltcg_gen_andi_i32(cpu_cc_src, cpu_cc_src, CC_O0x0800);
6598 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[0], cpu_T[0], CC_S0x0080 | CC_Z0x0040 | CC_A0x0010 | CC_P0x0004 | CC_C0x0001);
6599 tcg_gen_or_tltcg_gen_or_i32(cpu_cc_src, cpu_cc_src, cpu_T[0]);
6600 break;
6601 case 0x9f: /* lahf */
6602 if (CODE64(s)0 && !(s->cpuid_ext3_features & CPUID_EXT3_LAHF_LM(1 << 0)))
6603 goto illegal_op;
6604 gen_compute_eflags(s);
6605 /* Note: gen_compute_eflags() only gives the condition codes */
6606 tcg_gen_ori_tltcg_gen_ori_i32(cpu_T[0], cpu_cc_src, 0x02);
6607 gen_op_mov_reg_v(MO_8, R_AH4, cpu_T[0]);
6608 break;
6609 case 0xf5: /* cmc */
6610 gen_compute_eflags(s);
6611 tcg_gen_xori_tltcg_gen_xori_i32(cpu_cc_src, cpu_cc_src, CC_C0x0001);
6612 break;
6613 case 0xf8: /* clc */
6614 gen_compute_eflags(s);
6615 tcg_gen_andi_tltcg_gen_andi_i32(cpu_cc_src, cpu_cc_src, ~CC_C0x0001);
6616 break;
6617 case 0xf9: /* stc */
6618 gen_compute_eflags(s);
6619 tcg_gen_ori_tltcg_gen_ori_i32(cpu_cc_src, cpu_cc_src, CC_C0x0001);
6620 break;
6621 case 0xfc: /* cld */
6622 tcg_gen_movi_i32(cpu_tmp2_i32, 1);
6623 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, offsetof(CPUX86State, df)__builtin_offsetof(CPUX86State, df));
6624 break;
6625 case 0xfd: /* std */
6626 tcg_gen_movi_i32(cpu_tmp2_i32, -1);
6627 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, offsetof(CPUX86State, df)__builtin_offsetof(CPUX86State, df));
6628 break;
6629
6630 /************************/
6631 /* bit operations */
6632 case 0x1ba: /* bt/bts/btr/btc Gv, im */
6633 ot = dflag;
6634 modrm = cpu_ldub_code(env, s->pc++);
6635 op = (modrm >> 3) & 7;
6636 mod = (modrm >> 6) & 3;
6637 rm = (modrm & 7) | REX_B(s)0;
6638 if (mod != 3) {
6639 s->rip_offset = 1;
6640 gen_lea_modrm(env, s, modrm);
6641 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
6642 } else {
6643 gen_op_mov_v_reg(ot, cpu_T[0], rm);
6644 }
6645 /* load shift */
6646 val = cpu_ldub_code(env, s->pc++);
6647 tcg_gen_movi_tltcg_gen_movi_i32(cpu_T[1], val);
6648 if (op < 4)
6649 goto illegal_op;
6650 op -= 4;
6651 goto bt_op;
6652 case 0x1a3: /* bt Gv, Ev */
6653 op = 0;
6654 goto do_btx;
6655 case 0x1ab: /* bts */
6656 op = 1;
6657 goto do_btx;
6658 case 0x1b3: /* btr */
6659 op = 2;
6660 goto do_btx;
6661 case 0x1bb: /* btc */
6662 op = 3;
6663 do_btx:
6664 ot = dflag;
6665 modrm = cpu_ldub_code(env, s->pc++);
6666 reg = ((modrm >> 3) & 7) | rex_r;
6667 mod = (modrm >> 6) & 3;
6668 rm = (modrm & 7) | REX_B(s)0;
6669 gen_op_mov_v_reg(MO_32, cpu_T[1], reg);
6670 if (mod != 3) {
6671 gen_lea_modrm(env, s, modrm);
6672 /* specific case: we need to add a displacement */
6673 gen_exts(ot, cpu_T[1]);
6674 tcg_gen_sari_tltcg_gen_sari_i32(cpu_tmp0, cpu_T[1], 3 + ot);
6675 tcg_gen_shli_tltcg_gen_shli_i32(cpu_tmp0, cpu_tmp0, ot);
6676 tcg_gen_add_tltcg_gen_add_i32(cpu_A0, cpu_A0, cpu_tmp0);
6677 gen_op_ld_v(s, ot, cpu_T[0], cpu_A0);
6678 } else {
6679 gen_op_mov_v_reg(ot, cpu_T[0], rm);
6680 }
6681 bt_op:
6682 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[1], cpu_T[1], (1 << (3 + ot)) - 1);
6683 switch(op) {
6684 case 0:
6685 tcg_gen_shr_tltcg_gen_shr_i32(cpu_cc_src, cpu_T[0], cpu_T[1]);
6686 tcg_gen_movi_tltcg_gen_movi_i32(cpu_cc_dst, 0);
6687 break;
6688 case 1:
6689 tcg_gen_shr_tltcg_gen_shr_i32(cpu_tmp4, cpu_T[0], cpu_T[1]);
6690 tcg_gen_movi_tltcg_gen_movi_i32(cpu_tmp0, 1);
6691 tcg_gen_shl_tltcg_gen_shl_i32(cpu_tmp0, cpu_tmp0, cpu_T[1]);
6692 tcg_gen_or_tltcg_gen_or_i32(cpu_T[0], cpu_T[0], cpu_tmp0);
6693 break;
6694 case 2:
6695 tcg_gen_shr_tltcg_gen_shr_i32(cpu_tmp4, cpu_T[0], cpu_T[1]);
6696 tcg_gen_movi_tltcg_gen_movi_i32(cpu_tmp0, 1);
6697 tcg_gen_shl_tltcg_gen_shl_i32(cpu_tmp0, cpu_tmp0, cpu_T[1]);
6698 tcg_gen_not_tltcg_gen_not_i32(cpu_tmp0, cpu_tmp0);
6699 tcg_gen_and_tltcg_gen_and_i32(cpu_T[0], cpu_T[0], cpu_tmp0);
6700 break;
6701 default:
6702 case 3:
6703 tcg_gen_shr_tltcg_gen_shr_i32(cpu_tmp4, cpu_T[0], cpu_T[1]);
6704 tcg_gen_movi_tltcg_gen_movi_i32(cpu_tmp0, 1);
6705 tcg_gen_shl_tltcg_gen_shl_i32(cpu_tmp0, cpu_tmp0, cpu_T[1]);
6706 tcg_gen_xor_tltcg_gen_xor_i32(cpu_T[0], cpu_T[0], cpu_tmp0);
6707 break;
6708 }
6709 set_cc_op(s, CC_OP_SARB + ot);
6710 if (op != 0) {
6711 if (mod != 3) {
6712 gen_op_st_v(s, ot, cpu_T[0], cpu_A0);
6713 } else {
6714 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
6715 }
6716 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_tmp4);
6717 tcg_gen_movi_tltcg_gen_movi_i32(cpu_cc_dst, 0);
6718 }
6719 break;
6720 case 0x1bc: /* bsf / tzcnt */
6721 case 0x1bd: /* bsr / lzcnt */
6722 ot = dflag;
6723 modrm = cpu_ldub_code(env, s->pc++);
6724 reg = ((modrm >> 3) & 7) | rex_r;
6725 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
6726 gen_extu(ot, cpu_T[0]);
6727
6728 /* Note that lzcnt and tzcnt are in different extensions. */
6729 if ((prefixes & PREFIX_REPZ0x01)
6730 && (b & 1
6731 ? s->cpuid_ext3_features & CPUID_EXT3_ABM(1 << 5)
6732 : s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_BMI1(1 << 3))) {
6733 int size = 8 << ot;
6734 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_src, cpu_T[0]);
6735 if (b & 1) {
6736 /* For lzcnt, reduce the target_ulong result by the
6737 number of zeros that we expect to find at the top. */
6738 gen_helper_clz(cpu_T[0], cpu_T[0]);
6739 tcg_gen_subi_tltcg_gen_subi_i32(cpu_T[0], cpu_T[0], TARGET_LONG_BITS32 - size);
6740 } else {
6741 /* For tzcnt, a zero input must return the operand size:
6742 force all bits outside the operand size to 1. */
6743 target_ulong mask = (target_ulong)-2 << (size - 1);
6744 tcg_gen_ori_tltcg_gen_ori_i32(cpu_T[0], cpu_T[0], mask);
6745 gen_helper_ctz(cpu_T[0], cpu_T[0]);
6746 }
6747 /* For lzcnt/tzcnt, C and Z bits are defined and are
6748 related to the result. */
6749 gen_op_update1_cc();
6750 set_cc_op(s, CC_OP_BMILGB + ot);
6751 } else {
6752 /* For bsr/bsf, only the Z bit is defined and it is related
6753 to the input and not the result. */
6754 tcg_gen_mov_tltcg_gen_mov_i32(cpu_cc_dst, cpu_T[0]);
6755 set_cc_op(s, CC_OP_LOGICB + ot);
6756 if (b & 1) {
6757 /* For bsr, return the bit index of the first 1 bit,
6758 not the count of leading zeros. */
6759 gen_helper_clz(cpu_T[0], cpu_T[0]);
6760 tcg_gen_xori_tltcg_gen_xori_i32(cpu_T[0], cpu_T[0], TARGET_LONG_BITS32 - 1);
6761 } else {
6762 gen_helper_ctz(cpu_T[0], cpu_T[0]);
6763 }
6764 /* ??? The manual says that the output is undefined when the
6765 input is zero, but real hardware leaves it unchanged, and
6766 real programs appear to depend on that. */
6767 tcg_gen_movi_tltcg_gen_movi_i32(cpu_tmp0, 0);
6768 tcg_gen_movcond_tltcg_gen_movcond_i32(TCG_COND_EQ, cpu_T[0], cpu_cc_dst, cpu_tmp0,
6769 cpu_regs[reg], cpu_T[0]);
6770 }
6771 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
6772 break;
6773 /************************/
6774 /* bcd */
6775 case 0x27: /* daa */
6776 if (CODE64(s)0)
6777 goto illegal_op;
6778 gen_update_cc_op(s);
6779 gen_helper_daa(cpu_env);
6780 set_cc_op(s, CC_OP_EFLAGS);
6781 break;
6782 case 0x2f: /* das */
6783 if (CODE64(s)0)
6784 goto illegal_op;
6785 gen_update_cc_op(s);
6786 gen_helper_das(cpu_env);
6787 set_cc_op(s, CC_OP_EFLAGS);
6788 break;
6789 case 0x37: /* aaa */
6790 if (CODE64(s)0)
6791 goto illegal_op;
6792 gen_update_cc_op(s);
6793 gen_helper_aaa(cpu_env);
6794 set_cc_op(s, CC_OP_EFLAGS);
6795 break;
6796 case 0x3f: /* aas */
6797 if (CODE64(s)0)
6798 goto illegal_op;
6799 gen_update_cc_op(s);
6800 gen_helper_aas(cpu_env);
6801 set_cc_op(s, CC_OP_EFLAGS);
6802 break;
6803 case 0xd4: /* aam */
6804 if (CODE64(s)0)
6805 goto illegal_op;
6806 val = cpu_ldub_code(env, s->pc++);
6807 if (val == 0) {
6808 gen_exception(s, EXCP00_DIVZ0, pc_start - s->cs_base);
6809 } else {
6810 gen_helper_aam(cpu_env, tcg_const_i32(val));
6811 set_cc_op(s, CC_OP_LOGICB);
6812 }
6813 break;
6814 case 0xd5: /* aad */
6815 if (CODE64(s)0)
6816 goto illegal_op;
6817 val = cpu_ldub_code(env, s->pc++);
6818 gen_helper_aad(cpu_env, tcg_const_i32(val));
6819 set_cc_op(s, CC_OP_LOGICB);
6820 break;
6821 /************************/
6822 /* misc */
6823 case 0x90: /* nop */
6824 /* XXX: correct lock test for all insn */
6825 if (prefixes & PREFIX_LOCK0x04) {
6826 goto illegal_op;
6827 }
6828 /* If REX_B is set, then this is xchg eax, r8d, not a nop. */
6829 if (REX_B(s)0) {
6830 goto do_xchg_reg_eax;
6831 }
6832 if (prefixes & PREFIX_REPZ0x01) {
6833 gen_update_cc_op(s);
6834 gen_jmp_im(pc_start - s->cs_base);
6835 gen_helper_pause(cpu_env, tcg_const_i32(s->pc - pc_start));
6836 s->is_jmp = DISAS_TB_JUMP3;
6837 }
6838 break;
6839 case 0x9b: /* fwait */
6840 if ((s->flags & (HF_MP_MASK(1 << 9) | HF_TS_MASK(1 << 11))) ==
6841 (HF_MP_MASK(1 << 9) | HF_TS_MASK(1 << 11))) {
6842 gen_exception(s, EXCP07_PREX7, pc_start - s->cs_base);
6843 } else {
6844 gen_update_cc_op(s);
6845 gen_jmp_im(pc_start - s->cs_base);
6846 gen_helper_fwait(cpu_env);
6847 }
6848 break;
6849 case 0xcc: /* int3 */
6850 gen_interrupt(s, EXCP03_INT33, pc_start - s->cs_base, s->pc - s->cs_base);
6851 break;
6852 case 0xcd: /* int N */
6853 val = cpu_ldub_code(env, s->pc++);
6854 if (s->vm86 && s->iopl != 3) {
6855 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
6856 } else {
6857 gen_interrupt(s, val, pc_start - s->cs_base, s->pc - s->cs_base);
6858 }
6859 break;
6860 case 0xce: /* into */
6861 if (CODE64(s)0)
6862 goto illegal_op;
6863 gen_update_cc_op(s);
6864 gen_jmp_im(pc_start - s->cs_base);
6865 gen_helper_into(cpu_env, tcg_const_i32(s->pc - pc_start));
6866 break;
6867#ifdef WANT_ICEBP
6868 case 0xf1: /* icebp (undocumented, exits to external debugger) */
6869 gen_svm_check_intercept(s, pc_start, SVM_EXIT_ICEBP0x088);
6870#if 1
6871 gen_debug(s, pc_start - s->cs_base);
6872#else
6873 /* start debug */
6874 tb_flush(env);
6875 qemu_set_log(CPU_LOG_INT(1 << 4) | CPU_LOG_TB_IN_ASM(1 << 1));
6876#endif
6877 break;
6878#endif
6879 case 0xfa: /* cli */
6880 if (!s->vm86) {
6881 if (s->cpl <= s->iopl) {
6882 gen_helper_cli(cpu_env);
6883 } else {
6884 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
6885 }
6886 } else {
6887 if (s->iopl == 3) {
6888 gen_helper_cli(cpu_env);
6889 } else {
6890 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
6891 }
6892 }
6893 break;
6894 case 0xfb: /* sti */
6895 if (!s->vm86) {
6896 if (s->cpl <= s->iopl) {
6897 gen_sti:
6898 gen_helper_sti(cpu_env);
6899 /* interruptions are enabled only the first insn after sti */
6900 /* If several instructions disable interrupts, only the
6901 _first_ does it */
6902 if (!(s->tb->flags & HF_INHIBIT_IRQ_MASK(1 << 3)))
6903 gen_helper_set_inhibit_irq(cpu_env);
6904 /* give a chance to handle pending irqs */
6905 gen_jmp_im(s->pc - s->cs_base);
6906 gen_eob(s);
6907 } else {
6908 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
6909 }
6910 } else {
6911 if (s->iopl == 3) {
6912 goto gen_sti;
6913 } else {
6914 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
6915 }
6916 }
6917 break;
6918 case 0x62: /* bound */
6919 if (CODE64(s)0)
6920 goto illegal_op;
6921 ot = dflag;
6922 modrm = cpu_ldub_code(env, s->pc++);
6923 reg = (modrm >> 3) & 7;
6924 mod = (modrm >> 6) & 3;
6925 if (mod == 3)
6926 goto illegal_op;
6927 gen_op_mov_v_reg(ot, cpu_T[0], reg);
6928 gen_lea_modrm(env, s, modrm);
6929 gen_jmp_im(pc_start - s->cs_base);
6930 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
6931 if (ot == MO_16) {
6932 gen_helper_boundw(cpu_env, cpu_A0, cpu_tmp2_i32);
6933 } else {
6934 gen_helper_boundl(cpu_env, cpu_A0, cpu_tmp2_i32);
6935 }
6936 break;
6937 case 0x1c8 ... 0x1cf: /* bswap reg */
6938 reg = (b & 7) | REX_B(s)0;
6939#ifdef TARGET_X86_64
6940 if (dflag == MO_64) {
6941 gen_op_mov_v_reg(MO_64, cpu_T[0], reg);
6942 tcg_gen_bswap64_i64(cpu_T[0], cpu_T[0]);
6943 gen_op_mov_reg_v(MO_64, reg, cpu_T[0]);
6944 } else
6945#endif
6946 {
6947 gen_op_mov_v_reg(MO_32, cpu_T[0], reg);
6948 tcg_gen_ext32u_tltcg_gen_mov_i32(cpu_T[0], cpu_T[0]);
6949 tcg_gen_bswap32_tltcg_gen_bswap32_i32(cpu_T[0], cpu_T[0]);
6950 gen_op_mov_reg_v(MO_32, reg, cpu_T[0]);
6951 }
6952 break;
6953 case 0xd6: /* salc */
6954 if (CODE64(s)0)
6955 goto illegal_op;
6956 gen_compute_eflags_c(s, cpu_T[0]);
6957 tcg_gen_neg_tltcg_gen_neg_i32(cpu_T[0], cpu_T[0]);
6958 gen_op_mov_reg_v(MO_8, R_EAX0, cpu_T[0]);
6959 break;
6960 case 0xe0: /* loopnz */
6961 case 0xe1: /* loopz */
6962 case 0xe2: /* loop */
6963 case 0xe3: /* jecxz */
6964 {
6965 int l1, l2, l3;
6966
6967 tval = (int8_t)insn_get(env, s, MO_8);
6968 next_eip = s->pc - s->cs_base;
6969 tval += next_eip;
6970 if (dflag == MO_16) {
6971 tval &= 0xffff;
6972 }
6973
6974 l1 = gen_new_label();
6975 l2 = gen_new_label();
6976 l3 = gen_new_label();
6977 b &= 3;
6978 switch(b) {
6979 case 0: /* loopnz */
6980 case 1: /* loopz */
6981 gen_op_add_reg_im(s->aflag, R_ECX1, -1);
6982 gen_op_jz_ecx(s->aflag, l3);
6983 gen_jcc1(s, (JCC_Z << 1) | (b ^ 1), l1);
6984 break;
6985 case 2: /* loop */
6986 gen_op_add_reg_im(s->aflag, R_ECX1, -1);
6987 gen_op_jnz_ecx(s->aflag, l1);
6988 break;
6989 default:
6990 case 3: /* jcxz */
6991 gen_op_jz_ecx(s->aflag, l1);
6992 break;
6993 }
6994
6995 gen_set_label(l3);
6996 gen_jmp_im(next_eip);
6997 tcg_gen_br(l2);
6998
6999 gen_set_label(l1);
7000 gen_jmp_im(tval);
7001 gen_set_label(l2);
7002 gen_eob(s);
7003 }
7004 break;
7005 case 0x130: /* wrmsr */
7006 case 0x132: /* rdmsr */
7007 if (s->cpl != 0) {
7008 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7009 } else {
7010 gen_update_cc_op(s);
7011 gen_jmp_im(pc_start - s->cs_base);
7012 if (b & 2) {
7013 gen_helper_rdmsr(cpu_env);
7014 } else {
7015 gen_helper_wrmsr(cpu_env);
7016 }
7017 }
7018 break;
7019 case 0x131: /* rdtsc */
7020 gen_update_cc_op(s);
7021 gen_jmp_im(pc_start - s->cs_base);
7022 if (use_icount)
7023 gen_io_start();
7024 gen_helper_rdtsc(cpu_env);
7025 if (use_icount) {
7026 gen_io_end();
7027 gen_jmp(s, s->pc - s->cs_base);
7028 }
7029 break;
7030 case 0x133: /* rdpmc */
7031 gen_update_cc_op(s);
7032 gen_jmp_im(pc_start - s->cs_base);
7033 gen_helper_rdpmc(cpu_env);
7034 break;
7035 case 0x134: /* sysenter */
7036 /* For Intel SYSENTER is valid on 64-bit */
7037 if (CODE64(s)0 && env->cpuid_vendor1 != CPUID_VENDOR_INTEL_10x756e6547)
7038 goto illegal_op;
7039 if (!s->pe) {
7040 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7041 } else {
7042 gen_update_cc_op(s);
7043 gen_jmp_im(pc_start - s->cs_base);
7044 gen_helper_sysenter(cpu_env);
7045 gen_eob(s);
7046 }
7047 break;
7048 case 0x135: /* sysexit */
7049 /* For Intel SYSEXIT is valid on 64-bit */
7050 if (CODE64(s)0 && env->cpuid_vendor1 != CPUID_VENDOR_INTEL_10x756e6547)
7051 goto illegal_op;
7052 if (!s->pe) {
7053 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7054 } else {
7055 gen_update_cc_op(s);
7056 gen_jmp_im(pc_start - s->cs_base);
7057 gen_helper_sysexit(cpu_env, tcg_const_i32(dflag - 1));
7058 gen_eob(s);
7059 }
7060 break;
7061#ifdef TARGET_X86_64
7062 case 0x105: /* syscall */
7063 /* XXX: is it usable in real mode ? */
7064 gen_update_cc_op(s);
7065 gen_jmp_im(pc_start - s->cs_base);
7066 gen_helper_syscall(cpu_env, tcg_const_i32(s->pc - pc_start));
7067 gen_eob(s);
7068 break;
7069 case 0x107: /* sysret */
7070 if (!s->pe) {
7071 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7072 } else {
7073 gen_update_cc_op(s);
7074 gen_jmp_im(pc_start - s->cs_base);
7075 gen_helper_sysret(cpu_env, tcg_const_i32(dflag - 1));
7076 /* condition codes are modified only in long mode */
7077 if (s->lma) {
7078 set_cc_op(s, CC_OP_EFLAGS);
7079 }
7080 gen_eob(s);
7081 }
7082 break;
7083#endif
7084 case 0x1a2: /* cpuid */
7085 gen_update_cc_op(s);
7086 gen_jmp_im(pc_start - s->cs_base);
7087 gen_helper_cpuid(cpu_env);
7088 break;
7089 case 0xf4: /* hlt */
7090 if (s->cpl != 0) {
7091 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7092 } else {
7093 gen_update_cc_op(s);
7094 gen_jmp_im(pc_start - s->cs_base);
7095 gen_helper_hlt(cpu_env, tcg_const_i32(s->pc - pc_start));
7096 s->is_jmp = DISAS_TB_JUMP3;
7097 }
7098 break;
7099 case 0x100:
7100 modrm = cpu_ldub_code(env, s->pc++);
7101 mod = (modrm >> 6) & 3;
7102 op = (modrm >> 3) & 7;
7103 switch(op) {
7104 case 0: /* sldt */
7105 if (!s->pe || s->vm86)
7106 goto illegal_op;
7107 gen_svm_check_intercept(s, pc_start, SVM_EXIT_LDTR_READ0x068);
7108 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,ldt.selector)__builtin_offsetof(CPUX86State, ldt.selector));
7109 ot = mod == 3 ? dflag : MO_16;
7110 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
7111 break;
7112 case 2: /* lldt */
7113 if (!s->pe || s->vm86)
7114 goto illegal_op;
7115 if (s->cpl != 0) {
7116 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7117 } else {
7118 gen_svm_check_intercept(s, pc_start, SVM_EXIT_LDTR_WRITE0x06c);
7119 gen_ldst_modrm(env, s, modrm, MO_16, OR_TMP0, 0);
7120 gen_jmp_im(pc_start - s->cs_base);
7121 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
7122 gen_helper_lldt(cpu_env, cpu_tmp2_i32);
7123 }
7124 break;
7125 case 1: /* str */
7126 if (!s->pe || s->vm86)
7127 goto illegal_op;
7128 gen_svm_check_intercept(s, pc_start, SVM_EXIT_TR_READ0x069);
7129 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,tr.selector)__builtin_offsetof(CPUX86State, tr.selector));
7130 ot = mod == 3 ? dflag : MO_16;
7131 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
7132 break;
7133 case 3: /* ltr */
7134 if (!s->pe || s->vm86)
7135 goto illegal_op;
7136 if (s->cpl != 0) {
7137 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7138 } else {
7139 gen_svm_check_intercept(s, pc_start, SVM_EXIT_TR_WRITE0x06d);
7140 gen_ldst_modrm(env, s, modrm, MO_16, OR_TMP0, 0);
7141 gen_jmp_im(pc_start - s->cs_base);
7142 tcg_gen_trunc_tl_i32tcg_gen_mov_i32(cpu_tmp2_i32, cpu_T[0]);
7143 gen_helper_ltr(cpu_env, cpu_tmp2_i32);
7144 }
7145 break;
7146 case 4: /* verr */
7147 case 5: /* verw */
7148 if (!s->pe || s->vm86)
7149 goto illegal_op;
7150 gen_ldst_modrm(env, s, modrm, MO_16, OR_TMP0, 0);
7151 gen_update_cc_op(s);
7152 if (op == 4) {
7153 gen_helper_verr(cpu_env, cpu_T[0]);
7154 } else {
7155 gen_helper_verw(cpu_env, cpu_T[0]);
7156 }
7157 set_cc_op(s, CC_OP_EFLAGS);
7158 break;
7159 default:
7160 goto illegal_op;
7161 }
7162 break;
7163 case 0x101:
7164 modrm = cpu_ldub_code(env, s->pc++);
7165 mod = (modrm >> 6) & 3;
7166 op = (modrm >> 3) & 7;
7167 rm = modrm & 7;
7168 switch(op) {
7169 case 0: /* sgdt */
7170 if (mod == 3)
7171 goto illegal_op;
7172 gen_svm_check_intercept(s, pc_start, SVM_EXIT_GDTR_READ0x067);
7173 gen_lea_modrm(env, s, modrm);
7174 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State, gdt.limit)__builtin_offsetof(CPUX86State, gdt.limit));
7175 gen_op_st_v(s, MO_16, cpu_T[0], cpu_A0);
7176 gen_add_A0_im(s, 2);
7177 tcg_gen_ld_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State, gdt.base)__builtin_offsetof(CPUX86State, gdt.base));
7178 if (dflag == MO_16) {
7179 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[0], cpu_T[0], 0xffffff);
7180 }
7181 gen_op_st_v(s, CODE64(s)0 + MO_32, cpu_T[0], cpu_A0);
7182 break;
7183 case 1:
7184 if (mod == 3) {
7185 switch (rm) {
7186 case 0: /* monitor */
7187 if (!(s->cpuid_ext_features & CPUID_EXT_MONITOR(1 << 3)) ||
7188 s->cpl != 0)
7189 goto illegal_op;
7190 gen_update_cc_op(s);
7191 gen_jmp_im(pc_start - s->cs_base);
7192 tcg_gen_mov_tltcg_gen_mov_i32(cpu_A0, cpu_regs[R_EAX0]);
7193 gen_extu(s->aflag, cpu_A0);
7194 gen_add_A0_ds_seg(s);
7195 gen_helper_monitor(cpu_env, cpu_A0);
7196 break;
7197 case 1: /* mwait */
7198 if (!(s->cpuid_ext_features & CPUID_EXT_MONITOR(1 << 3)) ||
7199 s->cpl != 0)
7200 goto illegal_op;
7201 gen_update_cc_op(s);
7202 gen_jmp_im(pc_start - s->cs_base);
7203 gen_helper_mwait(cpu_env, tcg_const_i32(s->pc - pc_start));
7204 gen_eob(s);
7205 break;
7206 case 2: /* clac */
7207 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_SMAP(1 << 20)) ||
7208 s->cpl != 0) {
7209 goto illegal_op;
7210 }
7211 gen_helper_clac(cpu_env);
7212 gen_jmp_im(s->pc - s->cs_base);
7213 gen_eob(s);
7214 break;
7215 case 3: /* stac */
7216 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_SMAP(1 << 20)) ||
7217 s->cpl != 0) {
7218 goto illegal_op;
7219 }
7220 gen_helper_stac(cpu_env);
7221 gen_jmp_im(s->pc - s->cs_base);
7222 gen_eob(s);
7223 break;
7224 default:
7225 goto illegal_op;
7226 }
7227 } else { /* sidt */
7228 gen_svm_check_intercept(s, pc_start, SVM_EXIT_IDTR_READ0x066);
7229 gen_lea_modrm(env, s, modrm);
7230 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State, idt.limit)__builtin_offsetof(CPUX86State, idt.limit));
7231 gen_op_st_v(s, MO_16, cpu_T[0], cpu_A0);
7232 gen_add_A0_im(s, 2);
7233 tcg_gen_ld_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State, idt.base)__builtin_offsetof(CPUX86State, idt.base));
7234 if (dflag == MO_16) {
7235 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[0], cpu_T[0], 0xffffff);
7236 }
7237 gen_op_st_v(s, CODE64(s)0 + MO_32, cpu_T[0], cpu_A0);
7238 }
7239 break;
7240 case 2: /* lgdt */
7241 case 3: /* lidt */
7242 if (mod == 3) {
7243 gen_update_cc_op(s);
7244 gen_jmp_im(pc_start - s->cs_base);
7245 switch(rm) {
7246 case 0: /* VMRUN */
7247 if (!(s->flags & HF_SVME_MASK(1 << 20)) || !s->pe)
7248 goto illegal_op;
7249 if (s->cpl != 0) {
7250 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7251 break;
7252 } else {
7253 gen_helper_vmrun(cpu_env, tcg_const_i32(s->aflag - 1),
7254 tcg_const_i32(s->pc - pc_start));
7255 tcg_gen_exit_tb(0);
7256 s->is_jmp = DISAS_TB_JUMP3;
7257 }
7258 break;
7259 case 1: /* VMMCALL */
7260 if (!(s->flags & HF_SVME_MASK(1 << 20)))
7261 goto illegal_op;
7262 gen_helper_vmmcall(cpu_env);
7263 break;
7264 case 2: /* VMLOAD */
7265 if (!(s->flags & HF_SVME_MASK(1 << 20)) || !s->pe)
7266 goto illegal_op;
7267 if (s->cpl != 0) {
7268 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7269 break;
7270 } else {
7271 gen_helper_vmload(cpu_env, tcg_const_i32(s->aflag - 1));
7272 }
7273 break;
7274 case 3: /* VMSAVE */
7275 if (!(s->flags & HF_SVME_MASK(1 << 20)) || !s->pe)
7276 goto illegal_op;
7277 if (s->cpl != 0) {
7278 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7279 break;
7280 } else {
7281 gen_helper_vmsave(cpu_env, tcg_const_i32(s->aflag - 1));
7282 }
7283 break;
7284 case 4: /* STGI */
7285 if ((!(s->flags & HF_SVME_MASK(1 << 20)) &&
7286 !(s->cpuid_ext3_features & CPUID_EXT3_SKINIT(1 << 12))) ||
7287 !s->pe)
7288 goto illegal_op;
7289 if (s->cpl != 0) {
7290 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7291 break;
7292 } else {
7293 gen_helper_stgi(cpu_env);
7294 }
7295 break;
7296 case 5: /* CLGI */
7297 if (!(s->flags & HF_SVME_MASK(1 << 20)) || !s->pe)
7298 goto illegal_op;
7299 if (s->cpl != 0) {
7300 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7301 break;
7302 } else {
7303 gen_helper_clgi(cpu_env);
7304 }
7305 break;
7306 case 6: /* SKINIT */
7307 if ((!(s->flags & HF_SVME_MASK(1 << 20)) &&
7308 !(s->cpuid_ext3_features & CPUID_EXT3_SKINIT(1 << 12))) ||
7309 !s->pe)
7310 goto illegal_op;
7311 gen_helper_skinit(cpu_env);
7312 break;
7313 case 7: /* INVLPGA */
7314 if (!(s->flags & HF_SVME_MASK(1 << 20)) || !s->pe)
7315 goto illegal_op;
7316 if (s->cpl != 0) {
7317 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7318 break;
7319 } else {
7320 gen_helper_invlpga(cpu_env,
7321 tcg_const_i32(s->aflag - 1));
7322 }
7323 break;
7324 default:
7325 goto illegal_op;
7326 }
7327 } else if (s->cpl != 0) {
7328 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7329 } else {
7330 gen_svm_check_intercept(s, pc_start,
7331 op==2 ? SVM_EXIT_GDTR_WRITE0x06b : SVM_EXIT_IDTR_WRITE0x06a);
7332 gen_lea_modrm(env, s, modrm);
7333 gen_op_ld_v(s, MO_16, cpu_T[1], cpu_A0);
7334 gen_add_A0_im(s, 2);
7335 gen_op_ld_v(s, CODE64(s)0 + MO_32, cpu_T[0], cpu_A0);
7336 if (dflag == MO_16) {
7337 tcg_gen_andi_tltcg_gen_andi_i32(cpu_T[0], cpu_T[0], 0xffffff);
7338 }
7339 if (op == 2) {
7340 tcg_gen_st_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,gdt.base)__builtin_offsetof(CPUX86State, gdt.base));
7341 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[1], cpu_env, offsetof(CPUX86State,gdt.limit)__builtin_offsetof(CPUX86State, gdt.limit));
7342 } else {
7343 tcg_gen_st_tltcg_gen_st_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,idt.base)__builtin_offsetof(CPUX86State, idt.base));
7344 tcg_gen_st32_tltcg_gen_st_i32(cpu_T[1], cpu_env, offsetof(CPUX86State,idt.limit)__builtin_offsetof(CPUX86State, idt.limit));
7345 }
7346 }
7347 break;
7348 case 4: /* smsw */
7349 gen_svm_check_intercept(s, pc_start, SVM_EXIT_READ_CR00x000);
7350#if defined TARGET_X86_64 && defined HOST_WORDS_BIGENDIAN
7351 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,cr[0])__builtin_offsetof(CPUX86State, cr[0]) + 4);
7352#else
7353 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,cr[0])__builtin_offsetof(CPUX86State, cr[0]));
7354#endif
7355 gen_ldst_modrm(env, s, modrm, MO_16, OR_TMP0, 1);
7356 break;
7357 case 6: /* lmsw */
7358 if (s->cpl != 0) {
7359 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7360 } else {
7361 gen_svm_check_intercept(s, pc_start, SVM_EXIT_WRITE_CR00x010);
7362 gen_ldst_modrm(env, s, modrm, MO_16, OR_TMP0, 0);
7363 gen_helper_lmsw(cpu_env, cpu_T[0]);
7364 gen_jmp_im(s->pc - s->cs_base);
7365 gen_eob(s);
7366 }
7367 break;
7368 case 7:
7369 if (mod != 3) { /* invlpg */
7370 if (s->cpl != 0) {
7371 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7372 } else {
7373 gen_update_cc_op(s);
7374 gen_jmp_im(pc_start - s->cs_base);
7375 gen_lea_modrm(env, s, modrm);
7376 gen_helper_invlpg(cpu_env, cpu_A0);
7377 gen_jmp_im(s->pc - s->cs_base);
7378 gen_eob(s);
7379 }
7380 } else {
7381 switch (rm) {
7382 case 0: /* swapgs */
7383#ifdef TARGET_X86_64
7384 if (CODE64(s)0) {
7385 if (s->cpl != 0) {
7386 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7387 } else {
7388 tcg_gen_ld_tltcg_gen_ld_i32(cpu_T[0], cpu_env,
7389 offsetof(CPUX86State,segs[R_GS].base)__builtin_offsetof(CPUX86State, segs[5].base));
7390 tcg_gen_ld_tltcg_gen_ld_i32(cpu_T[1], cpu_env,
7391 offsetof(CPUX86State,kernelgsbase)__builtin_offsetof(CPUX86State, kernelgsbase));
7392 tcg_gen_st_tltcg_gen_st_i32(cpu_T[1], cpu_env,
7393 offsetof(CPUX86State,segs[R_GS].base)__builtin_offsetof(CPUX86State, segs[5].base));
7394 tcg_gen_st_tltcg_gen_st_i32(cpu_T[0], cpu_env,
7395 offsetof(CPUX86State,kernelgsbase)__builtin_offsetof(CPUX86State, kernelgsbase));
7396 }
7397 } else
7398#endif
7399 {
7400 goto illegal_op;
7401 }
7402 break;
7403 case 1: /* rdtscp */
7404 if (!(s->cpuid_ext2_features & CPUID_EXT2_RDTSCP(1 << 27)))
7405 goto illegal_op;
7406 gen_update_cc_op(s);
7407 gen_jmp_im(pc_start - s->cs_base);
7408 if (use_icount)
7409 gen_io_start();
7410 gen_helper_rdtscp(cpu_env);
7411 if (use_icount) {
7412 gen_io_end();
7413 gen_jmp(s, s->pc - s->cs_base);
7414 }
7415 break;
7416 default:
7417 goto illegal_op;
7418 }
7419 }
7420 break;
7421 default:
7422 goto illegal_op;
7423 }
7424 break;
7425 case 0x108: /* invd */
7426 case 0x109: /* wbinvd */
7427 if (s->cpl != 0) {
7428 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7429 } else {
7430 gen_svm_check_intercept(s, pc_start, (b & 2) ? SVM_EXIT_INVD0x076 : SVM_EXIT_WBINVD0x089);
7431 /* nothing to do */
7432 }
7433 break;
7434 case 0x63: /* arpl or movslS (x86_64) */
7435#ifdef TARGET_X86_64
7436 if (CODE64(s)0) {
7437 int d_ot;
7438 /* d_ot is the size of destination */
7439 d_ot = dflag;
7440
7441 modrm = cpu_ldub_code(env, s->pc++);
7442 reg = ((modrm >> 3) & 7) | rex_r;
7443 mod = (modrm >> 6) & 3;
7444 rm = (modrm & 7) | REX_B(s)0;
7445
7446 if (mod == 3) {
7447 gen_op_mov_v_reg(MO_32, cpu_T[0], rm);
7448 /* sign extend */
7449 if (d_ot == MO_64) {
7450 tcg_gen_ext32s_tltcg_gen_mov_i32(cpu_T[0], cpu_T[0]);
7451 }
7452 gen_op_mov_reg_v(d_ot, reg, cpu_T[0]);
7453 } else {
7454 gen_lea_modrm(env, s, modrm);
7455 gen_op_ld_v(s, MO_32 | MO_SIGN, cpu_T[0], cpu_A0);
7456 gen_op_mov_reg_v(d_ot, reg, cpu_T[0]);
7457 }
7458 } else
7459#endif
7460 {
7461 int label1;
7462 TCGvTCGv_i32 t0, t1, t2, a0;
7463
7464 if (!s->pe || s->vm86)
7465 goto illegal_op;
7466 t0 = tcg_temp_local_new()tcg_temp_local_new_i32();
7467 t1 = tcg_temp_local_new()tcg_temp_local_new_i32();
7468 t2 = tcg_temp_local_new()tcg_temp_local_new_i32();
7469 ot = MO_16;
7470 modrm = cpu_ldub_code(env, s->pc++);
7471 reg = (modrm >> 3) & 7;
7472 mod = (modrm >> 6) & 3;
7473 rm = modrm & 7;
7474 if (mod != 3) {
7475 gen_lea_modrm(env, s, modrm);
7476 gen_op_ld_v(s, ot, t0, cpu_A0);
7477 a0 = tcg_temp_local_new()tcg_temp_local_new_i32();
7478 tcg_gen_mov_tltcg_gen_mov_i32(a0, cpu_A0);
7479 } else {
7480 gen_op_mov_v_reg(ot, t0, rm);
7481 TCGV_UNUSED(a0)a0 = __extension__ ({ TCGv_i32 make_tcgv_tmp = {-1}; make_tcgv_tmp
;})
;
7482 }
7483 gen_op_mov_v_reg(ot, t1, reg);
7484 tcg_gen_andi_tltcg_gen_andi_i32(cpu_tmp0, t0, 3);
7485 tcg_gen_andi_tltcg_gen_andi_i32(t1, t1, 3);
7486 tcg_gen_movi_tltcg_gen_movi_i32(t2, 0);
7487 label1 = gen_new_label();
7488 tcg_gen_brcond_tltcg_gen_brcond_i32(TCG_COND_GE, cpu_tmp0, t1, label1);
7489 tcg_gen_andi_tltcg_gen_andi_i32(t0, t0, ~3);
7490 tcg_gen_or_tltcg_gen_or_i32(t0, t0, t1);
7491 tcg_gen_movi_tltcg_gen_movi_i32(t2, CC_Z0x0040);
7492 gen_set_label(label1);
7493 if (mod != 3) {
7494 gen_op_st_v(s, ot, t0, a0);
7495 tcg_temp_freetcg_temp_free_i32(a0);
7496 } else {
7497 gen_op_mov_reg_v(ot, rm, t0);
7498 }
7499 gen_compute_eflags(s);
7500 tcg_gen_andi_tltcg_gen_andi_i32(cpu_cc_src, cpu_cc_src, ~CC_Z0x0040);
7501 tcg_gen_or_tltcg_gen_or_i32(cpu_cc_src, cpu_cc_src, t2);
7502 tcg_temp_freetcg_temp_free_i32(t0);
7503 tcg_temp_freetcg_temp_free_i32(t1);
7504 tcg_temp_freetcg_temp_free_i32(t2);
7505 }
7506 break;
7507 case 0x102: /* lar */
7508 case 0x103: /* lsl */
7509 {
7510 int label1;
7511 TCGvTCGv_i32 t0;
7512 if (!s->pe || s->vm86)
7513 goto illegal_op;
7514 ot = dflag != MO_16 ? MO_32 : MO_16;
7515 modrm = cpu_ldub_code(env, s->pc++);
7516 reg = ((modrm >> 3) & 7) | rex_r;
7517 gen_ldst_modrm(env, s, modrm, MO_16, OR_TMP0, 0);
7518 t0 = tcg_temp_local_new()tcg_temp_local_new_i32();
7519 gen_update_cc_op(s);
7520 if (b == 0x102) {
7521 gen_helper_lar(t0, cpu_env, cpu_T[0]);
7522 } else {
7523 gen_helper_lsl(t0, cpu_env, cpu_T[0]);
7524 }
7525 tcg_gen_andi_tltcg_gen_andi_i32(cpu_tmp0, cpu_cc_src, CC_Z0x0040);
7526 label1 = gen_new_label();
7527 tcg_gen_brcondi_tltcg_gen_brcondi_i32(TCG_COND_EQ, cpu_tmp0, 0, label1);
7528 gen_op_mov_reg_v(ot, reg, t0);
7529 gen_set_label(label1);
7530 set_cc_op(s, CC_OP_EFLAGS);
7531 tcg_temp_freetcg_temp_free_i32(t0);
7532 }
7533 break;
7534 case 0x118:
7535 modrm = cpu_ldub_code(env, s->pc++);
7536 mod = (modrm >> 6) & 3;
7537 op = (modrm >> 3) & 7;
7538 switch(op) {
7539 case 0: /* prefetchnta */
7540 case 1: /* prefetchnt0 */
7541 case 2: /* prefetchnt0 */
7542 case 3: /* prefetchnt0 */
7543 if (mod == 3)
7544 goto illegal_op;
7545 gen_lea_modrm(env, s, modrm);
7546 /* nothing more to do */
7547 break;
7548 default: /* nop (multi byte) */
7549 gen_nop_modrm(env, s, modrm);
7550 break;
7551 }
7552 break;
7553 case 0x119 ... 0x11f: /* nop (multi byte) */
7554 modrm = cpu_ldub_code(env, s->pc++);
7555 gen_nop_modrm(env, s, modrm);
7556 break;
7557 case 0x120: /* mov reg, crN */
7558 case 0x122: /* mov crN, reg */
7559 if (s->cpl != 0) {
7560 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7561 } else {
7562 modrm = cpu_ldub_code(env, s->pc++);
7563 /* Ignore the mod bits (assume (modrm&0xc0)==0xc0).
7564 * AMD documentation (24594.pdf) and testing of
7565 * intel 386 and 486 processors all show that the mod bits
7566 * are assumed to be 1's, regardless of actual values.
7567 */
7568 rm = (modrm & 7) | REX_B(s)0;
7569 reg = ((modrm >> 3) & 7) | rex_r;
7570 if (CODE64(s)0)
7571 ot = MO_64;
7572 else
7573 ot = MO_32;
7574 if ((prefixes & PREFIX_LOCK0x04) && (reg == 0) &&
7575 (s->cpuid_ext3_features & CPUID_EXT3_CR8LEG(1 << 4))) {
7576 reg = 8;
7577 }
7578 switch(reg) {
7579 case 0:
7580 case 2:
7581 case 3:
7582 case 4:
7583 case 8:
7584 gen_update_cc_op(s);
7585 gen_jmp_im(pc_start - s->cs_base);
7586 if (b & 2) {
7587 gen_op_mov_v_reg(ot, cpu_T[0], rm);
7588 gen_helper_write_crN(cpu_env, tcg_const_i32(reg),
7589 cpu_T[0]);
7590 gen_jmp_im(s->pc - s->cs_base);
7591 gen_eob(s);
7592 } else {
7593 gen_helper_read_crN(cpu_T[0], cpu_env, tcg_const_i32(reg));
7594 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
7595 }
7596 break;
7597 default:
7598 goto illegal_op;
7599 }
7600 }
7601 break;
7602 case 0x121: /* mov reg, drN */
7603 case 0x123: /* mov drN, reg */
7604 if (s->cpl != 0) {
7605 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7606 } else {
7607 modrm = cpu_ldub_code(env, s->pc++);
7608 /* Ignore the mod bits (assume (modrm&0xc0)==0xc0).
7609 * AMD documentation (24594.pdf) and testing of
7610 * intel 386 and 486 processors all show that the mod bits
7611 * are assumed to be 1's, regardless of actual values.
7612 */
7613 rm = (modrm & 7) | REX_B(s)0;
7614 reg = ((modrm >> 3) & 7) | rex_r;
7615 if (CODE64(s)0)
7616 ot = MO_64;
7617 else
7618 ot = MO_32;
7619 /* XXX: do it dynamically with CR4.DE bit */
7620 if (reg == 4 || reg == 5 || reg >= 8)
7621 goto illegal_op;
7622 if (b & 2) {
7623 gen_svm_check_intercept(s, pc_start, SVM_EXIT_WRITE_DR00x030 + reg);
7624 gen_op_mov_v_reg(ot, cpu_T[0], rm);
7625 gen_helper_movl_drN_T0(cpu_env, tcg_const_i32(reg), cpu_T[0]);
7626 gen_jmp_im(s->pc - s->cs_base);
7627 gen_eob(s);
7628 } else {
7629 gen_svm_check_intercept(s, pc_start, SVM_EXIT_READ_DR00x020 + reg);
7630 tcg_gen_ld_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State,dr[reg])__builtin_offsetof(CPUX86State, dr[reg]));
7631 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
7632 }
7633 }
7634 break;
7635 case 0x106: /* clts */
7636 if (s->cpl != 0) {
7637 gen_exception(s, EXCP0D_GPF13, pc_start - s->cs_base);
7638 } else {
7639 gen_svm_check_intercept(s, pc_start, SVM_EXIT_WRITE_CR00x010);
7640 gen_helper_clts(cpu_env);
7641 /* abort block because static cpu state changed */
7642 gen_jmp_im(s->pc - s->cs_base);
7643 gen_eob(s);
7644 }
7645 break;
7646 /* MMX/3DNow!/SSE/SSE2/SSE3/SSSE3/SSE4 support */
7647 case 0x1c3: /* MOVNTI reg, mem */
7648 if (!(s->cpuid_features & CPUID_SSE2(1 << 26)))
7649 goto illegal_op;
7650 ot = mo_64_32(dflag);
7651 modrm = cpu_ldub_code(env, s->pc++);
7652 mod = (modrm >> 6) & 3;
7653 if (mod == 3)
7654 goto illegal_op;
7655 reg = ((modrm >> 3) & 7) | rex_r;
7656 /* generate a generic store */
7657 gen_ldst_modrm(env, s, modrm, ot, reg, 1);
7658 break;
7659 case 0x1ae:
7660 modrm = cpu_ldub_code(env, s->pc++);
7661 mod = (modrm >> 6) & 3;
7662 op = (modrm >> 3) & 7;
7663 switch(op) {
7664 case 0: /* fxsave */
7665 if (mod == 3 || !(s->cpuid_features & CPUID_FXSR(1 << 24)) ||
7666 (s->prefix & PREFIX_LOCK0x04))
7667 goto illegal_op;
7668 if ((s->flags & HF_EM_MASK(1 << 10)) || (s->flags & HF_TS_MASK(1 << 11))) {
7669 gen_exception(s, EXCP07_PREX7, pc_start - s->cs_base);
7670 break;
7671 }
7672 gen_lea_modrm(env, s, modrm);
7673 gen_update_cc_op(s);
7674 gen_jmp_im(pc_start - s->cs_base);
7675 gen_helper_fxsave(cpu_env, cpu_A0, tcg_const_i32(dflag == MO_64));
7676 break;
7677 case 1: /* fxrstor */
7678 if (mod == 3 || !(s->cpuid_features & CPUID_FXSR(1 << 24)) ||
7679 (s->prefix & PREFIX_LOCK0x04))
7680 goto illegal_op;
7681 if ((s->flags & HF_EM_MASK(1 << 10)) || (s->flags & HF_TS_MASK(1 << 11))) {
7682 gen_exception(s, EXCP07_PREX7, pc_start - s->cs_base);
7683 break;
7684 }
7685 gen_lea_modrm(env, s, modrm);
7686 gen_update_cc_op(s);
7687 gen_jmp_im(pc_start - s->cs_base);
7688 gen_helper_fxrstor(cpu_env, cpu_A0, tcg_const_i32(dflag == MO_64));
7689 break;
7690 case 2: /* ldmxcsr */
7691 case 3: /* stmxcsr */
7692 if (s->flags & HF_TS_MASK(1 << 11)) {
7693 gen_exception(s, EXCP07_PREX7, pc_start - s->cs_base);
7694 break;
7695 }
7696 if ((s->flags & HF_EM_MASK(1 << 10)) || !(s->flags & HF_OSFXSR_MASK(1 << 22)) ||
7697 mod == 3)
7698 goto illegal_op;
7699 gen_lea_modrm(env, s, modrm);
7700 if (op == 2) {
7701 tcg_gen_qemu_ld_i32(cpu_tmp2_i32, cpu_A0,
7702 s->mem_index, MO_LEUL);
7703 gen_helper_ldmxcsr(cpu_env, cpu_tmp2_i32);
7704 } else {
7705 tcg_gen_ld32u_tltcg_gen_ld_i32(cpu_T[0], cpu_env, offsetof(CPUX86State, mxcsr)__builtin_offsetof(CPUX86State, mxcsr));
7706 gen_op_st_v(s, MO_32, cpu_T[0], cpu_A0);
7707 }
7708 break;
7709 case 5: /* lfence */
7710 case 6: /* mfence */
7711 if ((modrm & 0xc7) != 0xc0 || !(s->cpuid_features & CPUID_SSE2(1 << 26)))
7712 goto illegal_op;
7713 break;
7714 case 7: /* sfence / clflush */
7715 if ((modrm & 0xc7) == 0xc0) {
7716 /* sfence */
7717 /* XXX: also check for cpuid_ext2_features & CPUID_EXT2_EMMX */
7718 if (!(s->cpuid_features & CPUID_SSE(1 << 25)))
7719 goto illegal_op;
7720 } else {
7721 /* clflush */
7722 if (!(s->cpuid_features & CPUID_CLFLUSH(1 << 19)))
7723 goto illegal_op;
7724 gen_lea_modrm(env, s, modrm);
7725 }
7726 break;
7727 default:
7728 goto illegal_op;
7729 }
7730 break;
7731 case 0x10d: /* 3DNow! prefetch(w) */
7732 modrm = cpu_ldub_code(env, s->pc++);
7733 mod = (modrm >> 6) & 3;
7734 if (mod == 3)
7735 goto illegal_op;
7736 gen_lea_modrm(env, s, modrm);
7737 /* ignore for now */
7738 break;
7739 case 0x1aa: /* rsm */
7740 gen_svm_check_intercept(s, pc_start, SVM_EXIT_RSM0x073);
7741 if (!(s->flags & HF_SMM_MASK(1 << 19)))
7742 goto illegal_op;
7743 gen_update_cc_op(s);
7744 gen_jmp_im(s->pc - s->cs_base);
7745 gen_helper_rsm(cpu_env);
7746 gen_eob(s);
7747 break;
7748 case 0x1b8: /* SSE4.2 popcnt */
7749 if ((prefixes & (PREFIX_REPZ0x01 | PREFIX_LOCK0x04 | PREFIX_REPNZ0x02)) !=
7750 PREFIX_REPZ0x01)
7751 goto illegal_op;
7752 if (!(s->cpuid_ext_features & CPUID_EXT_POPCNT(1 << 23)))
7753 goto illegal_op;
7754
7755 modrm = cpu_ldub_code(env, s->pc++);
7756 reg = ((modrm >> 3) & 7) | rex_r;
7757
7758 if (s->prefix & PREFIX_DATA0x08) {
7759 ot = MO_16;
7760 } else {
7761 ot = mo_64_32(dflag);
7762 }
7763
7764 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
7765 gen_helper_popcnt(cpu_T[0], cpu_env, cpu_T[0], tcg_const_i32(ot));
7766 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
7767
7768 set_cc_op(s, CC_OP_EFLAGS);
7769 break;
7770 case 0x10e ... 0x10f:
7771 /* 3DNow! instructions, ignore prefixes */
7772 s->prefix &= ~(PREFIX_REPZ0x01 | PREFIX_REPNZ0x02 | PREFIX_DATA0x08);
7773 case 0x110 ... 0x117:
7774 case 0x128 ... 0x12f:
7775 case 0x138 ... 0x13a:
7776 case 0x150 ... 0x179:
7777 case 0x17c ... 0x17f:
7778 case 0x1c2:
7779 case 0x1c4 ... 0x1c6:
7780 case 0x1d0 ... 0x1fe:
7781 gen_sse(env, s, b, pc_start, rex_r);
7782 break;
7783 default:
7784 goto illegal_op;
7785 }
7786 /* lock generation */
7787 if (s->prefix & PREFIX_LOCK0x04)
7788 gen_helper_unlock();
7789 return s->pc;
7790 illegal_op:
7791 if (s->prefix & PREFIX_LOCK0x04)
7792 gen_helper_unlock();
7793 /* XXX: ensure that no lock was generated */
7794 gen_exception(s, EXCP06_ILLOP6, pc_start - s->cs_base);
7795 return s->pc;
7796}
7797
7798void optimize_flags_init(void)
7799{
7800 static const char reg_names[CPU_NB_REGS8][4] = {
7801#ifdef TARGET_X86_64
7802 [R_EAX0] = "rax",
7803 [R_EBX3] = "rbx",
7804 [R_ECX1] = "rcx",
7805 [R_EDX2] = "rdx",
7806 [R_ESI6] = "rsi",
7807 [R_EDI7] = "rdi",
7808 [R_EBP5] = "rbp",
7809 [R_ESP4] = "rsp",
7810 [8] = "r8",
7811 [9] = "r9",
7812 [10] = "r10",
7813 [11] = "r11",
7814 [12] = "r12",
7815 [13] = "r13",
7816 [14] = "r14",
7817 [15] = "r15",
7818#else
7819 [R_EAX0] = "eax",
7820 [R_EBX3] = "ebx",
7821 [R_ECX1] = "ecx",
7822 [R_EDX2] = "edx",
7823 [R_ESI6] = "esi",
7824 [R_EDI7] = "edi",
7825 [R_EBP5] = "ebp",
7826 [R_ESP4] = "esp",
7827#endif
7828 };
7829 int i;
7830
7831 cpu_env = tcg_global_reg_new_ptr(TCG_AREG0, "env")__extension__ ({ TCGv_ptr make_tcgv_tmp = {((tcg_global_reg_new_i64
((TCG_REG_R14), ("env"))).i64)}; make_tcgv_tmp; })
;
7832 cpu_cc_op = tcg_global_mem_new_i32(TCG_AREG0TCG_REG_R14,
7833 offsetof(CPUX86State, cc_op)__builtin_offsetof(CPUX86State, cc_op), "cc_op");
7834 cpu_cc_dst = tcg_global_mem_newtcg_global_mem_new_i32(TCG_AREG0TCG_REG_R14, offsetof(CPUX86State, cc_dst)__builtin_offsetof(CPUX86State, cc_dst),
7835 "cc_dst");
7836 cpu_cc_src = tcg_global_mem_newtcg_global_mem_new_i32(TCG_AREG0TCG_REG_R14, offsetof(CPUX86State, cc_src)__builtin_offsetof(CPUX86State, cc_src),
7837 "cc_src");
7838 cpu_cc_src2 = tcg_global_mem_newtcg_global_mem_new_i32(TCG_AREG0TCG_REG_R14, offsetof(CPUX86State, cc_src2)__builtin_offsetof(CPUX86State, cc_src2),
7839 "cc_src2");
7840
7841 for (i = 0; i < CPU_NB_REGS8; ++i) {
7842 cpu_regs[i] = tcg_global_mem_newtcg_global_mem_new_i32(TCG_AREG0TCG_REG_R14,
7843 offsetof(CPUX86State, regs[i])__builtin_offsetof(CPUX86State, regs[i]),
7844 reg_names[i]);
7845 }
7846}
7847
7848/* generate intermediate code in gen_opc_buf and gen_opparam_buf for
7849 basic block 'tb'. If search_pc is TRUE, also generate PC
7850 information for each intermediate instruction. */
7851static inline void gen_intermediate_code_internal(X86CPU *cpu,
7852 TranslationBlock *tb,
7853 bool_Bool search_pc)
7854{
7855 CPUState *cs = CPU(cpu)((CPUState *)object_dynamic_cast_assert(((Object *)((cpu))), (
"cpu"), "/home/stefan/src/qemu/qemu.org/qemu/target-i386/translate.c"
, 7855, __func__))
;
7856 CPUX86State *env = &cpu->env;
7857 DisasContext dc1, *dc = &dc1;
7858 target_ulong pc_ptr;
7859 uint16_t *gen_opc_end;
7860 CPUBreakpoint *bp;
7861 int j, lj;
7862 uint64_t flags;
7863 target_ulong pc_start;
7864 target_ulong cs_base;
7865 int num_insns;
7866 int max_insns;
7867
7868 /* generate intermediate code */
7869 pc_start = tb->pc;
7870 cs_base = tb->cs_base;
7871 flags = tb->flags;
7872
7873 dc->pe = (flags >> HF_PE_SHIFT7) & 1;
7874 dc->code32 = (flags >> HF_CS32_SHIFT4) & 1;
7875 dc->ss32 = (flags >> HF_SS32_SHIFT5) & 1;
7876 dc->addseg = (flags >> HF_ADDSEG_SHIFT6) & 1;
7877 dc->f_st = 0;
7878 dc->vm86 = (flags >> VM_SHIFT17) & 1;
7879 dc->cpl = (flags >> HF_CPL_SHIFT0) & 3;
7880 dc->iopl = (flags >> IOPL_SHIFT12) & 3;
7881 dc->tf = (flags >> TF_SHIFT8) & 1;
7882 dc->singlestep_enabled = cs->singlestep_enabled;
7883 dc->cc_op = CC_OP_DYNAMIC;
7884 dc->cc_op_dirty = false0;
7885 dc->cs_base = cs_base;
7886 dc->tb = tb;
7887 dc->popl_esp_hack = 0;
7888 /* select memory access functions */
7889 dc->mem_index = 0;
7890 if (flags & HF_SOFTMMU_MASK(1 << 2)) {
7891 dc->mem_index = cpu_mmu_index(env);
7892 }
7893 dc->cpuid_features = env->features[FEAT_1_EDX];
7894 dc->cpuid_ext_features = env->features[FEAT_1_ECX];
7895 dc->cpuid_ext2_features = env->features[FEAT_8000_0001_EDX];
7896 dc->cpuid_ext3_features = env->features[FEAT_8000_0001_ECX];
7897 dc->cpuid_7_0_ebx_features = env->features[FEAT_7_0_EBX];
7898#ifdef TARGET_X86_64
7899 dc->lma = (flags >> HF_LMA_SHIFT14) & 1;
7900 dc->code64 = (flags >> HF_CS64_SHIFT15) & 1;
7901#endif
7902 dc->flags = flags;
7903 dc->jmp_opt = !(dc->tf || cs->singlestep_enabled ||
7904 (flags & HF_INHIBIT_IRQ_MASK(1 << 3))
7905#ifndef CONFIG_SOFTMMU1
7906 || (flags & HF_SOFTMMU_MASK(1 << 2))
7907#endif
7908 );
7909#if 0
7910 /* check addseg logic */
7911 if (!dc->addseg && (dc->vm86 || !dc->pe || !dc->code32))
7912 printf("ERROR addseg\n");
7913#endif
7914
7915 cpu_T[0] = tcg_temp_new()tcg_temp_new_i32();
7916 cpu_T[1] = tcg_temp_new()tcg_temp_new_i32();
7917 cpu_A0 = tcg_temp_new()tcg_temp_new_i32();
7918
7919 cpu_tmp0 = tcg_temp_new()tcg_temp_new_i32();
7920 cpu_tmp1_i64 = tcg_temp_new_i64();
7921 cpu_tmp2_i32 = tcg_temp_new_i32();
7922 cpu_tmp3_i32 = tcg_temp_new_i32();
7923 cpu_tmp4 = tcg_temp_new()tcg_temp_new_i32();
7924 cpu_ptr0 = tcg_temp_new_ptr()__extension__ ({ TCGv_ptr make_tcgv_tmp = {((tcg_temp_new_i64
()).i64)}; make_tcgv_tmp; })
;
7925 cpu_ptr1 = tcg_temp_new_ptr()__extension__ ({ TCGv_ptr make_tcgv_tmp = {((tcg_temp_new_i64
()).i64)}; make_tcgv_tmp; })
;
7926 cpu_cc_srcT = tcg_temp_local_new()tcg_temp_local_new_i32();
7927
7928 gen_opc_end = tcg_ctx.gen_opc_buf + OPC_MAX_SIZE(640 - 208);
7929
7930 dc->is_jmp = DISAS_NEXT0;
7931 pc_ptr = pc_start;
7932 lj = -1;
7933 num_insns = 0;
7934 max_insns = tb->cflags & CF_COUNT_MASK0x7fff;
7935 if (max_insns == 0)
7936 max_insns = CF_COUNT_MASK0x7fff;
7937
7938 gen_tb_start();
7939 for(;;) {
7940 if (unlikely(!QTAILQ_EMPTY(&env->breakpoints))__builtin_expect(!!(!((&env->breakpoints)->tqh_first
== ((void*)0))), 0)
) {
7941 QTAILQ_FOREACH(bp, &env->breakpoints, entry)for ((bp) = ((&env->breakpoints)->tqh_first); (bp);
(bp) = ((bp)->entry.tqe_next))
{
7942 if (bp->pc == pc_ptr &&
7943 !((bp->flags & BP_CPU0x20) && (tb->flags & HF_RF_MASK(1 << 16)))) {
7944 gen_debug(dc, pc_ptr - dc->cs_base);
7945 break;
7946 }
7947 }
7948 }
7949 if (search_pc) {
7950 j = tcg_ctx.gen_opc_ptr - tcg_ctx.gen_opc_buf;
7951 if (lj < j) {
7952 lj++;
7953 while (lj < j)
7954 tcg_ctx.gen_opc_instr_start[lj++] = 0;
7955 }
7956 tcg_ctx.gen_opc_pc[lj] = pc_ptr;
7957 gen_opc_cc_op[lj] = dc->cc_op;
7958 tcg_ctx.gen_opc_instr_start[lj] = 1;
7959 tcg_ctx.gen_opc_icount[lj] = num_insns;
7960 }
7961 if (num_insns + 1 == max_insns && (tb->cflags & CF_LAST_IO0x8000))
7962 gen_io_start();
7963
7964 pc_ptr = disas_insn(env, dc, pc_ptr);
7965 num_insns++;
7966 /* stop translation if indicated */
7967 if (dc->is_jmp)
7968 break;
7969 /* if single step mode, we generate only one instruction and
7970 generate an exception */
7971 /* if irq were inhibited with HF_INHIBIT_IRQ_MASK, we clear
7972 the flag and abort the translation to give the irqs a
7973 change to be happen */
7974 if (dc->tf || dc->singlestep_enabled ||
7975 (flags & HF_INHIBIT_IRQ_MASK(1 << 3))) {
7976 gen_jmp_im(pc_ptr - dc->cs_base);
7977 gen_eob(dc);
7978 break;
7979 }
7980 /* if too long translation, stop generation too */
7981 if (tcg_ctx.gen_opc_ptr >= gen_opc_end ||
7982 (pc_ptr - pc_start) >= (TARGET_PAGE_SIZE(1 << 12) - 32) ||
7983 num_insns >= max_insns) {
7984 gen_jmp_im(pc_ptr - dc->cs_base);
7985 gen_eob(dc);
7986 break;
7987 }
7988 if (singlestep) {
7989 gen_jmp_im(pc_ptr - dc->cs_base);
7990 gen_eob(dc);
7991 break;
7992 }
7993 }
7994 if (tb->cflags & CF_LAST_IO0x8000)
7995 gen_io_end();
7996 gen_tb_end(tb, num_insns);
7997 *tcg_ctx.gen_opc_ptr = INDEX_op_end;
7998 /* we don't forget to fill the last values */
7999 if (search_pc) {
8000 j = tcg_ctx.gen_opc_ptr - tcg_ctx.gen_opc_buf;
8001 lj++;
8002 while (lj <= j)
8003 tcg_ctx.gen_opc_instr_start[lj++] = 0;
8004 }
8005
8006#ifdef DEBUG_DISAS
8007 if (qemu_loglevel_mask(CPU_LOG_TB_IN_ASM(1 << 1))) {
8008 int disas_flags;
8009 qemu_log("----------------\n");
8010 qemu_log("IN: %s\n", lookup_symbol(pc_start));
8011#ifdef TARGET_X86_64
8012 if (dc->code64)
8013 disas_flags = 2;
8014 else
8015#endif
8016 disas_flags = !dc->code32;
8017 log_target_disas(env, pc_start, pc_ptr - pc_start, disas_flags);
8018 qemu_log("\n");
8019 }
8020#endif
8021
8022 if (!search_pc) {
8023 tb->size = pc_ptr - pc_start;
8024 tb->icount = num_insns;
8025 }
8026}
8027
8028void gen_intermediate_code(CPUX86State *env, TranslationBlock *tb)
8029{
8030 gen_intermediate_code_internal(x86_env_get_cpu(env), tb, false0);
8031}
8032
8033void gen_intermediate_code_pc(CPUX86State *env, TranslationBlock *tb)
8034{
8035 gen_intermediate_code_internal(x86_env_get_cpu(env), tb, true1);
8036}
8037
8038void restore_state_to_opc(CPUX86State *env, TranslationBlock *tb, int pc_pos)
8039{
8040 int cc_op;
8041#ifdef DEBUG_DISAS
8042 if (qemu_loglevel_mask(CPU_LOG_TB_OP(1 << 2))) {
8043 int i;
8044 qemu_log("RESTORE:\n");
8045 for(i = 0;i <= pc_pos; i++) {
8046 if (tcg_ctx.gen_opc_instr_start[i]) {
8047 qemu_log("0x%04x: " TARGET_FMT_lx"%08x" "\n", i,
8048 tcg_ctx.gen_opc_pc[i]);
8049 }
8050 }
8051 qemu_log("pc_pos=0x%x eip=" TARGET_FMT_lx"%08x" " cs_base=%x\n",
8052 pc_pos, tcg_ctx.gen_opc_pc[pc_pos] - tb->cs_base,
8053 (uint32_t)tb->cs_base);
8054 }
8055#endif
8056 env->eip = tcg_ctx.gen_opc_pc[pc_pos] - tb->cs_base;
8057 cc_op = gen_opc_cc_op[pc_pos];
8058 if (cc_op != CC_OP_DYNAMIC)
8059 env->cc_op = cc_op;
8060}