2 * i386 micro operations
4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 #include "exec-i386.h"
22 /* NOTE: data are not static to force relocation generation by GCC */
24 uint8_t parity_table[256] = {
25 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
26 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
27 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
28 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
29 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
30 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
31 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
32 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
33 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
34 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
35 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
36 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
37 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
38 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
39 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
40 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
41 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
42 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
43 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
44 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
45 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
46 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
47 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
48 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
49 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
50 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
51 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
52 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
53 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
54 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
55 CC_P, 0, 0, CC_P, 0, CC_P, CC_P, 0,
56 0, CC_P, CC_P, 0, CC_P, 0, 0, CC_P,
60 const uint8_t rclw_table[32] = {
61 0, 1, 2, 3, 4, 5, 6, 7,
62 8, 9,10,11,12,13,14,15,
63 16, 0, 1, 2, 3, 4, 5, 6,
64 7, 8, 9,10,11,12,13,14,
68 const uint8_t rclb_table[32] = {
69 0, 1, 2, 3, 4, 5, 6, 7,
70 8, 0, 1, 2, 3, 4, 5, 6,
71 7, 8, 0, 1, 2, 3, 4, 5,
72 6, 7, 8, 0, 1, 2, 3, 4,
76 /* an array of Intel 80-bit FP constants, to be loaded via integer ops */
77 typedef unsigned short f15ld[5];
80 /*0*/ {0x0000,0x0000,0x0000,0x0000,0x0000},
81 /*1*/ {0x0000,0x0000,0x0000,0x8000,0x3fff},
82 /*pi*/ {0xc235,0x2168,0xdaa2,0xc90f,0x4000},
83 /*lg2*/ {0xf799,0xfbcf,0x9a84,0x9a20,0x3ffd},
84 /*ln2*/ {0x79ac,0xd1cf,0x17f7,0xb172,0x3ffe},
85 /*l2e*/ {0xf0bc,0x5c17,0x3b29,0xb8aa,0x3fff},
86 /*l2t*/ {0x8afe,0xcd1b,0x784b,0xd49a,0x4000}
89 /* the same, 64-bit version */
90 typedef unsigned short f15ld[4];
93 #ifndef WORDS_BIGENDIAN
94 /*0*/ {0x0000,0x0000,0x0000,0x0000},
95 /*1*/ {0x0000,0x0000,0x0000,0x3ff0},
96 /*pi*/ {0x2d18,0x5444,0x21fb,0x4009},
97 /*lg2*/ {0x79ff,0x509f,0x4413,0x3fd3},
98 /*ln2*/ {0x39ef,0xfefa,0x2e42,0x3fe6},
99 /*l2e*/ {0x82fe,0x652b,0x1547,0x3ff7},
100 /*l2t*/ {0xa371,0x0979,0x934f,0x400a}
102 /*0*/ {0x0000,0x0000,0x0000,0x0000},
103 /*1*/ {0x3ff0,0x0000,0x0000,0x0000},
104 /*pi*/ {0x4009,0x21fb,0x5444,0x2d18},
105 /*lg2*/ {0x3fd3,0x4413,0x509f,0x79ff},
106 /*ln2*/ {0x3fe6,0x2e42,0xfefa,0x39ef},
107 /*l2e*/ {0x3ff7,0x1547,0x652b,0x82fe},
108 /*l2t*/ {0x400a,0x934f,0x0979,0xa371}
113 /* n must be a constant to be efficient */
114 static inline int lshift(int x, int n)
122 /* we define the various pieces of code used by the JIT */
126 #include "opreg_template.h"
132 #include "opreg_template.h"
138 #include "opreg_template.h"
144 #include "opreg_template.h"
150 #include "opreg_template.h"
156 #include "opreg_template.h"
162 #include "opreg_template.h"
168 #include "opreg_template.h"
172 /* operations with flags */
174 void OPPROTO op_addl_T0_T1_cc(void)
181 void OPPROTO op_orl_T0_T1_cc(void)
187 void OPPROTO op_andl_T0_T1_cc(void)
193 void OPPROTO op_subl_T0_T1_cc(void)
200 void OPPROTO op_xorl_T0_T1_cc(void)
206 void OPPROTO op_cmpl_T0_T1_cc(void)
212 void OPPROTO op_negl_T0_cc(void)
219 void OPPROTO op_incl_T0_cc(void)
221 CC_SRC = cc_table[CC_OP].compute_c();
226 void OPPROTO op_decl_T0_cc(void)
228 CC_SRC = cc_table[CC_OP].compute_c();
233 void OPPROTO op_testl_T0_T1_cc(void)
238 /* operations without flags */
240 void OPPROTO op_addl_T0_T1(void)
245 void OPPROTO op_orl_T0_T1(void)
250 void OPPROTO op_andl_T0_T1(void)
255 void OPPROTO op_subl_T0_T1(void)
260 void OPPROTO op_xorl_T0_T1(void)
265 void OPPROTO op_negl_T0(void)
270 void OPPROTO op_incl_T0(void)
275 void OPPROTO op_decl_T0(void)
280 void OPPROTO op_notl_T0(void)
285 void OPPROTO op_bswapl_T0(void)
290 /* multiply/divide */
291 void OPPROTO op_mulb_AL_T0(void)
294 res = (uint8_t)EAX * (uint8_t)T0;
295 EAX = (EAX & 0xffff0000) | res;
296 CC_SRC = (res & 0xff00);
299 void OPPROTO op_imulb_AL_T0(void)
302 res = (int8_t)EAX * (int8_t)T0;
303 EAX = (EAX & 0xffff0000) | (res & 0xffff);
304 CC_SRC = (res != (int8_t)res);
307 void OPPROTO op_mulw_AX_T0(void)
310 res = (uint16_t)EAX * (uint16_t)T0;
311 EAX = (EAX & 0xffff0000) | (res & 0xffff);
312 EDX = (EDX & 0xffff0000) | ((res >> 16) & 0xffff);
316 void OPPROTO op_imulw_AX_T0(void)
319 res = (int16_t)EAX * (int16_t)T0;
320 EAX = (EAX & 0xffff0000) | (res & 0xffff);
321 EDX = (EDX & 0xffff0000) | ((res >> 16) & 0xffff);
322 CC_SRC = (res != (int16_t)res);
325 void OPPROTO op_mull_EAX_T0(void)
328 res = (uint64_t)((uint32_t)EAX) * (uint64_t)((uint32_t)T0);
334 void OPPROTO op_imull_EAX_T0(void)
337 res = (int64_t)((int32_t)EAX) * (int64_t)((int32_t)T0);
340 CC_SRC = (res != (int32_t)res);
343 void OPPROTO op_imulw_T0_T1(void)
346 res = (int16_t)T0 * (int16_t)T1;
348 CC_SRC = (res != (int16_t)res);
351 void OPPROTO op_imull_T0_T1(void)
354 res = (int64_t)((int32_t)T0) * (int64_t)((int32_t)T1);
356 CC_SRC = (res != (int32_t)res);
359 /* division, flags are undefined */
360 /* XXX: add exceptions for overflow */
361 void OPPROTO op_divb_AL_T0(void)
363 unsigned int num, den, q, r;
365 num = (EAX & 0xffff);
368 raise_exception(EXCP00_DIVZ);
369 q = (num / den) & 0xff;
370 r = (num % den) & 0xff;
371 EAX = (EAX & 0xffff0000) | (r << 8) | q;
374 void OPPROTO op_idivb_AL_T0(void)
381 raise_exception(EXCP00_DIVZ);
382 q = (num / den) & 0xff;
383 r = (num % den) & 0xff;
384 EAX = (EAX & 0xffff0000) | (r << 8) | q;
387 void OPPROTO op_divw_AX_T0(void)
389 unsigned int num, den, q, r;
391 num = (EAX & 0xffff) | ((EDX & 0xffff) << 16);
394 raise_exception(EXCP00_DIVZ);
395 q = (num / den) & 0xffff;
396 r = (num % den) & 0xffff;
397 EAX = (EAX & 0xffff0000) | q;
398 EDX = (EDX & 0xffff0000) | r;
401 void OPPROTO op_idivw_AX_T0(void)
405 num = (EAX & 0xffff) | ((EDX & 0xffff) << 16);
408 raise_exception(EXCP00_DIVZ);
409 q = (num / den) & 0xffff;
410 r = (num % den) & 0xffff;
411 EAX = (EAX & 0xffff0000) | q;
412 EDX = (EDX & 0xffff0000) | r;
415 #ifdef BUGGY_GCC_DIV64
416 /* gcc 2.95.4 on PowerPC does not seem to like using __udivdi3, so we
417 call it from another function */
418 uint32_t div64(uint32_t *q_ptr, uint64_t num, uint32_t den)
424 int32_t idiv64(int32_t *q_ptr, int64_t num, int32_t den)
431 void OPPROTO op_divl_EAX_T0(void)
433 unsigned int den, q, r;
436 num = EAX | ((uint64_t)EDX << 32);
439 raise_exception(EXCP00_DIVZ);
440 #ifdef BUGGY_GCC_DIV64
441 r = div64(&q, num, den);
450 void OPPROTO op_idivl_EAX_T0(void)
455 num = EAX | ((uint64_t)EDX << 32);
458 raise_exception(EXCP00_DIVZ);
459 #ifdef BUGGY_GCC_DIV64
460 r = idiv64(&q, num, den);
469 /* constant load & misc op */
471 void OPPROTO op_movl_T0_im(void)
476 void OPPROTO op_addl_T0_im(void)
481 void OPPROTO op_andl_T0_ffff(void)
486 void OPPROTO op_movl_T0_T1(void)
491 void OPPROTO op_movl_T1_im(void)
496 void OPPROTO op_addl_T1_im(void)
501 void OPPROTO op_movl_T1_A0(void)
506 void OPPROTO op_movl_A0_im(void)
511 void OPPROTO op_addl_A0_im(void)
516 void OPPROTO op_addl_A0_AL(void)
521 void OPPROTO op_andl_A0_ffff(void)
528 void OPPROTO op_ldub_T0_A0(void)
530 T0 = ldub((uint8_t *)A0);
533 void OPPROTO op_ldsb_T0_A0(void)
535 T0 = ldsb((int8_t *)A0);
538 void OPPROTO op_lduw_T0_A0(void)
540 T0 = lduw((uint8_t *)A0);
543 void OPPROTO op_ldsw_T0_A0(void)
545 T0 = ldsw((int8_t *)A0);
548 void OPPROTO op_ldl_T0_A0(void)
550 T0 = ldl((uint8_t *)A0);
553 void OPPROTO op_ldub_T1_A0(void)
555 T1 = ldub((uint8_t *)A0);
558 void OPPROTO op_ldsb_T1_A0(void)
560 T1 = ldsb((int8_t *)A0);
563 void OPPROTO op_lduw_T1_A0(void)
565 T1 = lduw((uint8_t *)A0);
568 void OPPROTO op_ldsw_T1_A0(void)
570 T1 = ldsw((int8_t *)A0);
573 void OPPROTO op_ldl_T1_A0(void)
575 T1 = ldl((uint8_t *)A0);
578 void OPPROTO op_stb_T0_A0(void)
580 stb((uint8_t *)A0, T0);
583 void OPPROTO op_stw_T0_A0(void)
585 stw((uint8_t *)A0, T0);
588 void OPPROTO op_stl_T0_A0(void)
590 stl((uint8_t *)A0, T0);
593 /* used for bit operations */
595 void OPPROTO op_add_bitw_A0_T1(void)
597 A0 += ((int32_t)T1 >> 4) << 1;
600 void OPPROTO op_add_bitl_A0_T1(void)
602 A0 += ((int32_t)T1 >> 5) << 2;
607 void OPPROTO op_jmp_T0(void)
612 void OPPROTO op_jmp_im(void)
617 void OPPROTO op_int_im(void)
622 raise_exception_err(EXCP0D_GPF, intno * 8 + 2);
625 void OPPROTO op_int3(void)
628 raise_exception(EXCP03_INT3);
631 void OPPROTO op_into(void)
634 eflags = cc_table[CC_OP].compute_all();
636 raise_exception(EXCP04_INTO);
641 void OPPROTO op_gpf(void)
644 raise_exception(EXCP0D_GPF);
647 void OPPROTO op_cli(void)
649 env->eflags &= ~IF_MASK;
652 void OPPROTO op_sti(void)
654 env->eflags |= IF_MASK;
657 /* vm86plus instructions */
659 void OPPROTO op_cli_vm(void)
661 env->eflags &= ~VIF_MASK;
664 void OPPROTO op_sti_vm(void)
666 env->eflags |= VIF_MASK;
667 if (env->eflags & VIP_MASK) {
669 raise_exception(EXCP0D_GPF);
674 void OPPROTO op_boundw(void)
677 low = ldsw((uint8_t *)A0);
678 high = ldsw((uint8_t *)A0 + 2);
680 if (v < low || v > high)
681 raise_exception(EXCP05_BOUND);
685 void OPPROTO op_boundl(void)
688 low = ldl((uint8_t *)A0);
689 high = ldl((uint8_t *)A0 + 4);
691 if (v < low || v > high)
692 raise_exception(EXCP05_BOUND);
696 void OPPROTO op_cmpxchg8b(void)
701 eflags = cc_table[CC_OP].compute_all();
702 d = ldq((uint8_t *)A0);
703 if (d == (((uint64_t)EDX << 32) | EAX)) {
704 stq((uint8_t *)A0, ((uint64_t)ECX << 32) | EBX);
720 #include "ops_template.h"
724 #include "ops_template.h"
728 #include "ops_template.h"
733 void OPPROTO op_movsbl_T0_T0(void)
738 void OPPROTO op_movzbl_T0_T0(void)
743 void OPPROTO op_movswl_T0_T0(void)
748 void OPPROTO op_movzwl_T0_T0(void)
753 void OPPROTO op_movswl_EAX_AX(void)
758 void OPPROTO op_movsbw_AX_AL(void)
760 EAX = (EAX & 0xffff0000) | ((int8_t)EAX & 0xffff);
763 void OPPROTO op_movslq_EDX_EAX(void)
765 EDX = (int32_t)EAX >> 31;
768 void OPPROTO op_movswl_DX_AX(void)
770 EDX = (EDX & 0xffff0000) | (((int16_t)EAX >> 15) & 0xffff);
775 void op_pushl_T0(void)
779 stl((void *)offset, T0);
780 /* modify ESP after to handle exceptions correctly */
784 void op_pushw_T0(void)
788 stw((void *)offset, T0);
789 /* modify ESP after to handle exceptions correctly */
793 void op_pushl_ss32_T0(void)
797 stl(env->seg_cache[R_SS].base + offset, T0);
798 /* modify ESP after to handle exceptions correctly */
802 void op_pushw_ss32_T0(void)
806 stw(env->seg_cache[R_SS].base + offset, T0);
807 /* modify ESP after to handle exceptions correctly */
811 void op_pushl_ss16_T0(void)
814 offset = (ESP - 4) & 0xffff;
815 stl(env->seg_cache[R_SS].base + offset, T0);
816 /* modify ESP after to handle exceptions correctly */
817 ESP = (ESP & ~0xffff) | offset;
820 void op_pushw_ss16_T0(void)
823 offset = (ESP - 2) & 0xffff;
824 stw(env->seg_cache[R_SS].base + offset, T0);
825 /* modify ESP after to handle exceptions correctly */
826 ESP = (ESP & ~0xffff) | offset;
829 /* NOTE: ESP update is done after */
830 void op_popl_T0(void)
832 T0 = ldl((void *)ESP);
835 void op_popw_T0(void)
837 T0 = lduw((void *)ESP);
840 void op_popl_ss32_T0(void)
842 T0 = ldl(env->seg_cache[R_SS].base + ESP);
845 void op_popw_ss32_T0(void)
847 T0 = lduw(env->seg_cache[R_SS].base + ESP);
850 void op_popl_ss16_T0(void)
852 T0 = ldl(env->seg_cache[R_SS].base + (ESP & 0xffff));
855 void op_popw_ss16_T0(void)
857 T0 = lduw(env->seg_cache[R_SS].base + (ESP & 0xffff));
860 void op_addl_ESP_4(void)
865 void op_addl_ESP_2(void)
870 void op_addw_ESP_4(void)
872 ESP = (ESP & ~0xffff) | ((ESP + 4) & 0xffff);
875 void op_addw_ESP_2(void)
877 ESP = (ESP & ~0xffff) | ((ESP + 2) & 0xffff);
880 void op_addl_ESP_im(void)
885 void op_addw_ESP_im(void)
887 ESP = (ESP & ~0xffff) | ((ESP + PARAM1) & 0xffff);
895 void OPPROTO op_rdtsc(void)
899 asm("rdtsc" : "=A" (val));
901 /* better than nothing: the time increases */
908 /* We simulate a pre-MMX pentium as in valgrind */
909 #define CPUID_FP87 (1 << 0)
910 #define CPUID_VME (1 << 1)
911 #define CPUID_DE (1 << 2)
912 #define CPUID_PSE (1 << 3)
913 #define CPUID_TSC (1 << 4)
914 #define CPUID_MSR (1 << 5)
915 #define CPUID_PAE (1 << 6)
916 #define CPUID_MCE (1 << 7)
917 #define CPUID_CX8 (1 << 8)
918 #define CPUID_APIC (1 << 9)
919 #define CPUID_SEP (1 << 11) /* sysenter/sysexit */
920 #define CPUID_MTRR (1 << 12)
921 #define CPUID_PGE (1 << 13)
922 #define CPUID_MCA (1 << 14)
923 #define CPUID_CMOV (1 << 15)
925 #define CPUID_MMX (1 << 23)
926 #define CPUID_FXSR (1 << 24)
927 #define CPUID_SSE (1 << 25)
928 #define CPUID_SSE2 (1 << 26)
930 void helper_cpuid(void)
933 EAX = 1; /* max EAX index supported */
942 EDX = CPUID_FP87 | CPUID_VME | CPUID_DE | CPUID_PSE |
943 CPUID_TSC | CPUID_MSR | CPUID_MCE |
948 void OPPROTO op_cpuid(void)
956 void OPPROTO op_aam(void)
963 EAX = (EAX & ~0xffff) | al | (ah << 8);
967 void OPPROTO op_aad(void)
972 ah = (EAX >> 8) & 0xff;
973 al = ((ah * base) + al) & 0xff;
974 EAX = (EAX & ~0xffff) | al;
978 void OPPROTO op_aaa(void)
984 eflags = cc_table[CC_OP].compute_all();
987 ah = (EAX >> 8) & 0xff;
989 icarry = (al > 0xf9);
990 if (((al & 0x0f) > 9 ) || af) {
991 al = (al + 6) & 0x0f;
992 ah = (ah + 1 + icarry) & 0xff;
993 eflags |= CC_C | CC_A;
995 eflags &= ~(CC_C | CC_A);
998 EAX = (EAX & ~0xffff) | al | (ah << 8);
1002 void OPPROTO op_aas(void)
1008 eflags = cc_table[CC_OP].compute_all();
1011 ah = (EAX >> 8) & 0xff;
1014 if (((al & 0x0f) > 9 ) || af) {
1015 al = (al - 6) & 0x0f;
1016 ah = (ah - 1 - icarry) & 0xff;
1017 eflags |= CC_C | CC_A;
1019 eflags &= ~(CC_C | CC_A);
1022 EAX = (EAX & ~0xffff) | al | (ah << 8);
1026 void OPPROTO op_daa(void)
1031 eflags = cc_table[CC_OP].compute_all();
1037 if (((al & 0x0f) > 9 ) || af) {
1038 al = (al + 6) & 0xff;
1041 if ((al > 0x9f) || cf) {
1042 al = (al + 0x60) & 0xff;
1045 EAX = (EAX & ~0xff) | al;
1046 /* well, speed is not an issue here, so we compute the flags by hand */
1047 eflags |= (al == 0) << 6; /* zf */
1048 eflags |= parity_table[al]; /* pf */
1049 eflags |= (al & 0x80); /* sf */
1053 void OPPROTO op_das(void)
1055 int al, al1, af, cf;
1058 eflags = cc_table[CC_OP].compute_all();
1065 if (((al & 0x0f) > 9 ) || af) {
1069 al = (al - 6) & 0xff;
1071 if ((al1 > 0x99) || cf) {
1072 al = (al - 0x60) & 0xff;
1075 EAX = (EAX & ~0xff) | al;
1076 /* well, speed is not an issue here, so we compute the flags by hand */
1077 eflags |= (al == 0) << 6; /* zf */
1078 eflags |= parity_table[al]; /* pf */
1079 eflags |= (al & 0x80); /* sf */
1083 /* segment handling */
1085 /* XXX: use static VM86 information */
1086 void load_seg(int seg_reg, int selector)
1089 SegmentDescriptorTable *dt;
1094 env->segs[seg_reg] = selector;
1095 sc = &env->seg_cache[seg_reg];
1096 if (env->eflags & VM_MASK) {
1097 sc->base = (void *)(selector << 4);
1105 index = selector & ~7;
1106 if ((index + 7) > dt->limit)
1107 raise_exception_err(EXCP0D_GPF, selector);
1108 ptr = dt->base + index;
1111 sc->base = (void *)((e1 >> 16) | ((e2 & 0xff) << 16) | (e2 & 0xff000000));
1112 sc->limit = (e1 & 0xffff) | (e2 & 0x000f0000);
1114 sc->limit = (sc->limit << 12) | 0xfff;
1115 sc->seg_32bit = (e2 >> 22) & 1;
1117 fprintf(logfile, "load_seg: sel=0x%04x base=0x%08lx limit=0x%08lx seg_32bit=%d\n",
1118 selector, (unsigned long)sc->base, sc->limit, sc->seg_32bit);
1123 void OPPROTO op_movl_seg_T0(void)
1125 load_seg(PARAM1, T0 & 0xffff);
1128 void OPPROTO op_movl_T0_seg(void)
1130 T0 = env->segs[PARAM1];
1133 void OPPROTO op_movl_A0_seg(void)
1135 A0 = *(unsigned long *)((char *)env + PARAM1);
1138 void OPPROTO op_addl_A0_seg(void)
1140 A0 += *(unsigned long *)((char *)env + PARAM1);
1143 /* flags handling */
1145 /* slow jumps cases (compute x86 flags) */
1146 void OPPROTO op_jo_cc(void)
1149 eflags = cc_table[CC_OP].compute_all();
1157 void OPPROTO op_jb_cc(void)
1159 if (cc_table[CC_OP].compute_c())
1166 void OPPROTO op_jz_cc(void)
1169 eflags = cc_table[CC_OP].compute_all();
1177 void OPPROTO op_jbe_cc(void)
1180 eflags = cc_table[CC_OP].compute_all();
1181 if (eflags & (CC_Z | CC_C))
1188 void OPPROTO op_js_cc(void)
1191 eflags = cc_table[CC_OP].compute_all();
1199 void OPPROTO op_jp_cc(void)
1202 eflags = cc_table[CC_OP].compute_all();
1210 void OPPROTO op_jl_cc(void)
1213 eflags = cc_table[CC_OP].compute_all();
1214 if ((eflags ^ (eflags >> 4)) & 0x80)
1221 void OPPROTO op_jle_cc(void)
1224 eflags = cc_table[CC_OP].compute_all();
1225 if (((eflags ^ (eflags >> 4)) & 0x80) || (eflags & CC_Z))
1232 /* slow set cases (compute x86 flags) */
1233 void OPPROTO op_seto_T0_cc(void)
1236 eflags = cc_table[CC_OP].compute_all();
1237 T0 = (eflags >> 11) & 1;
1240 void OPPROTO op_setb_T0_cc(void)
1242 T0 = cc_table[CC_OP].compute_c();
1245 void OPPROTO op_setz_T0_cc(void)
1248 eflags = cc_table[CC_OP].compute_all();
1249 T0 = (eflags >> 6) & 1;
1252 void OPPROTO op_setbe_T0_cc(void)
1255 eflags = cc_table[CC_OP].compute_all();
1256 T0 = (eflags & (CC_Z | CC_C)) != 0;
1259 void OPPROTO op_sets_T0_cc(void)
1262 eflags = cc_table[CC_OP].compute_all();
1263 T0 = (eflags >> 7) & 1;
1266 void OPPROTO op_setp_T0_cc(void)
1269 eflags = cc_table[CC_OP].compute_all();
1270 T0 = (eflags >> 2) & 1;
1273 void OPPROTO op_setl_T0_cc(void)
1276 eflags = cc_table[CC_OP].compute_all();
1277 T0 = ((eflags ^ (eflags >> 4)) >> 7) & 1;
1280 void OPPROTO op_setle_T0_cc(void)
1283 eflags = cc_table[CC_OP].compute_all();
1284 T0 = (((eflags ^ (eflags >> 4)) & 0x80) || (eflags & CC_Z)) != 0;
1287 void OPPROTO op_xor_T0_1(void)
1292 void OPPROTO op_set_cc_op(void)
1297 #define FL_UPDATE_MASK32 (TF_MASK | AC_MASK | ID_MASK)
1298 #define FL_UPDATE_MASK16 (TF_MASK)
1300 void OPPROTO op_movl_eflags_T0(void)
1304 CC_SRC = eflags & (CC_O | CC_S | CC_Z | CC_A | CC_P | CC_C);
1305 DF = 1 - (2 * ((eflags >> 10) & 1));
1306 /* we also update some system flags as in user mode */
1307 env->eflags = (env->eflags & ~FL_UPDATE_MASK32) | (eflags & FL_UPDATE_MASK32);
1310 void OPPROTO op_movw_eflags_T0(void)
1314 CC_SRC = eflags & (CC_O | CC_S | CC_Z | CC_A | CC_P | CC_C);
1315 DF = 1 - (2 * ((eflags >> 10) & 1));
1316 /* we also update some system flags as in user mode */
1317 env->eflags = (env->eflags & ~FL_UPDATE_MASK16) | (eflags & FL_UPDATE_MASK16);
1321 void OPPROTO op_movw_eflags_T0_vm(void)
1325 CC_SRC = eflags & (CC_O | CC_S | CC_Z | CC_A | CC_P | CC_C);
1326 DF = 1 - (2 * ((eflags >> 10) & 1));
1327 /* we also update some system flags as in user mode */
1328 env->eflags = (env->eflags & ~(FL_UPDATE_MASK16 | VIF_MASK)) |
1329 (eflags & FL_UPDATE_MASK16);
1330 if (eflags & IF_MASK) {
1331 env->eflags |= VIF_MASK;
1332 if (env->eflags & VIP_MASK) {
1334 raise_exception(EXCP0D_GPF);
1340 void OPPROTO op_movl_eflags_T0_vm(void)
1344 CC_SRC = eflags & (CC_O | CC_S | CC_Z | CC_A | CC_P | CC_C);
1345 DF = 1 - (2 * ((eflags >> 10) & 1));
1346 /* we also update some system flags as in user mode */
1347 env->eflags = (env->eflags & ~(FL_UPDATE_MASK32 | VIF_MASK)) |
1348 (eflags & FL_UPDATE_MASK32);
1349 if (eflags & IF_MASK) {
1350 env->eflags |= VIF_MASK;
1351 if (env->eflags & VIP_MASK) {
1353 raise_exception(EXCP0D_GPF);
1359 /* XXX: compute only O flag */
1360 void OPPROTO op_movb_eflags_T0(void)
1363 of = cc_table[CC_OP].compute_all() & CC_O;
1364 CC_SRC = (T0 & (CC_S | CC_Z | CC_A | CC_P | CC_C)) | of;
1367 void OPPROTO op_movl_T0_eflags(void)
1370 eflags = cc_table[CC_OP].compute_all();
1371 eflags |= (DF & DF_MASK);
1372 eflags |= env->eflags & ~(VM_MASK | RF_MASK);
1377 void OPPROTO op_movl_T0_eflags_vm(void)
1380 eflags = cc_table[CC_OP].compute_all();
1381 eflags |= (DF & DF_MASK);
1382 eflags |= env->eflags & ~(VM_MASK | RF_MASK | IF_MASK);
1383 if (env->eflags & VIF_MASK)
1388 void OPPROTO op_cld(void)
1393 void OPPROTO op_std(void)
1398 void OPPROTO op_clc(void)
1401 eflags = cc_table[CC_OP].compute_all();
1406 void OPPROTO op_stc(void)
1409 eflags = cc_table[CC_OP].compute_all();
1414 void OPPROTO op_cmc(void)
1417 eflags = cc_table[CC_OP].compute_all();
1422 void OPPROTO op_salc(void)
1425 cf = cc_table[CC_OP].compute_c();
1426 EAX = (EAX & ~0xff) | ((-cf) & 0xff);
1429 static int compute_all_eflags(void)
1434 static int compute_c_eflags(void)
1436 return CC_SRC & CC_C;
1439 static int compute_c_mul(void)
1446 static int compute_all_mul(void)
1448 int cf, pf, af, zf, sf, of;
1450 pf = 0; /* undefined */
1451 af = 0; /* undefined */
1452 zf = 0; /* undefined */
1453 sf = 0; /* undefined */
1455 return cf | pf | af | zf | sf | of;
1458 CCTable cc_table[CC_OP_NB] = {
1459 [CC_OP_DYNAMIC] = { /* should never happen */ },
1461 [CC_OP_EFLAGS] = { compute_all_eflags, compute_c_eflags },
1463 [CC_OP_MUL] = { compute_all_mul, compute_c_mul },
1465 [CC_OP_ADDB] = { compute_all_addb, compute_c_addb },
1466 [CC_OP_ADDW] = { compute_all_addw, compute_c_addw },
1467 [CC_OP_ADDL] = { compute_all_addl, compute_c_addl },
1469 [CC_OP_ADCB] = { compute_all_adcb, compute_c_adcb },
1470 [CC_OP_ADCW] = { compute_all_adcw, compute_c_adcw },
1471 [CC_OP_ADCL] = { compute_all_adcl, compute_c_adcl },
1473 [CC_OP_SUBB] = { compute_all_subb, compute_c_subb },
1474 [CC_OP_SUBW] = { compute_all_subw, compute_c_subw },
1475 [CC_OP_SUBL] = { compute_all_subl, compute_c_subl },
1477 [CC_OP_SBBB] = { compute_all_sbbb, compute_c_sbbb },
1478 [CC_OP_SBBW] = { compute_all_sbbw, compute_c_sbbw },
1479 [CC_OP_SBBL] = { compute_all_sbbl, compute_c_sbbl },
1481 [CC_OP_LOGICB] = { compute_all_logicb, compute_c_logicb },
1482 [CC_OP_LOGICW] = { compute_all_logicw, compute_c_logicw },
1483 [CC_OP_LOGICL] = { compute_all_logicl, compute_c_logicl },
1485 [CC_OP_INCB] = { compute_all_incb, compute_c_incl },
1486 [CC_OP_INCW] = { compute_all_incw, compute_c_incl },
1487 [CC_OP_INCL] = { compute_all_incl, compute_c_incl },
1489 [CC_OP_DECB] = { compute_all_decb, compute_c_incl },
1490 [CC_OP_DECW] = { compute_all_decw, compute_c_incl },
1491 [CC_OP_DECL] = { compute_all_decl, compute_c_incl },
1493 [CC_OP_SHLB] = { compute_all_shlb, compute_c_shll },
1494 [CC_OP_SHLW] = { compute_all_shlw, compute_c_shll },
1495 [CC_OP_SHLL] = { compute_all_shll, compute_c_shll },
1497 [CC_OP_SARB] = { compute_all_sarb, compute_c_shll },
1498 [CC_OP_SARW] = { compute_all_sarw, compute_c_shll },
1499 [CC_OP_SARL] = { compute_all_sarl, compute_c_shll },
1502 /* floating point support. Some of the code for complicated x87
1503 functions comes from the LGPL'ed x86 emulator found in the Willows
1504 TWIN windows emulator. */
1506 #ifdef USE_X86LDOUBLE
1507 /* use long double functions */
1508 #define lrint lrintl
1509 #define llrint llrintl
1517 #define atan2 atan2l
1518 #define floor floorl
1523 extern int lrint(CPU86_LDouble x);
1524 extern int64_t llrint(CPU86_LDouble x);
1525 extern CPU86_LDouble fabs(CPU86_LDouble x);
1526 extern CPU86_LDouble sin(CPU86_LDouble x);
1527 extern CPU86_LDouble cos(CPU86_LDouble x);
1528 extern CPU86_LDouble sqrt(CPU86_LDouble x);
1529 extern CPU86_LDouble pow(CPU86_LDouble, CPU86_LDouble);
1530 extern CPU86_LDouble log(CPU86_LDouble x);
1531 extern CPU86_LDouble tan(CPU86_LDouble x);
1532 extern CPU86_LDouble atan2(CPU86_LDouble, CPU86_LDouble);
1533 extern CPU86_LDouble floor(CPU86_LDouble x);
1534 extern CPU86_LDouble ceil(CPU86_LDouble x);
1535 extern CPU86_LDouble rint(CPU86_LDouble x);
1537 #if defined(__powerpc__)
1538 extern CPU86_LDouble copysign(CPU86_LDouble, CPU86_LDouble);
1540 /* correct (but slow) PowerPC rint() (glibc version is incorrect) */
1541 double qemu_rint(double x)
1543 double y = 4503599627370496.0;
1554 #define rint qemu_rint
1557 #define RC_MASK 0xc00
1558 #define RC_NEAR 0x000
1559 #define RC_DOWN 0x400
1561 #define RC_CHOP 0xc00
1563 #define MAXTAN 9223372036854775808.0
1565 #ifdef USE_X86LDOUBLE
1571 unsigned long long lower;
1572 unsigned short upper;
1576 /* the following deal with x86 long double-precision numbers */
1577 #define MAXEXPD 0x7fff
1578 #define EXPBIAS 16383
1579 #define EXPD(fp) (fp.l.upper & 0x7fff)
1580 #define SIGND(fp) ((fp.l.upper) & 0x8000)
1581 #define MANTD(fp) (fp.l.lower)
1582 #define BIASEXPONENT(fp) fp.l.upper = (fp.l.upper & ~(0x7fff)) | EXPBIAS
1588 #ifndef WORDS_BIGENDIAN
1590 unsigned long lower;
1596 unsigned long lower;
1602 /* the following deal with IEEE double-precision numbers */
1603 #define MAXEXPD 0x7ff
1604 #define EXPBIAS 1023
1605 #define EXPD(fp) (((fp.l.upper) >> 20) & 0x7FF)
1606 #define SIGND(fp) ((fp.l.upper) & 0x80000000)
1607 #define MANTD(fp) (fp.ll & ((1LL << 52) - 1))
1608 #define BIASEXPONENT(fp) fp.l.upper = (fp.l.upper & ~(0x7ff << 20)) | (EXPBIAS << 20)
1613 void OPPROTO op_flds_FT0_A0(void)
1615 #ifdef USE_FP_CONVERT
1616 FP_CONVERT.i32 = ldl((void *)A0);
1619 FT0 = ldfl((void *)A0);
1623 void OPPROTO op_fldl_FT0_A0(void)
1625 #ifdef USE_FP_CONVERT
1626 FP_CONVERT.i64 = ldq((void *)A0);
1629 FT0 = ldfq((void *)A0);
1633 /* helpers are needed to avoid static constant reference. XXX: find a better way */
1634 #ifdef USE_INT_TO_FLOAT_HELPERS
1636 void helper_fild_FT0_A0(void)
1638 FT0 = (CPU86_LDouble)ldsw((void *)A0);
1641 void helper_fildl_FT0_A0(void)
1643 FT0 = (CPU86_LDouble)((int32_t)ldl((void *)A0));
1646 void helper_fildll_FT0_A0(void)
1648 FT0 = (CPU86_LDouble)((int64_t)ldq((void *)A0));
1651 void OPPROTO op_fild_FT0_A0(void)
1653 helper_fild_FT0_A0();
1656 void OPPROTO op_fildl_FT0_A0(void)
1658 helper_fildl_FT0_A0();
1661 void OPPROTO op_fildll_FT0_A0(void)
1663 helper_fildll_FT0_A0();
1668 void OPPROTO op_fild_FT0_A0(void)
1670 #ifdef USE_FP_CONVERT
1671 FP_CONVERT.i32 = ldsw((void *)A0);
1672 FT0 = (CPU86_LDouble)FP_CONVERT.i32;
1674 FT0 = (CPU86_LDouble)ldsw((void *)A0);
1678 void OPPROTO op_fildl_FT0_A0(void)
1680 #ifdef USE_FP_CONVERT
1681 FP_CONVERT.i32 = (int32_t) ldl((void *)A0);
1682 FT0 = (CPU86_LDouble)FP_CONVERT.i32;
1684 FT0 = (CPU86_LDouble)((int32_t)ldl((void *)A0));
1688 void OPPROTO op_fildll_FT0_A0(void)
1690 #ifdef USE_FP_CONVERT
1691 FP_CONVERT.i64 = (int64_t) ldq((void *)A0);
1692 FT0 = (CPU86_LDouble)FP_CONVERT.i64;
1694 FT0 = (CPU86_LDouble)((int64_t)ldq((void *)A0));
1701 void OPPROTO op_flds_ST0_A0(void)
1703 #ifdef USE_FP_CONVERT
1704 FP_CONVERT.i32 = ldl((void *)A0);
1707 ST0 = ldfl((void *)A0);
1711 void OPPROTO op_fldl_ST0_A0(void)
1713 #ifdef USE_FP_CONVERT
1714 FP_CONVERT.i64 = ldq((void *)A0);
1717 ST0 = ldfq((void *)A0);
1721 #ifdef USE_X86LDOUBLE
1722 void OPPROTO op_fldt_ST0_A0(void)
1724 ST0 = *(long double *)A0;
1727 void helper_fldt_ST0_A0(void)
1729 CPU86_LDoubleU temp;
1732 upper = lduw((uint8_t *)A0 + 8);
1733 /* XXX: handle overflow ? */
1734 e = (upper & 0x7fff) - 16383 + EXPBIAS; /* exponent */
1735 e |= (upper >> 4) & 0x800; /* sign */
1736 temp.ll = ((ldq((void *)A0) >> 11) & ((1LL << 52) - 1)) | ((uint64_t)e << 52);
1740 void OPPROTO op_fldt_ST0_A0(void)
1742 helper_fldt_ST0_A0();
1746 /* helpers are needed to avoid static constant reference. XXX: find a better way */
1747 #ifdef USE_INT_TO_FLOAT_HELPERS
1749 void helper_fild_ST0_A0(void)
1751 ST0 = (CPU86_LDouble)ldsw((void *)A0);
1754 void helper_fildl_ST0_A0(void)
1756 ST0 = (CPU86_LDouble)((int32_t)ldl((void *)A0));
1759 void helper_fildll_ST0_A0(void)
1761 ST0 = (CPU86_LDouble)((int64_t)ldq((void *)A0));
1764 void OPPROTO op_fild_ST0_A0(void)
1766 helper_fild_ST0_A0();
1769 void OPPROTO op_fildl_ST0_A0(void)
1771 helper_fildl_ST0_A0();
1774 void OPPROTO op_fildll_ST0_A0(void)
1776 helper_fildll_ST0_A0();
1781 void OPPROTO op_fild_ST0_A0(void)
1783 #ifdef USE_FP_CONVERT
1784 FP_CONVERT.i32 = ldsw((void *)A0);
1785 ST0 = (CPU86_LDouble)FP_CONVERT.i32;
1787 ST0 = (CPU86_LDouble)ldsw((void *)A0);
1791 void OPPROTO op_fildl_ST0_A0(void)
1793 #ifdef USE_FP_CONVERT
1794 FP_CONVERT.i32 = (int32_t) ldl((void *)A0);
1795 ST0 = (CPU86_LDouble)FP_CONVERT.i32;
1797 ST0 = (CPU86_LDouble)((int32_t)ldl((void *)A0));
1801 void OPPROTO op_fildll_ST0_A0(void)
1803 #ifdef USE_FP_CONVERT
1804 FP_CONVERT.i64 = (int64_t) ldq((void *)A0);
1805 ST0 = (CPU86_LDouble)FP_CONVERT.i64;
1807 ST0 = (CPU86_LDouble)((int64_t)ldq((void *)A0));
1815 void OPPROTO op_fsts_ST0_A0(void)
1817 #ifdef USE_FP_CONVERT
1819 stfl((void *)A0, FP_CONVERT.f);
1821 stfl((void *)A0, (float)ST0);
1825 void OPPROTO op_fstl_ST0_A0(void)
1827 stfq((void *)A0, (double)ST0);
1830 #ifdef USE_X86LDOUBLE
1831 void OPPROTO op_fstt_ST0_A0(void)
1833 *(long double *)A0 = ST0;
1836 void helper_fstt_ST0_A0(void)
1838 CPU86_LDoubleU temp;
1842 stq((void *)A0, (MANTD(temp) << 11) | (1LL << 63));
1843 /* exponent + sign */
1844 e = EXPD(temp) - EXPBIAS + 16383;
1845 e |= SIGND(temp) >> 16;
1846 stw((uint8_t *)A0 + 8, e);
1849 void OPPROTO op_fstt_ST0_A0(void)
1851 helper_fstt_ST0_A0();
1855 void OPPROTO op_fist_ST0_A0(void)
1857 #if defined(__sparc__) && !defined(__sparc_v9__)
1858 register CPU86_LDouble d asm("o0");
1866 stw((void *)A0, val);
1869 void OPPROTO op_fistl_ST0_A0(void)
1871 #if defined(__sparc__) && !defined(__sparc_v9__)
1872 register CPU86_LDouble d asm("o0");
1880 stl((void *)A0, val);
1883 void OPPROTO op_fistll_ST0_A0(void)
1885 #if defined(__sparc__) && !defined(__sparc_v9__)
1886 register CPU86_LDouble d asm("o0");
1894 stq((void *)A0, val);
1899 #define MUL10(iv) ( iv + iv + (iv << 3) )
1901 void helper_fbld_ST0_A0(void)
1904 CPU86_LDouble fpsrcop;
1908 /* in this code, seg/m32i will be used as temporary ptr/int */
1909 seg = (uint8_t *)A0 + 8;
1911 /* XXX: raise exception */
1915 /* XXX: raise exception */
1916 if ((v & 0xf0) != 0)
1918 m32i = v; /* <-- d14 */
1920 m32i = MUL10(m32i) + (v >> 4); /* <-- val * 10 + d13 */
1921 m32i = MUL10(m32i) + (v & 0xf); /* <-- val * 10 + d12 */
1923 m32i = MUL10(m32i) + (v >> 4); /* <-- val * 10 + d11 */
1924 m32i = MUL10(m32i) + (v & 0xf); /* <-- val * 10 + d10 */
1926 m32i = MUL10(m32i) + (v >> 4); /* <-- val * 10 + d9 */
1927 m32i = MUL10(m32i) + (v & 0xf); /* <-- val * 10 + d8 */
1928 fpsrcop = ((CPU86_LDouble)m32i) * 100000000.0;
1931 m32i = (v >> 4); /* <-- d7 */
1932 m32i = MUL10(m32i) + (v & 0xf); /* <-- val * 10 + d6 */
1934 m32i = MUL10(m32i) + (v >> 4); /* <-- val * 10 + d5 */
1935 m32i = MUL10(m32i) + (v & 0xf); /* <-- val * 10 + d4 */
1937 m32i = MUL10(m32i) + (v >> 4); /* <-- val * 10 + d3 */
1938 m32i = MUL10(m32i) + (v & 0xf); /* <-- val * 10 + d2 */
1940 m32i = MUL10(m32i) + (v >> 4); /* <-- val * 10 + d1 */
1941 m32i = MUL10(m32i) + (v & 0xf); /* <-- val * 10 + d0 */
1942 fpsrcop += ((CPU86_LDouble)m32i);
1943 if ( ldub(seg+9) & 0x80 )
1948 void OPPROTO op_fbld_ST0_A0(void)
1950 helper_fbld_ST0_A0();
1953 void helper_fbst_ST0_A0(void)
1955 CPU86_LDouble fptemp;
1956 CPU86_LDouble fpsrcop;
1958 uint8_t *mem_ref, *mem_end;
1960 fpsrcop = rint(ST0);
1961 mem_ref = (uint8_t *)A0;
1962 mem_end = mem_ref + 8;
1963 if ( fpsrcop < 0.0 ) {
1964 stw(mem_end, 0x8000);
1967 stw(mem_end, 0x0000);
1969 while (mem_ref < mem_end) {
1972 fptemp = floor(fpsrcop/10.0);
1973 v = ((int)(fpsrcop - fptemp*10.0));
1974 if (fptemp == 0.0) {
1979 fptemp = floor(fpsrcop/10.0);
1980 v |= (((int)(fpsrcop - fptemp*10.0)) << 4);
1984 while (mem_ref < mem_end) {
1989 void OPPROTO op_fbst_ST0_A0(void)
1991 helper_fbst_ST0_A0();
1996 static inline void fpush(void)
1998 env->fpstt = (env->fpstt - 1) & 7;
1999 env->fptags[env->fpstt] = 0; /* validate stack entry */
2002 static inline void fpop(void)
2004 env->fptags[env->fpstt] = 1; /* invvalidate stack entry */
2005 env->fpstt = (env->fpstt + 1) & 7;
2008 void OPPROTO op_fpush(void)
2013 void OPPROTO op_fpop(void)
2018 void OPPROTO op_fdecstp(void)
2020 env->fpstt = (env->fpstt - 1) & 7;
2021 env->fpus &= (~0x4700);
2024 void OPPROTO op_fincstp(void)
2026 env->fpstt = (env->fpstt + 1) & 7;
2027 env->fpus &= (~0x4700);
2030 void OPPROTO op_fmov_ST0_FT0(void)
2035 void OPPROTO op_fmov_FT0_STN(void)
2040 void OPPROTO op_fmov_ST0_STN(void)
2045 void OPPROTO op_fmov_STN_ST0(void)
2050 void OPPROTO op_fxchg_ST0_STN(void)
2058 /* FPU operations */
2060 /* XXX: handle nans */
2061 void OPPROTO op_fcom_ST0_FT0(void)
2063 env->fpus &= (~0x4500); /* (C3,C2,C0) <-- 000 */
2065 env->fpus |= 0x100; /* (C3,C2,C0) <-- 001 */
2066 else if (ST0 == FT0)
2067 env->fpus |= 0x4000; /* (C3,C2,C0) <-- 100 */
2071 /* XXX: handle nans */
2072 void OPPROTO op_fucom_ST0_FT0(void)
2074 env->fpus &= (~0x4500); /* (C3,C2,C0) <-- 000 */
2076 env->fpus |= 0x100; /* (C3,C2,C0) <-- 001 */
2077 else if (ST0 == FT0)
2078 env->fpus |= 0x4000; /* (C3,C2,C0) <-- 100 */
2082 void OPPROTO op_fadd_ST0_FT0(void)
2087 void OPPROTO op_fmul_ST0_FT0(void)
2092 void OPPROTO op_fsub_ST0_FT0(void)
2097 void OPPROTO op_fsubr_ST0_FT0(void)
2102 void OPPROTO op_fdiv_ST0_FT0(void)
2107 void OPPROTO op_fdivr_ST0_FT0(void)
2112 /* fp operations between STN and ST0 */
2114 void OPPROTO op_fadd_STN_ST0(void)
2119 void OPPROTO op_fmul_STN_ST0(void)
2124 void OPPROTO op_fsub_STN_ST0(void)
2129 void OPPROTO op_fsubr_STN_ST0(void)
2136 void OPPROTO op_fdiv_STN_ST0(void)
2141 void OPPROTO op_fdivr_STN_ST0(void)
2148 /* misc FPU operations */
2149 void OPPROTO op_fchs_ST0(void)
2154 void OPPROTO op_fabs_ST0(void)
2159 void helper_fxam_ST0(void)
2161 CPU86_LDoubleU temp;
2166 env->fpus &= (~0x4700); /* (C3,C2,C1,C0) <-- 0000 */
2168 env->fpus |= 0x200; /* C1 <-- 1 */
2170 expdif = EXPD(temp);
2171 if (expdif == MAXEXPD) {
2172 if (MANTD(temp) == 0)
2173 env->fpus |= 0x500 /*Infinity*/;
2175 env->fpus |= 0x100 /*NaN*/;
2176 } else if (expdif == 0) {
2177 if (MANTD(temp) == 0)
2178 env->fpus |= 0x4000 /*Zero*/;
2180 env->fpus |= 0x4400 /*Denormal*/;
2186 void OPPROTO op_fxam_ST0(void)
2191 void OPPROTO op_fld1_ST0(void)
2193 ST0 = *(CPU86_LDouble *)&f15rk[1];
2196 void OPPROTO op_fldl2t_ST0(void)
2198 ST0 = *(CPU86_LDouble *)&f15rk[6];
2201 void OPPROTO op_fldl2e_ST0(void)
2203 ST0 = *(CPU86_LDouble *)&f15rk[5];
2206 void OPPROTO op_fldpi_ST0(void)
2208 ST0 = *(CPU86_LDouble *)&f15rk[2];
2211 void OPPROTO op_fldlg2_ST0(void)
2213 ST0 = *(CPU86_LDouble *)&f15rk[3];
2216 void OPPROTO op_fldln2_ST0(void)
2218 ST0 = *(CPU86_LDouble *)&f15rk[4];
2221 void OPPROTO op_fldz_ST0(void)
2223 ST0 = *(CPU86_LDouble *)&f15rk[0];
2226 void OPPROTO op_fldz_FT0(void)
2228 ST0 = *(CPU86_LDouble *)&f15rk[0];
2231 void helper_f2xm1(void)
2233 ST0 = pow(2.0,ST0) - 1.0;
2236 void helper_fyl2x(void)
2238 CPU86_LDouble fptemp;
2242 fptemp = log(fptemp)/log(2.0); /* log2(ST) */
2246 env->fpus &= (~0x4700);
2251 void helper_fptan(void)
2253 CPU86_LDouble fptemp;
2256 if((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
2262 env->fpus &= (~0x400); /* C2 <-- 0 */
2263 /* the above code is for |arg| < 2**52 only */
2267 void helper_fpatan(void)
2269 CPU86_LDouble fptemp, fpsrcop;
2273 ST1 = atan2(fpsrcop,fptemp);
2277 void helper_fxtract(void)
2279 CPU86_LDoubleU temp;
2280 unsigned int expdif;
2283 expdif = EXPD(temp) - EXPBIAS;
2284 /*DP exponent bias*/
2291 void helper_fprem1(void)
2293 CPU86_LDouble dblq, fpsrcop, fptemp;
2294 CPU86_LDoubleU fpsrcop1, fptemp1;
2300 fpsrcop1.d = fpsrcop;
2302 expdif = EXPD(fpsrcop1) - EXPD(fptemp1);
2304 dblq = fpsrcop / fptemp;
2305 dblq = (dblq < 0.0)? ceil(dblq): floor(dblq);
2306 ST0 = fpsrcop - fptemp*dblq;
2307 q = (int)dblq; /* cutting off top bits is assumed here */
2308 env->fpus &= (~0x4700); /* (C3,C2,C1,C0) <-- 0000 */
2309 /* (C0,C1,C3) <-- (q2,q1,q0) */
2310 env->fpus |= (q&0x4) << 6; /* (C0) <-- q2 */
2311 env->fpus |= (q&0x2) << 8; /* (C1) <-- q1 */
2312 env->fpus |= (q&0x1) << 14; /* (C3) <-- q0 */
2314 env->fpus |= 0x400; /* C2 <-- 1 */
2315 fptemp = pow(2.0, expdif-50);
2316 fpsrcop = (ST0 / ST1) / fptemp;
2317 /* fpsrcop = integer obtained by rounding to the nearest */
2318 fpsrcop = (fpsrcop-floor(fpsrcop) < ceil(fpsrcop)-fpsrcop)?
2319 floor(fpsrcop): ceil(fpsrcop);
2320 ST0 -= (ST1 * fpsrcop * fptemp);
2324 void helper_fprem(void)
2326 CPU86_LDouble dblq, fpsrcop, fptemp;
2327 CPU86_LDoubleU fpsrcop1, fptemp1;
2333 fpsrcop1.d = fpsrcop;
2335 expdif = EXPD(fpsrcop1) - EXPD(fptemp1);
2336 if ( expdif < 53 ) {
2337 dblq = fpsrcop / fptemp;
2338 dblq = (dblq < 0.0)? ceil(dblq): floor(dblq);
2339 ST0 = fpsrcop - fptemp*dblq;
2340 q = (int)dblq; /* cutting off top bits is assumed here */
2341 env->fpus &= (~0x4700); /* (C3,C2,C1,C0) <-- 0000 */
2342 /* (C0,C1,C3) <-- (q2,q1,q0) */
2343 env->fpus |= (q&0x4) << 6; /* (C0) <-- q2 */
2344 env->fpus |= (q&0x2) << 8; /* (C1) <-- q1 */
2345 env->fpus |= (q&0x1) << 14; /* (C3) <-- q0 */
2347 env->fpus |= 0x400; /* C2 <-- 1 */
2348 fptemp = pow(2.0, expdif-50);
2349 fpsrcop = (ST0 / ST1) / fptemp;
2350 /* fpsrcop = integer obtained by chopping */
2351 fpsrcop = (fpsrcop < 0.0)?
2352 -(floor(fabs(fpsrcop))): floor(fpsrcop);
2353 ST0 -= (ST1 * fpsrcop * fptemp);
2357 void helper_fyl2xp1(void)
2359 CPU86_LDouble fptemp;
2362 if ((fptemp+1.0)>0.0) {
2363 fptemp = log(fptemp+1.0) / log(2.0); /* log2(ST+1.0) */
2367 env->fpus &= (~0x4700);
2372 void helper_fsqrt(void)
2374 CPU86_LDouble fptemp;
2378 env->fpus &= (~0x4700); /* (C3,C2,C1,C0) <-- 0000 */
2384 void helper_fsincos(void)
2386 CPU86_LDouble fptemp;
2389 if ((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
2395 env->fpus &= (~0x400); /* C2 <-- 0 */
2396 /* the above code is for |arg| < 2**63 only */
2400 void helper_frndint(void)
2405 void helper_fscale(void)
2407 CPU86_LDouble fpsrcop, fptemp;
2410 fptemp = pow(fpsrcop,ST1);
2414 void helper_fsin(void)
2416 CPU86_LDouble fptemp;
2419 if ((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
2423 env->fpus &= (~0x400); /* C2 <-- 0 */
2424 /* the above code is for |arg| < 2**53 only */
2428 void helper_fcos(void)
2430 CPU86_LDouble fptemp;
2433 if((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
2437 env->fpus &= (~0x400); /* C2 <-- 0 */
2438 /* the above code is for |arg5 < 2**63 only */
2442 /* associated heplers to reduce generated code length and to simplify
2443 relocation (FP constants are usually stored in .rodata section) */
2445 void OPPROTO op_f2xm1(void)
2450 void OPPROTO op_fyl2x(void)
2455 void OPPROTO op_fptan(void)
2460 void OPPROTO op_fpatan(void)
2465 void OPPROTO op_fxtract(void)
2470 void OPPROTO op_fprem1(void)
2476 void OPPROTO op_fprem(void)
2481 void OPPROTO op_fyl2xp1(void)
2486 void OPPROTO op_fsqrt(void)
2491 void OPPROTO op_fsincos(void)
2496 void OPPROTO op_frndint(void)
2501 void OPPROTO op_fscale(void)
2506 void OPPROTO op_fsin(void)
2511 void OPPROTO op_fcos(void)
2516 void OPPROTO op_fnstsw_A0(void)
2519 fpus = (env->fpus & ~0x3800) | (env->fpstt & 0x7) << 11;
2520 stw((void *)A0, fpus);
2523 void OPPROTO op_fnstsw_EAX(void)
2526 fpus = (env->fpus & ~0x3800) | (env->fpstt & 0x7) << 11;
2527 EAX = (EAX & 0xffff0000) | fpus;
2530 void OPPROTO op_fnstcw_A0(void)
2532 stw((void *)A0, env->fpuc);
2535 void OPPROTO op_fldcw_A0(void)
2538 env->fpuc = lduw((void *)A0);
2539 /* set rounding mode */
2540 switch(env->fpuc & RC_MASK) {
2543 rnd_type = FE_TONEAREST;
2546 rnd_type = FE_DOWNWARD;
2549 rnd_type = FE_UPWARD;
2552 rnd_type = FE_TOWARDZERO;
2555 fesetround(rnd_type);
2558 void OPPROTO op_fclex(void)
2560 env->fpus &= 0x7f00;
2563 void OPPROTO op_fninit(void)
2578 /* threading support */
2579 void OPPROTO op_lock(void)
2584 void OPPROTO op_unlock(void)