2 * i386 micro operations
4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
24 /* n must be a constant to be efficient */
25 static inline target_long lshift(target_long x, int n)
33 /* we define the various pieces of code used by the JIT */
37 #include "opreg_template.h"
43 #include "opreg_template.h"
49 #include "opreg_template.h"
55 #include "opreg_template.h"
61 #include "opreg_template.h"
67 #include "opreg_template.h"
73 #include "opreg_template.h"
79 #include "opreg_template.h"
85 #define REG (env->regs[8])
87 #include "opreg_template.h"
91 #define REG (env->regs[9])
93 #include "opreg_template.h"
97 #define REG (env->regs[10])
99 #include "opreg_template.h"
103 #define REG (env->regs[11])
105 #include "opreg_template.h"
109 #define REG (env->regs[12])
111 #include "opreg_template.h"
115 #define REG (env->regs[13])
117 #include "opreg_template.h"
121 #define REG (env->regs[14])
123 #include "opreg_template.h"
127 #define REG (env->regs[15])
129 #include "opreg_template.h"
135 /* operations with flags */
137 /* update flags with T0 and T1 (add/sub case) */
138 void OPPROTO op_update2_cc(void)
144 /* update flags with T0 (logic operation case) */
145 void OPPROTO op_update1_cc(void)
150 void OPPROTO op_update_neg_cc(void)
156 void OPPROTO op_cmpl_T0_T1_cc(void)
162 void OPPROTO op_update_inc_cc(void)
164 CC_SRC = cc_table[CC_OP].compute_c();
168 void OPPROTO op_testl_T0_T1_cc(void)
173 /* operations without flags */
175 void OPPROTO op_addl_T0_T1(void)
180 void OPPROTO op_orl_T0_T1(void)
185 void OPPROTO op_andl_T0_T1(void)
190 void OPPROTO op_subl_T0_T1(void)
195 void OPPROTO op_xorl_T0_T1(void)
200 void OPPROTO op_negl_T0(void)
205 void OPPROTO op_incl_T0(void)
210 void OPPROTO op_decl_T0(void)
215 void OPPROTO op_notl_T0(void)
220 void OPPROTO op_bswapl_T0(void)
226 void OPPROTO op_bswapq_T0(void)
232 /* multiply/divide */
234 /* XXX: add eflags optimizations */
235 /* XXX: add non P4 style flags */
237 void OPPROTO op_mulb_AL_T0(void)
240 res = (uint8_t)EAX * (uint8_t)T0;
241 EAX = (EAX & ~0xffff) | res;
243 CC_SRC = (res & 0xff00);
246 void OPPROTO op_imulb_AL_T0(void)
249 res = (int8_t)EAX * (int8_t)T0;
250 EAX = (EAX & ~0xffff) | (res & 0xffff);
252 CC_SRC = (res != (int8_t)res);
255 void OPPROTO op_mulw_AX_T0(void)
258 res = (uint16_t)EAX * (uint16_t)T0;
259 EAX = (EAX & ~0xffff) | (res & 0xffff);
260 EDX = (EDX & ~0xffff) | ((res >> 16) & 0xffff);
265 void OPPROTO op_imulw_AX_T0(void)
268 res = (int16_t)EAX * (int16_t)T0;
269 EAX = (EAX & ~0xffff) | (res & 0xffff);
270 EDX = (EDX & ~0xffff) | ((res >> 16) & 0xffff);
272 CC_SRC = (res != (int16_t)res);
275 void OPPROTO op_mull_EAX_T0(void)
278 res = (uint64_t)((uint32_t)EAX) * (uint64_t)((uint32_t)T0);
280 EDX = (uint32_t)(res >> 32);
281 CC_DST = (uint32_t)res;
282 CC_SRC = (uint32_t)(res >> 32);
285 void OPPROTO op_imull_EAX_T0(void)
288 res = (int64_t)((int32_t)EAX) * (int64_t)((int32_t)T0);
289 EAX = (uint32_t)(res);
290 EDX = (uint32_t)(res >> 32);
292 CC_SRC = (res != (int32_t)res);
295 void OPPROTO op_imulw_T0_T1(void)
298 res = (int16_t)T0 * (int16_t)T1;
301 CC_SRC = (res != (int16_t)res);
304 void OPPROTO op_imull_T0_T1(void)
307 res = (int64_t)((int32_t)T0) * (int64_t)((int32_t)T1);
310 CC_SRC = (res != (int32_t)res);
314 void OPPROTO op_mulq_EAX_T0(void)
316 helper_mulq_EAX_T0();
319 void OPPROTO op_imulq_EAX_T0(void)
321 helper_imulq_EAX_T0();
324 void OPPROTO op_imulq_T0_T1(void)
326 helper_imulq_T0_T1();
330 /* division, flags are undefined */
332 void OPPROTO op_divb_AL_T0(void)
334 unsigned int num, den, q, r;
336 num = (EAX & 0xffff);
339 raise_exception(EXCP00_DIVZ);
343 raise_exception(EXCP00_DIVZ);
345 r = (num % den) & 0xff;
346 EAX = (EAX & ~0xffff) | (r << 8) | q;
349 void OPPROTO op_idivb_AL_T0(void)
356 raise_exception(EXCP00_DIVZ);
360 raise_exception(EXCP00_DIVZ);
362 r = (num % den) & 0xff;
363 EAX = (EAX & ~0xffff) | (r << 8) | q;
366 void OPPROTO op_divw_AX_T0(void)
368 unsigned int num, den, q, r;
370 num = (EAX & 0xffff) | ((EDX & 0xffff) << 16);
373 raise_exception(EXCP00_DIVZ);
377 raise_exception(EXCP00_DIVZ);
379 r = (num % den) & 0xffff;
380 EAX = (EAX & ~0xffff) | q;
381 EDX = (EDX & ~0xffff) | r;
384 void OPPROTO op_idivw_AX_T0(void)
388 num = (EAX & 0xffff) | ((EDX & 0xffff) << 16);
391 raise_exception(EXCP00_DIVZ);
395 raise_exception(EXCP00_DIVZ);
397 r = (num % den) & 0xffff;
398 EAX = (EAX & ~0xffff) | q;
399 EDX = (EDX & ~0xffff) | r;
402 void OPPROTO op_divl_EAX_T0(void)
404 helper_divl_EAX_T0();
407 void OPPROTO op_idivl_EAX_T0(void)
409 helper_idivl_EAX_T0();
413 void OPPROTO op_divq_EAX_T0(void)
415 helper_divq_EAX_T0();
418 void OPPROTO op_idivq_EAX_T0(void)
420 helper_idivq_EAX_T0();
424 /* constant load & misc op */
426 /* XXX: consistent names */
427 void OPPROTO op_movl_T0_imu(void)
429 T0 = (uint32_t)PARAM1;
432 void OPPROTO op_movl_T0_im(void)
434 T0 = (int32_t)PARAM1;
437 void OPPROTO op_addl_T0_im(void)
442 void OPPROTO op_andl_T0_ffff(void)
447 void OPPROTO op_andl_T0_im(void)
452 void OPPROTO op_movl_T0_T1(void)
457 void OPPROTO op_movl_T1_imu(void)
459 T1 = (uint32_t)PARAM1;
462 void OPPROTO op_movl_T1_im(void)
464 T1 = (int32_t)PARAM1;
467 void OPPROTO op_addl_T1_im(void)
472 void OPPROTO op_movl_T1_A0(void)
477 void OPPROTO op_movl_A0_im(void)
479 A0 = (uint32_t)PARAM1;
482 void OPPROTO op_addl_A0_im(void)
484 A0 = (uint32_t)(A0 + PARAM1);
487 void OPPROTO op_movl_A0_seg(void)
489 A0 = (uint32_t)*(target_ulong *)((char *)env + PARAM1);
492 void OPPROTO op_addl_A0_seg(void)
494 A0 = (uint32_t)(A0 + *(target_ulong *)((char *)env + PARAM1));
497 void OPPROTO op_addl_A0_AL(void)
499 A0 = (uint32_t)(A0 + (EAX & 0xff));
502 #ifdef WORDS_BIGENDIAN
503 typedef union UREG64 {
504 struct { uint16_t v3, v2, v1, v0; } w;
505 struct { uint32_t v1, v0; } l;
509 typedef union UREG64 {
510 struct { uint16_t v0, v1, v2, v3; } w;
511 struct { uint32_t v0, v1; } l;
526 void OPPROTO op_movq_T0_im64(void)
531 void OPPROTO op_movq_T1_im64(void)
536 void OPPROTO op_movq_A0_im(void)
538 A0 = (int32_t)PARAM1;
541 void OPPROTO op_movq_A0_im64(void)
546 void OPPROTO op_addq_A0_im(void)
548 A0 = (A0 + (int32_t)PARAM1);
551 void OPPROTO op_addq_A0_im64(void)
556 void OPPROTO op_movq_A0_seg(void)
558 A0 = *(target_ulong *)((char *)env + PARAM1);
561 void OPPROTO op_addq_A0_seg(void)
563 A0 += *(target_ulong *)((char *)env + PARAM1);
566 void OPPROTO op_addq_A0_AL(void)
568 A0 = (A0 + (EAX & 0xff));
573 void OPPROTO op_andl_A0_ffff(void)
580 #define MEMSUFFIX _raw
583 #if !defined(CONFIG_USER_ONLY)
584 #define MEMSUFFIX _kernel
587 #define MEMSUFFIX _user
593 void OPPROTO op_jmp_T0(void)
598 void OPPROTO op_movl_eip_im(void)
600 EIP = (uint32_t)PARAM1;
604 void OPPROTO op_movq_eip_im(void)
606 EIP = (int32_t)PARAM1;
609 void OPPROTO op_movq_eip_im64(void)
615 void OPPROTO op_hlt(void)
620 void OPPROTO op_monitor(void)
625 void OPPROTO op_mwait(void)
630 void OPPROTO op_debug(void)
632 env->exception_index = EXCP_DEBUG;
636 void OPPROTO op_raise_interrupt(void)
638 int intno, next_eip_addend;
640 next_eip_addend = PARAM2;
641 raise_interrupt(intno, 1, 0, next_eip_addend);
644 void OPPROTO op_raise_exception(void)
647 exception_index = PARAM1;
648 raise_exception(exception_index);
651 void OPPROTO op_into(void)
654 eflags = cc_table[CC_OP].compute_all();
656 raise_interrupt(EXCP04_INTO, 1, 0, PARAM1);
661 void OPPROTO op_cli(void)
663 env->eflags &= ~IF_MASK;
666 void OPPROTO op_sti(void)
668 env->eflags |= IF_MASK;
671 void OPPROTO op_set_inhibit_irq(void)
673 env->hflags |= HF_INHIBIT_IRQ_MASK;
676 void OPPROTO op_reset_inhibit_irq(void)
678 env->hflags &= ~HF_INHIBIT_IRQ_MASK;
681 void OPPROTO op_rsm(void)
687 /* vm86plus instructions */
688 void OPPROTO op_cli_vm(void)
690 env->eflags &= ~VIF_MASK;
693 void OPPROTO op_sti_vm(void)
695 env->eflags |= VIF_MASK;
696 if (env->eflags & VIP_MASK) {
698 raise_exception(EXCP0D_GPF);
704 void OPPROTO op_boundw(void)
710 if (v < low || v > high) {
711 raise_exception(EXCP05_BOUND);
716 void OPPROTO op_boundl(void)
722 if (v < low || v > high) {
723 raise_exception(EXCP05_BOUND);
728 void OPPROTO op_cmpxchg8b(void)
733 void OPPROTO op_movl_T0_0(void)
738 void OPPROTO op_exit_tb(void)
743 /* multiple size ops */
748 #include "ops_template.h"
752 #include "ops_template.h"
756 #include "ops_template.h"
762 #include "ops_template.h"
769 void OPPROTO op_movsbl_T0_T0(void)
774 void OPPROTO op_movzbl_T0_T0(void)
779 void OPPROTO op_movswl_T0_T0(void)
784 void OPPROTO op_movzwl_T0_T0(void)
789 void OPPROTO op_movswl_EAX_AX(void)
791 EAX = (uint32_t)((int16_t)EAX);
795 void OPPROTO op_movslq_T0_T0(void)
800 void OPPROTO op_movslq_RAX_EAX(void)
806 void OPPROTO op_movsbw_AX_AL(void)
808 EAX = (EAX & ~0xffff) | ((int8_t)EAX & 0xffff);
811 void OPPROTO op_movslq_EDX_EAX(void)
813 EDX = (uint32_t)((int32_t)EAX >> 31);
816 void OPPROTO op_movswl_DX_AX(void)
818 EDX = (EDX & ~0xffff) | (((int16_t)EAX >> 15) & 0xffff);
822 void OPPROTO op_movsqo_RDX_RAX(void)
824 EDX = (int64_t)EAX >> 63;
828 /* string ops helpers */
830 void OPPROTO op_addl_ESI_T0(void)
832 ESI = (uint32_t)(ESI + T0);
835 void OPPROTO op_addw_ESI_T0(void)
837 ESI = (ESI & ~0xffff) | ((ESI + T0) & 0xffff);
840 void OPPROTO op_addl_EDI_T0(void)
842 EDI = (uint32_t)(EDI + T0);
845 void OPPROTO op_addw_EDI_T0(void)
847 EDI = (EDI & ~0xffff) | ((EDI + T0) & 0xffff);
850 void OPPROTO op_decl_ECX(void)
852 ECX = (uint32_t)(ECX - 1);
855 void OPPROTO op_decw_ECX(void)
857 ECX = (ECX & ~0xffff) | ((ECX - 1) & 0xffff);
861 void OPPROTO op_addq_ESI_T0(void)
866 void OPPROTO op_addq_EDI_T0(void)
871 void OPPROTO op_decq_ECX(void)
879 void op_addl_A0_SS(void)
881 A0 = (uint32_t)(A0 + env->segs[R_SS].base);
884 void op_subl_A0_2(void)
886 A0 = (uint32_t)(A0 - 2);
889 void op_subl_A0_4(void)
891 A0 = (uint32_t)(A0 - 4);
894 void op_addl_ESP_4(void)
896 ESP = (uint32_t)(ESP + 4);
899 void op_addl_ESP_2(void)
901 ESP = (uint32_t)(ESP + 2);
904 void op_addw_ESP_4(void)
906 ESP = (ESP & ~0xffff) | ((ESP + 4) & 0xffff);
909 void op_addw_ESP_2(void)
911 ESP = (ESP & ~0xffff) | ((ESP + 2) & 0xffff);
914 void op_addl_ESP_im(void)
916 ESP = (uint32_t)(ESP + PARAM1);
919 void op_addw_ESP_im(void)
921 ESP = (ESP & ~0xffff) | ((ESP + PARAM1) & 0xffff);
925 void op_subq_A0_2(void)
930 void op_subq_A0_8(void)
935 void op_addq_ESP_8(void)
940 void op_addq_ESP_im(void)
946 void OPPROTO op_rdtsc(void)
951 void OPPROTO op_cpuid(void)
956 void OPPROTO op_enter_level(void)
958 helper_enter_level(PARAM1, PARAM2);
962 void OPPROTO op_enter64_level(void)
964 helper_enter64_level(PARAM1, PARAM2);
968 void OPPROTO op_sysenter(void)
973 void OPPROTO op_sysexit(void)
979 void OPPROTO op_syscall(void)
981 helper_syscall(PARAM1);
984 void OPPROTO op_sysret(void)
986 helper_sysret(PARAM1);
990 void OPPROTO op_rdmsr(void)
995 void OPPROTO op_wrmsr(void)
1002 /* XXX: exception */
1003 void OPPROTO op_aam(void)
1010 EAX = (EAX & ~0xffff) | al | (ah << 8);
1014 void OPPROTO op_aad(void)
1019 ah = (EAX >> 8) & 0xff;
1020 al = ((ah * base) + al) & 0xff;
1021 EAX = (EAX & ~0xffff) | al;
1025 void OPPROTO op_aaa(void)
1031 eflags = cc_table[CC_OP].compute_all();
1034 ah = (EAX >> 8) & 0xff;
1036 icarry = (al > 0xf9);
1037 if (((al & 0x0f) > 9 ) || af) {
1038 al = (al + 6) & 0x0f;
1039 ah = (ah + 1 + icarry) & 0xff;
1040 eflags |= CC_C | CC_A;
1042 eflags &= ~(CC_C | CC_A);
1045 EAX = (EAX & ~0xffff) | al | (ah << 8);
1050 void OPPROTO op_aas(void)
1056 eflags = cc_table[CC_OP].compute_all();
1059 ah = (EAX >> 8) & 0xff;
1062 if (((al & 0x0f) > 9 ) || af) {
1063 al = (al - 6) & 0x0f;
1064 ah = (ah - 1 - icarry) & 0xff;
1065 eflags |= CC_C | CC_A;
1067 eflags &= ~(CC_C | CC_A);
1070 EAX = (EAX & ~0xffff) | al | (ah << 8);
1075 void OPPROTO op_daa(void)
1080 eflags = cc_table[CC_OP].compute_all();
1086 if (((al & 0x0f) > 9 ) || af) {
1087 al = (al + 6) & 0xff;
1090 if ((al > 0x9f) || cf) {
1091 al = (al + 0x60) & 0xff;
1094 EAX = (EAX & ~0xff) | al;
1095 /* well, speed is not an issue here, so we compute the flags by hand */
1096 eflags |= (al == 0) << 6; /* zf */
1097 eflags |= parity_table[al]; /* pf */
1098 eflags |= (al & 0x80); /* sf */
1103 void OPPROTO op_das(void)
1105 int al, al1, af, cf;
1108 eflags = cc_table[CC_OP].compute_all();
1115 if (((al & 0x0f) > 9 ) || af) {
1119 al = (al - 6) & 0xff;
1121 if ((al1 > 0x99) || cf) {
1122 al = (al - 0x60) & 0xff;
1125 EAX = (EAX & ~0xff) | al;
1126 /* well, speed is not an issue here, so we compute the flags by hand */
1127 eflags |= (al == 0) << 6; /* zf */
1128 eflags |= parity_table[al]; /* pf */
1129 eflags |= (al & 0x80); /* sf */
1134 /* segment handling */
1136 /* never use it with R_CS */
1137 void OPPROTO op_movl_seg_T0(void)
1139 load_seg(PARAM1, T0);
1142 /* faster VM86 version */
1143 void OPPROTO op_movl_seg_T0_vm(void)
1148 selector = T0 & 0xffff;
1149 /* env->segs[] access */
1150 sc = (SegmentCache *)((char *)env + PARAM1);
1151 sc->selector = selector;
1152 sc->base = (selector << 4);
1155 void OPPROTO op_movl_T0_seg(void)
1157 T0 = env->segs[PARAM1].selector;
1160 void OPPROTO op_lsl(void)
1165 void OPPROTO op_lar(void)
1170 void OPPROTO op_verr(void)
1175 void OPPROTO op_verw(void)
1180 void OPPROTO op_arpl(void)
1182 if ((T0 & 3) < (T1 & 3)) {
1183 /* XXX: emulate bug or 0xff3f0000 oring as in bochs ? */
1184 T0 = (T0 & ~3) | (T1 & 3);
1192 void OPPROTO op_arpl_update(void)
1195 eflags = cc_table[CC_OP].compute_all();
1196 CC_SRC = (eflags & ~CC_Z) | T1;
1199 /* T0: segment, T1:eip */
1200 void OPPROTO op_ljmp_protected_T0_T1(void)
1202 helper_ljmp_protected_T0_T1(PARAM1);
1205 void OPPROTO op_lcall_real_T0_T1(void)
1207 helper_lcall_real_T0_T1(PARAM1, PARAM2);
1210 void OPPROTO op_lcall_protected_T0_T1(void)
1212 helper_lcall_protected_T0_T1(PARAM1, PARAM2);
1215 void OPPROTO op_iret_real(void)
1217 helper_iret_real(PARAM1);
1220 void OPPROTO op_iret_protected(void)
1222 helper_iret_protected(PARAM1, PARAM2);
1225 void OPPROTO op_lret_protected(void)
1227 helper_lret_protected(PARAM1, PARAM2);
1230 void OPPROTO op_lldt_T0(void)
1235 void OPPROTO op_ltr_T0(void)
1240 /* CR registers access */
1241 void OPPROTO op_movl_crN_T0(void)
1243 helper_movl_crN_T0(PARAM1);
1246 #if !defined(CONFIG_USER_ONLY)
1247 void OPPROTO op_movtl_T0_cr8(void)
1249 T0 = cpu_get_apic_tpr(env);
1253 /* DR registers access */
1254 void OPPROTO op_movl_drN_T0(void)
1256 helper_movl_drN_T0(PARAM1);
1259 void OPPROTO op_lmsw_T0(void)
1261 /* only 4 lower bits of CR0 are modified. PE cannot be set to zero
1262 if already set to one. */
1263 T0 = (env->cr[0] & ~0xe) | (T0 & 0xf);
1264 helper_movl_crN_T0(0);
1267 void OPPROTO op_invlpg_A0(void)
1272 void OPPROTO op_movl_T0_env(void)
1274 T0 = *(uint32_t *)((char *)env + PARAM1);
1277 void OPPROTO op_movl_env_T0(void)
1279 *(uint32_t *)((char *)env + PARAM1) = T0;
1282 void OPPROTO op_movl_env_T1(void)
1284 *(uint32_t *)((char *)env + PARAM1) = T1;
1287 void OPPROTO op_movtl_T0_env(void)
1289 T0 = *(target_ulong *)((char *)env + PARAM1);
1292 void OPPROTO op_movtl_env_T0(void)
1294 *(target_ulong *)((char *)env + PARAM1) = T0;
1297 void OPPROTO op_movtl_T1_env(void)
1299 T1 = *(target_ulong *)((char *)env + PARAM1);
1302 void OPPROTO op_movtl_env_T1(void)
1304 *(target_ulong *)((char *)env + PARAM1) = T1;
1307 void OPPROTO op_clts(void)
1309 env->cr[0] &= ~CR0_TS_MASK;
1310 env->hflags &= ~HF_TS_MASK;
1313 /* flags handling */
1315 void OPPROTO op_goto_tb0(void)
1317 GOTO_TB(op_goto_tb0, PARAM1, 0);
1320 void OPPROTO op_goto_tb1(void)
1322 GOTO_TB(op_goto_tb1, PARAM1, 1);
1325 void OPPROTO op_jmp_label(void)
1327 GOTO_LABEL_PARAM(1);
1330 void OPPROTO op_jnz_T0_label(void)
1333 GOTO_LABEL_PARAM(1);
1337 void OPPROTO op_jz_T0_label(void)
1340 GOTO_LABEL_PARAM(1);
1344 /* slow set cases (compute x86 flags) */
1345 void OPPROTO op_seto_T0_cc(void)
1348 eflags = cc_table[CC_OP].compute_all();
1349 T0 = (eflags >> 11) & 1;
1352 void OPPROTO op_setb_T0_cc(void)
1354 T0 = cc_table[CC_OP].compute_c();
1357 void OPPROTO op_setz_T0_cc(void)
1360 eflags = cc_table[CC_OP].compute_all();
1361 T0 = (eflags >> 6) & 1;
1364 void OPPROTO op_setbe_T0_cc(void)
1367 eflags = cc_table[CC_OP].compute_all();
1368 T0 = (eflags & (CC_Z | CC_C)) != 0;
1371 void OPPROTO op_sets_T0_cc(void)
1374 eflags = cc_table[CC_OP].compute_all();
1375 T0 = (eflags >> 7) & 1;
1378 void OPPROTO op_setp_T0_cc(void)
1381 eflags = cc_table[CC_OP].compute_all();
1382 T0 = (eflags >> 2) & 1;
1385 void OPPROTO op_setl_T0_cc(void)
1388 eflags = cc_table[CC_OP].compute_all();
1389 T0 = ((eflags ^ (eflags >> 4)) >> 7) & 1;
1392 void OPPROTO op_setle_T0_cc(void)
1395 eflags = cc_table[CC_OP].compute_all();
1396 T0 = (((eflags ^ (eflags >> 4)) & 0x80) || (eflags & CC_Z)) != 0;
1399 void OPPROTO op_xor_T0_1(void)
1404 void OPPROTO op_set_cc_op(void)
1409 void OPPROTO op_mov_T0_cc(void)
1411 T0 = cc_table[CC_OP].compute_all();
1414 /* XXX: clear VIF/VIP in all ops ? */
1416 void OPPROTO op_movl_eflags_T0(void)
1418 load_eflags(T0, (TF_MASK | AC_MASK | ID_MASK | NT_MASK));
1421 void OPPROTO op_movw_eflags_T0(void)
1423 load_eflags(T0, (TF_MASK | AC_MASK | ID_MASK | NT_MASK) & 0xffff);
1426 void OPPROTO op_movl_eflags_T0_io(void)
1428 load_eflags(T0, (TF_MASK | AC_MASK | ID_MASK | NT_MASK | IF_MASK));
1431 void OPPROTO op_movw_eflags_T0_io(void)
1433 load_eflags(T0, (TF_MASK | AC_MASK | ID_MASK | NT_MASK | IF_MASK) & 0xffff);
1436 void OPPROTO op_movl_eflags_T0_cpl0(void)
1438 load_eflags(T0, (TF_MASK | AC_MASK | ID_MASK | NT_MASK | IF_MASK | IOPL_MASK));
1441 void OPPROTO op_movw_eflags_T0_cpl0(void)
1443 load_eflags(T0, (TF_MASK | AC_MASK | ID_MASK | NT_MASK | IF_MASK | IOPL_MASK) & 0xffff);
1447 /* vm86plus version */
1448 void OPPROTO op_movw_eflags_T0_vm(void)
1452 CC_SRC = eflags & (CC_O | CC_S | CC_Z | CC_A | CC_P | CC_C);
1453 DF = 1 - (2 * ((eflags >> 10) & 1));
1454 /* we also update some system flags as in user mode */
1455 env->eflags = (env->eflags & ~(FL_UPDATE_MASK16 | VIF_MASK)) |
1456 (eflags & FL_UPDATE_MASK16);
1457 if (eflags & IF_MASK) {
1458 env->eflags |= VIF_MASK;
1459 if (env->eflags & VIP_MASK) {
1461 raise_exception(EXCP0D_GPF);
1467 void OPPROTO op_movl_eflags_T0_vm(void)
1471 CC_SRC = eflags & (CC_O | CC_S | CC_Z | CC_A | CC_P | CC_C);
1472 DF = 1 - (2 * ((eflags >> 10) & 1));
1473 /* we also update some system flags as in user mode */
1474 env->eflags = (env->eflags & ~(FL_UPDATE_MASK32 | VIF_MASK)) |
1475 (eflags & FL_UPDATE_MASK32);
1476 if (eflags & IF_MASK) {
1477 env->eflags |= VIF_MASK;
1478 if (env->eflags & VIP_MASK) {
1480 raise_exception(EXCP0D_GPF);
1487 /* XXX: compute only O flag */
1488 void OPPROTO op_movb_eflags_T0(void)
1491 of = cc_table[CC_OP].compute_all() & CC_O;
1492 CC_SRC = (T0 & (CC_S | CC_Z | CC_A | CC_P | CC_C)) | of;
1495 void OPPROTO op_movl_T0_eflags(void)
1498 eflags = cc_table[CC_OP].compute_all();
1499 eflags |= (DF & DF_MASK);
1500 eflags |= env->eflags & ~(VM_MASK | RF_MASK);
1504 /* vm86plus version */
1506 void OPPROTO op_movl_T0_eflags_vm(void)
1509 eflags = cc_table[CC_OP].compute_all();
1510 eflags |= (DF & DF_MASK);
1511 eflags |= env->eflags & ~(VM_MASK | RF_MASK | IF_MASK);
1512 if (env->eflags & VIF_MASK)
1518 void OPPROTO op_cld(void)
1523 void OPPROTO op_std(void)
1528 void OPPROTO op_clc(void)
1531 eflags = cc_table[CC_OP].compute_all();
1536 void OPPROTO op_stc(void)
1539 eflags = cc_table[CC_OP].compute_all();
1544 void OPPROTO op_cmc(void)
1547 eflags = cc_table[CC_OP].compute_all();
1552 void OPPROTO op_salc(void)
1555 cf = cc_table[CC_OP].compute_c();
1556 EAX = (EAX & ~0xff) | ((-cf) & 0xff);
1559 static int compute_all_eflags(void)
1564 static int compute_c_eflags(void)
1566 return CC_SRC & CC_C;
1569 CCTable cc_table[CC_OP_NB] = {
1570 [CC_OP_DYNAMIC] = { /* should never happen */ },
1572 [CC_OP_EFLAGS] = { compute_all_eflags, compute_c_eflags },
1574 [CC_OP_MULB] = { compute_all_mulb, compute_c_mull },
1575 [CC_OP_MULW] = { compute_all_mulw, compute_c_mull },
1576 [CC_OP_MULL] = { compute_all_mull, compute_c_mull },
1578 [CC_OP_ADDB] = { compute_all_addb, compute_c_addb },
1579 [CC_OP_ADDW] = { compute_all_addw, compute_c_addw },
1580 [CC_OP_ADDL] = { compute_all_addl, compute_c_addl },
1582 [CC_OP_ADCB] = { compute_all_adcb, compute_c_adcb },
1583 [CC_OP_ADCW] = { compute_all_adcw, compute_c_adcw },
1584 [CC_OP_ADCL] = { compute_all_adcl, compute_c_adcl },
1586 [CC_OP_SUBB] = { compute_all_subb, compute_c_subb },
1587 [CC_OP_SUBW] = { compute_all_subw, compute_c_subw },
1588 [CC_OP_SUBL] = { compute_all_subl, compute_c_subl },
1590 [CC_OP_SBBB] = { compute_all_sbbb, compute_c_sbbb },
1591 [CC_OP_SBBW] = { compute_all_sbbw, compute_c_sbbw },
1592 [CC_OP_SBBL] = { compute_all_sbbl, compute_c_sbbl },
1594 [CC_OP_LOGICB] = { compute_all_logicb, compute_c_logicb },
1595 [CC_OP_LOGICW] = { compute_all_logicw, compute_c_logicw },
1596 [CC_OP_LOGICL] = { compute_all_logicl, compute_c_logicl },
1598 [CC_OP_INCB] = { compute_all_incb, compute_c_incl },
1599 [CC_OP_INCW] = { compute_all_incw, compute_c_incl },
1600 [CC_OP_INCL] = { compute_all_incl, compute_c_incl },
1602 [CC_OP_DECB] = { compute_all_decb, compute_c_incl },
1603 [CC_OP_DECW] = { compute_all_decw, compute_c_incl },
1604 [CC_OP_DECL] = { compute_all_decl, compute_c_incl },
1606 [CC_OP_SHLB] = { compute_all_shlb, compute_c_shlb },
1607 [CC_OP_SHLW] = { compute_all_shlw, compute_c_shlw },
1608 [CC_OP_SHLL] = { compute_all_shll, compute_c_shll },
1610 [CC_OP_SARB] = { compute_all_sarb, compute_c_sarl },
1611 [CC_OP_SARW] = { compute_all_sarw, compute_c_sarl },
1612 [CC_OP_SARL] = { compute_all_sarl, compute_c_sarl },
1614 #ifdef TARGET_X86_64
1615 [CC_OP_MULQ] = { compute_all_mulq, compute_c_mull },
1617 [CC_OP_ADDQ] = { compute_all_addq, compute_c_addq },
1619 [CC_OP_ADCQ] = { compute_all_adcq, compute_c_adcq },
1621 [CC_OP_SUBQ] = { compute_all_subq, compute_c_subq },
1623 [CC_OP_SBBQ] = { compute_all_sbbq, compute_c_sbbq },
1625 [CC_OP_LOGICQ] = { compute_all_logicq, compute_c_logicq },
1627 [CC_OP_INCQ] = { compute_all_incq, compute_c_incl },
1629 [CC_OP_DECQ] = { compute_all_decq, compute_c_incl },
1631 [CC_OP_SHLQ] = { compute_all_shlq, compute_c_shlq },
1633 [CC_OP_SARQ] = { compute_all_sarq, compute_c_sarl },
1637 /* floating point support. Some of the code for complicated x87
1638 functions comes from the LGPL'ed x86 emulator found in the Willows
1639 TWIN windows emulator. */
1643 void OPPROTO op_flds_FT0_A0(void)
1645 #ifdef USE_FP_CONVERT
1646 FP_CONVERT.i32 = ldl(A0);
1653 void OPPROTO op_fldl_FT0_A0(void)
1655 #ifdef USE_FP_CONVERT
1656 FP_CONVERT.i64 = ldq(A0);
1663 /* helpers are needed to avoid static constant reference. XXX: find a better way */
1664 #ifdef USE_INT_TO_FLOAT_HELPERS
1666 void helper_fild_FT0_A0(void)
1668 FT0 = (CPU86_LDouble)ldsw(A0);
1671 void helper_fildl_FT0_A0(void)
1673 FT0 = (CPU86_LDouble)((int32_t)ldl(A0));
1676 void helper_fildll_FT0_A0(void)
1678 FT0 = (CPU86_LDouble)((int64_t)ldq(A0));
1681 void OPPROTO op_fild_FT0_A0(void)
1683 helper_fild_FT0_A0();
1686 void OPPROTO op_fildl_FT0_A0(void)
1688 helper_fildl_FT0_A0();
1691 void OPPROTO op_fildll_FT0_A0(void)
1693 helper_fildll_FT0_A0();
1698 void OPPROTO op_fild_FT0_A0(void)
1700 #ifdef USE_FP_CONVERT
1701 FP_CONVERT.i32 = ldsw(A0);
1702 FT0 = (CPU86_LDouble)FP_CONVERT.i32;
1704 FT0 = (CPU86_LDouble)ldsw(A0);
1708 void OPPROTO op_fildl_FT0_A0(void)
1710 #ifdef USE_FP_CONVERT
1711 FP_CONVERT.i32 = (int32_t) ldl(A0);
1712 FT0 = (CPU86_LDouble)FP_CONVERT.i32;
1714 FT0 = (CPU86_LDouble)((int32_t)ldl(A0));
1718 void OPPROTO op_fildll_FT0_A0(void)
1720 #ifdef USE_FP_CONVERT
1721 FP_CONVERT.i64 = (int64_t) ldq(A0);
1722 FT0 = (CPU86_LDouble)FP_CONVERT.i64;
1724 FT0 = (CPU86_LDouble)((int64_t)ldq(A0));
1731 void OPPROTO op_flds_ST0_A0(void)
1734 new_fpstt = (env->fpstt - 1) & 7;
1735 #ifdef USE_FP_CONVERT
1736 FP_CONVERT.i32 = ldl(A0);
1737 env->fpregs[new_fpstt].d = FP_CONVERT.f;
1739 env->fpregs[new_fpstt].d = ldfl(A0);
1741 env->fpstt = new_fpstt;
1742 env->fptags[new_fpstt] = 0; /* validate stack entry */
1745 void OPPROTO op_fldl_ST0_A0(void)
1748 new_fpstt = (env->fpstt - 1) & 7;
1749 #ifdef USE_FP_CONVERT
1750 FP_CONVERT.i64 = ldq(A0);
1751 env->fpregs[new_fpstt].d = FP_CONVERT.d;
1753 env->fpregs[new_fpstt].d = ldfq(A0);
1755 env->fpstt = new_fpstt;
1756 env->fptags[new_fpstt] = 0; /* validate stack entry */
1759 void OPPROTO op_fldt_ST0_A0(void)
1761 helper_fldt_ST0_A0();
1764 /* helpers are needed to avoid static constant reference. XXX: find a better way */
1765 #ifdef USE_INT_TO_FLOAT_HELPERS
1767 void helper_fild_ST0_A0(void)
1770 new_fpstt = (env->fpstt - 1) & 7;
1771 env->fpregs[new_fpstt].d = (CPU86_LDouble)ldsw(A0);
1772 env->fpstt = new_fpstt;
1773 env->fptags[new_fpstt] = 0; /* validate stack entry */
1776 void helper_fildl_ST0_A0(void)
1779 new_fpstt = (env->fpstt - 1) & 7;
1780 env->fpregs[new_fpstt].d = (CPU86_LDouble)((int32_t)ldl(A0));
1781 env->fpstt = new_fpstt;
1782 env->fptags[new_fpstt] = 0; /* validate stack entry */
1785 void helper_fildll_ST0_A0(void)
1788 new_fpstt = (env->fpstt - 1) & 7;
1789 env->fpregs[new_fpstt].d = (CPU86_LDouble)((int64_t)ldq(A0));
1790 env->fpstt = new_fpstt;
1791 env->fptags[new_fpstt] = 0; /* validate stack entry */
1794 void OPPROTO op_fild_ST0_A0(void)
1796 helper_fild_ST0_A0();
1799 void OPPROTO op_fildl_ST0_A0(void)
1801 helper_fildl_ST0_A0();
1804 void OPPROTO op_fildll_ST0_A0(void)
1806 helper_fildll_ST0_A0();
1811 void OPPROTO op_fild_ST0_A0(void)
1814 new_fpstt = (env->fpstt - 1) & 7;
1815 #ifdef USE_FP_CONVERT
1816 FP_CONVERT.i32 = ldsw(A0);
1817 env->fpregs[new_fpstt].d = (CPU86_LDouble)FP_CONVERT.i32;
1819 env->fpregs[new_fpstt].d = (CPU86_LDouble)ldsw(A0);
1821 env->fpstt = new_fpstt;
1822 env->fptags[new_fpstt] = 0; /* validate stack entry */
1825 void OPPROTO op_fildl_ST0_A0(void)
1828 new_fpstt = (env->fpstt - 1) & 7;
1829 #ifdef USE_FP_CONVERT
1830 FP_CONVERT.i32 = (int32_t) ldl(A0);
1831 env->fpregs[new_fpstt].d = (CPU86_LDouble)FP_CONVERT.i32;
1833 env->fpregs[new_fpstt].d = (CPU86_LDouble)((int32_t)ldl(A0));
1835 env->fpstt = new_fpstt;
1836 env->fptags[new_fpstt] = 0; /* validate stack entry */
1839 void OPPROTO op_fildll_ST0_A0(void)
1842 new_fpstt = (env->fpstt - 1) & 7;
1843 #ifdef USE_FP_CONVERT
1844 FP_CONVERT.i64 = (int64_t) ldq(A0);
1845 env->fpregs[new_fpstt].d = (CPU86_LDouble)FP_CONVERT.i64;
1847 env->fpregs[new_fpstt].d = (CPU86_LDouble)((int64_t)ldq(A0));
1849 env->fpstt = new_fpstt;
1850 env->fptags[new_fpstt] = 0; /* validate stack entry */
1857 void OPPROTO op_fsts_ST0_A0(void)
1859 #ifdef USE_FP_CONVERT
1860 FP_CONVERT.f = (float)ST0;
1861 stfl(A0, FP_CONVERT.f);
1863 stfl(A0, (float)ST0);
1868 void OPPROTO op_fstl_ST0_A0(void)
1870 stfq(A0, (double)ST0);
1874 void OPPROTO op_fstt_ST0_A0(void)
1876 helper_fstt_ST0_A0();
1879 void OPPROTO op_fist_ST0_A0(void)
1881 #if defined(__sparc__) && !defined(__sparc_v9__)
1882 register CPU86_LDouble d asm("o0");
1889 val = floatx_to_int32(d, &env->fp_status);
1890 if (val != (int16_t)val)
1896 void OPPROTO op_fistl_ST0_A0(void)
1898 #if defined(__sparc__) && !defined(__sparc_v9__)
1899 register CPU86_LDouble d asm("o0");
1906 val = floatx_to_int32(d, &env->fp_status);
1911 void OPPROTO op_fistll_ST0_A0(void)
1913 #if defined(__sparc__) && !defined(__sparc_v9__)
1914 register CPU86_LDouble d asm("o0");
1921 val = floatx_to_int64(d, &env->fp_status);
1926 void OPPROTO op_fistt_ST0_A0(void)
1928 #if defined(__sparc__) && !defined(__sparc_v9__)
1929 register CPU86_LDouble d asm("o0");
1936 val = floatx_to_int32_round_to_zero(d, &env->fp_status);
1937 if (val != (int16_t)val)
1943 void OPPROTO op_fisttl_ST0_A0(void)
1945 #if defined(__sparc__) && !defined(__sparc_v9__)
1946 register CPU86_LDouble d asm("o0");
1953 val = floatx_to_int32_round_to_zero(d, &env->fp_status);
1958 void OPPROTO op_fisttll_ST0_A0(void)
1960 #if defined(__sparc__) && !defined(__sparc_v9__)
1961 register CPU86_LDouble d asm("o0");
1968 val = floatx_to_int64_round_to_zero(d, &env->fp_status);
1973 void OPPROTO op_fbld_ST0_A0(void)
1975 helper_fbld_ST0_A0();
1978 void OPPROTO op_fbst_ST0_A0(void)
1980 helper_fbst_ST0_A0();
1985 void OPPROTO op_fpush(void)
1990 void OPPROTO op_fpop(void)
1995 void OPPROTO op_fdecstp(void)
1997 env->fpstt = (env->fpstt - 1) & 7;
1998 env->fpus &= (~0x4700);
2001 void OPPROTO op_fincstp(void)
2003 env->fpstt = (env->fpstt + 1) & 7;
2004 env->fpus &= (~0x4700);
2007 void OPPROTO op_ffree_STN(void)
2009 env->fptags[(env->fpstt + PARAM1) & 7] = 1;
2012 void OPPROTO op_fmov_ST0_FT0(void)
2017 void OPPROTO op_fmov_FT0_STN(void)
2022 void OPPROTO op_fmov_ST0_STN(void)
2027 void OPPROTO op_fmov_STN_ST0(void)
2032 void OPPROTO op_fxchg_ST0_STN(void)
2040 /* FPU operations */
2042 const int fcom_ccval[4] = {0x0100, 0x4000, 0x0000, 0x4500};
2044 void OPPROTO op_fcom_ST0_FT0(void)
2048 ret = floatx_compare(ST0, FT0, &env->fp_status);
2049 env->fpus = (env->fpus & ~0x4500) | fcom_ccval[ret + 1];
2053 void OPPROTO op_fucom_ST0_FT0(void)
2057 ret = floatx_compare_quiet(ST0, FT0, &env->fp_status);
2058 env->fpus = (env->fpus & ~0x4500) | fcom_ccval[ret+ 1];
2062 const int fcomi_ccval[4] = {CC_C, CC_Z, 0, CC_Z | CC_P | CC_C};
2064 void OPPROTO op_fcomi_ST0_FT0(void)
2069 ret = floatx_compare(ST0, FT0, &env->fp_status);
2070 eflags = cc_table[CC_OP].compute_all();
2071 eflags = (eflags & ~(CC_Z | CC_P | CC_C)) | fcomi_ccval[ret + 1];
2076 void OPPROTO op_fucomi_ST0_FT0(void)
2081 ret = floatx_compare_quiet(ST0, FT0, &env->fp_status);
2082 eflags = cc_table[CC_OP].compute_all();
2083 eflags = (eflags & ~(CC_Z | CC_P | CC_C)) | fcomi_ccval[ret + 1];
2088 void OPPROTO op_fcmov_ST0_STN_T0(void)
2096 void OPPROTO op_fadd_ST0_FT0(void)
2101 void OPPROTO op_fmul_ST0_FT0(void)
2106 void OPPROTO op_fsub_ST0_FT0(void)
2111 void OPPROTO op_fsubr_ST0_FT0(void)
2116 void OPPROTO op_fdiv_ST0_FT0(void)
2118 ST0 = helper_fdiv(ST0, FT0);
2121 void OPPROTO op_fdivr_ST0_FT0(void)
2123 ST0 = helper_fdiv(FT0, ST0);
2126 /* fp operations between STN and ST0 */
2128 void OPPROTO op_fadd_STN_ST0(void)
2133 void OPPROTO op_fmul_STN_ST0(void)
2138 void OPPROTO op_fsub_STN_ST0(void)
2143 void OPPROTO op_fsubr_STN_ST0(void)
2150 void OPPROTO op_fdiv_STN_ST0(void)
2154 *p = helper_fdiv(*p, ST0);
2157 void OPPROTO op_fdivr_STN_ST0(void)
2161 *p = helper_fdiv(ST0, *p);
2164 /* misc FPU operations */
2165 void OPPROTO op_fchs_ST0(void)
2167 ST0 = floatx_chs(ST0);
2170 void OPPROTO op_fabs_ST0(void)
2172 ST0 = floatx_abs(ST0);
2175 void OPPROTO op_fxam_ST0(void)
2180 void OPPROTO op_fld1_ST0(void)
2185 void OPPROTO op_fldl2t_ST0(void)
2190 void OPPROTO op_fldl2e_ST0(void)
2195 void OPPROTO op_fldpi_ST0(void)
2200 void OPPROTO op_fldlg2_ST0(void)
2205 void OPPROTO op_fldln2_ST0(void)
2210 void OPPROTO op_fldz_ST0(void)
2215 void OPPROTO op_fldz_FT0(void)
2220 /* associated heplers to reduce generated code length and to simplify
2221 relocation (FP constants are usually stored in .rodata section) */
2223 void OPPROTO op_f2xm1(void)
2228 void OPPROTO op_fyl2x(void)
2233 void OPPROTO op_fptan(void)
2238 void OPPROTO op_fpatan(void)
2243 void OPPROTO op_fxtract(void)
2248 void OPPROTO op_fprem1(void)
2254 void OPPROTO op_fprem(void)
2259 void OPPROTO op_fyl2xp1(void)
2264 void OPPROTO op_fsqrt(void)
2269 void OPPROTO op_fsincos(void)
2274 void OPPROTO op_frndint(void)
2279 void OPPROTO op_fscale(void)
2284 void OPPROTO op_fsin(void)
2289 void OPPROTO op_fcos(void)
2294 void OPPROTO op_fnstsw_A0(void)
2297 fpus = (env->fpus & ~0x3800) | (env->fpstt & 0x7) << 11;
2302 void OPPROTO op_fnstsw_EAX(void)
2305 fpus = (env->fpus & ~0x3800) | (env->fpstt & 0x7) << 11;
2306 EAX = (EAX & ~0xffff) | fpus;
2309 void OPPROTO op_fnstcw_A0(void)
2315 void OPPROTO op_fldcw_A0(void)
2317 env->fpuc = lduw(A0);
2321 void OPPROTO op_fclex(void)
2323 env->fpus &= 0x7f00;
2326 void OPPROTO op_fwait(void)
2328 if (env->fpus & FPUS_SE)
2329 fpu_raise_exception();
2333 void OPPROTO op_fninit(void)
2348 void OPPROTO op_fnstenv_A0(void)
2350 helper_fstenv(A0, PARAM1);
2353 void OPPROTO op_fldenv_A0(void)
2355 helper_fldenv(A0, PARAM1);
2358 void OPPROTO op_fnsave_A0(void)
2360 helper_fsave(A0, PARAM1);
2363 void OPPROTO op_frstor_A0(void)
2365 helper_frstor(A0, PARAM1);
2368 /* threading support */
2369 void OPPROTO op_lock(void)
2374 void OPPROTO op_unlock(void)
2380 static inline void memcpy16(void *d, void *s)
2382 ((uint32_t *)d)[0] = ((uint32_t *)s)[0];
2383 ((uint32_t *)d)[1] = ((uint32_t *)s)[1];
2384 ((uint32_t *)d)[2] = ((uint32_t *)s)[2];
2385 ((uint32_t *)d)[3] = ((uint32_t *)s)[3];
2388 void OPPROTO op_movo(void)
2390 /* XXX: badly generated code */
2392 d = (XMMReg *)((char *)env + PARAM1);
2393 s = (XMMReg *)((char *)env + PARAM2);
2397 void OPPROTO op_movq(void)
2400 d = (uint64_t *)((char *)env + PARAM1);
2401 s = (uint64_t *)((char *)env + PARAM2);
2405 void OPPROTO op_movl(void)
2408 d = (uint32_t *)((char *)env + PARAM1);
2409 s = (uint32_t *)((char *)env + PARAM2);
2413 void OPPROTO op_movq_env_0(void)
2416 d = (uint64_t *)((char *)env + PARAM1);
2420 void OPPROTO op_fxsave_A0(void)
2422 helper_fxsave(A0, PARAM1);
2425 void OPPROTO op_fxrstor_A0(void)
2427 helper_fxrstor(A0, PARAM1);
2430 /* XXX: optimize by storing fptt and fptags in the static cpu state */
2431 void OPPROTO op_enter_mmx(void)
2434 *(uint32_t *)(env->fptags) = 0;
2435 *(uint32_t *)(env->fptags + 4) = 0;
2438 void OPPROTO op_emms(void)
2440 /* set to empty state */
2441 *(uint32_t *)(env->fptags) = 0x01010101;
2442 *(uint32_t *)(env->fptags + 4) = 0x01010101;
2446 #include "ops_sse.h"
2449 #include "ops_sse.h"