1 // SPDX-License-Identifier: GPL-2.0-only
4 * Copyright Novell Inc 2010
10 #include <asm/kvm_ppc.h>
11 #include <asm/disassemble.h>
12 #include <asm/kvm_book3s.h>
13 #include <asm/kvm_fpu.h>
15 #include <asm/cacheflush.h>
16 #include <asm/switch_to.h>
17 #include <linux/vmalloc.h>
22 #define dprintk printk
24 #define dprintk(...) do { } while(0);
40 #define OP_31_LFSX 535
41 #define OP_31_LFSUX 567
42 #define OP_31_LFDX 599
43 #define OP_31_LFDUX 631
44 #define OP_31_STFSX 663
45 #define OP_31_STFSUX 695
46 #define OP_31_STFX 727
47 #define OP_31_STFUX 759
48 #define OP_31_LWIZX 887
49 #define OP_31_STFIWX 983
51 #define OP_59_FADDS 21
52 #define OP_59_FSUBS 20
53 #define OP_59_FSQRTS 22
54 #define OP_59_FDIVS 18
56 #define OP_59_FMULS 25
57 #define OP_59_FRSQRTES 26
58 #define OP_59_FMSUBS 28
59 #define OP_59_FMADDS 29
60 #define OP_59_FNMSUBS 30
61 #define OP_59_FNMADDS 31
64 #define OP_63_FCPSGN 8
66 #define OP_63_FCTIW 14
67 #define OP_63_FCTIWZ 15
70 #define OP_63_FSQRT 22
74 #define OP_63_FRSQRTE 26
75 #define OP_63_FMSUB 28
76 #define OP_63_FMADD 29
77 #define OP_63_FNMSUB 30
78 #define OP_63_FNMADD 31
79 #define OP_63_FCMPO 32
80 #define OP_63_MTFSB1 38 // XXX
83 #define OP_63_MCRFS 64
84 #define OP_63_MTFSB0 70
86 #define OP_63_MTFSFI 134
87 #define OP_63_FABS 264
88 #define OP_63_MFFS 583
89 #define OP_63_MTFSF 711
91 #define OP_4X_PS_CMPU0 0
92 #define OP_4X_PSQ_LX 6
93 #define OP_4XW_PSQ_STX 7
94 #define OP_4A_PS_SUM0 10
95 #define OP_4A_PS_SUM1 11
96 #define OP_4A_PS_MULS0 12
97 #define OP_4A_PS_MULS1 13
98 #define OP_4A_PS_MADDS0 14
99 #define OP_4A_PS_MADDS1 15
100 #define OP_4A_PS_DIV 18
101 #define OP_4A_PS_SUB 20
102 #define OP_4A_PS_ADD 21
103 #define OP_4A_PS_SEL 23
104 #define OP_4A_PS_RES 24
105 #define OP_4A_PS_MUL 25
106 #define OP_4A_PS_RSQRTE 26
107 #define OP_4A_PS_MSUB 28
108 #define OP_4A_PS_MADD 29
109 #define OP_4A_PS_NMSUB 30
110 #define OP_4A_PS_NMADD 31
111 #define OP_4X_PS_CMPO0 32
112 #define OP_4X_PSQ_LUX 38
113 #define OP_4XW_PSQ_STUX 39
114 #define OP_4X_PS_NEG 40
115 #define OP_4X_PS_CMPU1 64
116 #define OP_4X_PS_MR 72
117 #define OP_4X_PS_CMPO1 96
118 #define OP_4X_PS_NABS 136
119 #define OP_4X_PS_ABS 264
120 #define OP_4X_PS_MERGE00 528
121 #define OP_4X_PS_MERGE01 560
122 #define OP_4X_PS_MERGE10 592
123 #define OP_4X_PS_MERGE11 624
125 #define SCALAR_NONE 0
126 #define SCALAR_HIGH (1 << 0)
127 #define SCALAR_LOW (1 << 1)
128 #define SCALAR_NO_PS0 (1 << 2)
129 #define SCALAR_NO_PS1 (1 << 3)
131 #define GQR_ST_TYPE_MASK 0x00000007
132 #define GQR_ST_TYPE_SHIFT 0
133 #define GQR_ST_SCALE_MASK 0x00003f00
134 #define GQR_ST_SCALE_SHIFT 8
135 #define GQR_LD_TYPE_MASK 0x00070000
136 #define GQR_LD_TYPE_SHIFT 16
137 #define GQR_LD_SCALE_MASK 0x3f000000
138 #define GQR_LD_SCALE_SHIFT 24
140 #define GQR_QUANTIZE_FLOAT 0
141 #define GQR_QUANTIZE_U8 4
142 #define GQR_QUANTIZE_U16 5
143 #define GQR_QUANTIZE_S8 6
144 #define GQR_QUANTIZE_S16 7
146 #define FPU_LS_SINGLE 0
147 #define FPU_LS_DOUBLE 1
148 #define FPU_LS_SINGLE_LOW 2
150 static inline void kvmppc_sync_qpr(struct kvm_vcpu *vcpu, int rt)
152 kvm_cvt_df(&VCPU_FPR(vcpu, rt), &vcpu->arch.qpr[rt]);
155 static void kvmppc_inject_pf(struct kvm_vcpu *vcpu, ulong eaddr, bool is_store)
158 u64 msr = kvmppc_get_msr(vcpu);
160 msr = kvmppc_set_field(msr, 33, 36, 0);
161 msr = kvmppc_set_field(msr, 42, 47, 0);
162 kvmppc_set_msr(vcpu, msr);
163 kvmppc_set_dar(vcpu, eaddr);
165 dsisr = kvmppc_set_field(0, 33, 33, 1);
167 dsisr = kvmppc_set_field(dsisr, 38, 38, 1);
168 kvmppc_set_dsisr(vcpu, dsisr);
169 kvmppc_book3s_queue_irqprio(vcpu, BOOK3S_INTERRUPT_DATA_STORAGE);
172 static int kvmppc_emulate_fpr_load(struct kvm_vcpu *vcpu,
173 int rs, ulong addr, int ls_type)
175 int emulated = EMULATE_FAIL;
178 int len = sizeof(u32);
180 if (ls_type == FPU_LS_DOUBLE)
183 /* read from memory */
184 r = kvmppc_ld(vcpu, &addr, len, tmp, true);
185 vcpu->arch.paddr_accessed = addr;
188 kvmppc_inject_pf(vcpu, addr, false);
190 } else if (r == EMULATE_DO_MMIO) {
191 emulated = kvmppc_handle_load(vcpu, KVM_MMIO_REG_FPR | rs,
196 emulated = EMULATE_DONE;
198 /* put in registers */
201 kvm_cvt_fd((u32*)tmp, &VCPU_FPR(vcpu, rs));
202 vcpu->arch.qpr[rs] = *((u32*)tmp);
205 VCPU_FPR(vcpu, rs) = *((u64*)tmp);
209 dprintk(KERN_INFO "KVM: FPR_LD [0x%llx] at 0x%lx (%d)\n", *(u64*)tmp,
216 static int kvmppc_emulate_fpr_store(struct kvm_vcpu *vcpu,
217 int rs, ulong addr, int ls_type)
219 int emulated = EMULATE_FAIL;
227 kvm_cvt_df(&VCPU_FPR(vcpu, rs), (u32*)tmp);
231 case FPU_LS_SINGLE_LOW:
232 *((u32*)tmp) = VCPU_FPR(vcpu, rs);
233 val = VCPU_FPR(vcpu, rs) & 0xffffffff;
237 *((u64*)tmp) = VCPU_FPR(vcpu, rs);
238 val = VCPU_FPR(vcpu, rs);
246 r = kvmppc_st(vcpu, &addr, len, tmp, true);
247 vcpu->arch.paddr_accessed = addr;
249 kvmppc_inject_pf(vcpu, addr, true);
250 } else if (r == EMULATE_DO_MMIO) {
251 emulated = kvmppc_handle_store(vcpu, val, len, 1);
253 emulated = EMULATE_DONE;
256 dprintk(KERN_INFO "KVM: FPR_ST [0x%llx] at 0x%lx (%d)\n",
262 static int kvmppc_emulate_psq_load(struct kvm_vcpu *vcpu,
263 int rs, ulong addr, bool w, int i)
265 int emulated = EMULATE_FAIL;
270 /* read from memory */
272 r = kvmppc_ld(vcpu, &addr, sizeof(u32), tmp, true);
273 memcpy(&tmp[1], &one, sizeof(u32));
275 r = kvmppc_ld(vcpu, &addr, sizeof(u32) * 2, tmp, true);
277 vcpu->arch.paddr_accessed = addr;
279 kvmppc_inject_pf(vcpu, addr, false);
281 } else if ((r == EMULATE_DO_MMIO) && w) {
282 emulated = kvmppc_handle_load(vcpu, KVM_MMIO_REG_FPR | rs,
284 vcpu->arch.qpr[rs] = tmp[1];
286 } else if (r == EMULATE_DO_MMIO) {
287 emulated = kvmppc_handle_load(vcpu, KVM_MMIO_REG_FQPR | rs,
292 emulated = EMULATE_DONE;
294 /* put in registers */
295 kvm_cvt_fd(&tmp[0], &VCPU_FPR(vcpu, rs));
296 vcpu->arch.qpr[rs] = tmp[1];
298 dprintk(KERN_INFO "KVM: PSQ_LD [0x%x, 0x%x] at 0x%lx (%d)\n", tmp[0],
299 tmp[1], addr, w ? 4 : 8);
305 static int kvmppc_emulate_psq_store(struct kvm_vcpu *vcpu,
306 int rs, ulong addr, bool w, int i)
308 int emulated = EMULATE_FAIL;
311 int len = w ? sizeof(u32) : sizeof(u64);
313 kvm_cvt_df(&VCPU_FPR(vcpu, rs), &tmp[0]);
314 tmp[1] = vcpu->arch.qpr[rs];
316 r = kvmppc_st(vcpu, &addr, len, tmp, true);
317 vcpu->arch.paddr_accessed = addr;
319 kvmppc_inject_pf(vcpu, addr, true);
320 } else if ((r == EMULATE_DO_MMIO) && w) {
321 emulated = kvmppc_handle_store(vcpu, tmp[0], 4, 1);
322 } else if (r == EMULATE_DO_MMIO) {
323 u64 val = ((u64)tmp[0] << 32) | tmp[1];
324 emulated = kvmppc_handle_store(vcpu, val, 8, 1);
326 emulated = EMULATE_DONE;
329 dprintk(KERN_INFO "KVM: PSQ_ST [0x%x, 0x%x] at 0x%lx (%d)\n",
330 tmp[0], tmp[1], addr, len);
336 * Cuts out inst bits with ordering according to spec.
337 * That means the leftmost bit is zero. All given bits are included.
339 static inline u32 inst_get_field(u32 inst, int msb, int lsb)
341 return kvmppc_get_field(inst, msb + 32, lsb + 32);
344 static bool kvmppc_inst_is_paired_single(struct kvm_vcpu *vcpu, u32 inst)
346 if (!(vcpu->arch.hflags & BOOK3S_HFLAG_PAIRED_SINGLE))
349 switch (get_op(inst)) {
365 switch (inst_get_field(inst, 21, 30)) {
376 case OP_4X_PS_MERGE00:
377 case OP_4X_PS_MERGE01:
378 case OP_4X_PS_MERGE10:
379 case OP_4X_PS_MERGE11:
383 switch (inst_get_field(inst, 25, 30)) {
385 case OP_4XW_PSQ_STUX:
389 switch (inst_get_field(inst, 26, 30)) {
394 case OP_4A_PS_MADDS0:
395 case OP_4A_PS_MADDS1:
402 case OP_4A_PS_RSQRTE:
411 switch (inst_get_field(inst, 21, 30)) {
419 switch (inst_get_field(inst, 26, 30)) {
429 switch (inst_get_field(inst, 21, 30)) {
451 switch (inst_get_field(inst, 26, 30)) {
462 switch (inst_get_field(inst, 21, 30)) {
480 static int get_d_signext(u32 inst)
482 int d = inst & 0x8ff;
490 static int kvmppc_ps_three_in(struct kvm_vcpu *vcpu, bool rc,
491 int reg_out, int reg_in1, int reg_in2,
492 int reg_in3, int scalar,
493 void (*func)(u64 *fpscr,
495 u32 *src2, u32 *src3))
497 u32 *qpr = vcpu->arch.qpr;
499 u32 ps0_in1, ps0_in2, ps0_in3;
500 u32 ps1_in1, ps1_in2, ps1_in3;
506 kvm_cvt_df(&VCPU_FPR(vcpu, reg_in1), &ps0_in1);
507 kvm_cvt_df(&VCPU_FPR(vcpu, reg_in2), &ps0_in2);
508 kvm_cvt_df(&VCPU_FPR(vcpu, reg_in3), &ps0_in3);
510 if (scalar & SCALAR_LOW)
511 ps0_in2 = qpr[reg_in2];
513 func(&vcpu->arch.fp.fpscr, &ps0_out, &ps0_in1, &ps0_in2, &ps0_in3);
515 dprintk(KERN_INFO "PS3 ps0 -> f(0x%x, 0x%x, 0x%x) = 0x%x\n",
516 ps0_in1, ps0_in2, ps0_in3, ps0_out);
518 if (!(scalar & SCALAR_NO_PS0))
519 kvm_cvt_fd(&ps0_out, &VCPU_FPR(vcpu, reg_out));
522 ps1_in1 = qpr[reg_in1];
523 ps1_in2 = qpr[reg_in2];
524 ps1_in3 = qpr[reg_in3];
526 if (scalar & SCALAR_HIGH)
529 if (!(scalar & SCALAR_NO_PS1))
530 func(&vcpu->arch.fp.fpscr, &qpr[reg_out], &ps1_in1, &ps1_in2, &ps1_in3);
532 dprintk(KERN_INFO "PS3 ps1 -> f(0x%x, 0x%x, 0x%x) = 0x%x\n",
533 ps1_in1, ps1_in2, ps1_in3, qpr[reg_out]);
538 static int kvmppc_ps_two_in(struct kvm_vcpu *vcpu, bool rc,
539 int reg_out, int reg_in1, int reg_in2,
541 void (*func)(u64 *fpscr,
545 u32 *qpr = vcpu->arch.qpr;
547 u32 ps0_in1, ps0_in2;
549 u32 ps1_in1, ps1_in2;
555 kvm_cvt_df(&VCPU_FPR(vcpu, reg_in1), &ps0_in1);
557 if (scalar & SCALAR_LOW)
558 ps0_in2 = qpr[reg_in2];
560 kvm_cvt_df(&VCPU_FPR(vcpu, reg_in2), &ps0_in2);
562 func(&vcpu->arch.fp.fpscr, &ps0_out, &ps0_in1, &ps0_in2);
564 if (!(scalar & SCALAR_NO_PS0)) {
565 dprintk(KERN_INFO "PS2 ps0 -> f(0x%x, 0x%x) = 0x%x\n",
566 ps0_in1, ps0_in2, ps0_out);
568 kvm_cvt_fd(&ps0_out, &VCPU_FPR(vcpu, reg_out));
572 ps1_in1 = qpr[reg_in1];
573 ps1_in2 = qpr[reg_in2];
575 if (scalar & SCALAR_HIGH)
578 func(&vcpu->arch.fp.fpscr, &ps1_out, &ps1_in1, &ps1_in2);
580 if (!(scalar & SCALAR_NO_PS1)) {
581 qpr[reg_out] = ps1_out;
583 dprintk(KERN_INFO "PS2 ps1 -> f(0x%x, 0x%x) = 0x%x\n",
584 ps1_in1, ps1_in2, qpr[reg_out]);
590 static int kvmppc_ps_one_in(struct kvm_vcpu *vcpu, bool rc,
591 int reg_out, int reg_in,
593 u32 *dst, u32 *src1))
595 u32 *qpr = vcpu->arch.qpr;
603 kvm_cvt_df(&VCPU_FPR(vcpu, reg_in), &ps0_in);
604 func(&vcpu->arch.fp.fpscr, &ps0_out, &ps0_in);
606 dprintk(KERN_INFO "PS1 ps0 -> f(0x%x) = 0x%x\n",
609 kvm_cvt_fd(&ps0_out, &VCPU_FPR(vcpu, reg_out));
612 ps1_in = qpr[reg_in];
613 func(&vcpu->arch.fp.fpscr, &qpr[reg_out], &ps1_in);
615 dprintk(KERN_INFO "PS1 ps1 -> f(0x%x) = 0x%x\n",
616 ps1_in, qpr[reg_out]);
621 int kvmppc_emulate_paired_single(struct kvm_vcpu *vcpu)
625 enum emulation_result emulated = EMULATE_DONE;
626 int ax_rd, ax_ra, ax_rb, ax_rc;
628 u64 *fpr_d, *fpr_a, *fpr_b, *fpr_c;
636 emulated = kvmppc_get_last_inst(vcpu, INST_GENERIC, &pinst);
637 inst = ppc_inst_val(pinst);
638 if (emulated != EMULATE_DONE)
641 ax_rd = inst_get_field(inst, 6, 10);
642 ax_ra = inst_get_field(inst, 11, 15);
643 ax_rb = inst_get_field(inst, 16, 20);
644 ax_rc = inst_get_field(inst, 21, 25);
645 full_d = inst_get_field(inst, 16, 31);
647 fpr_d = &VCPU_FPR(vcpu, ax_rd);
648 fpr_a = &VCPU_FPR(vcpu, ax_ra);
649 fpr_b = &VCPU_FPR(vcpu, ax_rb);
650 fpr_c = &VCPU_FPR(vcpu, ax_rc);
652 rcomp = (inst & 1) ? true : false;
653 cr = kvmppc_get_cr(vcpu);
655 if (!kvmppc_inst_is_paired_single(vcpu, inst))
658 if (!(kvmppc_get_msr(vcpu) & MSR_FP)) {
659 kvmppc_book3s_queue_irqprio(vcpu, BOOK3S_INTERRUPT_FP_UNAVAIL);
660 return EMULATE_AGAIN;
663 kvmppc_giveup_ext(vcpu, MSR_FP);
666 /* Do we need to clear FE0 / FE1 here? Don't think so. */
669 for (i = 0; i < ARRAY_SIZE(vcpu->arch.fp.fpr); i++) {
671 kvm_cvt_df(&VCPU_FPR(vcpu, i), &f);
672 dprintk(KERN_INFO "FPR[%d] = 0x%x / 0x%llx QPR[%d] = 0x%x\n",
673 i, f, VCPU_FPR(vcpu, i), i, vcpu->arch.qpr[i]);
677 switch (get_op(inst)) {
680 ulong addr = ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0;
681 bool w = inst_get_field(inst, 16, 16) ? true : false;
682 int i = inst_get_field(inst, 17, 19);
684 addr += get_d_signext(inst);
685 emulated = kvmppc_emulate_psq_load(vcpu, ax_rd, addr, w, i);
690 ulong addr = kvmppc_get_gpr(vcpu, ax_ra);
691 bool w = inst_get_field(inst, 16, 16) ? true : false;
692 int i = inst_get_field(inst, 17, 19);
694 addr += get_d_signext(inst);
695 emulated = kvmppc_emulate_psq_load(vcpu, ax_rd, addr, w, i);
697 if (emulated == EMULATE_DONE)
698 kvmppc_set_gpr(vcpu, ax_ra, addr);
703 ulong addr = ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0;
704 bool w = inst_get_field(inst, 16, 16) ? true : false;
705 int i = inst_get_field(inst, 17, 19);
707 addr += get_d_signext(inst);
708 emulated = kvmppc_emulate_psq_store(vcpu, ax_rd, addr, w, i);
713 ulong addr = kvmppc_get_gpr(vcpu, ax_ra);
714 bool w = inst_get_field(inst, 16, 16) ? true : false;
715 int i = inst_get_field(inst, 17, 19);
717 addr += get_d_signext(inst);
718 emulated = kvmppc_emulate_psq_store(vcpu, ax_rd, addr, w, i);
720 if (emulated == EMULATE_DONE)
721 kvmppc_set_gpr(vcpu, ax_ra, addr);
726 switch (inst_get_field(inst, 21, 30)) {
729 emulated = EMULATE_FAIL;
733 ulong addr = ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0;
734 bool w = inst_get_field(inst, 21, 21) ? true : false;
735 int i = inst_get_field(inst, 22, 24);
737 addr += kvmppc_get_gpr(vcpu, ax_rb);
738 emulated = kvmppc_emulate_psq_load(vcpu, ax_rd, addr, w, i);
743 emulated = EMULATE_FAIL;
747 ulong addr = kvmppc_get_gpr(vcpu, ax_ra);
748 bool w = inst_get_field(inst, 21, 21) ? true : false;
749 int i = inst_get_field(inst, 22, 24);
751 addr += kvmppc_get_gpr(vcpu, ax_rb);
752 emulated = kvmppc_emulate_psq_load(vcpu, ax_rd, addr, w, i);
754 if (emulated == EMULATE_DONE)
755 kvmppc_set_gpr(vcpu, ax_ra, addr);
759 VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_rb);
760 VCPU_FPR(vcpu, ax_rd) ^= 0x8000000000000000ULL;
761 vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
762 vcpu->arch.qpr[ax_rd] ^= 0x80000000;
766 emulated = EMULATE_FAIL;
770 VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_rb);
771 vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
775 emulated = EMULATE_FAIL;
779 VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_rb);
780 VCPU_FPR(vcpu, ax_rd) |= 0x8000000000000000ULL;
781 vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
782 vcpu->arch.qpr[ax_rd] |= 0x80000000;
786 VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_rb);
787 VCPU_FPR(vcpu, ax_rd) &= ~0x8000000000000000ULL;
788 vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
789 vcpu->arch.qpr[ax_rd] &= ~0x80000000;
791 case OP_4X_PS_MERGE00:
793 VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_ra);
794 /* vcpu->arch.qpr[ax_rd] = VCPU_FPR(vcpu, ax_rb); */
795 kvm_cvt_df(&VCPU_FPR(vcpu, ax_rb),
796 &vcpu->arch.qpr[ax_rd]);
798 case OP_4X_PS_MERGE01:
800 VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_ra);
801 vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
803 case OP_4X_PS_MERGE10:
805 /* VCPU_FPR(vcpu, ax_rd) = vcpu->arch.qpr[ax_ra]; */
806 kvm_cvt_fd(&vcpu->arch.qpr[ax_ra],
807 &VCPU_FPR(vcpu, ax_rd));
808 /* vcpu->arch.qpr[ax_rd] = VCPU_FPR(vcpu, ax_rb); */
809 kvm_cvt_df(&VCPU_FPR(vcpu, ax_rb),
810 &vcpu->arch.qpr[ax_rd]);
812 case OP_4X_PS_MERGE11:
814 /* VCPU_FPR(vcpu, ax_rd) = vcpu->arch.qpr[ax_ra]; */
815 kvm_cvt_fd(&vcpu->arch.qpr[ax_ra],
816 &VCPU_FPR(vcpu, ax_rd));
817 vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rb];
821 switch (inst_get_field(inst, 25, 30)) {
824 ulong addr = ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0;
825 bool w = inst_get_field(inst, 21, 21) ? true : false;
826 int i = inst_get_field(inst, 22, 24);
828 addr += kvmppc_get_gpr(vcpu, ax_rb);
829 emulated = kvmppc_emulate_psq_store(vcpu, ax_rd, addr, w, i);
832 case OP_4XW_PSQ_STUX:
834 ulong addr = kvmppc_get_gpr(vcpu, ax_ra);
835 bool w = inst_get_field(inst, 21, 21) ? true : false;
836 int i = inst_get_field(inst, 22, 24);
838 addr += kvmppc_get_gpr(vcpu, ax_rb);
839 emulated = kvmppc_emulate_psq_store(vcpu, ax_rd, addr, w, i);
841 if (emulated == EMULATE_DONE)
842 kvmppc_set_gpr(vcpu, ax_ra, addr);
847 switch (inst_get_field(inst, 26, 30)) {
849 emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
850 ax_rb, ax_ra, SCALAR_NO_PS0 | SCALAR_HIGH, fps_fadds);
851 VCPU_FPR(vcpu, ax_rd) = VCPU_FPR(vcpu, ax_rc);
854 emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
855 ax_ra, ax_rb, SCALAR_NO_PS1 | SCALAR_LOW, fps_fadds);
856 vcpu->arch.qpr[ax_rd] = vcpu->arch.qpr[ax_rc];
859 emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
860 ax_ra, ax_rc, SCALAR_HIGH, fps_fmuls);
863 emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
864 ax_ra, ax_rc, SCALAR_LOW, fps_fmuls);
866 case OP_4A_PS_MADDS0:
867 emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
868 ax_ra, ax_rc, ax_rb, SCALAR_HIGH, fps_fmadds);
870 case OP_4A_PS_MADDS1:
871 emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
872 ax_ra, ax_rc, ax_rb, SCALAR_LOW, fps_fmadds);
875 emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
876 ax_ra, ax_rb, SCALAR_NONE, fps_fdivs);
879 emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
880 ax_ra, ax_rb, SCALAR_NONE, fps_fsubs);
883 emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
884 ax_ra, ax_rb, SCALAR_NONE, fps_fadds);
887 emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
888 ax_ra, ax_rc, ax_rb, SCALAR_NONE, fps_fsel);
891 emulated = kvmppc_ps_one_in(vcpu, rcomp, ax_rd,
895 emulated = kvmppc_ps_two_in(vcpu, rcomp, ax_rd,
896 ax_ra, ax_rc, SCALAR_NONE, fps_fmuls);
898 case OP_4A_PS_RSQRTE:
899 emulated = kvmppc_ps_one_in(vcpu, rcomp, ax_rd,
903 emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
904 ax_ra, ax_rc, ax_rb, SCALAR_NONE, fps_fmsubs);
907 emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
908 ax_ra, ax_rc, ax_rb, SCALAR_NONE, fps_fmadds);
911 emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
912 ax_ra, ax_rc, ax_rb, SCALAR_NONE, fps_fnmsubs);
915 emulated = kvmppc_ps_three_in(vcpu, rcomp, ax_rd,
916 ax_ra, ax_rc, ax_rb, SCALAR_NONE, fps_fnmadds);
921 /* Real FPU operations */
925 ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) + full_d;
927 emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd, addr,
933 ulong addr = kvmppc_get_gpr(vcpu, ax_ra) + full_d;
935 emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd, addr,
938 if (emulated == EMULATE_DONE)
939 kvmppc_set_gpr(vcpu, ax_ra, addr);
944 ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) + full_d;
946 emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd, addr,
952 ulong addr = kvmppc_get_gpr(vcpu, ax_ra) + full_d;
954 emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd, addr,
957 if (emulated == EMULATE_DONE)
958 kvmppc_set_gpr(vcpu, ax_ra, addr);
963 ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) + full_d;
965 emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd, addr,
971 ulong addr = kvmppc_get_gpr(vcpu, ax_ra) + full_d;
973 emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd, addr,
976 if (emulated == EMULATE_DONE)
977 kvmppc_set_gpr(vcpu, ax_ra, addr);
982 ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) + full_d;
984 emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd, addr,
990 ulong addr = kvmppc_get_gpr(vcpu, ax_ra) + full_d;
992 emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd, addr,
995 if (emulated == EMULATE_DONE)
996 kvmppc_set_gpr(vcpu, ax_ra, addr);
1000 switch (inst_get_field(inst, 21, 30)) {
1003 ulong addr = ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0;
1005 addr += kvmppc_get_gpr(vcpu, ax_rb);
1006 emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd,
1007 addr, FPU_LS_SINGLE);
1012 ulong addr = kvmppc_get_gpr(vcpu, ax_ra) +
1013 kvmppc_get_gpr(vcpu, ax_rb);
1015 emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd,
1016 addr, FPU_LS_SINGLE);
1018 if (emulated == EMULATE_DONE)
1019 kvmppc_set_gpr(vcpu, ax_ra, addr);
1024 ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) +
1025 kvmppc_get_gpr(vcpu, ax_rb);
1027 emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd,
1028 addr, FPU_LS_DOUBLE);
1033 ulong addr = kvmppc_get_gpr(vcpu, ax_ra) +
1034 kvmppc_get_gpr(vcpu, ax_rb);
1036 emulated = kvmppc_emulate_fpr_load(vcpu, ax_rd,
1037 addr, FPU_LS_DOUBLE);
1039 if (emulated == EMULATE_DONE)
1040 kvmppc_set_gpr(vcpu, ax_ra, addr);
1045 ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) +
1046 kvmppc_get_gpr(vcpu, ax_rb);
1048 emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd,
1049 addr, FPU_LS_SINGLE);
1054 ulong addr = kvmppc_get_gpr(vcpu, ax_ra) +
1055 kvmppc_get_gpr(vcpu, ax_rb);
1057 emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd,
1058 addr, FPU_LS_SINGLE);
1060 if (emulated == EMULATE_DONE)
1061 kvmppc_set_gpr(vcpu, ax_ra, addr);
1066 ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) +
1067 kvmppc_get_gpr(vcpu, ax_rb);
1069 emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd,
1070 addr, FPU_LS_DOUBLE);
1075 ulong addr = kvmppc_get_gpr(vcpu, ax_ra) +
1076 kvmppc_get_gpr(vcpu, ax_rb);
1078 emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd,
1079 addr, FPU_LS_DOUBLE);
1081 if (emulated == EMULATE_DONE)
1082 kvmppc_set_gpr(vcpu, ax_ra, addr);
1087 ulong addr = (ax_ra ? kvmppc_get_gpr(vcpu, ax_ra) : 0) +
1088 kvmppc_get_gpr(vcpu, ax_rb);
1090 emulated = kvmppc_emulate_fpr_store(vcpu, ax_rd,
1099 switch (inst_get_field(inst, 21, 30)) {
1101 fpd_fadds(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1102 kvmppc_sync_qpr(vcpu, ax_rd);
1105 fpd_fsubs(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1106 kvmppc_sync_qpr(vcpu, ax_rd);
1109 fpd_fdivs(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1110 kvmppc_sync_qpr(vcpu, ax_rd);
1113 fpd_fres(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1114 kvmppc_sync_qpr(vcpu, ax_rd);
1116 case OP_59_FRSQRTES:
1117 fpd_frsqrtes(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1118 kvmppc_sync_qpr(vcpu, ax_rd);
1121 switch (inst_get_field(inst, 26, 30)) {
1123 fpd_fmuls(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c);
1124 kvmppc_sync_qpr(vcpu, ax_rd);
1127 fpd_fmsubs(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1128 kvmppc_sync_qpr(vcpu, ax_rd);
1131 fpd_fmadds(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1132 kvmppc_sync_qpr(vcpu, ax_rd);
1135 fpd_fnmsubs(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1136 kvmppc_sync_qpr(vcpu, ax_rd);
1139 fpd_fnmadds(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1140 kvmppc_sync_qpr(vcpu, ax_rd);
1145 switch (inst_get_field(inst, 21, 30)) {
1150 /* XXX need to implement */
1153 /* XXX missing CR */
1154 *fpr_d = vcpu->arch.fp.fpscr;
1157 /* XXX missing fm bits */
1158 /* XXX missing CR */
1159 vcpu->arch.fp.fpscr = *fpr_b;
1164 u32 cr0_mask = 0xf0000000;
1165 u32 cr_shift = inst_get_field(inst, 6, 8) * 4;
1167 fpd_fcmpu(&vcpu->arch.fp.fpscr, &tmp_cr, fpr_a, fpr_b);
1168 cr &= ~(cr0_mask >> cr_shift);
1169 cr |= (cr & cr0_mask) >> cr_shift;
1175 u32 cr0_mask = 0xf0000000;
1176 u32 cr_shift = inst_get_field(inst, 6, 8) * 4;
1178 fpd_fcmpo(&vcpu->arch.fp.fpscr, &tmp_cr, fpr_a, fpr_b);
1179 cr &= ~(cr0_mask >> cr_shift);
1180 cr |= (cr & cr0_mask) >> cr_shift;
1184 fpd_fneg(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1190 fpd_fabs(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1193 fpd_fcpsgn(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1196 fpd_fdiv(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1199 fpd_fadd(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1202 fpd_fsub(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_b);
1205 fpd_fctiw(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1208 fpd_fctiwz(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1211 fpd_frsp(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1212 kvmppc_sync_qpr(vcpu, ax_rd);
1219 fpd_fsqrt(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_b);
1220 /* fD = 1.0f / fD */
1221 fpd_fdiv(&vcpu->arch.fp.fpscr, &cr, fpr_d, (u64*)&one, fpr_d);
1225 switch (inst_get_field(inst, 26, 30)) {
1227 fpd_fmul(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c);
1230 fpd_fsel(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1233 fpd_fmsub(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1236 fpd_fmadd(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1239 fpd_fnmsub(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1242 fpd_fnmadd(&vcpu->arch.fp.fpscr, &cr, fpr_d, fpr_a, fpr_c, fpr_b);
1249 for (i = 0; i < ARRAY_SIZE(vcpu->arch.fp.fpr); i++) {
1251 kvm_cvt_df(&VCPU_FPR(vcpu, i), &f);
1252 dprintk(KERN_INFO "FPR[%d] = 0x%x\n", i, f);
1257 kvmppc_set_cr(vcpu, cr);
1259 disable_kernel_fp();