1 // SPDX-License-Identifier: GPL-2.0
3 * handling privileged instructions
5 * Copyright IBM Corp. 2008, 2013
11 #include <linux/kvm.h>
12 #include <linux/gfp.h>
13 #include <linux/errno.h>
14 #include <linux/compat.h>
15 #include <linux/mm_types.h>
17 #include <asm/asm-offsets.h>
18 #include <asm/facility.h>
19 #include <asm/current.h>
20 #include <asm/debug.h>
21 #include <asm/ebcdic.h>
22 #include <asm/sysinfo.h>
23 #include <asm/pgtable.h>
24 #include <asm/page-states.h>
25 #include <asm/pgalloc.h>
28 #include <asm/ptrace.h>
29 #include <asm/compat.h>
35 static int handle_ri(struct kvm_vcpu *vcpu)
37 if (test_kvm_facility(vcpu->kvm, 64)) {
38 VCPU_EVENT(vcpu, 3, "%s", "ENABLE: RI (lazy)");
39 vcpu->arch.sie_block->ecb3 |= ECB3_RI;
40 kvm_s390_retry_instr(vcpu);
43 return kvm_s390_inject_program_int(vcpu, PGM_OPERATION);
46 int kvm_s390_handle_aa(struct kvm_vcpu *vcpu)
48 if ((vcpu->arch.sie_block->ipa & 0xf) <= 4)
49 return handle_ri(vcpu);
54 static int handle_gs(struct kvm_vcpu *vcpu)
56 if (test_kvm_facility(vcpu->kvm, 133)) {
57 VCPU_EVENT(vcpu, 3, "%s", "ENABLE: GS (lazy)");
60 current->thread.gs_cb = (struct gs_cb *)&vcpu->run->s.regs.gscb;
61 restore_gs_cb(current->thread.gs_cb);
63 vcpu->arch.sie_block->ecb |= ECB_GS;
64 vcpu->arch.sie_block->ecd |= ECD_HOSTREGMGMT;
65 vcpu->arch.gs_enabled = 1;
66 kvm_s390_retry_instr(vcpu);
69 return kvm_s390_inject_program_int(vcpu, PGM_OPERATION);
72 int kvm_s390_handle_e3(struct kvm_vcpu *vcpu)
74 int code = vcpu->arch.sie_block->ipb & 0xff;
76 if (code == 0x49 || code == 0x4d)
77 return handle_gs(vcpu);
81 /* Handle SCK (SET CLOCK) interception */
82 static int handle_set_clock(struct kvm_vcpu *vcpu)
88 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
89 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
91 op2 = kvm_s390_get_base_disp_s(vcpu, &ar);
92 if (op2 & 7) /* Operand must be on a doubleword boundary */
93 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
94 rc = read_guest(vcpu, op2, ar, &val, sizeof(val));
96 return kvm_s390_inject_prog_cond(vcpu, rc);
98 VCPU_EVENT(vcpu, 3, "SCK: setting guest TOD to 0x%llx", val);
99 kvm_s390_set_tod_clock(vcpu->kvm, val);
101 kvm_s390_set_psw_cc(vcpu, 0);
105 static int handle_set_prefix(struct kvm_vcpu *vcpu)
112 vcpu->stat.instruction_spx++;
114 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
115 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
117 operand2 = kvm_s390_get_base_disp_s(vcpu, &ar);
119 /* must be word boundary */
121 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
124 rc = read_guest(vcpu, operand2, ar, &address, sizeof(address));
126 return kvm_s390_inject_prog_cond(vcpu, rc);
128 address &= 0x7fffe000u;
131 * Make sure the new value is valid memory. We only need to check the
132 * first page, since address is 8k aligned and memory pieces are always
133 * at least 1MB aligned and have at least a size of 1MB.
135 if (kvm_is_error_gpa(vcpu->kvm, address))
136 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
138 kvm_s390_set_prefix(vcpu, address);
139 trace_kvm_s390_handle_prefix(vcpu, 1, address);
143 static int handle_store_prefix(struct kvm_vcpu *vcpu)
150 vcpu->stat.instruction_stpx++;
152 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
153 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
155 operand2 = kvm_s390_get_base_disp_s(vcpu, &ar);
157 /* must be word boundary */
159 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
161 address = kvm_s390_get_prefix(vcpu);
164 rc = write_guest(vcpu, operand2, ar, &address, sizeof(address));
166 return kvm_s390_inject_prog_cond(vcpu, rc);
168 VCPU_EVENT(vcpu, 3, "STPX: storing prefix 0x%x into 0x%llx", address, operand2);
169 trace_kvm_s390_handle_prefix(vcpu, 0, address);
173 static int handle_store_cpu_address(struct kvm_vcpu *vcpu)
175 u16 vcpu_id = vcpu->vcpu_id;
180 vcpu->stat.instruction_stap++;
182 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
183 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
185 ga = kvm_s390_get_base_disp_s(vcpu, &ar);
188 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
190 rc = write_guest(vcpu, ga, ar, &vcpu_id, sizeof(vcpu_id));
192 return kvm_s390_inject_prog_cond(vcpu, rc);
194 VCPU_EVENT(vcpu, 3, "STAP: storing cpu address (%u) to 0x%llx", vcpu_id, ga);
195 trace_kvm_s390_handle_stap(vcpu, ga);
199 int kvm_s390_skey_check_enable(struct kvm_vcpu *vcpu)
202 struct kvm_s390_sie_block *sie_block = vcpu->arch.sie_block;
204 trace_kvm_s390_skey_related_inst(vcpu);
205 if (!(sie_block->ictl & (ICTL_ISKE | ICTL_SSKE | ICTL_RRBE)) &&
206 !(atomic_read(&sie_block->cpuflags) & CPUSTAT_KSS))
209 rc = s390_enable_skey();
210 VCPU_EVENT(vcpu, 3, "enabling storage keys for guest: %d", rc);
212 if (atomic_read(&sie_block->cpuflags) & CPUSTAT_KSS)
213 atomic_andnot(CPUSTAT_KSS, &sie_block->cpuflags);
215 sie_block->ictl &= ~(ICTL_ISKE | ICTL_SSKE |
221 static int try_handle_skey(struct kvm_vcpu *vcpu)
225 vcpu->stat.instruction_storage_key++;
226 rc = kvm_s390_skey_check_enable(vcpu);
230 /* with storage-key facility, SIE interprets it for us */
231 kvm_s390_retry_instr(vcpu);
232 VCPU_EVENT(vcpu, 4, "%s", "retrying storage key operation");
238 static int handle_iske(struct kvm_vcpu *vcpu)
245 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
246 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
248 rc = try_handle_skey(vcpu);
250 return rc != -EAGAIN ? rc : 0;
252 kvm_s390_get_regs_rre(vcpu, ®1, ®2);
254 addr = vcpu->run->s.regs.gprs[reg2] & PAGE_MASK;
255 addr = kvm_s390_logical_to_effective(vcpu, addr);
256 addr = kvm_s390_real_to_abs(vcpu, addr);
257 addr = gfn_to_hva(vcpu->kvm, gpa_to_gfn(addr));
258 if (kvm_is_error_hva(addr))
259 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
261 down_read(¤t->mm->mmap_sem);
262 rc = get_guest_storage_key(current->mm, addr, &key);
263 up_read(¤t->mm->mmap_sem);
265 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
266 vcpu->run->s.regs.gprs[reg1] &= ~0xff;
267 vcpu->run->s.regs.gprs[reg1] |= key;
271 static int handle_rrbe(struct kvm_vcpu *vcpu)
277 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
278 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
280 rc = try_handle_skey(vcpu);
282 return rc != -EAGAIN ? rc : 0;
284 kvm_s390_get_regs_rre(vcpu, ®1, ®2);
286 addr = vcpu->run->s.regs.gprs[reg2] & PAGE_MASK;
287 addr = kvm_s390_logical_to_effective(vcpu, addr);
288 addr = kvm_s390_real_to_abs(vcpu, addr);
289 addr = gfn_to_hva(vcpu->kvm, gpa_to_gfn(addr));
290 if (kvm_is_error_hva(addr))
291 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
293 down_read(¤t->mm->mmap_sem);
294 rc = reset_guest_reference_bit(current->mm, addr);
295 up_read(¤t->mm->mmap_sem);
297 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
299 kvm_s390_set_psw_cc(vcpu, rc);
307 static int handle_sske(struct kvm_vcpu *vcpu)
309 unsigned char m3 = vcpu->arch.sie_block->ipb >> 28;
310 unsigned long start, end;
311 unsigned char key, oldkey;
315 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
316 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
318 rc = try_handle_skey(vcpu);
320 return rc != -EAGAIN ? rc : 0;
322 if (!test_kvm_facility(vcpu->kvm, 8))
324 if (!test_kvm_facility(vcpu->kvm, 10))
325 m3 &= ~(SSKE_MC | SSKE_MR);
326 if (!test_kvm_facility(vcpu->kvm, 14))
329 kvm_s390_get_regs_rre(vcpu, ®1, ®2);
331 key = vcpu->run->s.regs.gprs[reg1] & 0xfe;
332 start = vcpu->run->s.regs.gprs[reg2] & PAGE_MASK;
333 start = kvm_s390_logical_to_effective(vcpu, start);
335 /* start already designates an absolute address */
336 end = (start + _SEGMENT_SIZE) & ~(_SEGMENT_SIZE - 1);
338 start = kvm_s390_real_to_abs(vcpu, start);
339 end = start + PAGE_SIZE;
342 while (start != end) {
343 unsigned long addr = gfn_to_hva(vcpu->kvm, gpa_to_gfn(start));
345 if (kvm_is_error_hva(addr))
346 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
348 down_read(¤t->mm->mmap_sem);
349 rc = cond_set_guest_storage_key(current->mm, addr, key, &oldkey,
350 m3 & SSKE_NQ, m3 & SSKE_MR,
352 up_read(¤t->mm->mmap_sem);
354 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
358 if (m3 & (SSKE_MC | SSKE_MR)) {
360 /* skey in reg1 is unpredictable */
361 kvm_s390_set_psw_cc(vcpu, 3);
363 kvm_s390_set_psw_cc(vcpu, rc);
364 vcpu->run->s.regs.gprs[reg1] &= ~0xff00UL;
365 vcpu->run->s.regs.gprs[reg1] |= (u64) oldkey << 8;
369 if (psw_bits(vcpu->arch.sie_block->gpsw).eaba == PSW_BITS_AMODE_64BIT)
370 vcpu->run->s.regs.gprs[reg2] &= ~PAGE_MASK;
372 vcpu->run->s.regs.gprs[reg2] &= ~0xfffff000UL;
373 end = kvm_s390_logical_to_effective(vcpu, end);
374 vcpu->run->s.regs.gprs[reg2] |= end;
379 static int handle_ipte_interlock(struct kvm_vcpu *vcpu)
381 vcpu->stat.instruction_ipte_interlock++;
382 if (psw_bits(vcpu->arch.sie_block->gpsw).pstate)
383 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
384 wait_event(vcpu->kvm->arch.ipte_wq, !ipte_lock_held(vcpu));
385 kvm_s390_retry_instr(vcpu);
386 VCPU_EVENT(vcpu, 4, "%s", "retrying ipte interlock operation");
390 static int handle_test_block(struct kvm_vcpu *vcpu)
395 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
396 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
398 kvm_s390_get_regs_rre(vcpu, NULL, ®2);
399 addr = vcpu->run->s.regs.gprs[reg2] & PAGE_MASK;
400 addr = kvm_s390_logical_to_effective(vcpu, addr);
401 if (kvm_s390_check_low_addr_prot_real(vcpu, addr))
402 return kvm_s390_inject_prog_irq(vcpu, &vcpu->arch.pgm);
403 addr = kvm_s390_real_to_abs(vcpu, addr);
405 if (kvm_is_error_gpa(vcpu->kvm, addr))
406 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
408 * We don't expect errors on modern systems, and do not care
409 * about storage keys (yet), so let's just clear the page.
411 if (kvm_clear_guest(vcpu->kvm, addr, PAGE_SIZE))
413 kvm_s390_set_psw_cc(vcpu, 0);
414 vcpu->run->s.regs.gprs[0] = 0;
418 static int handle_tpi(struct kvm_vcpu *vcpu)
420 struct kvm_s390_interrupt_info *inti;
427 addr = kvm_s390_get_base_disp_s(vcpu, &ar);
429 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
431 inti = kvm_s390_get_io_int(vcpu->kvm, vcpu->arch.sie_block->gcr[6], 0);
433 kvm_s390_set_psw_cc(vcpu, 0);
437 tpi_data[0] = inti->io.subchannel_id << 16 | inti->io.subchannel_nr;
438 tpi_data[1] = inti->io.io_int_parm;
439 tpi_data[2] = inti->io.io_int_word;
442 * Store the two-word I/O interruption code into the
445 len = sizeof(tpi_data) - 4;
446 rc = write_guest(vcpu, addr, ar, &tpi_data, len);
448 rc = kvm_s390_inject_prog_cond(vcpu, rc);
449 goto reinject_interrupt;
453 * Store the three-word I/O interruption code into
454 * the appropriate lowcore area.
456 len = sizeof(tpi_data);
457 if (write_guest_lc(vcpu, __LC_SUBCHANNEL_ID, &tpi_data, len)) {
458 /* failed writes to the low core are not recoverable */
460 goto reinject_interrupt;
464 /* irq was successfully handed to the guest */
466 kvm_s390_set_psw_cc(vcpu, 1);
470 * If we encounter a problem storing the interruption code, the
471 * instruction is suppressed from the guest's view: reinject the
474 if (kvm_s390_reinject_io_int(vcpu->kvm, inti)) {
478 /* don't set the cc, a pgm irq was injected or we drop to user space */
479 return rc ? -EFAULT : 0;
482 static int handle_tsch(struct kvm_vcpu *vcpu)
484 struct kvm_s390_interrupt_info *inti = NULL;
485 const u64 isc_mask = 0xffUL << 24; /* all iscs set */
487 /* a valid schid has at least one bit set */
488 if (vcpu->run->s.regs.gprs[1])
489 inti = kvm_s390_get_io_int(vcpu->kvm, isc_mask,
490 vcpu->run->s.regs.gprs[1]);
493 * Prepare exit to userspace.
494 * We indicate whether we dequeued a pending I/O interrupt
495 * so that userspace can re-inject it if the instruction gets
496 * a program check. While this may re-order the pending I/O
497 * interrupts, this is no problem since the priority is kept
500 vcpu->run->exit_reason = KVM_EXIT_S390_TSCH;
501 vcpu->run->s390_tsch.dequeued = !!inti;
503 vcpu->run->s390_tsch.subchannel_id = inti->io.subchannel_id;
504 vcpu->run->s390_tsch.subchannel_nr = inti->io.subchannel_nr;
505 vcpu->run->s390_tsch.io_int_parm = inti->io.io_int_parm;
506 vcpu->run->s390_tsch.io_int_word = inti->io.io_int_word;
508 vcpu->run->s390_tsch.ipb = vcpu->arch.sie_block->ipb;
513 static int handle_io_inst(struct kvm_vcpu *vcpu)
515 VCPU_EVENT(vcpu, 4, "%s", "I/O instruction");
517 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
518 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
520 if (vcpu->kvm->arch.css_support) {
522 * Most I/O instructions will be handled by userspace.
523 * Exceptions are tpi and the interrupt portion of tsch.
525 if (vcpu->arch.sie_block->ipa == 0xb236)
526 return handle_tpi(vcpu);
527 if (vcpu->arch.sie_block->ipa == 0xb235)
528 return handle_tsch(vcpu);
529 /* Handle in userspace. */
533 * Set condition code 3 to stop the guest from issuing channel
536 kvm_s390_set_psw_cc(vcpu, 3);
541 static int handle_stfl(struct kvm_vcpu *vcpu)
546 vcpu->stat.instruction_stfl++;
548 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
549 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
552 * We need to shift the lower 32 facility bits (bit 0-31) from a u64
553 * into a u32 memory representation. They will remain bits 0-31.
555 fac = *vcpu->kvm->arch.model.fac_list >> 32;
556 rc = write_guest_lc(vcpu, offsetof(struct lowcore, stfl_fac_list),
560 VCPU_EVENT(vcpu, 3, "STFL: store facility list 0x%x", fac);
561 trace_kvm_s390_handle_stfl(vcpu, fac);
565 #define PSW_MASK_ADDR_MODE (PSW_MASK_EA | PSW_MASK_BA)
566 #define PSW_MASK_UNASSIGNED 0xb80800fe7fffffffUL
567 #define PSW_ADDR_24 0x0000000000ffffffUL
568 #define PSW_ADDR_31 0x000000007fffffffUL
570 int is_valid_psw(psw_t *psw)
572 if (psw->mask & PSW_MASK_UNASSIGNED)
574 if ((psw->mask & PSW_MASK_ADDR_MODE) == PSW_MASK_BA) {
575 if (psw->addr & ~PSW_ADDR_31)
578 if (!(psw->mask & PSW_MASK_ADDR_MODE) && (psw->addr & ~PSW_ADDR_24))
580 if ((psw->mask & PSW_MASK_ADDR_MODE) == PSW_MASK_EA)
587 int kvm_s390_handle_lpsw(struct kvm_vcpu *vcpu)
589 psw_t *gpsw = &vcpu->arch.sie_block->gpsw;
590 psw_compat_t new_psw;
595 if (gpsw->mask & PSW_MASK_PSTATE)
596 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
598 addr = kvm_s390_get_base_disp_s(vcpu, &ar);
600 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
602 rc = read_guest(vcpu, addr, ar, &new_psw, sizeof(new_psw));
604 return kvm_s390_inject_prog_cond(vcpu, rc);
605 if (!(new_psw.mask & PSW32_MASK_BASE))
606 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
607 gpsw->mask = (new_psw.mask & ~PSW32_MASK_BASE) << 32;
608 gpsw->mask |= new_psw.addr & PSW32_ADDR_AMODE;
609 gpsw->addr = new_psw.addr & ~PSW32_ADDR_AMODE;
610 if (!is_valid_psw(gpsw))
611 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
615 static int handle_lpswe(struct kvm_vcpu *vcpu)
622 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
623 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
625 addr = kvm_s390_get_base_disp_s(vcpu, &ar);
627 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
628 rc = read_guest(vcpu, addr, ar, &new_psw, sizeof(new_psw));
630 return kvm_s390_inject_prog_cond(vcpu, rc);
631 vcpu->arch.sie_block->gpsw = new_psw;
632 if (!is_valid_psw(&vcpu->arch.sie_block->gpsw))
633 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
637 static int handle_stidp(struct kvm_vcpu *vcpu)
639 u64 stidp_data = vcpu->kvm->arch.model.cpuid;
644 vcpu->stat.instruction_stidp++;
646 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
647 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
649 operand2 = kvm_s390_get_base_disp_s(vcpu, &ar);
652 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
654 rc = write_guest(vcpu, operand2, ar, &stidp_data, sizeof(stidp_data));
656 return kvm_s390_inject_prog_cond(vcpu, rc);
658 VCPU_EVENT(vcpu, 3, "STIDP: store cpu id 0x%llx", stidp_data);
662 static void handle_stsi_3_2_2(struct kvm_vcpu *vcpu, struct sysinfo_3_2_2 *mem)
667 cpus = atomic_read(&vcpu->kvm->online_vcpus);
669 /* deal with other level 3 hypervisors */
670 if (stsi(mem, 3, 2, 2))
674 for (n = mem->count - 1; n > 0 ; n--)
675 memcpy(&mem->vm[n], &mem->vm[n - 1], sizeof(mem->vm[0]));
677 memset(&mem->vm[0], 0, sizeof(mem->vm[0]));
678 mem->vm[0].cpus_total = cpus;
679 mem->vm[0].cpus_configured = cpus;
680 mem->vm[0].cpus_standby = 0;
681 mem->vm[0].cpus_reserved = 0;
682 mem->vm[0].caf = 1000;
683 memcpy(mem->vm[0].name, "KVMguest", 8);
684 ASCEBC(mem->vm[0].name, 8);
685 memcpy(mem->vm[0].cpi, "KVM/Linux ", 16);
686 ASCEBC(mem->vm[0].cpi, 16);
689 static void insert_stsi_usr_data(struct kvm_vcpu *vcpu, u64 addr, u8 ar,
690 u8 fc, u8 sel1, u16 sel2)
692 vcpu->run->exit_reason = KVM_EXIT_S390_STSI;
693 vcpu->run->s390_stsi.addr = addr;
694 vcpu->run->s390_stsi.ar = ar;
695 vcpu->run->s390_stsi.fc = fc;
696 vcpu->run->s390_stsi.sel1 = sel1;
697 vcpu->run->s390_stsi.sel2 = sel2;
700 static int handle_stsi(struct kvm_vcpu *vcpu)
702 int fc = (vcpu->run->s.regs.gprs[0] & 0xf0000000) >> 28;
703 int sel1 = vcpu->run->s.regs.gprs[0] & 0xff;
704 int sel2 = vcpu->run->s.regs.gprs[1] & 0xffff;
705 unsigned long mem = 0;
710 vcpu->stat.instruction_stsi++;
711 VCPU_EVENT(vcpu, 3, "STSI: fc: %u sel1: %u sel2: %u", fc, sel1, sel2);
713 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
714 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
717 kvm_s390_set_psw_cc(vcpu, 3);
721 if (vcpu->run->s.regs.gprs[0] & 0x0fffff00
722 || vcpu->run->s.regs.gprs[1] & 0xffff0000)
723 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
726 vcpu->run->s.regs.gprs[0] = 3 << 28;
727 kvm_s390_set_psw_cc(vcpu, 0);
731 operand2 = kvm_s390_get_base_disp_s(vcpu, &ar);
733 if (operand2 & 0xfff)
734 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
737 case 1: /* same handling for 1 and 2 */
739 mem = get_zeroed_page(GFP_KERNEL);
742 if (stsi((void *) mem, fc, sel1, sel2))
746 if (sel1 != 2 || sel2 != 2)
748 mem = get_zeroed_page(GFP_KERNEL);
751 handle_stsi_3_2_2(vcpu, (void *) mem);
755 rc = write_guest(vcpu, operand2, ar, (void *)mem, PAGE_SIZE);
757 rc = kvm_s390_inject_prog_cond(vcpu, rc);
760 if (vcpu->kvm->arch.user_stsi) {
761 insert_stsi_usr_data(vcpu, operand2, ar, fc, sel1, sel2);
764 trace_kvm_s390_handle_stsi(vcpu, fc, sel1, sel2, operand2);
766 kvm_s390_set_psw_cc(vcpu, 0);
767 vcpu->run->s.regs.gprs[0] = 0;
770 kvm_s390_set_psw_cc(vcpu, 3);
776 static const intercept_handler_t b2_handlers[256] = {
777 [0x02] = handle_stidp,
778 [0x04] = handle_set_clock,
779 [0x10] = handle_set_prefix,
780 [0x11] = handle_store_prefix,
781 [0x12] = handle_store_cpu_address,
782 [0x14] = kvm_s390_handle_vsie,
783 [0x21] = handle_ipte_interlock,
784 [0x29] = handle_iske,
785 [0x2a] = handle_rrbe,
786 [0x2b] = handle_sske,
787 [0x2c] = handle_test_block,
788 [0x30] = handle_io_inst,
789 [0x31] = handle_io_inst,
790 [0x32] = handle_io_inst,
791 [0x33] = handle_io_inst,
792 [0x34] = handle_io_inst,
793 [0x35] = handle_io_inst,
794 [0x36] = handle_io_inst,
795 [0x37] = handle_io_inst,
796 [0x38] = handle_io_inst,
797 [0x39] = handle_io_inst,
798 [0x3a] = handle_io_inst,
799 [0x3b] = handle_io_inst,
800 [0x3c] = handle_io_inst,
801 [0x50] = handle_ipte_interlock,
802 [0x56] = handle_sthyi,
803 [0x5f] = handle_io_inst,
804 [0x74] = handle_io_inst,
805 [0x76] = handle_io_inst,
806 [0x7d] = handle_stsi,
807 [0xb1] = handle_stfl,
808 [0xb2] = handle_lpswe,
811 int kvm_s390_handle_b2(struct kvm_vcpu *vcpu)
813 intercept_handler_t handler;
816 * A lot of B2 instructions are priviledged. Here we check for
817 * the privileged ones, that we can handle in the kernel.
818 * Anything else goes to userspace.
820 handler = b2_handlers[vcpu->arch.sie_block->ipa & 0x00ff];
822 return handler(vcpu);
827 static int handle_epsw(struct kvm_vcpu *vcpu)
831 kvm_s390_get_regs_rre(vcpu, ®1, ®2);
833 /* This basically extracts the mask half of the psw. */
834 vcpu->run->s.regs.gprs[reg1] &= 0xffffffff00000000UL;
835 vcpu->run->s.regs.gprs[reg1] |= vcpu->arch.sie_block->gpsw.mask >> 32;
837 vcpu->run->s.regs.gprs[reg2] &= 0xffffffff00000000UL;
838 vcpu->run->s.regs.gprs[reg2] |=
839 vcpu->arch.sie_block->gpsw.mask & 0x00000000ffffffffUL;
844 #define PFMF_RESERVED 0xfffc0101UL
845 #define PFMF_SK 0x00020000UL
846 #define PFMF_CF 0x00010000UL
847 #define PFMF_UI 0x00008000UL
848 #define PFMF_FSC 0x00007000UL
849 #define PFMF_NQ 0x00000800UL
850 #define PFMF_MR 0x00000400UL
851 #define PFMF_MC 0x00000200UL
852 #define PFMF_KEY 0x000000feUL
854 static int handle_pfmf(struct kvm_vcpu *vcpu)
856 bool mr = false, mc = false, nq;
858 unsigned long start, end;
861 vcpu->stat.instruction_pfmf++;
863 kvm_s390_get_regs_rre(vcpu, ®1, ®2);
865 if (!test_kvm_facility(vcpu->kvm, 8))
866 return kvm_s390_inject_program_int(vcpu, PGM_OPERATION);
868 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
869 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
871 if (vcpu->run->s.regs.gprs[reg1] & PFMF_RESERVED)
872 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
874 /* Only provide non-quiescing support if enabled for the guest */
875 if (vcpu->run->s.regs.gprs[reg1] & PFMF_NQ &&
876 !test_kvm_facility(vcpu->kvm, 14))
877 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
879 /* Only provide conditional-SSKE support if enabled for the guest */
880 if (vcpu->run->s.regs.gprs[reg1] & PFMF_SK &&
881 test_kvm_facility(vcpu->kvm, 10)) {
882 mr = vcpu->run->s.regs.gprs[reg1] & PFMF_MR;
883 mc = vcpu->run->s.regs.gprs[reg1] & PFMF_MC;
886 nq = vcpu->run->s.regs.gprs[reg1] & PFMF_NQ;
887 key = vcpu->run->s.regs.gprs[reg1] & PFMF_KEY;
888 start = vcpu->run->s.regs.gprs[reg2] & PAGE_MASK;
889 start = kvm_s390_logical_to_effective(vcpu, start);
891 if (vcpu->run->s.regs.gprs[reg1] & PFMF_CF) {
892 if (kvm_s390_check_low_addr_prot_real(vcpu, start))
893 return kvm_s390_inject_prog_irq(vcpu, &vcpu->arch.pgm);
896 switch (vcpu->run->s.regs.gprs[reg1] & PFMF_FSC) {
898 /* only 4k frames specify a real address */
899 start = kvm_s390_real_to_abs(vcpu, start);
900 end = (start + PAGE_SIZE) & ~(PAGE_SIZE - 1);
903 end = (start + _SEGMENT_SIZE) & ~(_SEGMENT_SIZE - 1);
906 /* only support 2G frame size if EDAT2 is available and we are
907 not in 24-bit addressing mode */
908 if (!test_kvm_facility(vcpu->kvm, 78) ||
909 psw_bits(vcpu->arch.sie_block->gpsw).eaba == PSW_BITS_AMODE_24BIT)
910 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
911 end = (start + _REGION3_SIZE) & ~(_REGION3_SIZE - 1);
914 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
917 while (start != end) {
918 unsigned long useraddr;
920 /* Translate guest address to host address */
921 useraddr = gfn_to_hva(vcpu->kvm, gpa_to_gfn(start));
922 if (kvm_is_error_hva(useraddr))
923 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
925 if (vcpu->run->s.regs.gprs[reg1] & PFMF_CF) {
926 if (clear_user((void __user *)useraddr, PAGE_SIZE))
927 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
930 if (vcpu->run->s.regs.gprs[reg1] & PFMF_SK) {
931 int rc = kvm_s390_skey_check_enable(vcpu);
935 down_read(¤t->mm->mmap_sem);
936 rc = cond_set_guest_storage_key(current->mm, useraddr,
937 key, NULL, nq, mr, mc);
938 up_read(¤t->mm->mmap_sem);
940 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
945 if (vcpu->run->s.regs.gprs[reg1] & PFMF_FSC) {
946 if (psw_bits(vcpu->arch.sie_block->gpsw).eaba == PSW_BITS_AMODE_64BIT) {
947 vcpu->run->s.regs.gprs[reg2] = end;
949 vcpu->run->s.regs.gprs[reg2] &= ~0xffffffffUL;
950 end = kvm_s390_logical_to_effective(vcpu, end);
951 vcpu->run->s.regs.gprs[reg2] |= end;
957 static inline int do_essa(struct kvm_vcpu *vcpu, const int orc)
959 struct kvm_s390_migration_state *ms = vcpu->kvm->arch.migration_state;
960 int r1, r2, nappended, entries;
961 unsigned long gfn, hva, res, pgstev, ptev;
962 unsigned long *cbrlo;
965 * We don't need to set SD.FPF.SK to 1 here, because if we have a
966 * machine check here we either handle it or crash
969 kvm_s390_get_regs_rre(vcpu, &r1, &r2);
970 gfn = vcpu->run->s.regs.gprs[r2] >> PAGE_SHIFT;
971 hva = gfn_to_hva(vcpu->kvm, gfn);
972 entries = (vcpu->arch.sie_block->cbrlo & ~PAGE_MASK) >> 3;
974 if (kvm_is_error_hva(hva))
975 return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
977 nappended = pgste_perform_essa(vcpu->kvm->mm, hva, orc, &ptev, &pgstev);
979 res = orc ? 0x10 : 0;
980 vcpu->run->s.regs.gprs[r1] = res; /* Exception Indication */
983 res = (pgstev & _PGSTE_GPS_USAGE_MASK) >> 22;
985 * Set the block-content state part of the result. 0 means resident, so
986 * nothing to do if the page is valid. 2 is for preserved pages
987 * (non-present and non-zero), and 3 for zero pages (non-present and
990 if (ptev & _PAGE_INVALID) {
992 if (pgstev & _PGSTE_GPS_ZERO)
995 if (pgstev & _PGSTE_GPS_NODAT)
997 vcpu->run->s.regs.gprs[r1] = res;
999 * It is possible that all the normal 511 slots were full, in which case
1000 * we will now write in the 512th slot, which is reserved for host use.
1001 * In both cases we let the normal essa handling code process all the
1002 * slots, including the reserved one, if needed.
1004 if (nappended > 0) {
1005 cbrlo = phys_to_virt(vcpu->arch.sie_block->cbrlo & PAGE_MASK);
1006 cbrlo[entries] = gfn << PAGE_SHIFT;
1009 if (orc && gfn < ms->bitmap_size) {
1010 /* increment only if we are really flipping the bit to 1 */
1011 if (!test_and_set_bit(gfn, ms->pgste_bitmap))
1012 atomic64_inc(&ms->dirty_pages);
1018 static int handle_essa(struct kvm_vcpu *vcpu)
1020 /* entries expected to be 1FF */
1021 int entries = (vcpu->arch.sie_block->cbrlo & ~PAGE_MASK) >> 3;
1022 unsigned long *cbrlo;
1026 VCPU_EVENT(vcpu, 4, "ESSA: release %d pages", entries);
1027 gmap = vcpu->arch.gmap;
1028 vcpu->stat.instruction_essa++;
1029 if (!vcpu->kvm->arch.use_cmma)
1030 return kvm_s390_inject_program_int(vcpu, PGM_OPERATION);
1032 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
1033 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
1034 /* Check for invalid operation request code */
1035 orc = (vcpu->arch.sie_block->ipb & 0xf0000000) >> 28;
1036 /* ORCs 0-6 are always valid */
1037 if (orc > (test_kvm_facility(vcpu->kvm, 147) ? ESSA_SET_STABLE_NODAT
1038 : ESSA_SET_STABLE_IF_RESIDENT))
1039 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
1041 if (likely(!vcpu->kvm->arch.migration_state)) {
1043 * CMMA is enabled in the KVM settings, but is disabled in
1044 * the SIE block and in the mm_context, and we are not doing
1045 * a migration. Enable CMMA in the mm_context.
1046 * Since we need to take a write lock to write to the context
1047 * to avoid races with storage keys handling, we check if the
1048 * value really needs to be written to; if the value is
1049 * already correct, we do nothing and avoid the lock.
1051 if (vcpu->kvm->mm->context.use_cmma == 0) {
1052 down_write(&vcpu->kvm->mm->mmap_sem);
1053 vcpu->kvm->mm->context.use_cmma = 1;
1054 up_write(&vcpu->kvm->mm->mmap_sem);
1057 * If we are here, we are supposed to have CMMA enabled in
1058 * the SIE block. Enabling CMMA works on a per-CPU basis,
1059 * while the context use_cmma flag is per process.
1060 * It's possible that the context flag is enabled and the
1061 * SIE flag is not, so we set the flag always; if it was
1062 * already set, nothing changes, otherwise we enable it
1065 vcpu->arch.sie_block->ecb2 |= ECB2_CMMA;
1066 /* Retry the ESSA instruction */
1067 kvm_s390_retry_instr(vcpu);
1069 /* Account for the possible extra cbrl entry */
1070 i = do_essa(vcpu, orc);
1075 vcpu->arch.sie_block->cbrlo &= PAGE_MASK; /* reset nceo */
1076 cbrlo = phys_to_virt(vcpu->arch.sie_block->cbrlo);
1077 down_read(&gmap->mm->mmap_sem);
1078 for (i = 0; i < entries; ++i)
1079 __gmap_zap(gmap, cbrlo[i]);
1080 up_read(&gmap->mm->mmap_sem);
1084 static const intercept_handler_t b9_handlers[256] = {
1085 [0x8a] = handle_ipte_interlock,
1086 [0x8d] = handle_epsw,
1087 [0x8e] = handle_ipte_interlock,
1088 [0x8f] = handle_ipte_interlock,
1089 [0xab] = handle_essa,
1090 [0xaf] = handle_pfmf,
1093 int kvm_s390_handle_b9(struct kvm_vcpu *vcpu)
1095 intercept_handler_t handler;
1097 /* This is handled just as for the B2 instructions. */
1098 handler = b9_handlers[vcpu->arch.sie_block->ipa & 0x00ff];
1100 return handler(vcpu);
1105 int kvm_s390_handle_lctl(struct kvm_vcpu *vcpu)
1107 int reg1 = (vcpu->arch.sie_block->ipa & 0x00f0) >> 4;
1108 int reg3 = vcpu->arch.sie_block->ipa & 0x000f;
1109 int reg, rc, nr_regs;
1114 vcpu->stat.instruction_lctl++;
1116 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
1117 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
1119 ga = kvm_s390_get_base_disp_rs(vcpu, &ar);
1122 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
1124 VCPU_EVENT(vcpu, 4, "LCTL: r1:%d, r3:%d, addr: 0x%llx", reg1, reg3, ga);
1125 trace_kvm_s390_handle_lctl(vcpu, 0, reg1, reg3, ga);
1127 nr_regs = ((reg3 - reg1) & 0xf) + 1;
1128 rc = read_guest(vcpu, ga, ar, ctl_array, nr_regs * sizeof(u32));
1130 return kvm_s390_inject_prog_cond(vcpu, rc);
1134 vcpu->arch.sie_block->gcr[reg] &= 0xffffffff00000000ul;
1135 vcpu->arch.sie_block->gcr[reg] |= ctl_array[nr_regs++];
1138 reg = (reg + 1) % 16;
1140 kvm_make_request(KVM_REQ_TLB_FLUSH, vcpu);
1144 int kvm_s390_handle_stctl(struct kvm_vcpu *vcpu)
1146 int reg1 = (vcpu->arch.sie_block->ipa & 0x00f0) >> 4;
1147 int reg3 = vcpu->arch.sie_block->ipa & 0x000f;
1148 int reg, rc, nr_regs;
1153 vcpu->stat.instruction_stctl++;
1155 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
1156 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
1158 ga = kvm_s390_get_base_disp_rs(vcpu, &ar);
1161 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
1163 VCPU_EVENT(vcpu, 4, "STCTL r1:%d, r3:%d, addr: 0x%llx", reg1, reg3, ga);
1164 trace_kvm_s390_handle_stctl(vcpu, 0, reg1, reg3, ga);
1169 ctl_array[nr_regs++] = vcpu->arch.sie_block->gcr[reg];
1172 reg = (reg + 1) % 16;
1174 rc = write_guest(vcpu, ga, ar, ctl_array, nr_regs * sizeof(u32));
1175 return rc ? kvm_s390_inject_prog_cond(vcpu, rc) : 0;
1178 static int handle_lctlg(struct kvm_vcpu *vcpu)
1180 int reg1 = (vcpu->arch.sie_block->ipa & 0x00f0) >> 4;
1181 int reg3 = vcpu->arch.sie_block->ipa & 0x000f;
1182 int reg, rc, nr_regs;
1187 vcpu->stat.instruction_lctlg++;
1189 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
1190 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
1192 ga = kvm_s390_get_base_disp_rsy(vcpu, &ar);
1195 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
1197 VCPU_EVENT(vcpu, 4, "LCTLG: r1:%d, r3:%d, addr: 0x%llx", reg1, reg3, ga);
1198 trace_kvm_s390_handle_lctl(vcpu, 1, reg1, reg3, ga);
1200 nr_regs = ((reg3 - reg1) & 0xf) + 1;
1201 rc = read_guest(vcpu, ga, ar, ctl_array, nr_regs * sizeof(u64));
1203 return kvm_s390_inject_prog_cond(vcpu, rc);
1207 vcpu->arch.sie_block->gcr[reg] = ctl_array[nr_regs++];
1210 reg = (reg + 1) % 16;
1212 kvm_make_request(KVM_REQ_TLB_FLUSH, vcpu);
1216 static int handle_stctg(struct kvm_vcpu *vcpu)
1218 int reg1 = (vcpu->arch.sie_block->ipa & 0x00f0) >> 4;
1219 int reg3 = vcpu->arch.sie_block->ipa & 0x000f;
1220 int reg, rc, nr_regs;
1225 vcpu->stat.instruction_stctg++;
1227 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
1228 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
1230 ga = kvm_s390_get_base_disp_rsy(vcpu, &ar);
1233 return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
1235 VCPU_EVENT(vcpu, 4, "STCTG r1:%d, r3:%d, addr: 0x%llx", reg1, reg3, ga);
1236 trace_kvm_s390_handle_stctl(vcpu, 1, reg1, reg3, ga);
1241 ctl_array[nr_regs++] = vcpu->arch.sie_block->gcr[reg];
1244 reg = (reg + 1) % 16;
1246 rc = write_guest(vcpu, ga, ar, ctl_array, nr_regs * sizeof(u64));
1247 return rc ? kvm_s390_inject_prog_cond(vcpu, rc) : 0;
1250 static const intercept_handler_t eb_handlers[256] = {
1251 [0x2f] = handle_lctlg,
1252 [0x25] = handle_stctg,
1258 int kvm_s390_handle_eb(struct kvm_vcpu *vcpu)
1260 intercept_handler_t handler;
1262 handler = eb_handlers[vcpu->arch.sie_block->ipb & 0xff];
1264 return handler(vcpu);
1268 static int handle_tprot(struct kvm_vcpu *vcpu)
1270 u64 address1, address2;
1271 unsigned long hva, gpa;
1272 int ret = 0, cc = 0;
1276 vcpu->stat.instruction_tprot++;
1278 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
1279 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
1281 kvm_s390_get_base_disp_sse(vcpu, &address1, &address2, &ar, NULL);
1283 /* we only handle the Linux memory detection case:
1285 * everything else goes to userspace. */
1286 if (address2 & 0xf0)
1288 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_DAT)
1290 ret = guest_translate_address(vcpu, address1, ar, &gpa, GACC_STORE);
1291 if (ret == PGM_PROTECTION) {
1292 /* Write protected? Try again with read-only... */
1294 ret = guest_translate_address(vcpu, address1, ar, &gpa,
1298 if (ret == PGM_ADDRESSING || ret == PGM_TRANSLATION_SPEC) {
1299 ret = kvm_s390_inject_program_int(vcpu, ret);
1300 } else if (ret > 0) {
1301 /* Translation not available */
1302 kvm_s390_set_psw_cc(vcpu, 3);
1308 hva = gfn_to_hva_prot(vcpu->kvm, gpa_to_gfn(gpa), &writable);
1309 if (kvm_is_error_hva(hva)) {
1310 ret = kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);
1313 cc = 1; /* Write not permitted ==> read-only */
1314 kvm_s390_set_psw_cc(vcpu, cc);
1315 /* Note: CC2 only occurs for storage keys (not supported yet) */
1318 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_DAT)
1323 int kvm_s390_handle_e5(struct kvm_vcpu *vcpu)
1325 /* For e5xx... instructions we only handle TPROT */
1326 if ((vcpu->arch.sie_block->ipa & 0x00ff) == 0x01)
1327 return handle_tprot(vcpu);
1331 static int handle_sckpf(struct kvm_vcpu *vcpu)
1335 if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
1336 return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);
1338 if (vcpu->run->s.regs.gprs[0] & 0x00000000ffff0000)
1339 return kvm_s390_inject_program_int(vcpu,
1342 value = vcpu->run->s.regs.gprs[0] & 0x000000000000ffff;
1343 vcpu->arch.sie_block->todpr = value;
1348 static int handle_ptff(struct kvm_vcpu *vcpu)
1350 /* we don't emulate any control instructions yet */
1351 kvm_s390_set_psw_cc(vcpu, 3);
1355 static const intercept_handler_t x01_handlers[256] = {
1356 [0x04] = handle_ptff,
1357 [0x07] = handle_sckpf,
1360 int kvm_s390_handle_01(struct kvm_vcpu *vcpu)
1362 intercept_handler_t handler;
1364 handler = x01_handlers[vcpu->arch.sie_block->ipa & 0x00ff];
1366 return handler(vcpu);