2 * This program is free software; you can redistribute it and/or modify
3 * it under the terms of the GNU General Public License, version 2, as
4 * published by the Free Software Foundation.
6 * This program is distributed in the hope that it will be useful,
7 * but WITHOUT ANY WARRANTY; without even the implied warranty of
8 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
9 * GNU General Public License for more details.
11 * You should have received a copy of the GNU General Public License
12 * along with this program; if not, write to the Free Software
13 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
15 * Copyright IBM Corp. 2007
17 * Authors: Hollis Blanchard <hollisb@us.ibm.com>
18 * Christian Ehrhardt <ehrhardt@linux.vnet.ibm.com>
21 #include <linux/errno.h>
22 #include <linux/err.h>
23 #include <linux/kvm_host.h>
24 #include <linux/module.h>
25 #include <linux/vmalloc.h>
26 #include <linux/hrtimer.h>
28 #include <linux/slab.h>
29 #include <asm/cputable.h>
30 #include <asm/uaccess.h>
31 #include <asm/kvm_ppc.h>
32 #include <asm/tlbflush.h>
34 #include "../mm/mmu_decl.h"
36 #define CREATE_TRACE_POINTS
39 int kvm_arch_vcpu_runnable(struct kvm_vcpu *v)
41 return !(v->arch.shared->msr & MSR_WE) ||
42 !!(v->arch.pending_exceptions);
45 int kvmppc_kvm_pv(struct kvm_vcpu *vcpu)
47 int nr = kvmppc_get_gpr(vcpu, 11);
49 unsigned long __maybe_unused param1 = kvmppc_get_gpr(vcpu, 3);
50 unsigned long __maybe_unused param2 = kvmppc_get_gpr(vcpu, 4);
51 unsigned long __maybe_unused param3 = kvmppc_get_gpr(vcpu, 5);
52 unsigned long __maybe_unused param4 = kvmppc_get_gpr(vcpu, 6);
55 if (!(vcpu->arch.shared->msr & MSR_SF)) {
64 case HC_VENDOR_KVM | KVM_HC_PPC_MAP_MAGIC_PAGE:
66 vcpu->arch.magic_page_pa = param1;
67 vcpu->arch.magic_page_ea = param2;
69 r2 = KVM_MAGIC_FEAT_SR;
74 case HC_VENDOR_KVM | KVM_HC_FEATURES:
76 #if defined(CONFIG_PPC_BOOK3S) /* XXX Missing magic page on BookE */
77 r2 |= (1 << KVM_FEATURE_MAGIC_PAGE);
80 /* Second return value is in r4 */
83 r = HC_EV_UNIMPLEMENTED;
87 kvmppc_set_gpr(vcpu, 4, r2);
92 int kvmppc_emulate_mmio(struct kvm_run *run, struct kvm_vcpu *vcpu)
94 enum emulation_result er;
97 er = kvmppc_emulate_instruction(run, vcpu);
100 /* Future optimization: only reload non-volatiles if they were
101 * actually modified. */
104 case EMULATE_DO_MMIO:
105 run->exit_reason = KVM_EXIT_MMIO;
106 /* We must reload nonvolatiles because "update" load/store
107 * instructions modify register state. */
108 /* Future optimization: only reload non-volatiles if they were
109 * actually modified. */
113 /* XXX Deliver Program interrupt to guest. */
114 printk(KERN_EMERG "%s: emulation failed (%08x)\n", __func__,
115 kvmppc_get_last_inst(vcpu));
125 int kvm_arch_hardware_enable(void *garbage)
130 void kvm_arch_hardware_disable(void *garbage)
134 int kvm_arch_hardware_setup(void)
139 void kvm_arch_hardware_unsetup(void)
143 void kvm_arch_check_processor_compat(void *rtn)
145 *(int *)rtn = kvmppc_core_check_processor_compat();
148 int kvm_arch_init_vm(struct kvm *kvm)
153 void kvm_arch_destroy_vm(struct kvm *kvm)
156 struct kvm_vcpu *vcpu;
158 kvm_for_each_vcpu(i, vcpu, kvm)
159 kvm_arch_vcpu_free(vcpu);
161 mutex_lock(&kvm->lock);
162 for (i = 0; i < atomic_read(&kvm->online_vcpus); i++)
163 kvm->vcpus[i] = NULL;
165 atomic_set(&kvm->online_vcpus, 0);
166 mutex_unlock(&kvm->lock);
169 void kvm_arch_sync_events(struct kvm *kvm)
173 int kvm_dev_ioctl_check_extension(long ext)
178 case KVM_CAP_PPC_SEGSTATE:
179 case KVM_CAP_PPC_PAIRED_SINGLES:
180 case KVM_CAP_PPC_UNSET_IRQ:
181 case KVM_CAP_PPC_IRQ_LEVEL:
182 case KVM_CAP_ENABLE_CAP:
183 case KVM_CAP_PPC_OSI:
184 case KVM_CAP_PPC_GET_PVINFO:
187 case KVM_CAP_COALESCED_MMIO:
188 r = KVM_COALESCED_MMIO_PAGE_OFFSET;
198 long kvm_arch_dev_ioctl(struct file *filp,
199 unsigned int ioctl, unsigned long arg)
204 int kvm_arch_prepare_memory_region(struct kvm *kvm,
205 struct kvm_memory_slot *memslot,
206 struct kvm_memory_slot old,
207 struct kvm_userspace_memory_region *mem,
213 void kvm_arch_commit_memory_region(struct kvm *kvm,
214 struct kvm_userspace_memory_region *mem,
215 struct kvm_memory_slot old,
222 void kvm_arch_flush_shadow(struct kvm *kvm)
226 struct kvm_vcpu *kvm_arch_vcpu_create(struct kvm *kvm, unsigned int id)
228 struct kvm_vcpu *vcpu;
229 vcpu = kvmppc_core_vcpu_create(kvm, id);
231 kvmppc_create_vcpu_debugfs(vcpu, id);
235 void kvm_arch_vcpu_free(struct kvm_vcpu *vcpu)
237 /* Make sure we're not using the vcpu anymore */
238 hrtimer_cancel(&vcpu->arch.dec_timer);
239 tasklet_kill(&vcpu->arch.tasklet);
241 kvmppc_remove_vcpu_debugfs(vcpu);
242 kvmppc_core_vcpu_free(vcpu);
245 void kvm_arch_vcpu_destroy(struct kvm_vcpu *vcpu)
247 kvm_arch_vcpu_free(vcpu);
250 int kvm_cpu_has_pending_timer(struct kvm_vcpu *vcpu)
252 return kvmppc_core_pending_dec(vcpu);
255 static void kvmppc_decrementer_func(unsigned long data)
257 struct kvm_vcpu *vcpu = (struct kvm_vcpu *)data;
259 kvmppc_core_queue_dec(vcpu);
261 if (waitqueue_active(&vcpu->wq)) {
262 wake_up_interruptible(&vcpu->wq);
263 vcpu->stat.halt_wakeup++;
268 * low level hrtimer wake routine. Because this runs in hardirq context
269 * we schedule a tasklet to do the real work.
271 enum hrtimer_restart kvmppc_decrementer_wakeup(struct hrtimer *timer)
273 struct kvm_vcpu *vcpu;
275 vcpu = container_of(timer, struct kvm_vcpu, arch.dec_timer);
276 tasklet_schedule(&vcpu->arch.tasklet);
278 return HRTIMER_NORESTART;
281 int kvm_arch_vcpu_init(struct kvm_vcpu *vcpu)
283 hrtimer_init(&vcpu->arch.dec_timer, CLOCK_REALTIME, HRTIMER_MODE_ABS);
284 tasklet_init(&vcpu->arch.tasklet, kvmppc_decrementer_func, (ulong)vcpu);
285 vcpu->arch.dec_timer.function = kvmppc_decrementer_wakeup;
290 void kvm_arch_vcpu_uninit(struct kvm_vcpu *vcpu)
292 kvmppc_mmu_destroy(vcpu);
295 void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu)
297 kvmppc_core_vcpu_load(vcpu, cpu);
300 void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu)
302 kvmppc_core_vcpu_put(vcpu);
305 int kvm_arch_vcpu_ioctl_set_guest_debug(struct kvm_vcpu *vcpu,
306 struct kvm_guest_debug *dbg)
311 static void kvmppc_complete_dcr_load(struct kvm_vcpu *vcpu,
314 kvmppc_set_gpr(vcpu, vcpu->arch.io_gpr, run->dcr.data);
317 static void kvmppc_complete_mmio_load(struct kvm_vcpu *vcpu,
320 u64 uninitialized_var(gpr);
322 if (run->mmio.len > sizeof(gpr)) {
323 printk(KERN_ERR "bad MMIO length: %d\n", run->mmio.len);
327 if (vcpu->arch.mmio_is_bigendian) {
328 switch (run->mmio.len) {
329 case 8: gpr = *(u64 *)run->mmio.data; break;
330 case 4: gpr = *(u32 *)run->mmio.data; break;
331 case 2: gpr = *(u16 *)run->mmio.data; break;
332 case 1: gpr = *(u8 *)run->mmio.data; break;
335 /* Convert BE data from userland back to LE. */
336 switch (run->mmio.len) {
337 case 4: gpr = ld_le32((u32 *)run->mmio.data); break;
338 case 2: gpr = ld_le16((u16 *)run->mmio.data); break;
339 case 1: gpr = *(u8 *)run->mmio.data; break;
343 if (vcpu->arch.mmio_sign_extend) {
344 switch (run->mmio.len) {
359 kvmppc_set_gpr(vcpu, vcpu->arch.io_gpr, gpr);
361 switch (vcpu->arch.io_gpr & KVM_REG_EXT_MASK) {
363 kvmppc_set_gpr(vcpu, vcpu->arch.io_gpr, gpr);
366 vcpu->arch.fpr[vcpu->arch.io_gpr & KVM_REG_MASK] = gpr;
368 #ifdef CONFIG_PPC_BOOK3S
370 vcpu->arch.qpr[vcpu->arch.io_gpr & KVM_REG_MASK] = gpr;
373 vcpu->arch.fpr[vcpu->arch.io_gpr & KVM_REG_MASK] = gpr;
374 vcpu->arch.qpr[vcpu->arch.io_gpr & KVM_REG_MASK] = gpr;
382 int kvmppc_handle_load(struct kvm_run *run, struct kvm_vcpu *vcpu,
383 unsigned int rt, unsigned int bytes, int is_bigendian)
385 if (bytes > sizeof(run->mmio.data)) {
386 printk(KERN_ERR "%s: bad MMIO length: %d\n", __func__,
390 run->mmio.phys_addr = vcpu->arch.paddr_accessed;
391 run->mmio.len = bytes;
392 run->mmio.is_write = 0;
394 vcpu->arch.io_gpr = rt;
395 vcpu->arch.mmio_is_bigendian = is_bigendian;
396 vcpu->mmio_needed = 1;
397 vcpu->mmio_is_write = 0;
398 vcpu->arch.mmio_sign_extend = 0;
400 return EMULATE_DO_MMIO;
403 /* Same as above, but sign extends */
404 int kvmppc_handle_loads(struct kvm_run *run, struct kvm_vcpu *vcpu,
405 unsigned int rt, unsigned int bytes, int is_bigendian)
409 r = kvmppc_handle_load(run, vcpu, rt, bytes, is_bigendian);
410 vcpu->arch.mmio_sign_extend = 1;
415 int kvmppc_handle_store(struct kvm_run *run, struct kvm_vcpu *vcpu,
416 u64 val, unsigned int bytes, int is_bigendian)
418 void *data = run->mmio.data;
420 if (bytes > sizeof(run->mmio.data)) {
421 printk(KERN_ERR "%s: bad MMIO length: %d\n", __func__,
425 run->mmio.phys_addr = vcpu->arch.paddr_accessed;
426 run->mmio.len = bytes;
427 run->mmio.is_write = 1;
428 vcpu->mmio_needed = 1;
429 vcpu->mmio_is_write = 1;
431 /* Store the value at the lowest bytes in 'data'. */
434 case 8: *(u64 *)data = val; break;
435 case 4: *(u32 *)data = val; break;
436 case 2: *(u16 *)data = val; break;
437 case 1: *(u8 *)data = val; break;
440 /* Store LE value into 'data'. */
442 case 4: st_le32(data, val); break;
443 case 2: st_le16(data, val); break;
444 case 1: *(u8 *)data = val; break;
448 return EMULATE_DO_MMIO;
451 int kvm_arch_vcpu_ioctl_run(struct kvm_vcpu *vcpu, struct kvm_run *run)
456 if (vcpu->sigset_active)
457 sigprocmask(SIG_SETMASK, &vcpu->sigset, &sigsaved);
459 if (vcpu->mmio_needed) {
460 if (!vcpu->mmio_is_write)
461 kvmppc_complete_mmio_load(vcpu, run);
462 vcpu->mmio_needed = 0;
463 } else if (vcpu->arch.dcr_needed) {
464 if (!vcpu->arch.dcr_is_write)
465 kvmppc_complete_dcr_load(vcpu, run);
466 vcpu->arch.dcr_needed = 0;
467 } else if (vcpu->arch.osi_needed) {
468 u64 *gprs = run->osi.gprs;
471 for (i = 0; i < 32; i++)
472 kvmppc_set_gpr(vcpu, i, gprs[i]);
473 vcpu->arch.osi_needed = 0;
476 kvmppc_core_deliver_interrupts(vcpu);
480 r = __kvmppc_vcpu_run(run, vcpu);
484 if (vcpu->sigset_active)
485 sigprocmask(SIG_SETMASK, &sigsaved, NULL);
490 int kvm_vcpu_ioctl_interrupt(struct kvm_vcpu *vcpu, struct kvm_interrupt *irq)
492 if (irq->irq == KVM_INTERRUPT_UNSET)
493 kvmppc_core_dequeue_external(vcpu, irq);
495 kvmppc_core_queue_external(vcpu, irq);
497 if (waitqueue_active(&vcpu->wq)) {
498 wake_up_interruptible(&vcpu->wq);
499 vcpu->stat.halt_wakeup++;
505 static int kvm_vcpu_ioctl_enable_cap(struct kvm_vcpu *vcpu,
506 struct kvm_enable_cap *cap)
514 case KVM_CAP_PPC_OSI:
516 vcpu->arch.osi_enabled = true;
526 int kvm_arch_vcpu_ioctl_get_mpstate(struct kvm_vcpu *vcpu,
527 struct kvm_mp_state *mp_state)
532 int kvm_arch_vcpu_ioctl_set_mpstate(struct kvm_vcpu *vcpu,
533 struct kvm_mp_state *mp_state)
538 long kvm_arch_vcpu_ioctl(struct file *filp,
539 unsigned int ioctl, unsigned long arg)
541 struct kvm_vcpu *vcpu = filp->private_data;
542 void __user *argp = (void __user *)arg;
546 case KVM_INTERRUPT: {
547 struct kvm_interrupt irq;
549 if (copy_from_user(&irq, argp, sizeof(irq)))
551 r = kvm_vcpu_ioctl_interrupt(vcpu, &irq);
557 struct kvm_enable_cap cap;
559 if (copy_from_user(&cap, argp, sizeof(cap)))
561 r = kvm_vcpu_ioctl_enable_cap(vcpu, &cap);
572 static int kvm_vm_ioctl_get_pvinfo(struct kvm_ppc_pvinfo *pvinfo)
574 u32 inst_lis = 0x3c000000;
575 u32 inst_ori = 0x60000000;
576 u32 inst_nop = 0x60000000;
577 u32 inst_sc = 0x44000002;
578 u32 inst_imm_mask = 0xffff;
581 * The hypercall to get into KVM from within guest context is as
584 * lis r0, r0, KVM_SC_MAGIC_R0@h
585 * ori r0, KVM_SC_MAGIC_R0@l
589 pvinfo->hcall[0] = inst_lis | ((KVM_SC_MAGIC_R0 >> 16) & inst_imm_mask);
590 pvinfo->hcall[1] = inst_ori | (KVM_SC_MAGIC_R0 & inst_imm_mask);
591 pvinfo->hcall[2] = inst_sc;
592 pvinfo->hcall[3] = inst_nop;
597 long kvm_arch_vm_ioctl(struct file *filp,
598 unsigned int ioctl, unsigned long arg)
600 void __user *argp = (void __user *)arg;
604 case KVM_PPC_GET_PVINFO: {
605 struct kvm_ppc_pvinfo pvinfo;
606 memset(&pvinfo, 0, sizeof(pvinfo));
607 r = kvm_vm_ioctl_get_pvinfo(&pvinfo);
608 if (copy_to_user(argp, &pvinfo, sizeof(pvinfo))) {
623 int kvm_arch_init(void *opaque)
628 void kvm_arch_exit(void)