161491cf4SDavid Woodhouse /* 261491cf4SDavid Woodhouse * Xen HVM emulation support in KVM 361491cf4SDavid Woodhouse * 461491cf4SDavid Woodhouse * Copyright © 2019 Oracle and/or its affiliates. All rights reserved. 561491cf4SDavid Woodhouse * Copyright © 2022 Amazon.com, Inc. or its affiliates. All Rights Reserved. 661491cf4SDavid Woodhouse * 761491cf4SDavid Woodhouse * This work is licensed under the terms of the GNU GPL, version 2 or later. 861491cf4SDavid Woodhouse * See the COPYING file in the top-level directory. 961491cf4SDavid Woodhouse * 1061491cf4SDavid Woodhouse */ 1161491cf4SDavid Woodhouse 1261491cf4SDavid Woodhouse #include "qemu/osdep.h" 1355a3f666SJoao Martins #include "qemu/log.h" 1479b7067dSJoao Martins #include "qemu/main-loop.h" 15fb0fd2ceSJoao Martins #include "hw/xen/xen.h" 1661491cf4SDavid Woodhouse #include "sysemu/kvm_int.h" 1761491cf4SDavid Woodhouse #include "sysemu/kvm_xen.h" 1861491cf4SDavid Woodhouse #include "kvm/kvm_i386.h" 19bedcc139SJoao Martins #include "exec/address-spaces.h" 2061491cf4SDavid Woodhouse #include "xen-emu.h" 2155a3f666SJoao Martins #include "trace.h" 2279b7067dSJoao Martins #include "sysemu/runstate.h" 2361491cf4SDavid Woodhouse 24110a0ea5SDavid Woodhouse #include "hw/i386/kvm/xen_overlay.h" 25110a0ea5SDavid Woodhouse 26bedcc139SJoao Martins #include "hw/xen/interface/version.h" 2779b7067dSJoao Martins #include "hw/xen/interface/sched.h" 28fb0fd2ceSJoao Martins #include "hw/xen/interface/memory.h" 29fb0fd2ceSJoao Martins 30fb0fd2ceSJoao Martins #include "xen-compat.h" 31fb0fd2ceSJoao Martins 32fb0fd2ceSJoao Martins #ifdef TARGET_X86_64 33fb0fd2ceSJoao Martins #define hypercall_compat32(longmode) (!(longmode)) 34fb0fd2ceSJoao Martins #else 35fb0fd2ceSJoao Martins #define hypercall_compat32(longmode) (false) 36fb0fd2ceSJoao Martins #endif 37bedcc139SJoao Martins 38bedcc139SJoao Martins static int kvm_gva_rw(CPUState *cs, uint64_t gva, void *_buf, size_t sz, 39bedcc139SJoao Martins bool is_write) 40bedcc139SJoao Martins { 41bedcc139SJoao Martins uint8_t *buf = (uint8_t *)_buf; 42bedcc139SJoao Martins int ret; 43bedcc139SJoao Martins 44bedcc139SJoao Martins while (sz) { 45bedcc139SJoao Martins struct kvm_translation tr = { 46bedcc139SJoao Martins .linear_address = gva, 47bedcc139SJoao Martins }; 48bedcc139SJoao Martins 49bedcc139SJoao Martins size_t len = TARGET_PAGE_SIZE - (tr.linear_address & ~TARGET_PAGE_MASK); 50bedcc139SJoao Martins if (len > sz) { 51bedcc139SJoao Martins len = sz; 52bedcc139SJoao Martins } 53bedcc139SJoao Martins 54bedcc139SJoao Martins ret = kvm_vcpu_ioctl(cs, KVM_TRANSLATE, &tr); 55bedcc139SJoao Martins if (ret || !tr.valid || (is_write && !tr.writeable)) { 56bedcc139SJoao Martins return -EFAULT; 57bedcc139SJoao Martins } 58bedcc139SJoao Martins 59bedcc139SJoao Martins cpu_physical_memory_rw(tr.physical_address, buf, len, is_write); 60bedcc139SJoao Martins 61bedcc139SJoao Martins buf += len; 62bedcc139SJoao Martins sz -= len; 63bedcc139SJoao Martins gva += len; 64bedcc139SJoao Martins } 65bedcc139SJoao Martins 66bedcc139SJoao Martins return 0; 67bedcc139SJoao Martins } 68bedcc139SJoao Martins 69bedcc139SJoao Martins static inline int kvm_copy_from_gva(CPUState *cs, uint64_t gva, void *buf, 70bedcc139SJoao Martins size_t sz) 71bedcc139SJoao Martins { 72bedcc139SJoao Martins return kvm_gva_rw(cs, gva, buf, sz, false); 73bedcc139SJoao Martins } 74bedcc139SJoao Martins 75bedcc139SJoao Martins static inline int kvm_copy_to_gva(CPUState *cs, uint64_t gva, void *buf, 76bedcc139SJoao Martins size_t sz) 77bedcc139SJoao Martins { 78bedcc139SJoao Martins return kvm_gva_rw(cs, gva, buf, sz, true); 79bedcc139SJoao Martins } 80bedcc139SJoao Martins 81f66b8a83SJoao Martins int kvm_xen_init(KVMState *s, uint32_t hypercall_msr) 8261491cf4SDavid Woodhouse { 8361491cf4SDavid Woodhouse const int required_caps = KVM_XEN_HVM_CONFIG_HYPERCALL_MSR | 8461491cf4SDavid Woodhouse KVM_XEN_HVM_CONFIG_INTERCEPT_HCALL | KVM_XEN_HVM_CONFIG_SHARED_INFO; 8561491cf4SDavid Woodhouse struct kvm_xen_hvm_config cfg = { 86f66b8a83SJoao Martins .msr = hypercall_msr, 8761491cf4SDavid Woodhouse .flags = KVM_XEN_HVM_CONFIG_INTERCEPT_HCALL, 8861491cf4SDavid Woodhouse }; 8961491cf4SDavid Woodhouse int xen_caps, ret; 9061491cf4SDavid Woodhouse 9161491cf4SDavid Woodhouse xen_caps = kvm_check_extension(s, KVM_CAP_XEN_HVM); 9261491cf4SDavid Woodhouse if (required_caps & ~xen_caps) { 9361491cf4SDavid Woodhouse error_report("kvm: Xen HVM guest support not present or insufficient"); 9461491cf4SDavid Woodhouse return -ENOSYS; 9561491cf4SDavid Woodhouse } 9661491cf4SDavid Woodhouse 9761491cf4SDavid Woodhouse if (xen_caps & KVM_XEN_HVM_CONFIG_EVTCHN_SEND) { 9861491cf4SDavid Woodhouse struct kvm_xen_hvm_attr ha = { 9961491cf4SDavid Woodhouse .type = KVM_XEN_ATTR_TYPE_XEN_VERSION, 10061491cf4SDavid Woodhouse .u.xen_version = s->xen_version, 10161491cf4SDavid Woodhouse }; 10261491cf4SDavid Woodhouse (void)kvm_vm_ioctl(s, KVM_XEN_HVM_SET_ATTR, &ha); 10361491cf4SDavid Woodhouse 10461491cf4SDavid Woodhouse cfg.flags |= KVM_XEN_HVM_CONFIG_EVTCHN_SEND; 10561491cf4SDavid Woodhouse } 10661491cf4SDavid Woodhouse 10761491cf4SDavid Woodhouse ret = kvm_vm_ioctl(s, KVM_XEN_HVM_CONFIG, &cfg); 10861491cf4SDavid Woodhouse if (ret < 0) { 10961491cf4SDavid Woodhouse error_report("kvm: Failed to enable Xen HVM support: %s", 11061491cf4SDavid Woodhouse strerror(-ret)); 11161491cf4SDavid Woodhouse return ret; 11261491cf4SDavid Woodhouse } 11361491cf4SDavid Woodhouse 11461491cf4SDavid Woodhouse s->xen_caps = xen_caps; 11561491cf4SDavid Woodhouse return 0; 11661491cf4SDavid Woodhouse } 11761491cf4SDavid Woodhouse 1185e691a95SDavid Woodhouse int kvm_xen_init_vcpu(CPUState *cs) 1195e691a95SDavid Woodhouse { 1205e691a95SDavid Woodhouse int err; 1215e691a95SDavid Woodhouse 1225e691a95SDavid Woodhouse /* 1235e691a95SDavid Woodhouse * The kernel needs to know the Xen/ACPI vCPU ID because that's 1245e691a95SDavid Woodhouse * what the guest uses in hypercalls such as timers. It doesn't 1255e691a95SDavid Woodhouse * match the APIC ID which is generally used for talking to the 1265e691a95SDavid Woodhouse * kernel about vCPUs. And if vCPU threads race with creating 1275e691a95SDavid Woodhouse * their KVM vCPUs out of order, it doesn't necessarily match 1285e691a95SDavid Woodhouse * with the kernel's internal vCPU indices either. 1295e691a95SDavid Woodhouse */ 1305e691a95SDavid Woodhouse if (kvm_xen_has_cap(EVTCHN_SEND)) { 1315e691a95SDavid Woodhouse struct kvm_xen_vcpu_attr va = { 1325e691a95SDavid Woodhouse .type = KVM_XEN_VCPU_ATTR_TYPE_VCPU_ID, 1335e691a95SDavid Woodhouse .u.vcpu_id = cs->cpu_index, 1345e691a95SDavid Woodhouse }; 1355e691a95SDavid Woodhouse err = kvm_vcpu_ioctl(cs, KVM_XEN_VCPU_SET_ATTR, &va); 1365e691a95SDavid Woodhouse if (err) { 1375e691a95SDavid Woodhouse error_report("kvm: Failed to set Xen vCPU ID attribute: %s", 1385e691a95SDavid Woodhouse strerror(-err)); 1395e691a95SDavid Woodhouse return err; 1405e691a95SDavid Woodhouse } 1415e691a95SDavid Woodhouse } 1425e691a95SDavid Woodhouse 1435e691a95SDavid Woodhouse return 0; 1445e691a95SDavid Woodhouse } 1455e691a95SDavid Woodhouse 14661491cf4SDavid Woodhouse uint32_t kvm_xen_get_caps(void) 14761491cf4SDavid Woodhouse { 14861491cf4SDavid Woodhouse return kvm_state->xen_caps; 14961491cf4SDavid Woodhouse } 15055a3f666SJoao Martins 151bedcc139SJoao Martins static bool kvm_xen_hcall_xen_version(struct kvm_xen_exit *exit, X86CPU *cpu, 152bedcc139SJoao Martins int cmd, uint64_t arg) 153bedcc139SJoao Martins { 154bedcc139SJoao Martins int err = 0; 155bedcc139SJoao Martins 156bedcc139SJoao Martins switch (cmd) { 157bedcc139SJoao Martins case XENVER_get_features: { 158bedcc139SJoao Martins struct xen_feature_info fi; 159bedcc139SJoao Martins 160bedcc139SJoao Martins /* No need for 32/64 compat handling */ 161bedcc139SJoao Martins qemu_build_assert(sizeof(fi) == 8); 162bedcc139SJoao Martins 163bedcc139SJoao Martins err = kvm_copy_from_gva(CPU(cpu), arg, &fi, sizeof(fi)); 164bedcc139SJoao Martins if (err) { 165bedcc139SJoao Martins break; 166bedcc139SJoao Martins } 167bedcc139SJoao Martins 168bedcc139SJoao Martins fi.submap = 0; 169bedcc139SJoao Martins if (fi.submap_idx == 0) { 170bedcc139SJoao Martins fi.submap |= 1 << XENFEAT_writable_page_tables | 171bedcc139SJoao Martins 1 << XENFEAT_writable_descriptor_tables | 172bedcc139SJoao Martins 1 << XENFEAT_auto_translated_physmap | 173bedcc139SJoao Martins 1 << XENFEAT_supervisor_mode_kernel; 174bedcc139SJoao Martins } 175bedcc139SJoao Martins 176bedcc139SJoao Martins err = kvm_copy_to_gva(CPU(cpu), arg, &fi, sizeof(fi)); 177bedcc139SJoao Martins break; 178bedcc139SJoao Martins } 179bedcc139SJoao Martins 180bedcc139SJoao Martins default: 181bedcc139SJoao Martins return false; 182bedcc139SJoao Martins } 183bedcc139SJoao Martins 184bedcc139SJoao Martins exit->u.hcall.result = err; 185bedcc139SJoao Martins return true; 186bedcc139SJoao Martins } 187bedcc139SJoao Martins 188fb0fd2ceSJoao Martins static int xen_set_shared_info(uint64_t gfn) 189fb0fd2ceSJoao Martins { 190fb0fd2ceSJoao Martins uint64_t gpa = gfn << TARGET_PAGE_BITS; 191fb0fd2ceSJoao Martins int err; 192fb0fd2ceSJoao Martins 193fb0fd2ceSJoao Martins QEMU_IOTHREAD_LOCK_GUARD(); 194fb0fd2ceSJoao Martins 195fb0fd2ceSJoao Martins /* 196fb0fd2ceSJoao Martins * The xen_overlay device tells KVM about it too, since it had to 197fb0fd2ceSJoao Martins * do that on migration load anyway (unless we're going to jump 198fb0fd2ceSJoao Martins * through lots of hoops to maintain the fiction that this isn't 199fb0fd2ceSJoao Martins * KVM-specific. 200fb0fd2ceSJoao Martins */ 201fb0fd2ceSJoao Martins err = xen_overlay_map_shinfo_page(gpa); 202fb0fd2ceSJoao Martins if (err) { 203fb0fd2ceSJoao Martins return err; 204fb0fd2ceSJoao Martins } 205fb0fd2ceSJoao Martins 206fb0fd2ceSJoao Martins trace_kvm_xen_set_shared_info(gfn); 207fb0fd2ceSJoao Martins 208fb0fd2ceSJoao Martins return err; 209fb0fd2ceSJoao Martins } 210fb0fd2ceSJoao Martins 211fb0fd2ceSJoao Martins static int add_to_physmap_one(uint32_t space, uint64_t idx, uint64_t gfn) 212fb0fd2ceSJoao Martins { 213fb0fd2ceSJoao Martins switch (space) { 214fb0fd2ceSJoao Martins case XENMAPSPACE_shared_info: 215fb0fd2ceSJoao Martins if (idx > 0) { 216fb0fd2ceSJoao Martins return -EINVAL; 217fb0fd2ceSJoao Martins } 218fb0fd2ceSJoao Martins return xen_set_shared_info(gfn); 219fb0fd2ceSJoao Martins 220fb0fd2ceSJoao Martins case XENMAPSPACE_grant_table: 221fb0fd2ceSJoao Martins case XENMAPSPACE_gmfn: 222fb0fd2ceSJoao Martins case XENMAPSPACE_gmfn_range: 223fb0fd2ceSJoao Martins return -ENOTSUP; 224fb0fd2ceSJoao Martins 225fb0fd2ceSJoao Martins case XENMAPSPACE_gmfn_foreign: 226fb0fd2ceSJoao Martins case XENMAPSPACE_dev_mmio: 227fb0fd2ceSJoao Martins return -EPERM; 228fb0fd2ceSJoao Martins 229fb0fd2ceSJoao Martins default: 230fb0fd2ceSJoao Martins return -EINVAL; 231fb0fd2ceSJoao Martins } 232fb0fd2ceSJoao Martins } 233fb0fd2ceSJoao Martins 234fb0fd2ceSJoao Martins static int do_add_to_physmap(struct kvm_xen_exit *exit, X86CPU *cpu, 235fb0fd2ceSJoao Martins uint64_t arg) 236fb0fd2ceSJoao Martins { 237fb0fd2ceSJoao Martins struct xen_add_to_physmap xatp; 238fb0fd2ceSJoao Martins CPUState *cs = CPU(cpu); 239fb0fd2ceSJoao Martins 240fb0fd2ceSJoao Martins if (hypercall_compat32(exit->u.hcall.longmode)) { 241fb0fd2ceSJoao Martins struct compat_xen_add_to_physmap xatp32; 242fb0fd2ceSJoao Martins 243fb0fd2ceSJoao Martins qemu_build_assert(sizeof(struct compat_xen_add_to_physmap) == 16); 244fb0fd2ceSJoao Martins if (kvm_copy_from_gva(cs, arg, &xatp32, sizeof(xatp32))) { 245fb0fd2ceSJoao Martins return -EFAULT; 246fb0fd2ceSJoao Martins } 247fb0fd2ceSJoao Martins xatp.domid = xatp32.domid; 248fb0fd2ceSJoao Martins xatp.size = xatp32.size; 249fb0fd2ceSJoao Martins xatp.space = xatp32.space; 250fb0fd2ceSJoao Martins xatp.idx = xatp32.idx; 251fb0fd2ceSJoao Martins xatp.gpfn = xatp32.gpfn; 252fb0fd2ceSJoao Martins } else { 253fb0fd2ceSJoao Martins if (kvm_copy_from_gva(cs, arg, &xatp, sizeof(xatp))) { 254fb0fd2ceSJoao Martins return -EFAULT; 255fb0fd2ceSJoao Martins } 256fb0fd2ceSJoao Martins } 257fb0fd2ceSJoao Martins 258fb0fd2ceSJoao Martins if (xatp.domid != DOMID_SELF && xatp.domid != xen_domid) { 259fb0fd2ceSJoao Martins return -ESRCH; 260fb0fd2ceSJoao Martins } 261fb0fd2ceSJoao Martins 262fb0fd2ceSJoao Martins return add_to_physmap_one(xatp.space, xatp.idx, xatp.gpfn); 263fb0fd2ceSJoao Martins } 264fb0fd2ceSJoao Martins 265*782a7960SDavid Woodhouse static int do_add_to_physmap_batch(struct kvm_xen_exit *exit, X86CPU *cpu, 266*782a7960SDavid Woodhouse uint64_t arg) 267*782a7960SDavid Woodhouse { 268*782a7960SDavid Woodhouse struct xen_add_to_physmap_batch xatpb; 269*782a7960SDavid Woodhouse unsigned long idxs_gva, gpfns_gva, errs_gva; 270*782a7960SDavid Woodhouse CPUState *cs = CPU(cpu); 271*782a7960SDavid Woodhouse size_t op_sz; 272*782a7960SDavid Woodhouse 273*782a7960SDavid Woodhouse if (hypercall_compat32(exit->u.hcall.longmode)) { 274*782a7960SDavid Woodhouse struct compat_xen_add_to_physmap_batch xatpb32; 275*782a7960SDavid Woodhouse 276*782a7960SDavid Woodhouse qemu_build_assert(sizeof(struct compat_xen_add_to_physmap_batch) == 20); 277*782a7960SDavid Woodhouse if (kvm_copy_from_gva(cs, arg, &xatpb32, sizeof(xatpb32))) { 278*782a7960SDavid Woodhouse return -EFAULT; 279*782a7960SDavid Woodhouse } 280*782a7960SDavid Woodhouse xatpb.domid = xatpb32.domid; 281*782a7960SDavid Woodhouse xatpb.space = xatpb32.space; 282*782a7960SDavid Woodhouse xatpb.size = xatpb32.size; 283*782a7960SDavid Woodhouse 284*782a7960SDavid Woodhouse idxs_gva = xatpb32.idxs.c; 285*782a7960SDavid Woodhouse gpfns_gva = xatpb32.gpfns.c; 286*782a7960SDavid Woodhouse errs_gva = xatpb32.errs.c; 287*782a7960SDavid Woodhouse op_sz = sizeof(uint32_t); 288*782a7960SDavid Woodhouse } else { 289*782a7960SDavid Woodhouse if (kvm_copy_from_gva(cs, arg, &xatpb, sizeof(xatpb))) { 290*782a7960SDavid Woodhouse return -EFAULT; 291*782a7960SDavid Woodhouse } 292*782a7960SDavid Woodhouse op_sz = sizeof(unsigned long); 293*782a7960SDavid Woodhouse idxs_gva = (unsigned long)xatpb.idxs.p; 294*782a7960SDavid Woodhouse gpfns_gva = (unsigned long)xatpb.gpfns.p; 295*782a7960SDavid Woodhouse errs_gva = (unsigned long)xatpb.errs.p; 296*782a7960SDavid Woodhouse } 297*782a7960SDavid Woodhouse 298*782a7960SDavid Woodhouse if (xatpb.domid != DOMID_SELF && xatpb.domid != xen_domid) { 299*782a7960SDavid Woodhouse return -ESRCH; 300*782a7960SDavid Woodhouse } 301*782a7960SDavid Woodhouse 302*782a7960SDavid Woodhouse /* Explicitly invalid for the batch op. Not that we implement it anyway. */ 303*782a7960SDavid Woodhouse if (xatpb.space == XENMAPSPACE_gmfn_range) { 304*782a7960SDavid Woodhouse return -EINVAL; 305*782a7960SDavid Woodhouse } 306*782a7960SDavid Woodhouse 307*782a7960SDavid Woodhouse while (xatpb.size--) { 308*782a7960SDavid Woodhouse unsigned long idx = 0; 309*782a7960SDavid Woodhouse unsigned long gpfn = 0; 310*782a7960SDavid Woodhouse int err; 311*782a7960SDavid Woodhouse 312*782a7960SDavid Woodhouse /* For 32-bit compat this only copies the low 32 bits of each */ 313*782a7960SDavid Woodhouse if (kvm_copy_from_gva(cs, idxs_gva, &idx, op_sz) || 314*782a7960SDavid Woodhouse kvm_copy_from_gva(cs, gpfns_gva, &gpfn, op_sz)) { 315*782a7960SDavid Woodhouse return -EFAULT; 316*782a7960SDavid Woodhouse } 317*782a7960SDavid Woodhouse idxs_gva += op_sz; 318*782a7960SDavid Woodhouse gpfns_gva += op_sz; 319*782a7960SDavid Woodhouse 320*782a7960SDavid Woodhouse err = add_to_physmap_one(xatpb.space, idx, gpfn); 321*782a7960SDavid Woodhouse 322*782a7960SDavid Woodhouse if (kvm_copy_to_gva(cs, errs_gva, &err, sizeof(err))) { 323*782a7960SDavid Woodhouse return -EFAULT; 324*782a7960SDavid Woodhouse } 325*782a7960SDavid Woodhouse errs_gva += sizeof(err); 326*782a7960SDavid Woodhouse } 327*782a7960SDavid Woodhouse return 0; 328*782a7960SDavid Woodhouse } 329*782a7960SDavid Woodhouse 330fb0fd2ceSJoao Martins static bool kvm_xen_hcall_memory_op(struct kvm_xen_exit *exit, X86CPU *cpu, 331fb0fd2ceSJoao Martins int cmd, uint64_t arg) 332fb0fd2ceSJoao Martins { 333fb0fd2ceSJoao Martins int err; 334fb0fd2ceSJoao Martins 335fb0fd2ceSJoao Martins switch (cmd) { 336fb0fd2ceSJoao Martins case XENMEM_add_to_physmap: 337fb0fd2ceSJoao Martins err = do_add_to_physmap(exit, cpu, arg); 338fb0fd2ceSJoao Martins break; 339fb0fd2ceSJoao Martins 340*782a7960SDavid Woodhouse case XENMEM_add_to_physmap_batch: 341*782a7960SDavid Woodhouse err = do_add_to_physmap_batch(exit, cpu, arg); 342*782a7960SDavid Woodhouse break; 343*782a7960SDavid Woodhouse 344fb0fd2ceSJoao Martins default: 345fb0fd2ceSJoao Martins return false; 346fb0fd2ceSJoao Martins } 347fb0fd2ceSJoao Martins 348fb0fd2ceSJoao Martins exit->u.hcall.result = err; 349fb0fd2ceSJoao Martins return true; 350fb0fd2ceSJoao Martins } 351fb0fd2ceSJoao Martins 35279b7067dSJoao Martins int kvm_xen_soft_reset(void) 35379b7067dSJoao Martins { 354fb0fd2ceSJoao Martins int err; 355fb0fd2ceSJoao Martins 35679b7067dSJoao Martins assert(qemu_mutex_iothread_locked()); 35779b7067dSJoao Martins 35879b7067dSJoao Martins trace_kvm_xen_soft_reset(); 35979b7067dSJoao Martins 360fb0fd2ceSJoao Martins err = xen_overlay_map_shinfo_page(INVALID_GFN); 361fb0fd2ceSJoao Martins if (err) { 362fb0fd2ceSJoao Martins return err; 363fb0fd2ceSJoao Martins } 364fb0fd2ceSJoao Martins 36579b7067dSJoao Martins return 0; 36679b7067dSJoao Martins } 36779b7067dSJoao Martins 36879b7067dSJoao Martins static int schedop_shutdown(CPUState *cs, uint64_t arg) 36979b7067dSJoao Martins { 37079b7067dSJoao Martins struct sched_shutdown shutdown; 37179b7067dSJoao Martins int ret = 0; 37279b7067dSJoao Martins 37379b7067dSJoao Martins /* No need for 32/64 compat handling */ 37479b7067dSJoao Martins qemu_build_assert(sizeof(shutdown) == 4); 37579b7067dSJoao Martins 37679b7067dSJoao Martins if (kvm_copy_from_gva(cs, arg, &shutdown, sizeof(shutdown))) { 37779b7067dSJoao Martins return -EFAULT; 37879b7067dSJoao Martins } 37979b7067dSJoao Martins 38079b7067dSJoao Martins switch (shutdown.reason) { 38179b7067dSJoao Martins case SHUTDOWN_crash: 38279b7067dSJoao Martins cpu_dump_state(cs, stderr, CPU_DUMP_CODE); 38379b7067dSJoao Martins qemu_system_guest_panicked(NULL); 38479b7067dSJoao Martins break; 38579b7067dSJoao Martins 38679b7067dSJoao Martins case SHUTDOWN_reboot: 38779b7067dSJoao Martins qemu_system_reset_request(SHUTDOWN_CAUSE_GUEST_RESET); 38879b7067dSJoao Martins break; 38979b7067dSJoao Martins 39079b7067dSJoao Martins case SHUTDOWN_poweroff: 39179b7067dSJoao Martins qemu_system_shutdown_request(SHUTDOWN_CAUSE_GUEST_SHUTDOWN); 39279b7067dSJoao Martins break; 39379b7067dSJoao Martins 39479b7067dSJoao Martins case SHUTDOWN_soft_reset: 39579b7067dSJoao Martins qemu_mutex_lock_iothread(); 39679b7067dSJoao Martins ret = kvm_xen_soft_reset(); 39779b7067dSJoao Martins qemu_mutex_unlock_iothread(); 39879b7067dSJoao Martins break; 39979b7067dSJoao Martins 40079b7067dSJoao Martins default: 40179b7067dSJoao Martins ret = -EINVAL; 40279b7067dSJoao Martins break; 40379b7067dSJoao Martins } 40479b7067dSJoao Martins 40579b7067dSJoao Martins return ret; 40679b7067dSJoao Martins } 40779b7067dSJoao Martins 40879b7067dSJoao Martins static bool kvm_xen_hcall_sched_op(struct kvm_xen_exit *exit, X86CPU *cpu, 40979b7067dSJoao Martins int cmd, uint64_t arg) 41079b7067dSJoao Martins { 41179b7067dSJoao Martins CPUState *cs = CPU(cpu); 41279b7067dSJoao Martins int err = -ENOSYS; 41379b7067dSJoao Martins 41479b7067dSJoao Martins switch (cmd) { 41579b7067dSJoao Martins case SCHEDOP_shutdown: 41679b7067dSJoao Martins err = schedop_shutdown(cs, arg); 41779b7067dSJoao Martins break; 41879b7067dSJoao Martins 419c789b9efSDavid Woodhouse case SCHEDOP_poll: 420c789b9efSDavid Woodhouse /* 421c789b9efSDavid Woodhouse * Linux will panic if this doesn't work. Just yield; it's not 422c789b9efSDavid Woodhouse * worth overthinking it because with event channel handling 423c789b9efSDavid Woodhouse * in KVM, the kernel will intercept this and it will never 424c789b9efSDavid Woodhouse * reach QEMU anyway. The semantics of the hypercall explicltly 425c789b9efSDavid Woodhouse * permit spurious wakeups. 426c789b9efSDavid Woodhouse */ 427c789b9efSDavid Woodhouse case SCHEDOP_yield: 428c789b9efSDavid Woodhouse sched_yield(); 429c789b9efSDavid Woodhouse err = 0; 430c789b9efSDavid Woodhouse break; 431c789b9efSDavid Woodhouse 43279b7067dSJoao Martins default: 43379b7067dSJoao Martins return false; 43479b7067dSJoao Martins } 43579b7067dSJoao Martins 43679b7067dSJoao Martins exit->u.hcall.result = err; 43779b7067dSJoao Martins return true; 43879b7067dSJoao Martins } 43979b7067dSJoao Martins 44055a3f666SJoao Martins static bool do_kvm_xen_handle_exit(X86CPU *cpu, struct kvm_xen_exit *exit) 44155a3f666SJoao Martins { 44255a3f666SJoao Martins uint16_t code = exit->u.hcall.input; 44355a3f666SJoao Martins 44455a3f666SJoao Martins if (exit->u.hcall.cpl > 0) { 44555a3f666SJoao Martins exit->u.hcall.result = -EPERM; 44655a3f666SJoao Martins return true; 44755a3f666SJoao Martins } 44855a3f666SJoao Martins 44955a3f666SJoao Martins switch (code) { 45079b7067dSJoao Martins case __HYPERVISOR_sched_op: 45179b7067dSJoao Martins return kvm_xen_hcall_sched_op(exit, cpu, exit->u.hcall.params[0], 45279b7067dSJoao Martins exit->u.hcall.params[1]); 453fb0fd2ceSJoao Martins case __HYPERVISOR_memory_op: 454fb0fd2ceSJoao Martins return kvm_xen_hcall_memory_op(exit, cpu, exit->u.hcall.params[0], 455fb0fd2ceSJoao Martins exit->u.hcall.params[1]); 456bedcc139SJoao Martins case __HYPERVISOR_xen_version: 457bedcc139SJoao Martins return kvm_xen_hcall_xen_version(exit, cpu, exit->u.hcall.params[0], 458bedcc139SJoao Martins exit->u.hcall.params[1]); 45955a3f666SJoao Martins default: 46055a3f666SJoao Martins return false; 46155a3f666SJoao Martins } 46255a3f666SJoao Martins } 46355a3f666SJoao Martins 46455a3f666SJoao Martins int kvm_xen_handle_exit(X86CPU *cpu, struct kvm_xen_exit *exit) 46555a3f666SJoao Martins { 46655a3f666SJoao Martins if (exit->type != KVM_EXIT_XEN_HCALL) { 46755a3f666SJoao Martins return -1; 46855a3f666SJoao Martins } 46955a3f666SJoao Martins 470110a0ea5SDavid Woodhouse /* 471110a0ea5SDavid Woodhouse * The kernel latches the guest 32/64 mode when the MSR is used to fill 472110a0ea5SDavid Woodhouse * the hypercall page. So if we see a hypercall in a mode that doesn't 473110a0ea5SDavid Woodhouse * match our own idea of the guest mode, fetch the kernel's idea of the 474110a0ea5SDavid Woodhouse * "long mode" to remain in sync. 475110a0ea5SDavid Woodhouse */ 476110a0ea5SDavid Woodhouse if (exit->u.hcall.longmode != xen_is_long_mode()) { 477110a0ea5SDavid Woodhouse xen_sync_long_mode(); 478110a0ea5SDavid Woodhouse } 479110a0ea5SDavid Woodhouse 48055a3f666SJoao Martins if (!do_kvm_xen_handle_exit(cpu, exit)) { 48155a3f666SJoao Martins /* 48255a3f666SJoao Martins * Some hypercalls will be deliberately "implemented" by returning 48355a3f666SJoao Martins * -ENOSYS. This case is for hypercalls which are unexpected. 48455a3f666SJoao Martins */ 48555a3f666SJoao Martins exit->u.hcall.result = -ENOSYS; 48655a3f666SJoao Martins qemu_log_mask(LOG_UNIMP, "Unimplemented Xen hypercall %" 48755a3f666SJoao Martins PRId64 " (0x%" PRIx64 " 0x%" PRIx64 " 0x%" PRIx64 ")\n", 48855a3f666SJoao Martins (uint64_t)exit->u.hcall.input, 48955a3f666SJoao Martins (uint64_t)exit->u.hcall.params[0], 49055a3f666SJoao Martins (uint64_t)exit->u.hcall.params[1], 49155a3f666SJoao Martins (uint64_t)exit->u.hcall.params[2]); 49255a3f666SJoao Martins } 49355a3f666SJoao Martins 49455a3f666SJoao Martins trace_kvm_xen_hypercall(CPU(cpu)->cpu_index, exit->u.hcall.cpl, 49555a3f666SJoao Martins exit->u.hcall.input, exit->u.hcall.params[0], 49655a3f666SJoao Martins exit->u.hcall.params[1], exit->u.hcall.params[2], 49755a3f666SJoao Martins exit->u.hcall.result); 49855a3f666SJoao Martins return 0; 49955a3f666SJoao Martins } 500