111ad93f6SDavid Gibson /* 211ad93f6SDavid Gibson * QEMU PowerPC pSeries Logical Partition (aka sPAPR) hardware System Emulator 311ad93f6SDavid Gibson * 411ad93f6SDavid Gibson * PAPR Virtualized Interrupt System, aka ICS/ICP aka xics, in-kernel emulation 511ad93f6SDavid Gibson * 611ad93f6SDavid Gibson * Copyright (c) 2013 David Gibson, IBM Corporation. 711ad93f6SDavid Gibson * 811ad93f6SDavid Gibson * Permission is hereby granted, free of charge, to any person obtaining a copy 911ad93f6SDavid Gibson * of this software and associated documentation files (the "Software"), to deal 1011ad93f6SDavid Gibson * in the Software without restriction, including without limitation the rights 1111ad93f6SDavid Gibson * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 1211ad93f6SDavid Gibson * copies of the Software, and to permit persons to whom the Software is 1311ad93f6SDavid Gibson * furnished to do so, subject to the following conditions: 1411ad93f6SDavid Gibson * 1511ad93f6SDavid Gibson * The above copyright notice and this permission notice shall be included in 1611ad93f6SDavid Gibson * all copies or substantial portions of the Software. 1711ad93f6SDavid Gibson * 1811ad93f6SDavid Gibson * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 1911ad93f6SDavid Gibson * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 2011ad93f6SDavid Gibson * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 2111ad93f6SDavid Gibson * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 2211ad93f6SDavid Gibson * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 2311ad93f6SDavid Gibson * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 2411ad93f6SDavid Gibson * THE SOFTWARE. 2511ad93f6SDavid Gibson * 2611ad93f6SDavid Gibson */ 2711ad93f6SDavid Gibson 280d75590dSPeter Maydell #include "qemu/osdep.h" 29da34e65cSMarkus Armbruster #include "qapi/error.h" 304771d756SPaolo Bonzini #include "qemu-common.h" 314771d756SPaolo Bonzini #include "cpu.h" 3211ad93f6SDavid Gibson #include "trace.h" 3377ac58ddSPaolo Bonzini #include "sysemu/kvm.h" 3411ad93f6SDavid Gibson #include "hw/ppc/spapr.h" 353f777abcSCédric Le Goater #include "hw/ppc/spapr_cpu_core.h" 3611ad93f6SDavid Gibson #include "hw/ppc/xics.h" 37a51d5afcSThomas Huth #include "hw/ppc/xics_spapr.h" 3811ad93f6SDavid Gibson #include "kvm_ppc.h" 3911ad93f6SDavid Gibson #include "qemu/config-file.h" 4011ad93f6SDavid Gibson #include "qemu/error-report.h" 4111ad93f6SDavid Gibson 4211ad93f6SDavid Gibson #include <sys/ioctl.h> 4311ad93f6SDavid Gibson 44729f8a4fSCédric Le Goater static int kernel_xics_fd = -1; 45729f8a4fSCédric Le Goater 46de86ecccSGreg Kurz typedef struct KVMEnabledICP { 47de86ecccSGreg Kurz unsigned long vcpu_id; 48de86ecccSGreg Kurz QLIST_ENTRY(KVMEnabledICP) node; 49de86ecccSGreg Kurz } KVMEnabledICP; 50de86ecccSGreg Kurz 51de86ecccSGreg Kurz static QLIST_HEAD(, KVMEnabledICP) 52de86ecccSGreg Kurz kvm_enabled_icps = QLIST_HEAD_INITIALIZER(&kvm_enabled_icps); 53de86ecccSGreg Kurz 5456b11587SCédric Le Goater static void kvm_disable_icps(void) 5556b11587SCédric Le Goater { 5656b11587SCédric Le Goater KVMEnabledICP *enabled_icp, *next; 5756b11587SCédric Le Goater 5856b11587SCédric Le Goater QLIST_FOREACH_SAFE(enabled_icp, &kvm_enabled_icps, node, next) { 5956b11587SCédric Le Goater QLIST_REMOVE(enabled_icp, node); 6056b11587SCédric Le Goater g_free(enabled_icp); 6156b11587SCédric Le Goater } 6256b11587SCédric Le Goater } 6356b11587SCédric Le Goater 6411ad93f6SDavid Gibson /* 6511ad93f6SDavid Gibson * ICP-KVM 6611ad93f6SDavid Gibson */ 670e5c7fadSGreg Kurz void icp_get_kvm_state(ICPState *icp) 6811ad93f6SDavid Gibson { 6911ad93f6SDavid Gibson uint64_t state; 7011ad93f6SDavid Gibson int ret; 7111ad93f6SDavid Gibson 723bf84e99SCédric Le Goater /* The KVM XICS device is not in use */ 733bf84e99SCédric Le Goater if (kernel_xics_fd == -1) { 743bf84e99SCédric Le Goater return; 753bf84e99SCédric Le Goater } 763bf84e99SCédric Le Goater 7711ad93f6SDavid Gibson /* ICP for this CPU thread is not in use, exiting */ 788e4fba20SCédric Le Goater if (!icp->cs) { 7911ad93f6SDavid Gibson return; 8011ad93f6SDavid Gibson } 8111ad93f6SDavid Gibson 82bf358b54SCédric Le Goater ret = kvm_get_one_reg(icp->cs, KVM_REG_PPC_ICP_STATE, &state); 8311ad93f6SDavid Gibson if (ret != 0) { 8411ad93f6SDavid Gibson error_report("Unable to retrieve KVM interrupt controller state" 858e4fba20SCédric Le Goater " for CPU %ld: %s", kvm_arch_vcpu_id(icp->cs), strerror(errno)); 8611ad93f6SDavid Gibson exit(1); 8711ad93f6SDavid Gibson } 8811ad93f6SDavid Gibson 898e4fba20SCédric Le Goater icp->xirr = state >> KVM_REG_PPC_ICP_XISR_SHIFT; 908e4fba20SCédric Le Goater icp->mfrr = (state >> KVM_REG_PPC_ICP_MFRR_SHIFT) 9111ad93f6SDavid Gibson & KVM_REG_PPC_ICP_MFRR_MASK; 928e4fba20SCédric Le Goater icp->pending_priority = (state >> KVM_REG_PPC_ICP_PPRI_SHIFT) 9311ad93f6SDavid Gibson & KVM_REG_PPC_ICP_PPRI_MASK; 9411ad93f6SDavid Gibson } 9511ad93f6SDavid Gibson 96dcb556fcSGreg Kurz static void do_icp_synchronize_state(CPUState *cpu, run_on_cpu_data arg) 97dcb556fcSGreg Kurz { 98dcb556fcSGreg Kurz icp_get_kvm_state(arg.host_ptr); 99dcb556fcSGreg Kurz } 100dcb556fcSGreg Kurz 1010e5c7fadSGreg Kurz void icp_synchronize_state(ICPState *icp) 102dcb556fcSGreg Kurz { 103dcb556fcSGreg Kurz if (icp->cs) { 104dcb556fcSGreg Kurz run_on_cpu(icp->cs, do_icp_synchronize_state, RUN_ON_CPU_HOST_PTR(icp)); 105dcb556fcSGreg Kurz } 106dcb556fcSGreg Kurz } 107dcb556fcSGreg Kurz 108330a21e3SGreg Kurz int icp_set_kvm_state(ICPState *icp, Error **errp) 10911ad93f6SDavid Gibson { 11011ad93f6SDavid Gibson uint64_t state; 11111ad93f6SDavid Gibson int ret; 11211ad93f6SDavid Gibson 1133bf84e99SCédric Le Goater /* The KVM XICS device is not in use */ 1143bf84e99SCédric Le Goater if (kernel_xics_fd == -1) { 1153bf84e99SCédric Le Goater return 0; 1163bf84e99SCédric Le Goater } 1173bf84e99SCédric Le Goater 11811ad93f6SDavid Gibson /* ICP for this CPU thread is not in use, exiting */ 1198e4fba20SCédric Le Goater if (!icp->cs) { 12011ad93f6SDavid Gibson return 0; 12111ad93f6SDavid Gibson } 12211ad93f6SDavid Gibson 1238e4fba20SCédric Le Goater state = ((uint64_t)icp->xirr << KVM_REG_PPC_ICP_XISR_SHIFT) 1248e4fba20SCédric Le Goater | ((uint64_t)icp->mfrr << KVM_REG_PPC_ICP_MFRR_SHIFT) 1258e4fba20SCédric Le Goater | ((uint64_t)icp->pending_priority << KVM_REG_PPC_ICP_PPRI_SHIFT); 12611ad93f6SDavid Gibson 127bf358b54SCédric Le Goater ret = kvm_set_one_reg(icp->cs, KVM_REG_PPC_ICP_STATE, &state); 128330a21e3SGreg Kurz if (ret < 0) { 129330a21e3SGreg Kurz error_setg_errno(errp, -ret, 130330a21e3SGreg Kurz "Unable to restore KVM interrupt controller state (0x%" 131330a21e3SGreg Kurz PRIx64 ") for CPU %ld", state, 132330a21e3SGreg Kurz kvm_arch_vcpu_id(icp->cs)); 13311ad93f6SDavid Gibson return ret; 13411ad93f6SDavid Gibson } 13511ad93f6SDavid Gibson 13611ad93f6SDavid Gibson return 0; 13711ad93f6SDavid Gibson } 13811ad93f6SDavid Gibson 1398e6e6efeSGreg Kurz void icp_kvm_realize(DeviceState *dev, Error **errp) 140f0232434SCédric Le Goater { 141a028dd42SCédric Le Goater ICPState *icp = ICP(dev); 142a028dd42SCédric Le Goater CPUState *cs; 143de86ecccSGreg Kurz KVMEnabledICP *enabled_icp; 144a028dd42SCédric Le Goater unsigned long vcpu_id; 145f0232434SCédric Le Goater int ret; 146f0232434SCédric Le Goater 1473bf84e99SCédric Le Goater /* The KVM XICS device is not in use */ 148f0232434SCédric Le Goater if (kernel_xics_fd == -1) { 1493bf84e99SCédric Le Goater return; 150f0232434SCédric Le Goater } 151f0232434SCédric Le Goater 152a028dd42SCédric Le Goater cs = icp->cs; 153a028dd42SCédric Le Goater vcpu_id = kvm_arch_vcpu_id(cs); 154a028dd42SCédric Le Goater 155f0232434SCédric Le Goater /* 156f0232434SCédric Le Goater * If we are reusing a parked vCPU fd corresponding to the CPU 157f0232434SCédric Le Goater * which was hot-removed earlier we don't have to renable 158f0232434SCédric Le Goater * KVM_CAP_IRQ_XICS capability again. 159f0232434SCédric Le Goater */ 160de86ecccSGreg Kurz QLIST_FOREACH(enabled_icp, &kvm_enabled_icps, node) { 161de86ecccSGreg Kurz if (enabled_icp->vcpu_id == vcpu_id) { 162f0232434SCédric Le Goater return; 163f0232434SCédric Le Goater } 164de86ecccSGreg Kurz } 165f0232434SCédric Le Goater 166de86ecccSGreg Kurz ret = kvm_vcpu_enable_cap(cs, KVM_CAP_IRQ_XICS, 0, kernel_xics_fd, vcpu_id); 167f0232434SCédric Le Goater if (ret < 0) { 168*894ea3ecSGreg Kurz Error *local_err = NULL; 169*894ea3ecSGreg Kurz 170*894ea3ecSGreg Kurz error_setg(&local_err, "Unable to connect CPU%ld to kernel XICS: %s", 171*894ea3ecSGreg Kurz vcpu_id, strerror(errno)); 172*894ea3ecSGreg Kurz if (errno == ENOSPC) { 173*894ea3ecSGreg Kurz error_append_hint(&local_err, "Try -smp maxcpus=N with N < %u\n", 174*894ea3ecSGreg Kurz MACHINE(qdev_get_machine())->smp.max_cpus); 175*894ea3ecSGreg Kurz } 176*894ea3ecSGreg Kurz error_propagate(errp, local_err); 177b1fd36c3SGreg Kurz return; 178f0232434SCédric Le Goater } 179de86ecccSGreg Kurz enabled_icp = g_malloc(sizeof(*enabled_icp)); 180de86ecccSGreg Kurz enabled_icp->vcpu_id = vcpu_id; 181de86ecccSGreg Kurz QLIST_INSERT_HEAD(&kvm_enabled_icps, enabled_icp, node); 182f0232434SCédric Le Goater } 183f0232434SCédric Le Goater 18411ad93f6SDavid Gibson /* 18511ad93f6SDavid Gibson * ICS-KVM 18611ad93f6SDavid Gibson */ 187d80b2ccfSGreg Kurz void ics_get_kvm_state(ICSState *ics) 18811ad93f6SDavid Gibson { 18911ad93f6SDavid Gibson uint64_t state; 19011ad93f6SDavid Gibson int i; 19111ad93f6SDavid Gibson 1923bf84e99SCédric Le Goater /* The KVM XICS device is not in use */ 1933bf84e99SCédric Le Goater if (kernel_xics_fd == -1) { 1943bf84e99SCédric Le Goater return; 1953bf84e99SCédric Le Goater } 1963bf84e99SCédric Le Goater 19711ad93f6SDavid Gibson for (i = 0; i < ics->nr_irqs; i++) { 19811ad93f6SDavid Gibson ICSIRQState *irq = &ics->irqs[i]; 19911ad93f6SDavid Gibson 2004c3539d4SCédric Le Goater if (ics_irq_free(ics, i)) { 2014c3539d4SCédric Le Goater continue; 2024c3539d4SCédric Le Goater } 2034c3539d4SCédric Le Goater 204bf358b54SCédric Le Goater kvm_device_access(kernel_xics_fd, KVM_DEV_XICS_GRP_SOURCES, 20550beeb68SMarkus Armbruster i + ics->offset, &state, false, &error_fatal); 20611ad93f6SDavid Gibson 20711ad93f6SDavid Gibson irq->server = state & KVM_XICS_DESTINATION_MASK; 20811ad93f6SDavid Gibson irq->saved_priority = (state >> KVM_XICS_PRIORITY_SHIFT) 20911ad93f6SDavid Gibson & KVM_XICS_PRIORITY_MASK; 21011ad93f6SDavid Gibson /* 21111ad93f6SDavid Gibson * To be consistent with the software emulation in xics.c, we 21211ad93f6SDavid Gibson * split out the masked state + priority that we get from the 21311ad93f6SDavid Gibson * kernel into 'current priority' (0xff if masked) and 21411ad93f6SDavid Gibson * 'saved priority' (if masked, this is the priority the 21511ad93f6SDavid Gibson * interrupt had before it was masked). Masking and unmasking 21611ad93f6SDavid Gibson * are done with the ibm,int-off and ibm,int-on RTAS calls. 21711ad93f6SDavid Gibson */ 21811ad93f6SDavid Gibson if (state & KVM_XICS_MASKED) { 21911ad93f6SDavid Gibson irq->priority = 0xff; 22011ad93f6SDavid Gibson } else { 22111ad93f6SDavid Gibson irq->priority = irq->saved_priority; 22211ad93f6SDavid Gibson } 22311ad93f6SDavid Gibson 224063cb7cbSSam Bobroff irq->status = 0; 22511ad93f6SDavid Gibson if (state & KVM_XICS_PENDING) { 22611ad93f6SDavid Gibson if (state & KVM_XICS_LEVEL_SENSITIVE) { 22711ad93f6SDavid Gibson irq->status |= XICS_STATUS_ASSERTED; 22811ad93f6SDavid Gibson } else { 22911ad93f6SDavid Gibson /* 23011ad93f6SDavid Gibson * A pending edge-triggered interrupt (or MSI) 23111ad93f6SDavid Gibson * must have been rejected previously when we 23211ad93f6SDavid Gibson * first detected it and tried to deliver it, 23311ad93f6SDavid Gibson * so mark it as pending and previously rejected 23411ad93f6SDavid Gibson * for consistency with how xics.c works. 23511ad93f6SDavid Gibson */ 23611ad93f6SDavid Gibson irq->status |= XICS_STATUS_MASKED_PENDING 23711ad93f6SDavid Gibson | XICS_STATUS_REJECTED; 23811ad93f6SDavid Gibson } 23911ad93f6SDavid Gibson } 240229e16fdSSam Bobroff if (state & KVM_XICS_PRESENTED) { 241229e16fdSSam Bobroff irq->status |= XICS_STATUS_PRESENTED; 242229e16fdSSam Bobroff } 243229e16fdSSam Bobroff if (state & KVM_XICS_QUEUED) { 244229e16fdSSam Bobroff irq->status |= XICS_STATUS_QUEUED; 245229e16fdSSam Bobroff } 24611ad93f6SDavid Gibson } 24711ad93f6SDavid Gibson } 24811ad93f6SDavid Gibson 249d80b2ccfSGreg Kurz void ics_synchronize_state(ICSState *ics) 250dcb556fcSGreg Kurz { 251dcb556fcSGreg Kurz ics_get_kvm_state(ics); 252dcb556fcSGreg Kurz } 253dcb556fcSGreg Kurz 254330a21e3SGreg Kurz int ics_set_kvm_state_one(ICSState *ics, int srcno, Error **errp) 25511ad93f6SDavid Gibson { 25611ad93f6SDavid Gibson uint64_t state; 2576cead90cSGreg Kurz ICSIRQState *irq = &ics->irqs[srcno]; 25811ad93f6SDavid Gibson int ret; 25911ad93f6SDavid Gibson 2603bf84e99SCédric Le Goater /* The KVM XICS device is not in use */ 2613bf84e99SCédric Le Goater if (kernel_xics_fd == -1) { 2623bf84e99SCédric Le Goater return 0; 2633bf84e99SCédric Le Goater } 2643bf84e99SCédric Le Goater 26511ad93f6SDavid Gibson state = irq->server; 26611ad93f6SDavid Gibson state |= (uint64_t)(irq->saved_priority & KVM_XICS_PRIORITY_MASK) 26711ad93f6SDavid Gibson << KVM_XICS_PRIORITY_SHIFT; 26811ad93f6SDavid Gibson if (irq->priority != irq->saved_priority) { 26911ad93f6SDavid Gibson assert(irq->priority == 0xff); 27038298611SGreg Kurz } 27138298611SGreg Kurz 27238298611SGreg Kurz if (irq->priority == 0xff) { 27311ad93f6SDavid Gibson state |= KVM_XICS_MASKED; 27411ad93f6SDavid Gibson } 27511ad93f6SDavid Gibson 2766cead90cSGreg Kurz if (irq->flags & XICS_FLAGS_IRQ_LSI) { 27711ad93f6SDavid Gibson state |= KVM_XICS_LEVEL_SENSITIVE; 27811ad93f6SDavid Gibson if (irq->status & XICS_STATUS_ASSERTED) { 27911ad93f6SDavid Gibson state |= KVM_XICS_PENDING; 28011ad93f6SDavid Gibson } 28111ad93f6SDavid Gibson } else { 28211ad93f6SDavid Gibson if (irq->status & XICS_STATUS_MASKED_PENDING) { 28311ad93f6SDavid Gibson state |= KVM_XICS_PENDING; 28411ad93f6SDavid Gibson } 28511ad93f6SDavid Gibson } 286229e16fdSSam Bobroff if (irq->status & XICS_STATUS_PRESENTED) { 287229e16fdSSam Bobroff state |= KVM_XICS_PRESENTED; 288229e16fdSSam Bobroff } 289229e16fdSSam Bobroff if (irq->status & XICS_STATUS_QUEUED) { 290229e16fdSSam Bobroff state |= KVM_XICS_QUEUED; 291229e16fdSSam Bobroff } 29211ad93f6SDavid Gibson 29352b43881SCédric Le Goater ret = kvm_device_access(kernel_xics_fd, KVM_DEV_XICS_GRP_SOURCES, 294330a21e3SGreg Kurz srcno + ics->offset, &state, true, errp); 295330a21e3SGreg Kurz if (ret < 0) { 29611ad93f6SDavid Gibson return ret; 29711ad93f6SDavid Gibson } 2986cead90cSGreg Kurz 2996cead90cSGreg Kurz return 0; 3006cead90cSGreg Kurz } 3016cead90cSGreg Kurz 302330a21e3SGreg Kurz int ics_set_kvm_state(ICSState *ics, Error **errp) 3036cead90cSGreg Kurz { 3046cead90cSGreg Kurz int i; 3056cead90cSGreg Kurz 3063bf84e99SCédric Le Goater /* The KVM XICS device is not in use */ 3073bf84e99SCédric Le Goater if (kernel_xics_fd == -1) { 3083bf84e99SCédric Le Goater return 0; 3093bf84e99SCédric Le Goater } 3103bf84e99SCédric Le Goater 3116cead90cSGreg Kurz for (i = 0; i < ics->nr_irqs; i++) { 312330a21e3SGreg Kurz Error *local_err = NULL; 3136cead90cSGreg Kurz int ret; 3146cead90cSGreg Kurz 3154c3539d4SCédric Le Goater if (ics_irq_free(ics, i)) { 3164c3539d4SCédric Le Goater continue; 3174c3539d4SCédric Le Goater } 3184c3539d4SCédric Le Goater 319330a21e3SGreg Kurz ret = ics_set_kvm_state_one(ics, i, &local_err); 320330a21e3SGreg Kurz if (ret < 0) { 321330a21e3SGreg Kurz error_propagate(errp, local_err); 3226cead90cSGreg Kurz return ret; 3236cead90cSGreg Kurz } 32411ad93f6SDavid Gibson } 32511ad93f6SDavid Gibson 32611ad93f6SDavid Gibson return 0; 32711ad93f6SDavid Gibson } 32811ad93f6SDavid Gibson 329557b4567SGreg Kurz void ics_kvm_set_irq(ICSState *ics, int srcno, int val) 33011ad93f6SDavid Gibson { 33111ad93f6SDavid Gibson struct kvm_irq_level args; 33211ad93f6SDavid Gibson int rc; 33311ad93f6SDavid Gibson 3343bf84e99SCédric Le Goater /* The KVM XICS device should be in use */ 3353bf84e99SCédric Le Goater assert(kernel_xics_fd != -1); 3363bf84e99SCédric Le Goater 33711ad93f6SDavid Gibson args.irq = srcno + ics->offset; 3384af88944SAlexey Kardashevskiy if (ics->irqs[srcno].flags & XICS_FLAGS_IRQ_MSI) { 33911ad93f6SDavid Gibson if (!val) { 34011ad93f6SDavid Gibson return; 34111ad93f6SDavid Gibson } 34211ad93f6SDavid Gibson args.level = KVM_INTERRUPT_SET; 34311ad93f6SDavid Gibson } else { 34411ad93f6SDavid Gibson args.level = val ? KVM_INTERRUPT_SET_LEVEL : KVM_INTERRUPT_UNSET; 34511ad93f6SDavid Gibson } 34611ad93f6SDavid Gibson rc = kvm_vm_ioctl(kvm_state, KVM_IRQ_LINE, &args); 34711ad93f6SDavid Gibson if (rc < 0) { 34811ad93f6SDavid Gibson perror("kvm_irq_line"); 34911ad93f6SDavid Gibson } 35011ad93f6SDavid Gibson } 35111ad93f6SDavid Gibson 3524ffb7496SGreg Kurz int xics_kvm_connect(SpaprInterruptController *intc, uint32_t nr_servers, 3534ffb7496SGreg Kurz Error **errp) 35411ad93f6SDavid Gibson { 35598a39a79SDavid Gibson ICSState *ics = ICS_SPAPR(intc); 356817bb6a4SCédric Le Goater int rc; 3573f777abcSCédric Le Goater CPUState *cs; 3583f777abcSCédric Le Goater Error *local_err = NULL; 3593f777abcSCédric Le Goater 3603f777abcSCédric Le Goater /* 3613f777abcSCédric Le Goater * The KVM XICS device already in use. This is the case when 3623f777abcSCédric Le Goater * rebooting under the XICS-only interrupt mode. 3633f777abcSCédric Le Goater */ 3643f777abcSCédric Le Goater if (kernel_xics_fd != -1) { 3653f777abcSCédric Le Goater return 0; 3663f777abcSCédric Le Goater } 36711ad93f6SDavid Gibson 36811ad93f6SDavid Gibson if (!kvm_enabled() || !kvm_check_extension(kvm_state, KVM_CAP_IRQ_XICS)) { 36911ad93f6SDavid Gibson error_setg(errp, 37011ad93f6SDavid Gibson "KVM and IRQ_XICS capability must be present for in-kernel XICS"); 37164fb9621SGreg Kurz return -1; 37211ad93f6SDavid Gibson } 37311ad93f6SDavid Gibson 3743a3b8502SAlexey Kardashevskiy rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_SET_XIVE, "ibm,set-xive"); 37511ad93f6SDavid Gibson if (rc < 0) { 376ab3d15faSGreg Kurz error_setg_errno(&local_err, -rc, 377ab3d15faSGreg Kurz "kvmppc_define_rtas_kernel_token: ibm,set-xive"); 37811ad93f6SDavid Gibson goto fail; 37911ad93f6SDavid Gibson } 38011ad93f6SDavid Gibson 3813a3b8502SAlexey Kardashevskiy rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_GET_XIVE, "ibm,get-xive"); 38211ad93f6SDavid Gibson if (rc < 0) { 383ab3d15faSGreg Kurz error_setg_errno(&local_err, -rc, 384ab3d15faSGreg Kurz "kvmppc_define_rtas_kernel_token: ibm,get-xive"); 38511ad93f6SDavid Gibson goto fail; 38611ad93f6SDavid Gibson } 38711ad93f6SDavid Gibson 3883a3b8502SAlexey Kardashevskiy rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_INT_ON, "ibm,int-on"); 38911ad93f6SDavid Gibson if (rc < 0) { 390ab3d15faSGreg Kurz error_setg_errno(&local_err, -rc, 391ab3d15faSGreg Kurz "kvmppc_define_rtas_kernel_token: ibm,int-on"); 39211ad93f6SDavid Gibson goto fail; 39311ad93f6SDavid Gibson } 39411ad93f6SDavid Gibson 3953a3b8502SAlexey Kardashevskiy rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_INT_OFF, "ibm,int-off"); 39611ad93f6SDavid Gibson if (rc < 0) { 397ab3d15faSGreg Kurz error_setg_errno(&local_err, -rc, 398ab3d15faSGreg Kurz "kvmppc_define_rtas_kernel_token: ibm,int-off"); 39911ad93f6SDavid Gibson goto fail; 40011ad93f6SDavid Gibson } 40111ad93f6SDavid Gibson 402bf358b54SCédric Le Goater /* Create the KVM XICS device */ 403bf358b54SCédric Le Goater rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false); 40411ad93f6SDavid Gibson if (rc < 0) { 405ab3d15faSGreg Kurz error_setg_errno(&local_err, -rc, "Error on KVM_CREATE_DEVICE for XICS"); 40611ad93f6SDavid Gibson goto fail; 40711ad93f6SDavid Gibson } 40811ad93f6SDavid Gibson 409*894ea3ecSGreg Kurz /* Tell KVM about the # of VCPUs we may have (POWER9 and newer only) */ 410*894ea3ecSGreg Kurz if (kvm_device_check_attr(rc, KVM_DEV_XICS_GRP_CTRL, 411*894ea3ecSGreg Kurz KVM_DEV_XICS_NR_SERVERS)) { 412*894ea3ecSGreg Kurz if (kvm_device_access(rc, KVM_DEV_XICS_GRP_CTRL, 413*894ea3ecSGreg Kurz KVM_DEV_XICS_NR_SERVERS, &nr_servers, true, 414*894ea3ecSGreg Kurz &local_err)) { 415*894ea3ecSGreg Kurz goto fail; 416*894ea3ecSGreg Kurz } 417*894ea3ecSGreg Kurz } 418*894ea3ecSGreg Kurz 419bf358b54SCédric Le Goater kernel_xics_fd = rc; 4209554233cSAlexey Kardashevskiy kvm_kernel_irqchip = true; 4219554233cSAlexey Kardashevskiy kvm_msi_via_irqfd_allowed = true; 4229554233cSAlexey Kardashevskiy kvm_gsi_direct_mapping = true; 4239554233cSAlexey Kardashevskiy 4243f777abcSCédric Le Goater /* Create the presenters */ 4253f777abcSCédric Le Goater CPU_FOREACH(cs) { 4263f777abcSCédric Le Goater PowerPCCPU *cpu = POWERPC_CPU(cs); 4273f777abcSCédric Le Goater 4283f777abcSCédric Le Goater icp_kvm_realize(DEVICE(spapr_cpu_state(cpu)->icp), &local_err); 4293f777abcSCédric Le Goater if (local_err) { 4303f777abcSCédric Le Goater goto fail; 4313f777abcSCédric Le Goater } 4323f777abcSCédric Le Goater } 4333f777abcSCédric Le Goater 4343f777abcSCédric Le Goater /* Update the KVM sources */ 43598a39a79SDavid Gibson ics_set_kvm_state(ics, &local_err); 436330a21e3SGreg Kurz if (local_err) { 437330a21e3SGreg Kurz goto fail; 438330a21e3SGreg Kurz } 4393f777abcSCédric Le Goater 4403f777abcSCédric Le Goater /* Connect the presenters to the initial VCPUs of the machine */ 4413f777abcSCédric Le Goater CPU_FOREACH(cs) { 4423f777abcSCédric Le Goater PowerPCCPU *cpu = POWERPC_CPU(cs); 443330a21e3SGreg Kurz icp_set_kvm_state(spapr_cpu_state(cpu)->icp, &local_err); 444330a21e3SGreg Kurz if (local_err) { 445330a21e3SGreg Kurz goto fail; 446330a21e3SGreg Kurz } 4473f777abcSCédric Le Goater } 4483f777abcSCédric Le Goater 449bf358b54SCédric Le Goater return 0; 45011ad93f6SDavid Gibson 45111ad93f6SDavid Gibson fail: 452ab3d15faSGreg Kurz error_propagate(errp, local_err); 45398a39a79SDavid Gibson xics_kvm_disconnect(intc); 4542192a930SCédric Le Goater return -1; 45511ad93f6SDavid Gibson } 45656b11587SCédric Le Goater 45798a39a79SDavid Gibson void xics_kvm_disconnect(SpaprInterruptController *intc) 45856b11587SCédric Le Goater { 45956b11587SCédric Le Goater /* 46056b11587SCédric Le Goater * Only on P9 using the XICS-on XIVE KVM device: 46156b11587SCédric Le Goater * 46256b11587SCédric Le Goater * When the KVM device fd is closed, the device is destroyed and 46356b11587SCédric Le Goater * removed from the list of devices of the VM. The VCPU presenters 46456b11587SCédric Le Goater * are also detached from the device. 46556b11587SCédric Le Goater */ 4664812f261SGreg Kurz if (kernel_xics_fd != -1) { 46756b11587SCédric Le Goater close(kernel_xics_fd); 46856b11587SCédric Le Goater kernel_xics_fd = -1; 4694812f261SGreg Kurz } 47056b11587SCédric Le Goater 47156b11587SCédric Le Goater kvmppc_define_rtas_kernel_token(0, "ibm,set-xive"); 47256b11587SCédric Le Goater kvmppc_define_rtas_kernel_token(0, "ibm,get-xive"); 47356b11587SCédric Le Goater kvmppc_define_rtas_kernel_token(0, "ibm,int-on"); 47456b11587SCédric Le Goater kvmppc_define_rtas_kernel_token(0, "ibm,int-off"); 47556b11587SCédric Le Goater 47656b11587SCédric Le Goater kvm_kernel_irqchip = false; 47756b11587SCédric Le Goater kvm_msi_via_irqfd_allowed = false; 47856b11587SCédric Le Goater kvm_gsi_direct_mapping = false; 47956b11587SCédric Le Goater 48056b11587SCédric Le Goater /* Clear the presenter from the VCPUs */ 48156b11587SCédric Le Goater kvm_disable_icps(); 48256b11587SCédric Le Goater } 4837abc0c6dSGreg Kurz 4847abc0c6dSGreg Kurz /* 4857abc0c6dSGreg Kurz * This is a heuristic to detect older KVMs on POWER9 hosts that don't 4867abc0c6dSGreg Kurz * support destruction of a KVM XICS device while the VM is running. 4877abc0c6dSGreg Kurz * Required to start a spapr machine with ic-mode=dual,kernel-irqchip=on. 4887abc0c6dSGreg Kurz */ 4897abc0c6dSGreg Kurz bool xics_kvm_has_broken_disconnect(SpaprMachineState *spapr) 4907abc0c6dSGreg Kurz { 4917abc0c6dSGreg Kurz int rc; 4927abc0c6dSGreg Kurz 4937abc0c6dSGreg Kurz rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false); 4947abc0c6dSGreg Kurz if (rc < 0) { 4957abc0c6dSGreg Kurz /* 4967abc0c6dSGreg Kurz * The error is ignored on purpose. The KVM XICS setup code 4977abc0c6dSGreg Kurz * will catch it again anyway. The goal here is to see if 4987abc0c6dSGreg Kurz * close() actually destroys the device or not. 4997abc0c6dSGreg Kurz */ 5007abc0c6dSGreg Kurz return false; 5017abc0c6dSGreg Kurz } 5027abc0c6dSGreg Kurz 5037abc0c6dSGreg Kurz close(rc); 5047abc0c6dSGreg Kurz 5057abc0c6dSGreg Kurz rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false); 5067abc0c6dSGreg Kurz if (rc >= 0) { 5077abc0c6dSGreg Kurz close(rc); 5087abc0c6dSGreg Kurz return false; 5097abc0c6dSGreg Kurz } 5107abc0c6dSGreg Kurz 5117abc0c6dSGreg Kurz return errno == EEXIST; 5127abc0c6dSGreg Kurz } 513