xref: /qemu/hw/intc/xics_kvm.c (revision 4c3539d491026a0cc68e3b886f16cb7f57efd46b) !
111ad93f6SDavid Gibson /*
211ad93f6SDavid Gibson  * QEMU PowerPC pSeries Logical Partition (aka sPAPR) hardware System Emulator
311ad93f6SDavid Gibson  *
411ad93f6SDavid Gibson  * PAPR Virtualized Interrupt System, aka ICS/ICP aka xics, in-kernel emulation
511ad93f6SDavid Gibson  *
611ad93f6SDavid Gibson  * Copyright (c) 2013 David Gibson, IBM Corporation.
711ad93f6SDavid Gibson  *
811ad93f6SDavid Gibson  * Permission is hereby granted, free of charge, to any person obtaining a copy
911ad93f6SDavid Gibson  * of this software and associated documentation files (the "Software"), to deal
1011ad93f6SDavid Gibson  * in the Software without restriction, including without limitation the rights
1111ad93f6SDavid Gibson  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
1211ad93f6SDavid Gibson  * copies of the Software, and to permit persons to whom the Software is
1311ad93f6SDavid Gibson  * furnished to do so, subject to the following conditions:
1411ad93f6SDavid Gibson  *
1511ad93f6SDavid Gibson  * The above copyright notice and this permission notice shall be included in
1611ad93f6SDavid Gibson  * all copies or substantial portions of the Software.
1711ad93f6SDavid Gibson  *
1811ad93f6SDavid Gibson  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1911ad93f6SDavid Gibson  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
2011ad93f6SDavid Gibson  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
2111ad93f6SDavid Gibson  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
2211ad93f6SDavid Gibson  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
2311ad93f6SDavid Gibson  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
2411ad93f6SDavid Gibson  * THE SOFTWARE.
2511ad93f6SDavid Gibson  *
2611ad93f6SDavid Gibson  */
2711ad93f6SDavid Gibson 
280d75590dSPeter Maydell #include "qemu/osdep.h"
29da34e65cSMarkus Armbruster #include "qapi/error.h"
304771d756SPaolo Bonzini #include "qemu-common.h"
314771d756SPaolo Bonzini #include "cpu.h"
3211ad93f6SDavid Gibson #include "trace.h"
3377ac58ddSPaolo Bonzini #include "sysemu/kvm.h"
3411ad93f6SDavid Gibson #include "hw/ppc/spapr.h"
353f777abcSCédric Le Goater #include "hw/ppc/spapr_cpu_core.h"
3611ad93f6SDavid Gibson #include "hw/ppc/xics.h"
37a51d5afcSThomas Huth #include "hw/ppc/xics_spapr.h"
3811ad93f6SDavid Gibson #include "kvm_ppc.h"
3911ad93f6SDavid Gibson #include "qemu/config-file.h"
4011ad93f6SDavid Gibson #include "qemu/error-report.h"
4111ad93f6SDavid Gibson 
4211ad93f6SDavid Gibson #include <sys/ioctl.h>
4311ad93f6SDavid Gibson 
44729f8a4fSCédric Le Goater static int kernel_xics_fd = -1;
45729f8a4fSCédric Le Goater 
46de86ecccSGreg Kurz typedef struct KVMEnabledICP {
47de86ecccSGreg Kurz     unsigned long vcpu_id;
48de86ecccSGreg Kurz     QLIST_ENTRY(KVMEnabledICP) node;
49de86ecccSGreg Kurz } KVMEnabledICP;
50de86ecccSGreg Kurz 
51de86ecccSGreg Kurz static QLIST_HEAD(, KVMEnabledICP)
52de86ecccSGreg Kurz     kvm_enabled_icps = QLIST_HEAD_INITIALIZER(&kvm_enabled_icps);
53de86ecccSGreg Kurz 
5456b11587SCédric Le Goater static void kvm_disable_icps(void)
5556b11587SCédric Le Goater {
5656b11587SCédric Le Goater     KVMEnabledICP *enabled_icp, *next;
5756b11587SCédric Le Goater 
5856b11587SCédric Le Goater     QLIST_FOREACH_SAFE(enabled_icp, &kvm_enabled_icps, node, next) {
5956b11587SCédric Le Goater         QLIST_REMOVE(enabled_icp, node);
6056b11587SCédric Le Goater         g_free(enabled_icp);
6156b11587SCédric Le Goater     }
6256b11587SCédric Le Goater }
6356b11587SCédric Le Goater 
6411ad93f6SDavid Gibson /*
6511ad93f6SDavid Gibson  * ICP-KVM
6611ad93f6SDavid Gibson  */
670e5c7fadSGreg Kurz void icp_get_kvm_state(ICPState *icp)
6811ad93f6SDavid Gibson {
6911ad93f6SDavid Gibson     uint64_t state;
7011ad93f6SDavid Gibson     int ret;
7111ad93f6SDavid Gibson 
723bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
733bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
743bf84e99SCédric Le Goater         return;
753bf84e99SCédric Le Goater     }
763bf84e99SCédric Le Goater 
7711ad93f6SDavid Gibson     /* ICP for this CPU thread is not in use, exiting */
788e4fba20SCédric Le Goater     if (!icp->cs) {
7911ad93f6SDavid Gibson         return;
8011ad93f6SDavid Gibson     }
8111ad93f6SDavid Gibson 
82bf358b54SCédric Le Goater     ret = kvm_get_one_reg(icp->cs, KVM_REG_PPC_ICP_STATE, &state);
8311ad93f6SDavid Gibson     if (ret != 0) {
8411ad93f6SDavid Gibson         error_report("Unable to retrieve KVM interrupt controller state"
858e4fba20SCédric Le Goater                 " for CPU %ld: %s", kvm_arch_vcpu_id(icp->cs), strerror(errno));
8611ad93f6SDavid Gibson         exit(1);
8711ad93f6SDavid Gibson     }
8811ad93f6SDavid Gibson 
898e4fba20SCédric Le Goater     icp->xirr = state >> KVM_REG_PPC_ICP_XISR_SHIFT;
908e4fba20SCédric Le Goater     icp->mfrr = (state >> KVM_REG_PPC_ICP_MFRR_SHIFT)
9111ad93f6SDavid Gibson         & KVM_REG_PPC_ICP_MFRR_MASK;
928e4fba20SCédric Le Goater     icp->pending_priority = (state >> KVM_REG_PPC_ICP_PPRI_SHIFT)
9311ad93f6SDavid Gibson         & KVM_REG_PPC_ICP_PPRI_MASK;
9411ad93f6SDavid Gibson }
9511ad93f6SDavid Gibson 
96dcb556fcSGreg Kurz static void do_icp_synchronize_state(CPUState *cpu, run_on_cpu_data arg)
97dcb556fcSGreg Kurz {
98dcb556fcSGreg Kurz     icp_get_kvm_state(arg.host_ptr);
99dcb556fcSGreg Kurz }
100dcb556fcSGreg Kurz 
1010e5c7fadSGreg Kurz void icp_synchronize_state(ICPState *icp)
102dcb556fcSGreg Kurz {
103dcb556fcSGreg Kurz     if (icp->cs) {
104dcb556fcSGreg Kurz         run_on_cpu(icp->cs, do_icp_synchronize_state, RUN_ON_CPU_HOST_PTR(icp));
105dcb556fcSGreg Kurz     }
106dcb556fcSGreg Kurz }
107dcb556fcSGreg Kurz 
108330a21e3SGreg Kurz int icp_set_kvm_state(ICPState *icp, Error **errp)
10911ad93f6SDavid Gibson {
11011ad93f6SDavid Gibson     uint64_t state;
11111ad93f6SDavid Gibson     int ret;
11211ad93f6SDavid Gibson 
1133bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
1143bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
1153bf84e99SCédric Le Goater         return 0;
1163bf84e99SCédric Le Goater     }
1173bf84e99SCédric Le Goater 
11811ad93f6SDavid Gibson     /* ICP for this CPU thread is not in use, exiting */
1198e4fba20SCédric Le Goater     if (!icp->cs) {
12011ad93f6SDavid Gibson         return 0;
12111ad93f6SDavid Gibson     }
12211ad93f6SDavid Gibson 
1238e4fba20SCédric Le Goater     state = ((uint64_t)icp->xirr << KVM_REG_PPC_ICP_XISR_SHIFT)
1248e4fba20SCédric Le Goater         | ((uint64_t)icp->mfrr << KVM_REG_PPC_ICP_MFRR_SHIFT)
1258e4fba20SCédric Le Goater         | ((uint64_t)icp->pending_priority << KVM_REG_PPC_ICP_PPRI_SHIFT);
12611ad93f6SDavid Gibson 
127bf358b54SCédric Le Goater     ret = kvm_set_one_reg(icp->cs, KVM_REG_PPC_ICP_STATE, &state);
128330a21e3SGreg Kurz     if (ret < 0) {
129330a21e3SGreg Kurz         error_setg_errno(errp, -ret,
130330a21e3SGreg Kurz                          "Unable to restore KVM interrupt controller state (0x%"
131330a21e3SGreg Kurz                          PRIx64 ") for CPU %ld", state,
132330a21e3SGreg Kurz                          kvm_arch_vcpu_id(icp->cs));
13311ad93f6SDavid Gibson         return ret;
13411ad93f6SDavid Gibson     }
13511ad93f6SDavid Gibson 
13611ad93f6SDavid Gibson     return 0;
13711ad93f6SDavid Gibson }
13811ad93f6SDavid Gibson 
1398e6e6efeSGreg Kurz void icp_kvm_realize(DeviceState *dev, Error **errp)
140f0232434SCédric Le Goater {
141a028dd42SCédric Le Goater     ICPState *icp = ICP(dev);
142a028dd42SCédric Le Goater     CPUState *cs;
143de86ecccSGreg Kurz     KVMEnabledICP *enabled_icp;
144a028dd42SCédric Le Goater     unsigned long vcpu_id;
145f0232434SCédric Le Goater     int ret;
146f0232434SCédric Le Goater 
1473bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
148f0232434SCédric Le Goater     if (kernel_xics_fd == -1) {
1493bf84e99SCédric Le Goater         return;
150f0232434SCédric Le Goater     }
151f0232434SCédric Le Goater 
152a028dd42SCédric Le Goater     cs = icp->cs;
153a028dd42SCédric Le Goater     vcpu_id = kvm_arch_vcpu_id(cs);
154a028dd42SCédric Le Goater 
155f0232434SCédric Le Goater     /*
156f0232434SCédric Le Goater      * If we are reusing a parked vCPU fd corresponding to the CPU
157f0232434SCédric Le Goater      * which was hot-removed earlier we don't have to renable
158f0232434SCédric Le Goater      * KVM_CAP_IRQ_XICS capability again.
159f0232434SCédric Le Goater      */
160de86ecccSGreg Kurz     QLIST_FOREACH(enabled_icp, &kvm_enabled_icps, node) {
161de86ecccSGreg Kurz         if (enabled_icp->vcpu_id == vcpu_id) {
162f0232434SCédric Le Goater             return;
163f0232434SCédric Le Goater         }
164de86ecccSGreg Kurz     }
165f0232434SCédric Le Goater 
166de86ecccSGreg Kurz     ret = kvm_vcpu_enable_cap(cs, KVM_CAP_IRQ_XICS, 0, kernel_xics_fd, vcpu_id);
167f0232434SCédric Le Goater     if (ret < 0) {
168b1fd36c3SGreg Kurz         error_setg(errp, "Unable to connect CPU%ld to kernel XICS: %s", vcpu_id,
169de86ecccSGreg Kurz                    strerror(errno));
170b1fd36c3SGreg Kurz         return;
171f0232434SCédric Le Goater     }
172de86ecccSGreg Kurz     enabled_icp = g_malloc(sizeof(*enabled_icp));
173de86ecccSGreg Kurz     enabled_icp->vcpu_id = vcpu_id;
174de86ecccSGreg Kurz     QLIST_INSERT_HEAD(&kvm_enabled_icps, enabled_icp, node);
175f0232434SCédric Le Goater }
176f0232434SCédric Le Goater 
17711ad93f6SDavid Gibson /*
17811ad93f6SDavid Gibson  * ICS-KVM
17911ad93f6SDavid Gibson  */
180d80b2ccfSGreg Kurz void ics_get_kvm_state(ICSState *ics)
18111ad93f6SDavid Gibson {
18211ad93f6SDavid Gibson     uint64_t state;
18311ad93f6SDavid Gibson     int i;
18411ad93f6SDavid Gibson 
1853bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
1863bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
1873bf84e99SCédric Le Goater         return;
1883bf84e99SCédric Le Goater     }
1893bf84e99SCédric Le Goater 
19011ad93f6SDavid Gibson     for (i = 0; i < ics->nr_irqs; i++) {
19111ad93f6SDavid Gibson         ICSIRQState *irq = &ics->irqs[i];
19211ad93f6SDavid Gibson 
193*4c3539d4SCédric Le Goater         if (ics_irq_free(ics, i)) {
194*4c3539d4SCédric Le Goater             continue;
195*4c3539d4SCédric Le Goater         }
196*4c3539d4SCédric Le Goater 
197bf358b54SCédric Le Goater         kvm_device_access(kernel_xics_fd, KVM_DEV_XICS_GRP_SOURCES,
19850beeb68SMarkus Armbruster                           i + ics->offset, &state, false, &error_fatal);
19911ad93f6SDavid Gibson 
20011ad93f6SDavid Gibson         irq->server = state & KVM_XICS_DESTINATION_MASK;
20111ad93f6SDavid Gibson         irq->saved_priority = (state >> KVM_XICS_PRIORITY_SHIFT)
20211ad93f6SDavid Gibson             & KVM_XICS_PRIORITY_MASK;
20311ad93f6SDavid Gibson         /*
20411ad93f6SDavid Gibson          * To be consistent with the software emulation in xics.c, we
20511ad93f6SDavid Gibson          * split out the masked state + priority that we get from the
20611ad93f6SDavid Gibson          * kernel into 'current priority' (0xff if masked) and
20711ad93f6SDavid Gibson          * 'saved priority' (if masked, this is the priority the
20811ad93f6SDavid Gibson          * interrupt had before it was masked).  Masking and unmasking
20911ad93f6SDavid Gibson          * are done with the ibm,int-off and ibm,int-on RTAS calls.
21011ad93f6SDavid Gibson          */
21111ad93f6SDavid Gibson         if (state & KVM_XICS_MASKED) {
21211ad93f6SDavid Gibson             irq->priority = 0xff;
21311ad93f6SDavid Gibson         } else {
21411ad93f6SDavid Gibson             irq->priority = irq->saved_priority;
21511ad93f6SDavid Gibson         }
21611ad93f6SDavid Gibson 
217063cb7cbSSam Bobroff         irq->status = 0;
21811ad93f6SDavid Gibson         if (state & KVM_XICS_PENDING) {
21911ad93f6SDavid Gibson             if (state & KVM_XICS_LEVEL_SENSITIVE) {
22011ad93f6SDavid Gibson                 irq->status |= XICS_STATUS_ASSERTED;
22111ad93f6SDavid Gibson             } else {
22211ad93f6SDavid Gibson                 /*
22311ad93f6SDavid Gibson                  * A pending edge-triggered interrupt (or MSI)
22411ad93f6SDavid Gibson                  * must have been rejected previously when we
22511ad93f6SDavid Gibson                  * first detected it and tried to deliver it,
22611ad93f6SDavid Gibson                  * so mark it as pending and previously rejected
22711ad93f6SDavid Gibson                  * for consistency with how xics.c works.
22811ad93f6SDavid Gibson                  */
22911ad93f6SDavid Gibson                 irq->status |= XICS_STATUS_MASKED_PENDING
23011ad93f6SDavid Gibson                     | XICS_STATUS_REJECTED;
23111ad93f6SDavid Gibson             }
23211ad93f6SDavid Gibson         }
233229e16fdSSam Bobroff         if (state & KVM_XICS_PRESENTED) {
234229e16fdSSam Bobroff                 irq->status |= XICS_STATUS_PRESENTED;
235229e16fdSSam Bobroff         }
236229e16fdSSam Bobroff         if (state & KVM_XICS_QUEUED) {
237229e16fdSSam Bobroff                 irq->status |= XICS_STATUS_QUEUED;
238229e16fdSSam Bobroff         }
23911ad93f6SDavid Gibson     }
24011ad93f6SDavid Gibson }
24111ad93f6SDavid Gibson 
242d80b2ccfSGreg Kurz void ics_synchronize_state(ICSState *ics)
243dcb556fcSGreg Kurz {
244dcb556fcSGreg Kurz     ics_get_kvm_state(ics);
245dcb556fcSGreg Kurz }
246dcb556fcSGreg Kurz 
247330a21e3SGreg Kurz int ics_set_kvm_state_one(ICSState *ics, int srcno, Error **errp)
24811ad93f6SDavid Gibson {
24911ad93f6SDavid Gibson     uint64_t state;
2506cead90cSGreg Kurz     ICSIRQState *irq = &ics->irqs[srcno];
25111ad93f6SDavid Gibson     int ret;
25211ad93f6SDavid Gibson 
2533bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
2543bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
2553bf84e99SCédric Le Goater         return 0;
2563bf84e99SCédric Le Goater     }
2573bf84e99SCédric Le Goater 
25811ad93f6SDavid Gibson     state = irq->server;
25911ad93f6SDavid Gibson     state |= (uint64_t)(irq->saved_priority & KVM_XICS_PRIORITY_MASK)
26011ad93f6SDavid Gibson         << KVM_XICS_PRIORITY_SHIFT;
26111ad93f6SDavid Gibson     if (irq->priority != irq->saved_priority) {
26211ad93f6SDavid Gibson         assert(irq->priority == 0xff);
26338298611SGreg Kurz     }
26438298611SGreg Kurz 
26538298611SGreg Kurz     if (irq->priority == 0xff) {
26611ad93f6SDavid Gibson         state |= KVM_XICS_MASKED;
26711ad93f6SDavid Gibson     }
26811ad93f6SDavid Gibson 
2696cead90cSGreg Kurz     if (irq->flags & XICS_FLAGS_IRQ_LSI) {
27011ad93f6SDavid Gibson         state |= KVM_XICS_LEVEL_SENSITIVE;
27111ad93f6SDavid Gibson         if (irq->status & XICS_STATUS_ASSERTED) {
27211ad93f6SDavid Gibson             state |= KVM_XICS_PENDING;
27311ad93f6SDavid Gibson         }
27411ad93f6SDavid Gibson     } else {
27511ad93f6SDavid Gibson         if (irq->status & XICS_STATUS_MASKED_PENDING) {
27611ad93f6SDavid Gibson             state |= KVM_XICS_PENDING;
27711ad93f6SDavid Gibson         }
27811ad93f6SDavid Gibson     }
279229e16fdSSam Bobroff     if (irq->status & XICS_STATUS_PRESENTED) {
280229e16fdSSam Bobroff         state |= KVM_XICS_PRESENTED;
281229e16fdSSam Bobroff     }
282229e16fdSSam Bobroff     if (irq->status & XICS_STATUS_QUEUED) {
283229e16fdSSam Bobroff         state |= KVM_XICS_QUEUED;
284229e16fdSSam Bobroff     }
28511ad93f6SDavid Gibson 
28652b43881SCédric Le Goater     ret = kvm_device_access(kernel_xics_fd, KVM_DEV_XICS_GRP_SOURCES,
287330a21e3SGreg Kurz                             srcno + ics->offset, &state, true, errp);
288330a21e3SGreg Kurz     if (ret < 0) {
28911ad93f6SDavid Gibson         return ret;
29011ad93f6SDavid Gibson     }
2916cead90cSGreg Kurz 
2926cead90cSGreg Kurz     return 0;
2936cead90cSGreg Kurz }
2946cead90cSGreg Kurz 
295330a21e3SGreg Kurz int ics_set_kvm_state(ICSState *ics, Error **errp)
2966cead90cSGreg Kurz {
2976cead90cSGreg Kurz     int i;
2986cead90cSGreg Kurz 
2993bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
3003bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
3013bf84e99SCédric Le Goater         return 0;
3023bf84e99SCédric Le Goater     }
3033bf84e99SCédric Le Goater 
3046cead90cSGreg Kurz     for (i = 0; i < ics->nr_irqs; i++) {
305330a21e3SGreg Kurz         Error *local_err = NULL;
3066cead90cSGreg Kurz         int ret;
3076cead90cSGreg Kurz 
308*4c3539d4SCédric Le Goater         if (ics_irq_free(ics, i)) {
309*4c3539d4SCédric Le Goater             continue;
310*4c3539d4SCédric Le Goater         }
311*4c3539d4SCédric Le Goater 
312330a21e3SGreg Kurz         ret = ics_set_kvm_state_one(ics, i, &local_err);
313330a21e3SGreg Kurz         if (ret < 0) {
314330a21e3SGreg Kurz             error_propagate(errp, local_err);
3156cead90cSGreg Kurz             return ret;
3166cead90cSGreg Kurz         }
31711ad93f6SDavid Gibson     }
31811ad93f6SDavid Gibson 
31911ad93f6SDavid Gibson     return 0;
32011ad93f6SDavid Gibson }
32111ad93f6SDavid Gibson 
322557b4567SGreg Kurz void ics_kvm_set_irq(ICSState *ics, int srcno, int val)
32311ad93f6SDavid Gibson {
32411ad93f6SDavid Gibson     struct kvm_irq_level args;
32511ad93f6SDavid Gibson     int rc;
32611ad93f6SDavid Gibson 
3273bf84e99SCédric Le Goater     /* The KVM XICS device should be in use */
3283bf84e99SCédric Le Goater     assert(kernel_xics_fd != -1);
3293bf84e99SCédric Le Goater 
33011ad93f6SDavid Gibson     args.irq = srcno + ics->offset;
3314af88944SAlexey Kardashevskiy     if (ics->irqs[srcno].flags & XICS_FLAGS_IRQ_MSI) {
33211ad93f6SDavid Gibson         if (!val) {
33311ad93f6SDavid Gibson             return;
33411ad93f6SDavid Gibson         }
33511ad93f6SDavid Gibson         args.level = KVM_INTERRUPT_SET;
33611ad93f6SDavid Gibson     } else {
33711ad93f6SDavid Gibson         args.level = val ? KVM_INTERRUPT_SET_LEVEL : KVM_INTERRUPT_UNSET;
33811ad93f6SDavid Gibson     }
33911ad93f6SDavid Gibson     rc = kvm_vm_ioctl(kvm_state, KVM_IRQ_LINE, &args);
34011ad93f6SDavid Gibson     if (rc < 0) {
34111ad93f6SDavid Gibson         perror("kvm_irq_line");
34211ad93f6SDavid Gibson     }
34311ad93f6SDavid Gibson }
34411ad93f6SDavid Gibson 
345eab9f191SGreg Kurz int xics_kvm_connect(SpaprMachineState *spapr, Error **errp)
34611ad93f6SDavid Gibson {
347817bb6a4SCédric Le Goater     int rc;
3483f777abcSCédric Le Goater     CPUState *cs;
3493f777abcSCédric Le Goater     Error *local_err = NULL;
3503f777abcSCédric Le Goater 
3513f777abcSCédric Le Goater     /*
3523f777abcSCédric Le Goater      * The KVM XICS device already in use. This is the case when
3533f777abcSCédric Le Goater      * rebooting under the XICS-only interrupt mode.
3543f777abcSCédric Le Goater      */
3553f777abcSCédric Le Goater     if (kernel_xics_fd != -1) {
3563f777abcSCédric Le Goater         return 0;
3573f777abcSCédric Le Goater     }
35811ad93f6SDavid Gibson 
35911ad93f6SDavid Gibson     if (!kvm_enabled() || !kvm_check_extension(kvm_state, KVM_CAP_IRQ_XICS)) {
36011ad93f6SDavid Gibson         error_setg(errp,
36111ad93f6SDavid Gibson                    "KVM and IRQ_XICS capability must be present for in-kernel XICS");
36264fb9621SGreg Kurz         return -1;
36311ad93f6SDavid Gibson     }
36411ad93f6SDavid Gibson 
3653a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_SET_XIVE, "ibm,set-xive");
36611ad93f6SDavid Gibson     if (rc < 0) {
367ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
368ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,set-xive");
36911ad93f6SDavid Gibson         goto fail;
37011ad93f6SDavid Gibson     }
37111ad93f6SDavid Gibson 
3723a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_GET_XIVE, "ibm,get-xive");
37311ad93f6SDavid Gibson     if (rc < 0) {
374ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
375ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,get-xive");
37611ad93f6SDavid Gibson         goto fail;
37711ad93f6SDavid Gibson     }
37811ad93f6SDavid Gibson 
3793a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_INT_ON, "ibm,int-on");
38011ad93f6SDavid Gibson     if (rc < 0) {
381ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
382ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,int-on");
38311ad93f6SDavid Gibson         goto fail;
38411ad93f6SDavid Gibson     }
38511ad93f6SDavid Gibson 
3863a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_INT_OFF, "ibm,int-off");
38711ad93f6SDavid Gibson     if (rc < 0) {
388ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
389ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,int-off");
39011ad93f6SDavid Gibson         goto fail;
39111ad93f6SDavid Gibson     }
39211ad93f6SDavid Gibson 
393bf358b54SCédric Le Goater     /* Create the KVM XICS device */
394bf358b54SCédric Le Goater     rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false);
39511ad93f6SDavid Gibson     if (rc < 0) {
396ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc, "Error on KVM_CREATE_DEVICE for XICS");
39711ad93f6SDavid Gibson         goto fail;
39811ad93f6SDavid Gibson     }
39911ad93f6SDavid Gibson 
400bf358b54SCédric Le Goater     kernel_xics_fd = rc;
4019554233cSAlexey Kardashevskiy     kvm_kernel_irqchip = true;
4029554233cSAlexey Kardashevskiy     kvm_msi_via_irqfd_allowed = true;
4039554233cSAlexey Kardashevskiy     kvm_gsi_direct_mapping = true;
4049554233cSAlexey Kardashevskiy 
4053f777abcSCédric Le Goater     /* Create the presenters */
4063f777abcSCédric Le Goater     CPU_FOREACH(cs) {
4073f777abcSCédric Le Goater         PowerPCCPU *cpu = POWERPC_CPU(cs);
4083f777abcSCédric Le Goater 
4093f777abcSCédric Le Goater         icp_kvm_realize(DEVICE(spapr_cpu_state(cpu)->icp), &local_err);
4103f777abcSCédric Le Goater         if (local_err) {
4113f777abcSCédric Le Goater             goto fail;
4123f777abcSCédric Le Goater         }
4133f777abcSCédric Le Goater     }
4143f777abcSCédric Le Goater 
4153f777abcSCédric Le Goater     /* Update the KVM sources */
416330a21e3SGreg Kurz     ics_set_kvm_state(spapr->ics, &local_err);
417330a21e3SGreg Kurz     if (local_err) {
418330a21e3SGreg Kurz         goto fail;
419330a21e3SGreg Kurz     }
4203f777abcSCédric Le Goater 
4213f777abcSCédric Le Goater     /* Connect the presenters to the initial VCPUs of the machine */
4223f777abcSCédric Le Goater     CPU_FOREACH(cs) {
4233f777abcSCédric Le Goater         PowerPCCPU *cpu = POWERPC_CPU(cs);
424330a21e3SGreg Kurz         icp_set_kvm_state(spapr_cpu_state(cpu)->icp, &local_err);
425330a21e3SGreg Kurz         if (local_err) {
426330a21e3SGreg Kurz             goto fail;
427330a21e3SGreg Kurz         }
4283f777abcSCédric Le Goater     }
4293f777abcSCédric Le Goater 
430bf358b54SCédric Le Goater     return 0;
43111ad93f6SDavid Gibson 
43211ad93f6SDavid Gibson fail:
433ab3d15faSGreg Kurz     error_propagate(errp, local_err);
4344812f261SGreg Kurz     xics_kvm_disconnect(spapr, NULL);
4352192a930SCédric Le Goater     return -1;
43611ad93f6SDavid Gibson }
43756b11587SCédric Le Goater 
43856b11587SCédric Le Goater void xics_kvm_disconnect(SpaprMachineState *spapr, Error **errp)
43956b11587SCédric Le Goater {
44056b11587SCédric Le Goater     /*
44156b11587SCédric Le Goater      * Only on P9 using the XICS-on XIVE KVM device:
44256b11587SCédric Le Goater      *
44356b11587SCédric Le Goater      * When the KVM device fd is closed, the device is destroyed and
44456b11587SCédric Le Goater      * removed from the list of devices of the VM. The VCPU presenters
44556b11587SCédric Le Goater      * are also detached from the device.
44656b11587SCédric Le Goater      */
4474812f261SGreg Kurz     if (kernel_xics_fd != -1) {
44856b11587SCédric Le Goater         close(kernel_xics_fd);
44956b11587SCédric Le Goater         kernel_xics_fd = -1;
4504812f261SGreg Kurz     }
45156b11587SCédric Le Goater 
45256b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,set-xive");
45356b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,get-xive");
45456b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,int-on");
45556b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,int-off");
45656b11587SCédric Le Goater 
45756b11587SCédric Le Goater     kvm_kernel_irqchip = false;
45856b11587SCédric Le Goater     kvm_msi_via_irqfd_allowed = false;
45956b11587SCédric Le Goater     kvm_gsi_direct_mapping = false;
46056b11587SCédric Le Goater 
46156b11587SCédric Le Goater     /* Clear the presenter from the VCPUs */
46256b11587SCédric Le Goater     kvm_disable_icps();
46356b11587SCédric Le Goater }
4647abc0c6dSGreg Kurz 
4657abc0c6dSGreg Kurz /*
4667abc0c6dSGreg Kurz  * This is a heuristic to detect older KVMs on POWER9 hosts that don't
4677abc0c6dSGreg Kurz  * support destruction of a KVM XICS device while the VM is running.
4687abc0c6dSGreg Kurz  * Required to start a spapr machine with ic-mode=dual,kernel-irqchip=on.
4697abc0c6dSGreg Kurz  */
4707abc0c6dSGreg Kurz bool xics_kvm_has_broken_disconnect(SpaprMachineState *spapr)
4717abc0c6dSGreg Kurz {
4727abc0c6dSGreg Kurz     int rc;
4737abc0c6dSGreg Kurz 
4747abc0c6dSGreg Kurz     rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false);
4757abc0c6dSGreg Kurz     if (rc < 0) {
4767abc0c6dSGreg Kurz         /*
4777abc0c6dSGreg Kurz          * The error is ignored on purpose. The KVM XICS setup code
4787abc0c6dSGreg Kurz          * will catch it again anyway. The goal here is to see if
4797abc0c6dSGreg Kurz          * close() actually destroys the device or not.
4807abc0c6dSGreg Kurz          */
4817abc0c6dSGreg Kurz         return false;
4827abc0c6dSGreg Kurz     }
4837abc0c6dSGreg Kurz 
4847abc0c6dSGreg Kurz     close(rc);
4857abc0c6dSGreg Kurz 
4867abc0c6dSGreg Kurz     rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false);
4877abc0c6dSGreg Kurz     if (rc >= 0) {
4887abc0c6dSGreg Kurz         close(rc);
4897abc0c6dSGreg Kurz         return false;
4907abc0c6dSGreg Kurz     }
4917abc0c6dSGreg Kurz 
4927abc0c6dSGreg Kurz     return errno == EEXIST;
4937abc0c6dSGreg Kurz }
494