xref: /qemu/hw/intc/xics_kvm.c (revision 668f62ec621e4e2919fb7d4caa5d805764c5852d)
111ad93f6SDavid Gibson /*
211ad93f6SDavid Gibson  * QEMU PowerPC pSeries Logical Partition (aka sPAPR) hardware System Emulator
311ad93f6SDavid Gibson  *
411ad93f6SDavid Gibson  * PAPR Virtualized Interrupt System, aka ICS/ICP aka xics, in-kernel emulation
511ad93f6SDavid Gibson  *
611ad93f6SDavid Gibson  * Copyright (c) 2013 David Gibson, IBM Corporation.
711ad93f6SDavid Gibson  *
811ad93f6SDavid Gibson  * Permission is hereby granted, free of charge, to any person obtaining a copy
911ad93f6SDavid Gibson  * of this software and associated documentation files (the "Software"), to deal
1011ad93f6SDavid Gibson  * in the Software without restriction, including without limitation the rights
1111ad93f6SDavid Gibson  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
1211ad93f6SDavid Gibson  * copies of the Software, and to permit persons to whom the Software is
1311ad93f6SDavid Gibson  * furnished to do so, subject to the following conditions:
1411ad93f6SDavid Gibson  *
1511ad93f6SDavid Gibson  * The above copyright notice and this permission notice shall be included in
1611ad93f6SDavid Gibson  * all copies or substantial portions of the Software.
1711ad93f6SDavid Gibson  *
1811ad93f6SDavid Gibson  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1911ad93f6SDavid Gibson  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
2011ad93f6SDavid Gibson  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
2111ad93f6SDavid Gibson  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
2211ad93f6SDavid Gibson  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
2311ad93f6SDavid Gibson  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
2411ad93f6SDavid Gibson  * THE SOFTWARE.
2511ad93f6SDavid Gibson  *
2611ad93f6SDavid Gibson  */
2711ad93f6SDavid Gibson 
280d75590dSPeter Maydell #include "qemu/osdep.h"
29da34e65cSMarkus Armbruster #include "qapi/error.h"
304771d756SPaolo Bonzini #include "qemu-common.h"
314771d756SPaolo Bonzini #include "cpu.h"
3211ad93f6SDavid Gibson #include "trace.h"
3377ac58ddSPaolo Bonzini #include "sysemu/kvm.h"
3411ad93f6SDavid Gibson #include "hw/ppc/spapr.h"
353f777abcSCédric Le Goater #include "hw/ppc/spapr_cpu_core.h"
3611ad93f6SDavid Gibson #include "hw/ppc/xics.h"
37a51d5afcSThomas Huth #include "hw/ppc/xics_spapr.h"
3811ad93f6SDavid Gibson #include "kvm_ppc.h"
3911ad93f6SDavid Gibson #include "qemu/config-file.h"
4011ad93f6SDavid Gibson #include "qemu/error-report.h"
4111ad93f6SDavid Gibson 
4211ad93f6SDavid Gibson #include <sys/ioctl.h>
4311ad93f6SDavid Gibson 
44729f8a4fSCédric Le Goater static int kernel_xics_fd = -1;
45729f8a4fSCédric Le Goater 
46de86ecccSGreg Kurz typedef struct KVMEnabledICP {
47de86ecccSGreg Kurz     unsigned long vcpu_id;
48de86ecccSGreg Kurz     QLIST_ENTRY(KVMEnabledICP) node;
49de86ecccSGreg Kurz } KVMEnabledICP;
50de86ecccSGreg Kurz 
51de86ecccSGreg Kurz static QLIST_HEAD(, KVMEnabledICP)
52de86ecccSGreg Kurz     kvm_enabled_icps = QLIST_HEAD_INITIALIZER(&kvm_enabled_icps);
53de86ecccSGreg Kurz 
5456b11587SCédric Le Goater static void kvm_disable_icps(void)
5556b11587SCédric Le Goater {
5656b11587SCédric Le Goater     KVMEnabledICP *enabled_icp, *next;
5756b11587SCédric Le Goater 
5856b11587SCédric Le Goater     QLIST_FOREACH_SAFE(enabled_icp, &kvm_enabled_icps, node, next) {
5956b11587SCédric Le Goater         QLIST_REMOVE(enabled_icp, node);
6056b11587SCédric Le Goater         g_free(enabled_icp);
6156b11587SCédric Le Goater     }
6256b11587SCédric Le Goater }
6356b11587SCédric Le Goater 
6411ad93f6SDavid Gibson /*
6511ad93f6SDavid Gibson  * ICP-KVM
6611ad93f6SDavid Gibson  */
670e5c7fadSGreg Kurz void icp_get_kvm_state(ICPState *icp)
6811ad93f6SDavid Gibson {
6911ad93f6SDavid Gibson     uint64_t state;
7011ad93f6SDavid Gibson     int ret;
7111ad93f6SDavid Gibson 
723bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
733bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
743bf84e99SCédric Le Goater         return;
753bf84e99SCédric Le Goater     }
763bf84e99SCédric Le Goater 
7711ad93f6SDavid Gibson     /* ICP for this CPU thread is not in use, exiting */
788e4fba20SCédric Le Goater     if (!icp->cs) {
7911ad93f6SDavid Gibson         return;
8011ad93f6SDavid Gibson     }
8111ad93f6SDavid Gibson 
82bf358b54SCédric Le Goater     ret = kvm_get_one_reg(icp->cs, KVM_REG_PPC_ICP_STATE, &state);
8311ad93f6SDavid Gibson     if (ret != 0) {
8411ad93f6SDavid Gibson         error_report("Unable to retrieve KVM interrupt controller state"
858e4fba20SCédric Le Goater                 " for CPU %ld: %s", kvm_arch_vcpu_id(icp->cs), strerror(errno));
8611ad93f6SDavid Gibson         exit(1);
8711ad93f6SDavid Gibson     }
8811ad93f6SDavid Gibson 
898e4fba20SCédric Le Goater     icp->xirr = state >> KVM_REG_PPC_ICP_XISR_SHIFT;
908e4fba20SCédric Le Goater     icp->mfrr = (state >> KVM_REG_PPC_ICP_MFRR_SHIFT)
9111ad93f6SDavid Gibson         & KVM_REG_PPC_ICP_MFRR_MASK;
928e4fba20SCédric Le Goater     icp->pending_priority = (state >> KVM_REG_PPC_ICP_PPRI_SHIFT)
9311ad93f6SDavid Gibson         & KVM_REG_PPC_ICP_PPRI_MASK;
9411ad93f6SDavid Gibson }
9511ad93f6SDavid Gibson 
96dcb556fcSGreg Kurz static void do_icp_synchronize_state(CPUState *cpu, run_on_cpu_data arg)
97dcb556fcSGreg Kurz {
98dcb556fcSGreg Kurz     icp_get_kvm_state(arg.host_ptr);
99dcb556fcSGreg Kurz }
100dcb556fcSGreg Kurz 
1010e5c7fadSGreg Kurz void icp_synchronize_state(ICPState *icp)
102dcb556fcSGreg Kurz {
103dcb556fcSGreg Kurz     if (icp->cs) {
104dcb556fcSGreg Kurz         run_on_cpu(icp->cs, do_icp_synchronize_state, RUN_ON_CPU_HOST_PTR(icp));
105dcb556fcSGreg Kurz     }
106dcb556fcSGreg Kurz }
107dcb556fcSGreg Kurz 
108330a21e3SGreg Kurz int icp_set_kvm_state(ICPState *icp, Error **errp)
10911ad93f6SDavid Gibson {
11011ad93f6SDavid Gibson     uint64_t state;
11111ad93f6SDavid Gibson     int ret;
11211ad93f6SDavid Gibson 
1133bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
1143bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
1153bf84e99SCédric Le Goater         return 0;
1163bf84e99SCédric Le Goater     }
1173bf84e99SCédric Le Goater 
11811ad93f6SDavid Gibson     /* ICP for this CPU thread is not in use, exiting */
1198e4fba20SCédric Le Goater     if (!icp->cs) {
12011ad93f6SDavid Gibson         return 0;
12111ad93f6SDavid Gibson     }
12211ad93f6SDavid Gibson 
1238e4fba20SCédric Le Goater     state = ((uint64_t)icp->xirr << KVM_REG_PPC_ICP_XISR_SHIFT)
1248e4fba20SCédric Le Goater         | ((uint64_t)icp->mfrr << KVM_REG_PPC_ICP_MFRR_SHIFT)
1258e4fba20SCédric Le Goater         | ((uint64_t)icp->pending_priority << KVM_REG_PPC_ICP_PPRI_SHIFT);
12611ad93f6SDavid Gibson 
127bf358b54SCédric Le Goater     ret = kvm_set_one_reg(icp->cs, KVM_REG_PPC_ICP_STATE, &state);
128330a21e3SGreg Kurz     if (ret < 0) {
129330a21e3SGreg Kurz         error_setg_errno(errp, -ret,
130330a21e3SGreg Kurz                          "Unable to restore KVM interrupt controller state (0x%"
131330a21e3SGreg Kurz                          PRIx64 ") for CPU %ld", state,
132330a21e3SGreg Kurz                          kvm_arch_vcpu_id(icp->cs));
13311ad93f6SDavid Gibson         return ret;
13411ad93f6SDavid Gibson     }
13511ad93f6SDavid Gibson 
13611ad93f6SDavid Gibson     return 0;
13711ad93f6SDavid Gibson }
13811ad93f6SDavid Gibson 
1398e6e6efeSGreg Kurz void icp_kvm_realize(DeviceState *dev, Error **errp)
140f0232434SCédric Le Goater {
141a028dd42SCédric Le Goater     ICPState *icp = ICP(dev);
142a028dd42SCédric Le Goater     CPUState *cs;
143de86ecccSGreg Kurz     KVMEnabledICP *enabled_icp;
144a028dd42SCédric Le Goater     unsigned long vcpu_id;
145f0232434SCédric Le Goater     int ret;
146f0232434SCédric Le Goater 
1473bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
148f0232434SCédric Le Goater     if (kernel_xics_fd == -1) {
1493bf84e99SCédric Le Goater         return;
150f0232434SCédric Le Goater     }
151f0232434SCédric Le Goater 
152a028dd42SCédric Le Goater     cs = icp->cs;
153a028dd42SCédric Le Goater     vcpu_id = kvm_arch_vcpu_id(cs);
154a028dd42SCédric Le Goater 
155f0232434SCédric Le Goater     /*
156f0232434SCédric Le Goater      * If we are reusing a parked vCPU fd corresponding to the CPU
157f0232434SCédric Le Goater      * which was hot-removed earlier we don't have to renable
158f0232434SCédric Le Goater      * KVM_CAP_IRQ_XICS capability again.
159f0232434SCédric Le Goater      */
160de86ecccSGreg Kurz     QLIST_FOREACH(enabled_icp, &kvm_enabled_icps, node) {
161de86ecccSGreg Kurz         if (enabled_icp->vcpu_id == vcpu_id) {
162f0232434SCédric Le Goater             return;
163f0232434SCédric Le Goater         }
164de86ecccSGreg Kurz     }
165f0232434SCédric Le Goater 
166de86ecccSGreg Kurz     ret = kvm_vcpu_enable_cap(cs, KVM_CAP_IRQ_XICS, 0, kernel_xics_fd, vcpu_id);
167f0232434SCédric Le Goater     if (ret < 0) {
168894ea3ecSGreg Kurz         Error *local_err = NULL;
169894ea3ecSGreg Kurz 
170894ea3ecSGreg Kurz         error_setg(&local_err, "Unable to connect CPU%ld to kernel XICS: %s",
171894ea3ecSGreg Kurz                    vcpu_id, strerror(errno));
172894ea3ecSGreg Kurz         if (errno == ENOSPC) {
173894ea3ecSGreg Kurz             error_append_hint(&local_err, "Try -smp maxcpus=N with N < %u\n",
174894ea3ecSGreg Kurz                               MACHINE(qdev_get_machine())->smp.max_cpus);
175894ea3ecSGreg Kurz         }
176894ea3ecSGreg Kurz         error_propagate(errp, local_err);
177b1fd36c3SGreg Kurz         return;
178f0232434SCédric Le Goater     }
179de86ecccSGreg Kurz     enabled_icp = g_malloc(sizeof(*enabled_icp));
180de86ecccSGreg Kurz     enabled_icp->vcpu_id = vcpu_id;
181de86ecccSGreg Kurz     QLIST_INSERT_HEAD(&kvm_enabled_icps, enabled_icp, node);
182f0232434SCédric Le Goater }
183f0232434SCédric Le Goater 
18411ad93f6SDavid Gibson /*
18511ad93f6SDavid Gibson  * ICS-KVM
18611ad93f6SDavid Gibson  */
187d80b2ccfSGreg Kurz void ics_get_kvm_state(ICSState *ics)
18811ad93f6SDavid Gibson {
18911ad93f6SDavid Gibson     uint64_t state;
19011ad93f6SDavid Gibson     int i;
19111ad93f6SDavid Gibson 
1923bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
1933bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
1943bf84e99SCédric Le Goater         return;
1953bf84e99SCédric Le Goater     }
1963bf84e99SCédric Le Goater 
19711ad93f6SDavid Gibson     for (i = 0; i < ics->nr_irqs; i++) {
19811ad93f6SDavid Gibson         ICSIRQState *irq = &ics->irqs[i];
19911ad93f6SDavid Gibson 
2004c3539d4SCédric Le Goater         if (ics_irq_free(ics, i)) {
2014c3539d4SCédric Le Goater             continue;
2024c3539d4SCédric Le Goater         }
2034c3539d4SCédric Le Goater 
204bf358b54SCédric Le Goater         kvm_device_access(kernel_xics_fd, KVM_DEV_XICS_GRP_SOURCES,
20550beeb68SMarkus Armbruster                           i + ics->offset, &state, false, &error_fatal);
20611ad93f6SDavid Gibson 
20711ad93f6SDavid Gibson         irq->server = state & KVM_XICS_DESTINATION_MASK;
20811ad93f6SDavid Gibson         irq->saved_priority = (state >> KVM_XICS_PRIORITY_SHIFT)
20911ad93f6SDavid Gibson             & KVM_XICS_PRIORITY_MASK;
21011ad93f6SDavid Gibson         /*
21111ad93f6SDavid Gibson          * To be consistent with the software emulation in xics.c, we
21211ad93f6SDavid Gibson          * split out the masked state + priority that we get from the
21311ad93f6SDavid Gibson          * kernel into 'current priority' (0xff if masked) and
21411ad93f6SDavid Gibson          * 'saved priority' (if masked, this is the priority the
21511ad93f6SDavid Gibson          * interrupt had before it was masked).  Masking and unmasking
21611ad93f6SDavid Gibson          * are done with the ibm,int-off and ibm,int-on RTAS calls.
21711ad93f6SDavid Gibson          */
21811ad93f6SDavid Gibson         if (state & KVM_XICS_MASKED) {
21911ad93f6SDavid Gibson             irq->priority = 0xff;
22011ad93f6SDavid Gibson         } else {
22111ad93f6SDavid Gibson             irq->priority = irq->saved_priority;
22211ad93f6SDavid Gibson         }
22311ad93f6SDavid Gibson 
224063cb7cbSSam Bobroff         irq->status = 0;
22511ad93f6SDavid Gibson         if (state & KVM_XICS_PENDING) {
22611ad93f6SDavid Gibson             if (state & KVM_XICS_LEVEL_SENSITIVE) {
22711ad93f6SDavid Gibson                 irq->status |= XICS_STATUS_ASSERTED;
22811ad93f6SDavid Gibson             } else {
22911ad93f6SDavid Gibson                 /*
23011ad93f6SDavid Gibson                  * A pending edge-triggered interrupt (or MSI)
23111ad93f6SDavid Gibson                  * must have been rejected previously when we
23211ad93f6SDavid Gibson                  * first detected it and tried to deliver it,
23311ad93f6SDavid Gibson                  * so mark it as pending and previously rejected
23411ad93f6SDavid Gibson                  * for consistency with how xics.c works.
23511ad93f6SDavid Gibson                  */
23611ad93f6SDavid Gibson                 irq->status |= XICS_STATUS_MASKED_PENDING
23711ad93f6SDavid Gibson                     | XICS_STATUS_REJECTED;
23811ad93f6SDavid Gibson             }
23911ad93f6SDavid Gibson         }
240229e16fdSSam Bobroff         if (state & KVM_XICS_PRESENTED) {
241229e16fdSSam Bobroff                 irq->status |= XICS_STATUS_PRESENTED;
242229e16fdSSam Bobroff         }
243229e16fdSSam Bobroff         if (state & KVM_XICS_QUEUED) {
244229e16fdSSam Bobroff                 irq->status |= XICS_STATUS_QUEUED;
245229e16fdSSam Bobroff         }
24611ad93f6SDavid Gibson     }
24711ad93f6SDavid Gibson }
24811ad93f6SDavid Gibson 
249d80b2ccfSGreg Kurz void ics_synchronize_state(ICSState *ics)
250dcb556fcSGreg Kurz {
251dcb556fcSGreg Kurz     ics_get_kvm_state(ics);
252dcb556fcSGreg Kurz }
253dcb556fcSGreg Kurz 
254330a21e3SGreg Kurz int ics_set_kvm_state_one(ICSState *ics, int srcno, Error **errp)
25511ad93f6SDavid Gibson {
25611ad93f6SDavid Gibson     uint64_t state;
2576cead90cSGreg Kurz     ICSIRQState *irq = &ics->irqs[srcno];
25811ad93f6SDavid Gibson     int ret;
25911ad93f6SDavid Gibson 
2603bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
2613bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
2623bf84e99SCédric Le Goater         return 0;
2633bf84e99SCédric Le Goater     }
2643bf84e99SCédric Le Goater 
26511ad93f6SDavid Gibson     state = irq->server;
26611ad93f6SDavid Gibson     state |= (uint64_t)(irq->saved_priority & KVM_XICS_PRIORITY_MASK)
26711ad93f6SDavid Gibson         << KVM_XICS_PRIORITY_SHIFT;
26811ad93f6SDavid Gibson     if (irq->priority != irq->saved_priority) {
26911ad93f6SDavid Gibson         assert(irq->priority == 0xff);
27038298611SGreg Kurz     }
27138298611SGreg Kurz 
27238298611SGreg Kurz     if (irq->priority == 0xff) {
27311ad93f6SDavid Gibson         state |= KVM_XICS_MASKED;
27411ad93f6SDavid Gibson     }
27511ad93f6SDavid Gibson 
2766cead90cSGreg Kurz     if (irq->flags & XICS_FLAGS_IRQ_LSI) {
27711ad93f6SDavid Gibson         state |= KVM_XICS_LEVEL_SENSITIVE;
27811ad93f6SDavid Gibson         if (irq->status & XICS_STATUS_ASSERTED) {
27911ad93f6SDavid Gibson             state |= KVM_XICS_PENDING;
28011ad93f6SDavid Gibson         }
28111ad93f6SDavid Gibson     } else {
28211ad93f6SDavid Gibson         if (irq->status & XICS_STATUS_MASKED_PENDING) {
28311ad93f6SDavid Gibson             state |= KVM_XICS_PENDING;
28411ad93f6SDavid Gibson         }
28511ad93f6SDavid Gibson     }
286229e16fdSSam Bobroff     if (irq->status & XICS_STATUS_PRESENTED) {
287229e16fdSSam Bobroff         state |= KVM_XICS_PRESENTED;
288229e16fdSSam Bobroff     }
289229e16fdSSam Bobroff     if (irq->status & XICS_STATUS_QUEUED) {
290229e16fdSSam Bobroff         state |= KVM_XICS_QUEUED;
291229e16fdSSam Bobroff     }
29211ad93f6SDavid Gibson 
29352b43881SCédric Le Goater     ret = kvm_device_access(kernel_xics_fd, KVM_DEV_XICS_GRP_SOURCES,
294330a21e3SGreg Kurz                             srcno + ics->offset, &state, true, errp);
295330a21e3SGreg Kurz     if (ret < 0) {
29611ad93f6SDavid Gibson         return ret;
29711ad93f6SDavid Gibson     }
2986cead90cSGreg Kurz 
2996cead90cSGreg Kurz     return 0;
3006cead90cSGreg Kurz }
3016cead90cSGreg Kurz 
302330a21e3SGreg Kurz int ics_set_kvm_state(ICSState *ics, Error **errp)
3036cead90cSGreg Kurz {
3046cead90cSGreg Kurz     int i;
3056cead90cSGreg Kurz 
3063bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
3073bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
3083bf84e99SCédric Le Goater         return 0;
3093bf84e99SCédric Le Goater     }
3103bf84e99SCédric Le Goater 
3116cead90cSGreg Kurz     for (i = 0; i < ics->nr_irqs; i++) {
3126cead90cSGreg Kurz         int ret;
3136cead90cSGreg Kurz 
3144c3539d4SCédric Le Goater         if (ics_irq_free(ics, i)) {
3154c3539d4SCédric Le Goater             continue;
3164c3539d4SCédric Le Goater         }
3174c3539d4SCédric Le Goater 
318*668f62ecSMarkus Armbruster         ret = ics_set_kvm_state_one(ics, i, errp);
319330a21e3SGreg Kurz         if (ret < 0) {
3206cead90cSGreg Kurz             return ret;
3216cead90cSGreg Kurz         }
32211ad93f6SDavid Gibson     }
32311ad93f6SDavid Gibson 
32411ad93f6SDavid Gibson     return 0;
32511ad93f6SDavid Gibson }
32611ad93f6SDavid Gibson 
327557b4567SGreg Kurz void ics_kvm_set_irq(ICSState *ics, int srcno, int val)
32811ad93f6SDavid Gibson {
32911ad93f6SDavid Gibson     struct kvm_irq_level args;
33011ad93f6SDavid Gibson     int rc;
33111ad93f6SDavid Gibson 
3323bf84e99SCédric Le Goater     /* The KVM XICS device should be in use */
3333bf84e99SCédric Le Goater     assert(kernel_xics_fd != -1);
3343bf84e99SCédric Le Goater 
33511ad93f6SDavid Gibson     args.irq = srcno + ics->offset;
3364af88944SAlexey Kardashevskiy     if (ics->irqs[srcno].flags & XICS_FLAGS_IRQ_MSI) {
33711ad93f6SDavid Gibson         if (!val) {
33811ad93f6SDavid Gibson             return;
33911ad93f6SDavid Gibson         }
34011ad93f6SDavid Gibson         args.level = KVM_INTERRUPT_SET;
34111ad93f6SDavid Gibson     } else {
34211ad93f6SDavid Gibson         args.level = val ? KVM_INTERRUPT_SET_LEVEL : KVM_INTERRUPT_UNSET;
34311ad93f6SDavid Gibson     }
34411ad93f6SDavid Gibson     rc = kvm_vm_ioctl(kvm_state, KVM_IRQ_LINE, &args);
34511ad93f6SDavid Gibson     if (rc < 0) {
34611ad93f6SDavid Gibson         perror("kvm_irq_line");
34711ad93f6SDavid Gibson     }
34811ad93f6SDavid Gibson }
34911ad93f6SDavid Gibson 
3504ffb7496SGreg Kurz int xics_kvm_connect(SpaprInterruptController *intc, uint32_t nr_servers,
3514ffb7496SGreg Kurz                      Error **errp)
35211ad93f6SDavid Gibson {
35398a39a79SDavid Gibson     ICSState *ics = ICS_SPAPR(intc);
354817bb6a4SCédric Le Goater     int rc;
3553f777abcSCédric Le Goater     CPUState *cs;
3563f777abcSCédric Le Goater     Error *local_err = NULL;
3573f777abcSCédric Le Goater 
3583f777abcSCédric Le Goater     /*
3593f777abcSCédric Le Goater      * The KVM XICS device already in use. This is the case when
3603f777abcSCédric Le Goater      * rebooting under the XICS-only interrupt mode.
3613f777abcSCédric Le Goater      */
3623f777abcSCédric Le Goater     if (kernel_xics_fd != -1) {
3633f777abcSCédric Le Goater         return 0;
3643f777abcSCédric Le Goater     }
36511ad93f6SDavid Gibson 
36611ad93f6SDavid Gibson     if (!kvm_enabled() || !kvm_check_extension(kvm_state, KVM_CAP_IRQ_XICS)) {
36711ad93f6SDavid Gibson         error_setg(errp,
36811ad93f6SDavid Gibson                    "KVM and IRQ_XICS capability must be present for in-kernel XICS");
36964fb9621SGreg Kurz         return -1;
37011ad93f6SDavid Gibson     }
37111ad93f6SDavid Gibson 
3723a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_SET_XIVE, "ibm,set-xive");
37311ad93f6SDavid Gibson     if (rc < 0) {
374ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
375ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,set-xive");
37611ad93f6SDavid Gibson         goto fail;
37711ad93f6SDavid Gibson     }
37811ad93f6SDavid Gibson 
3793a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_GET_XIVE, "ibm,get-xive");
38011ad93f6SDavid Gibson     if (rc < 0) {
381ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
382ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,get-xive");
38311ad93f6SDavid Gibson         goto fail;
38411ad93f6SDavid Gibson     }
38511ad93f6SDavid Gibson 
3863a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_INT_ON, "ibm,int-on");
38711ad93f6SDavid Gibson     if (rc < 0) {
388ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
389ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,int-on");
39011ad93f6SDavid Gibson         goto fail;
39111ad93f6SDavid Gibson     }
39211ad93f6SDavid Gibson 
3933a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_INT_OFF, "ibm,int-off");
39411ad93f6SDavid Gibson     if (rc < 0) {
395ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
396ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,int-off");
39711ad93f6SDavid Gibson         goto fail;
39811ad93f6SDavid Gibson     }
39911ad93f6SDavid Gibson 
400bf358b54SCédric Le Goater     /* Create the KVM XICS device */
401bf358b54SCédric Le Goater     rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false);
40211ad93f6SDavid Gibson     if (rc < 0) {
403ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc, "Error on KVM_CREATE_DEVICE for XICS");
40411ad93f6SDavid Gibson         goto fail;
40511ad93f6SDavid Gibson     }
40611ad93f6SDavid Gibson 
407894ea3ecSGreg Kurz     /* Tell KVM about the # of VCPUs we may have (POWER9 and newer only) */
408894ea3ecSGreg Kurz     if (kvm_device_check_attr(rc, KVM_DEV_XICS_GRP_CTRL,
409894ea3ecSGreg Kurz                               KVM_DEV_XICS_NR_SERVERS)) {
410894ea3ecSGreg Kurz         if (kvm_device_access(rc, KVM_DEV_XICS_GRP_CTRL,
411894ea3ecSGreg Kurz                               KVM_DEV_XICS_NR_SERVERS, &nr_servers, true,
412894ea3ecSGreg Kurz                               &local_err)) {
413894ea3ecSGreg Kurz             goto fail;
414894ea3ecSGreg Kurz         }
415894ea3ecSGreg Kurz     }
416894ea3ecSGreg Kurz 
417bf358b54SCédric Le Goater     kernel_xics_fd = rc;
4189554233cSAlexey Kardashevskiy     kvm_kernel_irqchip = true;
4199554233cSAlexey Kardashevskiy     kvm_msi_via_irqfd_allowed = true;
4209554233cSAlexey Kardashevskiy     kvm_gsi_direct_mapping = true;
4219554233cSAlexey Kardashevskiy 
4223f777abcSCédric Le Goater     /* Create the presenters */
4233f777abcSCédric Le Goater     CPU_FOREACH(cs) {
4243f777abcSCédric Le Goater         PowerPCCPU *cpu = POWERPC_CPU(cs);
4253f777abcSCédric Le Goater 
4263f777abcSCédric Le Goater         icp_kvm_realize(DEVICE(spapr_cpu_state(cpu)->icp), &local_err);
4273f777abcSCédric Le Goater         if (local_err) {
4283f777abcSCédric Le Goater             goto fail;
4293f777abcSCédric Le Goater         }
4303f777abcSCédric Le Goater     }
4313f777abcSCédric Le Goater 
4323f777abcSCédric Le Goater     /* Update the KVM sources */
43398a39a79SDavid Gibson     ics_set_kvm_state(ics, &local_err);
434330a21e3SGreg Kurz     if (local_err) {
435330a21e3SGreg Kurz         goto fail;
436330a21e3SGreg Kurz     }
4373f777abcSCédric Le Goater 
4383f777abcSCédric Le Goater     /* Connect the presenters to the initial VCPUs of the machine */
4393f777abcSCédric Le Goater     CPU_FOREACH(cs) {
4403f777abcSCédric Le Goater         PowerPCCPU *cpu = POWERPC_CPU(cs);
441330a21e3SGreg Kurz         icp_set_kvm_state(spapr_cpu_state(cpu)->icp, &local_err);
442330a21e3SGreg Kurz         if (local_err) {
443330a21e3SGreg Kurz             goto fail;
444330a21e3SGreg Kurz         }
4453f777abcSCédric Le Goater     }
4463f777abcSCédric Le Goater 
447bf358b54SCédric Le Goater     return 0;
44811ad93f6SDavid Gibson 
44911ad93f6SDavid Gibson fail:
450ab3d15faSGreg Kurz     error_propagate(errp, local_err);
45198a39a79SDavid Gibson     xics_kvm_disconnect(intc);
4522192a930SCédric Le Goater     return -1;
45311ad93f6SDavid Gibson }
45456b11587SCédric Le Goater 
45598a39a79SDavid Gibson void xics_kvm_disconnect(SpaprInterruptController *intc)
45656b11587SCédric Le Goater {
45756b11587SCédric Le Goater     /*
45856b11587SCédric Le Goater      * Only on P9 using the XICS-on XIVE KVM device:
45956b11587SCédric Le Goater      *
46056b11587SCédric Le Goater      * When the KVM device fd is closed, the device is destroyed and
46156b11587SCédric Le Goater      * removed from the list of devices of the VM. The VCPU presenters
46256b11587SCédric Le Goater      * are also detached from the device.
46356b11587SCédric Le Goater      */
4644812f261SGreg Kurz     if (kernel_xics_fd != -1) {
46556b11587SCédric Le Goater         close(kernel_xics_fd);
46656b11587SCédric Le Goater         kernel_xics_fd = -1;
4674812f261SGreg Kurz     }
46856b11587SCédric Le Goater 
46956b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,set-xive");
47056b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,get-xive");
47156b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,int-on");
47256b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,int-off");
47356b11587SCédric Le Goater 
47456b11587SCédric Le Goater     kvm_kernel_irqchip = false;
47556b11587SCédric Le Goater     kvm_msi_via_irqfd_allowed = false;
47656b11587SCédric Le Goater     kvm_gsi_direct_mapping = false;
47756b11587SCédric Le Goater 
47856b11587SCédric Le Goater     /* Clear the presenter from the VCPUs */
47956b11587SCédric Le Goater     kvm_disable_icps();
48056b11587SCédric Le Goater }
4817abc0c6dSGreg Kurz 
4827abc0c6dSGreg Kurz /*
4837abc0c6dSGreg Kurz  * This is a heuristic to detect older KVMs on POWER9 hosts that don't
4847abc0c6dSGreg Kurz  * support destruction of a KVM XICS device while the VM is running.
4857abc0c6dSGreg Kurz  * Required to start a spapr machine with ic-mode=dual,kernel-irqchip=on.
4867abc0c6dSGreg Kurz  */
4877abc0c6dSGreg Kurz bool xics_kvm_has_broken_disconnect(SpaprMachineState *spapr)
4887abc0c6dSGreg Kurz {
4897abc0c6dSGreg Kurz     int rc;
4907abc0c6dSGreg Kurz 
4917abc0c6dSGreg Kurz     rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false);
4927abc0c6dSGreg Kurz     if (rc < 0) {
4937abc0c6dSGreg Kurz         /*
4947abc0c6dSGreg Kurz          * The error is ignored on purpose. The KVM XICS setup code
4957abc0c6dSGreg Kurz          * will catch it again anyway. The goal here is to see if
4967abc0c6dSGreg Kurz          * close() actually destroys the device or not.
4977abc0c6dSGreg Kurz          */
4987abc0c6dSGreg Kurz         return false;
4997abc0c6dSGreg Kurz     }
5007abc0c6dSGreg Kurz 
5017abc0c6dSGreg Kurz     close(rc);
5027abc0c6dSGreg Kurz 
5037abc0c6dSGreg Kurz     rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false);
5047abc0c6dSGreg Kurz     if (rc >= 0) {
5057abc0c6dSGreg Kurz         close(rc);
5067abc0c6dSGreg Kurz         return false;
5077abc0c6dSGreg Kurz     }
5087abc0c6dSGreg Kurz 
5097abc0c6dSGreg Kurz     return errno == EEXIST;
5107abc0c6dSGreg Kurz }
511