xref: /qemu/hw/intc/xics_kvm.c (revision 894ea3ecd38f4d09353cea19bb20002892d2b8b3)
111ad93f6SDavid Gibson /*
211ad93f6SDavid Gibson  * QEMU PowerPC pSeries Logical Partition (aka sPAPR) hardware System Emulator
311ad93f6SDavid Gibson  *
411ad93f6SDavid Gibson  * PAPR Virtualized Interrupt System, aka ICS/ICP aka xics, in-kernel emulation
511ad93f6SDavid Gibson  *
611ad93f6SDavid Gibson  * Copyright (c) 2013 David Gibson, IBM Corporation.
711ad93f6SDavid Gibson  *
811ad93f6SDavid Gibson  * Permission is hereby granted, free of charge, to any person obtaining a copy
911ad93f6SDavid Gibson  * of this software and associated documentation files (the "Software"), to deal
1011ad93f6SDavid Gibson  * in the Software without restriction, including without limitation the rights
1111ad93f6SDavid Gibson  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
1211ad93f6SDavid Gibson  * copies of the Software, and to permit persons to whom the Software is
1311ad93f6SDavid Gibson  * furnished to do so, subject to the following conditions:
1411ad93f6SDavid Gibson  *
1511ad93f6SDavid Gibson  * The above copyright notice and this permission notice shall be included in
1611ad93f6SDavid Gibson  * all copies or substantial portions of the Software.
1711ad93f6SDavid Gibson  *
1811ad93f6SDavid Gibson  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1911ad93f6SDavid Gibson  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
2011ad93f6SDavid Gibson  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
2111ad93f6SDavid Gibson  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
2211ad93f6SDavid Gibson  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
2311ad93f6SDavid Gibson  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
2411ad93f6SDavid Gibson  * THE SOFTWARE.
2511ad93f6SDavid Gibson  *
2611ad93f6SDavid Gibson  */
2711ad93f6SDavid Gibson 
280d75590dSPeter Maydell #include "qemu/osdep.h"
29da34e65cSMarkus Armbruster #include "qapi/error.h"
304771d756SPaolo Bonzini #include "qemu-common.h"
314771d756SPaolo Bonzini #include "cpu.h"
3211ad93f6SDavid Gibson #include "trace.h"
3377ac58ddSPaolo Bonzini #include "sysemu/kvm.h"
3411ad93f6SDavid Gibson #include "hw/ppc/spapr.h"
353f777abcSCédric Le Goater #include "hw/ppc/spapr_cpu_core.h"
3611ad93f6SDavid Gibson #include "hw/ppc/xics.h"
37a51d5afcSThomas Huth #include "hw/ppc/xics_spapr.h"
3811ad93f6SDavid Gibson #include "kvm_ppc.h"
3911ad93f6SDavid Gibson #include "qemu/config-file.h"
4011ad93f6SDavid Gibson #include "qemu/error-report.h"
4111ad93f6SDavid Gibson 
4211ad93f6SDavid Gibson #include <sys/ioctl.h>
4311ad93f6SDavid Gibson 
44729f8a4fSCédric Le Goater static int kernel_xics_fd = -1;
45729f8a4fSCédric Le Goater 
46de86ecccSGreg Kurz typedef struct KVMEnabledICP {
47de86ecccSGreg Kurz     unsigned long vcpu_id;
48de86ecccSGreg Kurz     QLIST_ENTRY(KVMEnabledICP) node;
49de86ecccSGreg Kurz } KVMEnabledICP;
50de86ecccSGreg Kurz 
51de86ecccSGreg Kurz static QLIST_HEAD(, KVMEnabledICP)
52de86ecccSGreg Kurz     kvm_enabled_icps = QLIST_HEAD_INITIALIZER(&kvm_enabled_icps);
53de86ecccSGreg Kurz 
5456b11587SCédric Le Goater static void kvm_disable_icps(void)
5556b11587SCédric Le Goater {
5656b11587SCédric Le Goater     KVMEnabledICP *enabled_icp, *next;
5756b11587SCédric Le Goater 
5856b11587SCédric Le Goater     QLIST_FOREACH_SAFE(enabled_icp, &kvm_enabled_icps, node, next) {
5956b11587SCédric Le Goater         QLIST_REMOVE(enabled_icp, node);
6056b11587SCédric Le Goater         g_free(enabled_icp);
6156b11587SCédric Le Goater     }
6256b11587SCédric Le Goater }
6356b11587SCédric Le Goater 
6411ad93f6SDavid Gibson /*
6511ad93f6SDavid Gibson  * ICP-KVM
6611ad93f6SDavid Gibson  */
670e5c7fadSGreg Kurz void icp_get_kvm_state(ICPState *icp)
6811ad93f6SDavid Gibson {
6911ad93f6SDavid Gibson     uint64_t state;
7011ad93f6SDavid Gibson     int ret;
7111ad93f6SDavid Gibson 
723bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
733bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
743bf84e99SCédric Le Goater         return;
753bf84e99SCédric Le Goater     }
763bf84e99SCédric Le Goater 
7711ad93f6SDavid Gibson     /* ICP for this CPU thread is not in use, exiting */
788e4fba20SCédric Le Goater     if (!icp->cs) {
7911ad93f6SDavid Gibson         return;
8011ad93f6SDavid Gibson     }
8111ad93f6SDavid Gibson 
82bf358b54SCédric Le Goater     ret = kvm_get_one_reg(icp->cs, KVM_REG_PPC_ICP_STATE, &state);
8311ad93f6SDavid Gibson     if (ret != 0) {
8411ad93f6SDavid Gibson         error_report("Unable to retrieve KVM interrupt controller state"
858e4fba20SCédric Le Goater                 " for CPU %ld: %s", kvm_arch_vcpu_id(icp->cs), strerror(errno));
8611ad93f6SDavid Gibson         exit(1);
8711ad93f6SDavid Gibson     }
8811ad93f6SDavid Gibson 
898e4fba20SCédric Le Goater     icp->xirr = state >> KVM_REG_PPC_ICP_XISR_SHIFT;
908e4fba20SCédric Le Goater     icp->mfrr = (state >> KVM_REG_PPC_ICP_MFRR_SHIFT)
9111ad93f6SDavid Gibson         & KVM_REG_PPC_ICP_MFRR_MASK;
928e4fba20SCédric Le Goater     icp->pending_priority = (state >> KVM_REG_PPC_ICP_PPRI_SHIFT)
9311ad93f6SDavid Gibson         & KVM_REG_PPC_ICP_PPRI_MASK;
9411ad93f6SDavid Gibson }
9511ad93f6SDavid Gibson 
96dcb556fcSGreg Kurz static void do_icp_synchronize_state(CPUState *cpu, run_on_cpu_data arg)
97dcb556fcSGreg Kurz {
98dcb556fcSGreg Kurz     icp_get_kvm_state(arg.host_ptr);
99dcb556fcSGreg Kurz }
100dcb556fcSGreg Kurz 
1010e5c7fadSGreg Kurz void icp_synchronize_state(ICPState *icp)
102dcb556fcSGreg Kurz {
103dcb556fcSGreg Kurz     if (icp->cs) {
104dcb556fcSGreg Kurz         run_on_cpu(icp->cs, do_icp_synchronize_state, RUN_ON_CPU_HOST_PTR(icp));
105dcb556fcSGreg Kurz     }
106dcb556fcSGreg Kurz }
107dcb556fcSGreg Kurz 
108330a21e3SGreg Kurz int icp_set_kvm_state(ICPState *icp, Error **errp)
10911ad93f6SDavid Gibson {
11011ad93f6SDavid Gibson     uint64_t state;
11111ad93f6SDavid Gibson     int ret;
11211ad93f6SDavid Gibson 
1133bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
1143bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
1153bf84e99SCédric Le Goater         return 0;
1163bf84e99SCédric Le Goater     }
1173bf84e99SCédric Le Goater 
11811ad93f6SDavid Gibson     /* ICP for this CPU thread is not in use, exiting */
1198e4fba20SCédric Le Goater     if (!icp->cs) {
12011ad93f6SDavid Gibson         return 0;
12111ad93f6SDavid Gibson     }
12211ad93f6SDavid Gibson 
1238e4fba20SCédric Le Goater     state = ((uint64_t)icp->xirr << KVM_REG_PPC_ICP_XISR_SHIFT)
1248e4fba20SCédric Le Goater         | ((uint64_t)icp->mfrr << KVM_REG_PPC_ICP_MFRR_SHIFT)
1258e4fba20SCédric Le Goater         | ((uint64_t)icp->pending_priority << KVM_REG_PPC_ICP_PPRI_SHIFT);
12611ad93f6SDavid Gibson 
127bf358b54SCédric Le Goater     ret = kvm_set_one_reg(icp->cs, KVM_REG_PPC_ICP_STATE, &state);
128330a21e3SGreg Kurz     if (ret < 0) {
129330a21e3SGreg Kurz         error_setg_errno(errp, -ret,
130330a21e3SGreg Kurz                          "Unable to restore KVM interrupt controller state (0x%"
131330a21e3SGreg Kurz                          PRIx64 ") for CPU %ld", state,
132330a21e3SGreg Kurz                          kvm_arch_vcpu_id(icp->cs));
13311ad93f6SDavid Gibson         return ret;
13411ad93f6SDavid Gibson     }
13511ad93f6SDavid Gibson 
13611ad93f6SDavid Gibson     return 0;
13711ad93f6SDavid Gibson }
13811ad93f6SDavid Gibson 
1398e6e6efeSGreg Kurz void icp_kvm_realize(DeviceState *dev, Error **errp)
140f0232434SCédric Le Goater {
141a028dd42SCédric Le Goater     ICPState *icp = ICP(dev);
142a028dd42SCédric Le Goater     CPUState *cs;
143de86ecccSGreg Kurz     KVMEnabledICP *enabled_icp;
144a028dd42SCédric Le Goater     unsigned long vcpu_id;
145f0232434SCédric Le Goater     int ret;
146f0232434SCédric Le Goater 
1473bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
148f0232434SCédric Le Goater     if (kernel_xics_fd == -1) {
1493bf84e99SCédric Le Goater         return;
150f0232434SCédric Le Goater     }
151f0232434SCédric Le Goater 
152a028dd42SCédric Le Goater     cs = icp->cs;
153a028dd42SCédric Le Goater     vcpu_id = kvm_arch_vcpu_id(cs);
154a028dd42SCédric Le Goater 
155f0232434SCédric Le Goater     /*
156f0232434SCédric Le Goater      * If we are reusing a parked vCPU fd corresponding to the CPU
157f0232434SCédric Le Goater      * which was hot-removed earlier we don't have to renable
158f0232434SCédric Le Goater      * KVM_CAP_IRQ_XICS capability again.
159f0232434SCédric Le Goater      */
160de86ecccSGreg Kurz     QLIST_FOREACH(enabled_icp, &kvm_enabled_icps, node) {
161de86ecccSGreg Kurz         if (enabled_icp->vcpu_id == vcpu_id) {
162f0232434SCédric Le Goater             return;
163f0232434SCédric Le Goater         }
164de86ecccSGreg Kurz     }
165f0232434SCédric Le Goater 
166de86ecccSGreg Kurz     ret = kvm_vcpu_enable_cap(cs, KVM_CAP_IRQ_XICS, 0, kernel_xics_fd, vcpu_id);
167f0232434SCédric Le Goater     if (ret < 0) {
168*894ea3ecSGreg Kurz         Error *local_err = NULL;
169*894ea3ecSGreg Kurz 
170*894ea3ecSGreg Kurz         error_setg(&local_err, "Unable to connect CPU%ld to kernel XICS: %s",
171*894ea3ecSGreg Kurz                    vcpu_id, strerror(errno));
172*894ea3ecSGreg Kurz         if (errno == ENOSPC) {
173*894ea3ecSGreg Kurz             error_append_hint(&local_err, "Try -smp maxcpus=N with N < %u\n",
174*894ea3ecSGreg Kurz                               MACHINE(qdev_get_machine())->smp.max_cpus);
175*894ea3ecSGreg Kurz         }
176*894ea3ecSGreg Kurz         error_propagate(errp, local_err);
177b1fd36c3SGreg Kurz         return;
178f0232434SCédric Le Goater     }
179de86ecccSGreg Kurz     enabled_icp = g_malloc(sizeof(*enabled_icp));
180de86ecccSGreg Kurz     enabled_icp->vcpu_id = vcpu_id;
181de86ecccSGreg Kurz     QLIST_INSERT_HEAD(&kvm_enabled_icps, enabled_icp, node);
182f0232434SCédric Le Goater }
183f0232434SCédric Le Goater 
18411ad93f6SDavid Gibson /*
18511ad93f6SDavid Gibson  * ICS-KVM
18611ad93f6SDavid Gibson  */
187d80b2ccfSGreg Kurz void ics_get_kvm_state(ICSState *ics)
18811ad93f6SDavid Gibson {
18911ad93f6SDavid Gibson     uint64_t state;
19011ad93f6SDavid Gibson     int i;
19111ad93f6SDavid Gibson 
1923bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
1933bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
1943bf84e99SCédric Le Goater         return;
1953bf84e99SCédric Le Goater     }
1963bf84e99SCédric Le Goater 
19711ad93f6SDavid Gibson     for (i = 0; i < ics->nr_irqs; i++) {
19811ad93f6SDavid Gibson         ICSIRQState *irq = &ics->irqs[i];
19911ad93f6SDavid Gibson 
2004c3539d4SCédric Le Goater         if (ics_irq_free(ics, i)) {
2014c3539d4SCédric Le Goater             continue;
2024c3539d4SCédric Le Goater         }
2034c3539d4SCédric Le Goater 
204bf358b54SCédric Le Goater         kvm_device_access(kernel_xics_fd, KVM_DEV_XICS_GRP_SOURCES,
20550beeb68SMarkus Armbruster                           i + ics->offset, &state, false, &error_fatal);
20611ad93f6SDavid Gibson 
20711ad93f6SDavid Gibson         irq->server = state & KVM_XICS_DESTINATION_MASK;
20811ad93f6SDavid Gibson         irq->saved_priority = (state >> KVM_XICS_PRIORITY_SHIFT)
20911ad93f6SDavid Gibson             & KVM_XICS_PRIORITY_MASK;
21011ad93f6SDavid Gibson         /*
21111ad93f6SDavid Gibson          * To be consistent with the software emulation in xics.c, we
21211ad93f6SDavid Gibson          * split out the masked state + priority that we get from the
21311ad93f6SDavid Gibson          * kernel into 'current priority' (0xff if masked) and
21411ad93f6SDavid Gibson          * 'saved priority' (if masked, this is the priority the
21511ad93f6SDavid Gibson          * interrupt had before it was masked).  Masking and unmasking
21611ad93f6SDavid Gibson          * are done with the ibm,int-off and ibm,int-on RTAS calls.
21711ad93f6SDavid Gibson          */
21811ad93f6SDavid Gibson         if (state & KVM_XICS_MASKED) {
21911ad93f6SDavid Gibson             irq->priority = 0xff;
22011ad93f6SDavid Gibson         } else {
22111ad93f6SDavid Gibson             irq->priority = irq->saved_priority;
22211ad93f6SDavid Gibson         }
22311ad93f6SDavid Gibson 
224063cb7cbSSam Bobroff         irq->status = 0;
22511ad93f6SDavid Gibson         if (state & KVM_XICS_PENDING) {
22611ad93f6SDavid Gibson             if (state & KVM_XICS_LEVEL_SENSITIVE) {
22711ad93f6SDavid Gibson                 irq->status |= XICS_STATUS_ASSERTED;
22811ad93f6SDavid Gibson             } else {
22911ad93f6SDavid Gibson                 /*
23011ad93f6SDavid Gibson                  * A pending edge-triggered interrupt (or MSI)
23111ad93f6SDavid Gibson                  * must have been rejected previously when we
23211ad93f6SDavid Gibson                  * first detected it and tried to deliver it,
23311ad93f6SDavid Gibson                  * so mark it as pending and previously rejected
23411ad93f6SDavid Gibson                  * for consistency with how xics.c works.
23511ad93f6SDavid Gibson                  */
23611ad93f6SDavid Gibson                 irq->status |= XICS_STATUS_MASKED_PENDING
23711ad93f6SDavid Gibson                     | XICS_STATUS_REJECTED;
23811ad93f6SDavid Gibson             }
23911ad93f6SDavid Gibson         }
240229e16fdSSam Bobroff         if (state & KVM_XICS_PRESENTED) {
241229e16fdSSam Bobroff                 irq->status |= XICS_STATUS_PRESENTED;
242229e16fdSSam Bobroff         }
243229e16fdSSam Bobroff         if (state & KVM_XICS_QUEUED) {
244229e16fdSSam Bobroff                 irq->status |= XICS_STATUS_QUEUED;
245229e16fdSSam Bobroff         }
24611ad93f6SDavid Gibson     }
24711ad93f6SDavid Gibson }
24811ad93f6SDavid Gibson 
249d80b2ccfSGreg Kurz void ics_synchronize_state(ICSState *ics)
250dcb556fcSGreg Kurz {
251dcb556fcSGreg Kurz     ics_get_kvm_state(ics);
252dcb556fcSGreg Kurz }
253dcb556fcSGreg Kurz 
254330a21e3SGreg Kurz int ics_set_kvm_state_one(ICSState *ics, int srcno, Error **errp)
25511ad93f6SDavid Gibson {
25611ad93f6SDavid Gibson     uint64_t state;
2576cead90cSGreg Kurz     ICSIRQState *irq = &ics->irqs[srcno];
25811ad93f6SDavid Gibson     int ret;
25911ad93f6SDavid Gibson 
2603bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
2613bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
2623bf84e99SCédric Le Goater         return 0;
2633bf84e99SCédric Le Goater     }
2643bf84e99SCédric Le Goater 
26511ad93f6SDavid Gibson     state = irq->server;
26611ad93f6SDavid Gibson     state |= (uint64_t)(irq->saved_priority & KVM_XICS_PRIORITY_MASK)
26711ad93f6SDavid Gibson         << KVM_XICS_PRIORITY_SHIFT;
26811ad93f6SDavid Gibson     if (irq->priority != irq->saved_priority) {
26911ad93f6SDavid Gibson         assert(irq->priority == 0xff);
27038298611SGreg Kurz     }
27138298611SGreg Kurz 
27238298611SGreg Kurz     if (irq->priority == 0xff) {
27311ad93f6SDavid Gibson         state |= KVM_XICS_MASKED;
27411ad93f6SDavid Gibson     }
27511ad93f6SDavid Gibson 
2766cead90cSGreg Kurz     if (irq->flags & XICS_FLAGS_IRQ_LSI) {
27711ad93f6SDavid Gibson         state |= KVM_XICS_LEVEL_SENSITIVE;
27811ad93f6SDavid Gibson         if (irq->status & XICS_STATUS_ASSERTED) {
27911ad93f6SDavid Gibson             state |= KVM_XICS_PENDING;
28011ad93f6SDavid Gibson         }
28111ad93f6SDavid Gibson     } else {
28211ad93f6SDavid Gibson         if (irq->status & XICS_STATUS_MASKED_PENDING) {
28311ad93f6SDavid Gibson             state |= KVM_XICS_PENDING;
28411ad93f6SDavid Gibson         }
28511ad93f6SDavid Gibson     }
286229e16fdSSam Bobroff     if (irq->status & XICS_STATUS_PRESENTED) {
287229e16fdSSam Bobroff         state |= KVM_XICS_PRESENTED;
288229e16fdSSam Bobroff     }
289229e16fdSSam Bobroff     if (irq->status & XICS_STATUS_QUEUED) {
290229e16fdSSam Bobroff         state |= KVM_XICS_QUEUED;
291229e16fdSSam Bobroff     }
29211ad93f6SDavid Gibson 
29352b43881SCédric Le Goater     ret = kvm_device_access(kernel_xics_fd, KVM_DEV_XICS_GRP_SOURCES,
294330a21e3SGreg Kurz                             srcno + ics->offset, &state, true, errp);
295330a21e3SGreg Kurz     if (ret < 0) {
29611ad93f6SDavid Gibson         return ret;
29711ad93f6SDavid Gibson     }
2986cead90cSGreg Kurz 
2996cead90cSGreg Kurz     return 0;
3006cead90cSGreg Kurz }
3016cead90cSGreg Kurz 
302330a21e3SGreg Kurz int ics_set_kvm_state(ICSState *ics, Error **errp)
3036cead90cSGreg Kurz {
3046cead90cSGreg Kurz     int i;
3056cead90cSGreg Kurz 
3063bf84e99SCédric Le Goater     /* The KVM XICS device is not in use */
3073bf84e99SCédric Le Goater     if (kernel_xics_fd == -1) {
3083bf84e99SCédric Le Goater         return 0;
3093bf84e99SCédric Le Goater     }
3103bf84e99SCédric Le Goater 
3116cead90cSGreg Kurz     for (i = 0; i < ics->nr_irqs; i++) {
312330a21e3SGreg Kurz         Error *local_err = NULL;
3136cead90cSGreg Kurz         int ret;
3146cead90cSGreg Kurz 
3154c3539d4SCédric Le Goater         if (ics_irq_free(ics, i)) {
3164c3539d4SCédric Le Goater             continue;
3174c3539d4SCédric Le Goater         }
3184c3539d4SCédric Le Goater 
319330a21e3SGreg Kurz         ret = ics_set_kvm_state_one(ics, i, &local_err);
320330a21e3SGreg Kurz         if (ret < 0) {
321330a21e3SGreg Kurz             error_propagate(errp, local_err);
3226cead90cSGreg Kurz             return ret;
3236cead90cSGreg Kurz         }
32411ad93f6SDavid Gibson     }
32511ad93f6SDavid Gibson 
32611ad93f6SDavid Gibson     return 0;
32711ad93f6SDavid Gibson }
32811ad93f6SDavid Gibson 
329557b4567SGreg Kurz void ics_kvm_set_irq(ICSState *ics, int srcno, int val)
33011ad93f6SDavid Gibson {
33111ad93f6SDavid Gibson     struct kvm_irq_level args;
33211ad93f6SDavid Gibson     int rc;
33311ad93f6SDavid Gibson 
3343bf84e99SCédric Le Goater     /* The KVM XICS device should be in use */
3353bf84e99SCédric Le Goater     assert(kernel_xics_fd != -1);
3363bf84e99SCédric Le Goater 
33711ad93f6SDavid Gibson     args.irq = srcno + ics->offset;
3384af88944SAlexey Kardashevskiy     if (ics->irqs[srcno].flags & XICS_FLAGS_IRQ_MSI) {
33911ad93f6SDavid Gibson         if (!val) {
34011ad93f6SDavid Gibson             return;
34111ad93f6SDavid Gibson         }
34211ad93f6SDavid Gibson         args.level = KVM_INTERRUPT_SET;
34311ad93f6SDavid Gibson     } else {
34411ad93f6SDavid Gibson         args.level = val ? KVM_INTERRUPT_SET_LEVEL : KVM_INTERRUPT_UNSET;
34511ad93f6SDavid Gibson     }
34611ad93f6SDavid Gibson     rc = kvm_vm_ioctl(kvm_state, KVM_IRQ_LINE, &args);
34711ad93f6SDavid Gibson     if (rc < 0) {
34811ad93f6SDavid Gibson         perror("kvm_irq_line");
34911ad93f6SDavid Gibson     }
35011ad93f6SDavid Gibson }
35111ad93f6SDavid Gibson 
3524ffb7496SGreg Kurz int xics_kvm_connect(SpaprInterruptController *intc, uint32_t nr_servers,
3534ffb7496SGreg Kurz                      Error **errp)
35411ad93f6SDavid Gibson {
35598a39a79SDavid Gibson     ICSState *ics = ICS_SPAPR(intc);
356817bb6a4SCédric Le Goater     int rc;
3573f777abcSCédric Le Goater     CPUState *cs;
3583f777abcSCédric Le Goater     Error *local_err = NULL;
3593f777abcSCédric Le Goater 
3603f777abcSCédric Le Goater     /*
3613f777abcSCédric Le Goater      * The KVM XICS device already in use. This is the case when
3623f777abcSCédric Le Goater      * rebooting under the XICS-only interrupt mode.
3633f777abcSCédric Le Goater      */
3643f777abcSCédric Le Goater     if (kernel_xics_fd != -1) {
3653f777abcSCédric Le Goater         return 0;
3663f777abcSCédric Le Goater     }
36711ad93f6SDavid Gibson 
36811ad93f6SDavid Gibson     if (!kvm_enabled() || !kvm_check_extension(kvm_state, KVM_CAP_IRQ_XICS)) {
36911ad93f6SDavid Gibson         error_setg(errp,
37011ad93f6SDavid Gibson                    "KVM and IRQ_XICS capability must be present for in-kernel XICS");
37164fb9621SGreg Kurz         return -1;
37211ad93f6SDavid Gibson     }
37311ad93f6SDavid Gibson 
3743a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_SET_XIVE, "ibm,set-xive");
37511ad93f6SDavid Gibson     if (rc < 0) {
376ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
377ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,set-xive");
37811ad93f6SDavid Gibson         goto fail;
37911ad93f6SDavid Gibson     }
38011ad93f6SDavid Gibson 
3813a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_GET_XIVE, "ibm,get-xive");
38211ad93f6SDavid Gibson     if (rc < 0) {
383ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
384ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,get-xive");
38511ad93f6SDavid Gibson         goto fail;
38611ad93f6SDavid Gibson     }
38711ad93f6SDavid Gibson 
3883a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_INT_ON, "ibm,int-on");
38911ad93f6SDavid Gibson     if (rc < 0) {
390ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
391ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,int-on");
39211ad93f6SDavid Gibson         goto fail;
39311ad93f6SDavid Gibson     }
39411ad93f6SDavid Gibson 
3953a3b8502SAlexey Kardashevskiy     rc = kvmppc_define_rtas_kernel_token(RTAS_IBM_INT_OFF, "ibm,int-off");
39611ad93f6SDavid Gibson     if (rc < 0) {
397ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc,
398ab3d15faSGreg Kurz                          "kvmppc_define_rtas_kernel_token: ibm,int-off");
39911ad93f6SDavid Gibson         goto fail;
40011ad93f6SDavid Gibson     }
40111ad93f6SDavid Gibson 
402bf358b54SCédric Le Goater     /* Create the KVM XICS device */
403bf358b54SCédric Le Goater     rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false);
40411ad93f6SDavid Gibson     if (rc < 0) {
405ab3d15faSGreg Kurz         error_setg_errno(&local_err, -rc, "Error on KVM_CREATE_DEVICE for XICS");
40611ad93f6SDavid Gibson         goto fail;
40711ad93f6SDavid Gibson     }
40811ad93f6SDavid Gibson 
409*894ea3ecSGreg Kurz     /* Tell KVM about the # of VCPUs we may have (POWER9 and newer only) */
410*894ea3ecSGreg Kurz     if (kvm_device_check_attr(rc, KVM_DEV_XICS_GRP_CTRL,
411*894ea3ecSGreg Kurz                               KVM_DEV_XICS_NR_SERVERS)) {
412*894ea3ecSGreg Kurz         if (kvm_device_access(rc, KVM_DEV_XICS_GRP_CTRL,
413*894ea3ecSGreg Kurz                               KVM_DEV_XICS_NR_SERVERS, &nr_servers, true,
414*894ea3ecSGreg Kurz                               &local_err)) {
415*894ea3ecSGreg Kurz             goto fail;
416*894ea3ecSGreg Kurz         }
417*894ea3ecSGreg Kurz     }
418*894ea3ecSGreg Kurz 
419bf358b54SCédric Le Goater     kernel_xics_fd = rc;
4209554233cSAlexey Kardashevskiy     kvm_kernel_irqchip = true;
4219554233cSAlexey Kardashevskiy     kvm_msi_via_irqfd_allowed = true;
4229554233cSAlexey Kardashevskiy     kvm_gsi_direct_mapping = true;
4239554233cSAlexey Kardashevskiy 
4243f777abcSCédric Le Goater     /* Create the presenters */
4253f777abcSCédric Le Goater     CPU_FOREACH(cs) {
4263f777abcSCédric Le Goater         PowerPCCPU *cpu = POWERPC_CPU(cs);
4273f777abcSCédric Le Goater 
4283f777abcSCédric Le Goater         icp_kvm_realize(DEVICE(spapr_cpu_state(cpu)->icp), &local_err);
4293f777abcSCédric Le Goater         if (local_err) {
4303f777abcSCédric Le Goater             goto fail;
4313f777abcSCédric Le Goater         }
4323f777abcSCédric Le Goater     }
4333f777abcSCédric Le Goater 
4343f777abcSCédric Le Goater     /* Update the KVM sources */
43598a39a79SDavid Gibson     ics_set_kvm_state(ics, &local_err);
436330a21e3SGreg Kurz     if (local_err) {
437330a21e3SGreg Kurz         goto fail;
438330a21e3SGreg Kurz     }
4393f777abcSCédric Le Goater 
4403f777abcSCédric Le Goater     /* Connect the presenters to the initial VCPUs of the machine */
4413f777abcSCédric Le Goater     CPU_FOREACH(cs) {
4423f777abcSCédric Le Goater         PowerPCCPU *cpu = POWERPC_CPU(cs);
443330a21e3SGreg Kurz         icp_set_kvm_state(spapr_cpu_state(cpu)->icp, &local_err);
444330a21e3SGreg Kurz         if (local_err) {
445330a21e3SGreg Kurz             goto fail;
446330a21e3SGreg Kurz         }
4473f777abcSCédric Le Goater     }
4483f777abcSCédric Le Goater 
449bf358b54SCédric Le Goater     return 0;
45011ad93f6SDavid Gibson 
45111ad93f6SDavid Gibson fail:
452ab3d15faSGreg Kurz     error_propagate(errp, local_err);
45398a39a79SDavid Gibson     xics_kvm_disconnect(intc);
4542192a930SCédric Le Goater     return -1;
45511ad93f6SDavid Gibson }
45656b11587SCédric Le Goater 
45798a39a79SDavid Gibson void xics_kvm_disconnect(SpaprInterruptController *intc)
45856b11587SCédric Le Goater {
45956b11587SCédric Le Goater     /*
46056b11587SCédric Le Goater      * Only on P9 using the XICS-on XIVE KVM device:
46156b11587SCédric Le Goater      *
46256b11587SCédric Le Goater      * When the KVM device fd is closed, the device is destroyed and
46356b11587SCédric Le Goater      * removed from the list of devices of the VM. The VCPU presenters
46456b11587SCédric Le Goater      * are also detached from the device.
46556b11587SCédric Le Goater      */
4664812f261SGreg Kurz     if (kernel_xics_fd != -1) {
46756b11587SCédric Le Goater         close(kernel_xics_fd);
46856b11587SCédric Le Goater         kernel_xics_fd = -1;
4694812f261SGreg Kurz     }
47056b11587SCédric Le Goater 
47156b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,set-xive");
47256b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,get-xive");
47356b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,int-on");
47456b11587SCédric Le Goater     kvmppc_define_rtas_kernel_token(0, "ibm,int-off");
47556b11587SCédric Le Goater 
47656b11587SCédric Le Goater     kvm_kernel_irqchip = false;
47756b11587SCédric Le Goater     kvm_msi_via_irqfd_allowed = false;
47856b11587SCédric Le Goater     kvm_gsi_direct_mapping = false;
47956b11587SCédric Le Goater 
48056b11587SCédric Le Goater     /* Clear the presenter from the VCPUs */
48156b11587SCédric Le Goater     kvm_disable_icps();
48256b11587SCédric Le Goater }
4837abc0c6dSGreg Kurz 
4847abc0c6dSGreg Kurz /*
4857abc0c6dSGreg Kurz  * This is a heuristic to detect older KVMs on POWER9 hosts that don't
4867abc0c6dSGreg Kurz  * support destruction of a KVM XICS device while the VM is running.
4877abc0c6dSGreg Kurz  * Required to start a spapr machine with ic-mode=dual,kernel-irqchip=on.
4887abc0c6dSGreg Kurz  */
4897abc0c6dSGreg Kurz bool xics_kvm_has_broken_disconnect(SpaprMachineState *spapr)
4907abc0c6dSGreg Kurz {
4917abc0c6dSGreg Kurz     int rc;
4927abc0c6dSGreg Kurz 
4937abc0c6dSGreg Kurz     rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false);
4947abc0c6dSGreg Kurz     if (rc < 0) {
4957abc0c6dSGreg Kurz         /*
4967abc0c6dSGreg Kurz          * The error is ignored on purpose. The KVM XICS setup code
4977abc0c6dSGreg Kurz          * will catch it again anyway. The goal here is to see if
4987abc0c6dSGreg Kurz          * close() actually destroys the device or not.
4997abc0c6dSGreg Kurz          */
5007abc0c6dSGreg Kurz         return false;
5017abc0c6dSGreg Kurz     }
5027abc0c6dSGreg Kurz 
5037abc0c6dSGreg Kurz     close(rc);
5047abc0c6dSGreg Kurz 
5057abc0c6dSGreg Kurz     rc = kvm_create_device(kvm_state, KVM_DEV_TYPE_XICS, false);
5067abc0c6dSGreg Kurz     if (rc >= 0) {
5077abc0c6dSGreg Kurz         close(rc);
5087abc0c6dSGreg Kurz         return false;
5097abc0c6dSGreg Kurz     }
5107abc0c6dSGreg Kurz 
5117abc0c6dSGreg Kurz     return errno == EEXIST;
5127abc0c6dSGreg Kurz }
513