1f5cc5a5cSClaudio Fontana /* 2f5cc5a5cSClaudio Fontana * x86 KVM CPU type initialization 3f5cc5a5cSClaudio Fontana * 4f5cc5a5cSClaudio Fontana * Copyright 2021 SUSE LLC 5f5cc5a5cSClaudio Fontana * 6f5cc5a5cSClaudio Fontana * This work is licensed under the terms of the GNU GPL, version 2 or later. 7f5cc5a5cSClaudio Fontana * See the COPYING file in the top-level directory. 8f5cc5a5cSClaudio Fontana */ 9f5cc5a5cSClaudio Fontana 10f5cc5a5cSClaudio Fontana #include "qemu/osdep.h" 11f5cc5a5cSClaudio Fontana #include "cpu.h" 12f5cc5a5cSClaudio Fontana #include "host-cpu.h" 13f5cc5a5cSClaudio Fontana #include "qapi/error.h" 1432cad1ffSPhilippe Mathieu-Daudé #include "system/system.h" 15f5cc5a5cSClaudio Fontana #include "hw/boards.h" 16f5cc5a5cSClaudio Fontana 17f5cc5a5cSClaudio Fontana #include "kvm_i386.h" 18b12a0f85SPhilippe Mathieu-Daudé #include "accel/accel-cpu-target.h" 19f5cc5a5cSClaudio Fontana 200d08c423SGerd Hoffmann static void kvm_set_guest_phys_bits(CPUState *cs) 210d08c423SGerd Hoffmann { 220d08c423SGerd Hoffmann X86CPU *cpu = X86_CPU(cs); 230d08c423SGerd Hoffmann uint32_t eax, guest_phys_bits; 240d08c423SGerd Hoffmann 250d08c423SGerd Hoffmann eax = kvm_arch_get_supported_cpuid(cs->kvm_state, 0x80000008, 0, R_EAX); 260d08c423SGerd Hoffmann guest_phys_bits = (eax >> 16) & 0xff; 270d08c423SGerd Hoffmann if (!guest_phys_bits) { 280d08c423SGerd Hoffmann return; 290d08c423SGerd Hoffmann } 300d08c423SGerd Hoffmann cpu->guest_phys_bits = guest_phys_bits; 310d08c423SGerd Hoffmann if (cpu->guest_phys_bits > cpu->phys_bits) { 320d08c423SGerd Hoffmann cpu->guest_phys_bits = cpu->phys_bits; 330d08c423SGerd Hoffmann } 340d08c423SGerd Hoffmann 350d08c423SGerd Hoffmann if (cpu->host_phys_bits && cpu->host_phys_bits_limit && 360d08c423SGerd Hoffmann cpu->guest_phys_bits > cpu->host_phys_bits_limit) { 370d08c423SGerd Hoffmann cpu->guest_phys_bits = cpu->host_phys_bits_limit; 380d08c423SGerd Hoffmann } 390d08c423SGerd Hoffmann } 400d08c423SGerd Hoffmann 419ea057dcSClaudio Fontana static bool kvm_cpu_realizefn(CPUState *cs, Error **errp) 42f5cc5a5cSClaudio Fontana { 43f5cc5a5cSClaudio Fontana X86CPU *cpu = X86_CPU(cs); 44f5cc5a5cSClaudio Fontana CPUX86State *env = &cpu->env; 450d08c423SGerd Hoffmann bool ret; 46f5cc5a5cSClaudio Fontana 47f5cc5a5cSClaudio Fontana /* 48f5cc5a5cSClaudio Fontana * The realize order is important, since x86_cpu_realize() checks if 49f5cc5a5cSClaudio Fontana * nothing else has been set by the user (or by accelerators) in 50662175b9SClaudio Fontana * cpu->ucode_rev and cpu->phys_bits, and updates the CPUID results in 51662175b9SClaudio Fontana * mwait.ecx. 52662175b9SClaudio Fontana * This accel realization code also assumes cpu features are already expanded. 53f5cc5a5cSClaudio Fontana * 54f5cc5a5cSClaudio Fontana * realize order: 55662175b9SClaudio Fontana * 560d08c423SGerd Hoffmann * x86_cpu_realizefn(): 570d08c423SGerd Hoffmann * x86_cpu_expand_features() 580d08c423SGerd Hoffmann * cpu_exec_realizefn(): 590d08c423SGerd Hoffmann * accel_cpu_common_realize() 600d08c423SGerd Hoffmann * kvm_cpu_realizefn() 610d08c423SGerd Hoffmann * host_cpu_realizefn() 620d08c423SGerd Hoffmann * kvm_set_guest_phys_bits() 630d08c423SGerd Hoffmann * check/update ucode_rev, phys_bits, guest_phys_bits, mwait 640d08c423SGerd Hoffmann * cpu_common_realizefn() (via xcc->parent_realize) 65f5cc5a5cSClaudio Fontana */ 66f5cc5a5cSClaudio Fontana if (cpu->max_features) { 6705fc711cSZide Chen if (enable_cpu_pm) { 6805fc711cSZide Chen if (kvm_has_waitpkg()) { 69f5cc5a5cSClaudio Fontana env->features[FEAT_7_0_ECX] |= CPUID_7_0_ECX_WAITPKG; 70f5cc5a5cSClaudio Fontana } 7105fc711cSZide Chen 7205fc711cSZide Chen if (env->features[FEAT_1_ECX] & CPUID_EXT_MONITOR) { 7305fc711cSZide Chen host_cpuid(5, 0, &cpu->mwait.eax, &cpu->mwait.ebx, 7405fc711cSZide Chen &cpu->mwait.ecx, &cpu->mwait.edx); 7505fc711cSZide Chen } 7605fc711cSZide Chen } 77f5cc5a5cSClaudio Fontana if (cpu->ucode_rev == 0) { 78f5cc5a5cSClaudio Fontana cpu->ucode_rev = 79f5cc5a5cSClaudio Fontana kvm_arch_get_supported_msr_feature(kvm_state, 80f5cc5a5cSClaudio Fontana MSR_IA32_UCODE_REV); 81f5cc5a5cSClaudio Fontana } 82f5cc5a5cSClaudio Fontana } 830d08c423SGerd Hoffmann ret = host_cpu_realizefn(cs, errp); 840d08c423SGerd Hoffmann if (!ret) { 850d08c423SGerd Hoffmann return ret; 860d08c423SGerd Hoffmann } 870d08c423SGerd Hoffmann 880d08c423SGerd Hoffmann if ((env->features[FEAT_8000_0001_EDX] & CPUID_EXT2_LM) && 890d08c423SGerd Hoffmann cpu->guest_phys_bits == -1) { 900d08c423SGerd Hoffmann kvm_set_guest_phys_bits(cs); 910d08c423SGerd Hoffmann } 920d08c423SGerd Hoffmann 930d08c423SGerd Hoffmann return true; 94f5cc5a5cSClaudio Fontana } 95f5cc5a5cSClaudio Fontana 96f5cc5a5cSClaudio Fontana static bool lmce_supported(void) 97f5cc5a5cSClaudio Fontana { 98f5cc5a5cSClaudio Fontana uint64_t mce_cap = 0; 99f5cc5a5cSClaudio Fontana 100f5cc5a5cSClaudio Fontana if (kvm_ioctl(kvm_state, KVM_X86_GET_MCE_CAP_SUPPORTED, &mce_cap) < 0) { 101f5cc5a5cSClaudio Fontana return false; 102f5cc5a5cSClaudio Fontana } 103f5cc5a5cSClaudio Fontana return !!(mce_cap & MCG_LMCE_P); 104f5cc5a5cSClaudio Fontana } 105f5cc5a5cSClaudio Fontana 106f5cc5a5cSClaudio Fontana static void kvm_cpu_max_instance_init(X86CPU *cpu) 107f5cc5a5cSClaudio Fontana { 108f5cc5a5cSClaudio Fontana CPUX86State *env = &cpu->env; 109f5cc5a5cSClaudio Fontana KVMState *s = kvm_state; 110f5cc5a5cSClaudio Fontana 111f5cc5a5cSClaudio Fontana host_cpu_max_instance_init(cpu); 112f5cc5a5cSClaudio Fontana 113f5cc5a5cSClaudio Fontana if (lmce_supported()) { 114f5cc5a5cSClaudio Fontana object_property_set_bool(OBJECT(cpu), "lmce", true, &error_abort); 115f5cc5a5cSClaudio Fontana } 116f5cc5a5cSClaudio Fontana 117f5cc5a5cSClaudio Fontana env->cpuid_min_level = 118f5cc5a5cSClaudio Fontana kvm_arch_get_supported_cpuid(s, 0x0, 0, R_EAX); 119f5cc5a5cSClaudio Fontana env->cpuid_min_xlevel = 120f5cc5a5cSClaudio Fontana kvm_arch_get_supported_cpuid(s, 0x80000000, 0, R_EAX); 121f5cc5a5cSClaudio Fontana env->cpuid_min_xlevel2 = 122f5cc5a5cSClaudio Fontana kvm_arch_get_supported_cpuid(s, 0xC0000000, 0, R_EAX); 123f5cc5a5cSClaudio Fontana } 124f5cc5a5cSClaudio Fontana 125fea45008SDavid Edmondson static void kvm_cpu_xsave_init(void) 126fea45008SDavid Edmondson { 127fea45008SDavid Edmondson static bool first = true; 12819db68caSYang Zhong uint32_t eax, ebx, ecx, edx; 129fea45008SDavid Edmondson int i; 130fea45008SDavid Edmondson 131fea45008SDavid Edmondson if (!first) { 132fea45008SDavid Edmondson return; 133fea45008SDavid Edmondson } 134fea45008SDavid Edmondson first = false; 135fea45008SDavid Edmondson 136fea45008SDavid Edmondson /* x87 and SSE states are in the legacy region of the XSAVE area. */ 137fea45008SDavid Edmondson x86_ext_save_areas[XSTATE_FP_BIT].offset = 0; 138fea45008SDavid Edmondson x86_ext_save_areas[XSTATE_SSE_BIT].offset = 0; 139fea45008SDavid Edmondson 140fea45008SDavid Edmondson for (i = XSTATE_SSE_BIT + 1; i < XSAVE_STATE_AREA_COUNT; i++) { 141fea45008SDavid Edmondson ExtSaveArea *esa = &x86_ext_save_areas[i]; 142fea45008SDavid Edmondson 14358f7db26SPaolo Bonzini if (!esa->size) { 14458f7db26SPaolo Bonzini continue; 14558f7db26SPaolo Bonzini } 14619db68caSYang Zhong host_cpuid(0xd, i, &eax, &ebx, &ecx, &edx); 14719db68caSYang Zhong if (eax != 0) { 14819db68caSYang Zhong assert(esa->size == eax); 14919db68caSYang Zhong esa->offset = ebx; 15019db68caSYang Zhong esa->ecx = ecx; 151fea45008SDavid Edmondson } 152fea45008SDavid Edmondson } 153fea45008SDavid Edmondson } 154fea45008SDavid Edmondson 1555b8978d8SClaudio Fontana /* 1565b8978d8SClaudio Fontana * KVM-specific features that are automatically added/removed 1575b8978d8SClaudio Fontana * from cpudef models when KVM is enabled. 1585b8978d8SClaudio Fontana * Only for builtin_x86_defs models initialized with x86_register_cpudef_types. 1595b8978d8SClaudio Fontana * 1605b8978d8SClaudio Fontana * NOTE: features can be enabled by default only if they were 1615b8978d8SClaudio Fontana * already available in the oldest kernel version supported 1625b8978d8SClaudio Fontana * by the KVM accelerator (see "OS requirements" section at 1635b8978d8SClaudio Fontana * docs/system/target-i386.rst) 1645b8978d8SClaudio Fontana */ 1655b8978d8SClaudio Fontana static PropValue kvm_default_props[] = { 1665b8978d8SClaudio Fontana { "kvmclock", "on" }, 1675b8978d8SClaudio Fontana { "kvm-nopiodelay", "on" }, 1685b8978d8SClaudio Fontana { "kvm-asyncpf", "on" }, 1695b8978d8SClaudio Fontana { "kvm-steal-time", "on" }, 1705b8978d8SClaudio Fontana { "kvm-pv-eoi", "on" }, 1715b8978d8SClaudio Fontana { "kvmclock-stable-bit", "on" }, 1725b8978d8SClaudio Fontana { "x2apic", "on" }, 1735b8978d8SClaudio Fontana { "kvm-msi-ext-dest-id", "off" }, 1745b8978d8SClaudio Fontana { "acpi", "off" }, 1755b8978d8SClaudio Fontana { "monitor", "off" }, 1765b8978d8SClaudio Fontana { "svm", "off" }, 1775b8978d8SClaudio Fontana { NULL, NULL }, 1785b8978d8SClaudio Fontana }; 1795b8978d8SClaudio Fontana 1805b8978d8SClaudio Fontana /* 1815b8978d8SClaudio Fontana * Only for builtin_x86_defs models initialized with x86_register_cpudef_types. 1825b8978d8SClaudio Fontana */ 18363f16d97SPhilippe Mathieu-Daudé static void x86_cpu_change_kvm_default(const char *prop, const char *value) 1845b8978d8SClaudio Fontana { 1855b8978d8SClaudio Fontana PropValue *pv; 1865b8978d8SClaudio Fontana for (pv = kvm_default_props; pv->prop; pv++) { 1875b8978d8SClaudio Fontana if (!strcmp(pv->prop, prop)) { 1885b8978d8SClaudio Fontana pv->value = value; 1895b8978d8SClaudio Fontana break; 1905b8978d8SClaudio Fontana } 1915b8978d8SClaudio Fontana } 1925b8978d8SClaudio Fontana 1935b8978d8SClaudio Fontana /* 1945b8978d8SClaudio Fontana * It is valid to call this function only for properties that 1955b8978d8SClaudio Fontana * are already present in the kvm_default_props table. 1965b8978d8SClaudio Fontana */ 1975b8978d8SClaudio Fontana assert(pv->prop); 1985b8978d8SClaudio Fontana } 1995b8978d8SClaudio Fontana 200f5cc5a5cSClaudio Fontana static void kvm_cpu_instance_init(CPUState *cs) 201f5cc5a5cSClaudio Fontana { 202f5cc5a5cSClaudio Fontana X86CPU *cpu = X86_CPU(cs); 2035b8978d8SClaudio Fontana X86CPUClass *xcc = X86_CPU_GET_CLASS(cpu); 204f5cc5a5cSClaudio Fontana 205f5cc5a5cSClaudio Fontana host_cpu_instance_init(cpu); 206f5cc5a5cSClaudio Fontana 2075b8978d8SClaudio Fontana if (xcc->model) { 2085b8978d8SClaudio Fontana /* only applies to builtin_x86_defs cpus */ 209f5cc5a5cSClaudio Fontana if (!kvm_irqchip_in_kernel()) { 210f5cc5a5cSClaudio Fontana x86_cpu_change_kvm_default("x2apic", "off"); 211dc89f32dSDavid Woodhouse } else if (kvm_irqchip_is_split()) { 212f5cc5a5cSClaudio Fontana x86_cpu_change_kvm_default("kvm-msi-ext-dest-id", "on"); 213f5cc5a5cSClaudio Fontana } 214f5cc5a5cSClaudio Fontana 215f5cc5a5cSClaudio Fontana /* Special cases not set in the X86CPUDefinition structs: */ 216f5cc5a5cSClaudio Fontana x86_cpu_apply_props(cpu, kvm_default_props); 2175b8978d8SClaudio Fontana } 218f5cc5a5cSClaudio Fontana 219f5cc5a5cSClaudio Fontana if (cpu->max_features) { 220f5cc5a5cSClaudio Fontana kvm_cpu_max_instance_init(cpu); 221f5cc5a5cSClaudio Fontana } 222fea45008SDavid Edmondson 223fea45008SDavid Edmondson kvm_cpu_xsave_init(); 224f5cc5a5cSClaudio Fontana } 225f5cc5a5cSClaudio Fontana 226*12d1a768SPhilippe Mathieu-Daudé static void kvm_cpu_accel_class_init(ObjectClass *oc, const void *data) 227f5cc5a5cSClaudio Fontana { 228f5cc5a5cSClaudio Fontana AccelCPUClass *acc = ACCEL_CPU_CLASS(oc); 229f5cc5a5cSClaudio Fontana 2306294e502SPhilippe Mathieu-Daudé acc->cpu_target_realize = kvm_cpu_realizefn; 231f5cc5a5cSClaudio Fontana acc->cpu_instance_init = kvm_cpu_instance_init; 232f5cc5a5cSClaudio Fontana } 233f5cc5a5cSClaudio Fontana static const TypeInfo kvm_cpu_accel_type_info = { 234f5cc5a5cSClaudio Fontana .name = ACCEL_CPU_NAME("kvm"), 235f5cc5a5cSClaudio Fontana 236f5cc5a5cSClaudio Fontana .parent = TYPE_ACCEL_CPU, 237f5cc5a5cSClaudio Fontana .class_init = kvm_cpu_accel_class_init, 238f5cc5a5cSClaudio Fontana .abstract = true, 239f5cc5a5cSClaudio Fontana }; 240f5cc5a5cSClaudio Fontana static void kvm_cpu_accel_register_types(void) 241f5cc5a5cSClaudio Fontana { 242f5cc5a5cSClaudio Fontana type_register_static(&kvm_cpu_accel_type_info); 243f5cc5a5cSClaudio Fontana } 244f5cc5a5cSClaudio Fontana type_init(kvm_cpu_accel_register_types); 245