11f070489SIgor Mammedov /* 21f070489SIgor Mammedov * QEMU Host Memory Backend 31f070489SIgor Mammedov * 41f070489SIgor Mammedov * Copyright (C) 2013-2014 Red Hat Inc 51f070489SIgor Mammedov * 61f070489SIgor Mammedov * Authors: 71f070489SIgor Mammedov * Igor Mammedov <imammedo@redhat.com> 81f070489SIgor Mammedov * 91f070489SIgor Mammedov * This work is licensed under the terms of the GNU GPL, version 2 or later. 101f070489SIgor Mammedov * See the COPYING file in the top-level directory. 111f070489SIgor Mammedov */ 129af23989SMarkus Armbruster 139c058332SPeter Maydell #include "qemu/osdep.h" 141f070489SIgor Mammedov #include "sysemu/hostmem.h" 156b269967SEduardo Habkost #include "hw/boards.h" 16da34e65cSMarkus Armbruster #include "qapi/error.h" 17eb815e24SMarkus Armbruster #include "qapi/qapi-builtin-visit.h" 181f070489SIgor Mammedov #include "qapi/visitor.h" 191f070489SIgor Mammedov #include "qemu/config-file.h" 201f070489SIgor Mammedov #include "qom/object_interfaces.h" 212b108085SDavid Gibson #include "qemu/mmap-alloc.h" 22b85ea5faSPeter Maydell #include "qemu/madvise.h" 231f070489SIgor Mammedov 244cf1b76bSHu Tao #ifdef CONFIG_NUMA 254cf1b76bSHu Tao #include <numaif.h> 266bb613f0SMichal Privoznik #include <numa.h> 274cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_DEFAULT != MPOL_DEFAULT); 286bb613f0SMichal Privoznik /* 296bb613f0SMichal Privoznik * HOST_MEM_POLICY_PREFERRED may either translate to MPOL_PREFERRED or 306bb613f0SMichal Privoznik * MPOL_PREFERRED_MANY, see comments further below. 316bb613f0SMichal Privoznik */ 324cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_PREFERRED != MPOL_PREFERRED); 334cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_BIND != MPOL_BIND); 344cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_INTERLEAVE != MPOL_INTERLEAVE); 354cf1b76bSHu Tao #endif 364cf1b76bSHu Tao 37fa0cb34dSMarc-André Lureau char * 38fa0cb34dSMarc-André Lureau host_memory_backend_get_name(HostMemoryBackend *backend) 39fa0cb34dSMarc-André Lureau { 40fa0cb34dSMarc-André Lureau if (!backend->use_canonical_path) { 417a309cc9SMarkus Armbruster return g_strdup(object_get_canonical_path_component(OBJECT(backend))); 42fa0cb34dSMarc-André Lureau } 43fa0cb34dSMarc-André Lureau 44fa0cb34dSMarc-André Lureau return object_get_canonical_path(OBJECT(backend)); 45fa0cb34dSMarc-André Lureau } 46fa0cb34dSMarc-André Lureau 471f070489SIgor Mammedov static void 48d7bce999SEric Blake host_memory_backend_get_size(Object *obj, Visitor *v, const char *name, 49d7bce999SEric Blake void *opaque, Error **errp) 501f070489SIgor Mammedov { 511f070489SIgor Mammedov HostMemoryBackend *backend = MEMORY_BACKEND(obj); 521f070489SIgor Mammedov uint64_t value = backend->size; 531f070489SIgor Mammedov 5451e72bc1SEric Blake visit_type_size(v, name, &value, errp); 551f070489SIgor Mammedov } 561f070489SIgor Mammedov 571f070489SIgor Mammedov static void 58d7bce999SEric Blake host_memory_backend_set_size(Object *obj, Visitor *v, const char *name, 59d7bce999SEric Blake void *opaque, Error **errp) 601f070489SIgor Mammedov { 611f070489SIgor Mammedov HostMemoryBackend *backend = MEMORY_BACKEND(obj); 621f070489SIgor Mammedov uint64_t value; 631f070489SIgor Mammedov 646f4c60e4SPeter Xu if (host_memory_backend_mr_inited(backend)) { 65dcfe4805SMarkus Armbruster error_setg(errp, "cannot change property %s of %s ", name, 66dcfe4805SMarkus Armbruster object_get_typename(obj)); 67dcfe4805SMarkus Armbruster return; 681f070489SIgor Mammedov } 691f070489SIgor Mammedov 70668f62ecSMarkus Armbruster if (!visit_type_size(v, name, &value, errp)) { 71dcfe4805SMarkus Armbruster return; 721f070489SIgor Mammedov } 731f070489SIgor Mammedov if (!value) { 74dcfe4805SMarkus Armbruster error_setg(errp, 7521d16836SZhang Yi "property '%s' of %s doesn't take value '%" PRIu64 "'", 7621d16836SZhang Yi name, object_get_typename(obj), value); 77dcfe4805SMarkus Armbruster return; 781f070489SIgor Mammedov } 791f070489SIgor Mammedov backend->size = value; 801f070489SIgor Mammedov } 811f070489SIgor Mammedov 824cf1b76bSHu Tao static void 83d7bce999SEric Blake host_memory_backend_get_host_nodes(Object *obj, Visitor *v, const char *name, 84d7bce999SEric Blake void *opaque, Error **errp) 854cf1b76bSHu Tao { 864cf1b76bSHu Tao HostMemoryBackend *backend = MEMORY_BACKEND(obj); 874cf1b76bSHu Tao uint16List *host_nodes = NULL; 88c3033fd3SEric Blake uint16List **tail = &host_nodes; 894cf1b76bSHu Tao unsigned long value; 904cf1b76bSHu Tao 914cf1b76bSHu Tao value = find_first_bit(backend->host_nodes, MAX_NODES); 921454d33fSXiao Guangrong if (value == MAX_NODES) { 9315160ab7SIgor Mammedov goto ret; 941454d33fSXiao Guangrong } 954cf1b76bSHu Tao 96c3033fd3SEric Blake QAPI_LIST_APPEND(tail, value); 97658ae5a7SMarkus Armbruster 984cf1b76bSHu Tao do { 994cf1b76bSHu Tao value = find_next_bit(backend->host_nodes, MAX_NODES, value + 1); 1004cf1b76bSHu Tao if (value == MAX_NODES) { 1014cf1b76bSHu Tao break; 1024cf1b76bSHu Tao } 1034cf1b76bSHu Tao 104c3033fd3SEric Blake QAPI_LIST_APPEND(tail, value); 1054cf1b76bSHu Tao } while (true); 1064cf1b76bSHu Tao 10715160ab7SIgor Mammedov ret: 10851e72bc1SEric Blake visit_type_uint16List(v, name, &host_nodes, errp); 109bdd5ce05SKeqian Zhu qapi_free_uint16List(host_nodes); 1104cf1b76bSHu Tao } 1114cf1b76bSHu Tao 1124cf1b76bSHu Tao static void 113d7bce999SEric Blake host_memory_backend_set_host_nodes(Object *obj, Visitor *v, const char *name, 114d7bce999SEric Blake void *opaque, Error **errp) 1154cf1b76bSHu Tao { 1164cf1b76bSHu Tao #ifdef CONFIG_NUMA 1174cf1b76bSHu Tao HostMemoryBackend *backend = MEMORY_BACKEND(obj); 118ffa144b3SEduardo Habkost uint16List *l, *host_nodes = NULL; 1194cf1b76bSHu Tao 120ffa144b3SEduardo Habkost visit_type_uint16List(v, name, &host_nodes, errp); 1214cf1b76bSHu Tao 122ffa144b3SEduardo Habkost for (l = host_nodes; l; l = l->next) { 123ffa144b3SEduardo Habkost if (l->value >= MAX_NODES) { 124ffa144b3SEduardo Habkost error_setg(errp, "Invalid host-nodes value: %d", l->value); 125ffa144b3SEduardo Habkost goto out; 1264cf1b76bSHu Tao } 127ffa144b3SEduardo Habkost } 128ffa144b3SEduardo Habkost 129ffa144b3SEduardo Habkost for (l = host_nodes; l; l = l->next) { 130ffa144b3SEduardo Habkost bitmap_set(backend->host_nodes, l->value, 1); 131ffa144b3SEduardo Habkost } 132ffa144b3SEduardo Habkost 133ffa144b3SEduardo Habkost out: 134ffa144b3SEduardo Habkost qapi_free_uint16List(host_nodes); 1354cf1b76bSHu Tao #else 1364cf1b76bSHu Tao error_setg(errp, "NUMA node binding are not supported by this QEMU"); 1374cf1b76bSHu Tao #endif 1384cf1b76bSHu Tao } 1394cf1b76bSHu Tao 140a3590dacSDaniel P. Berrange static int 141a3590dacSDaniel P. Berrange host_memory_backend_get_policy(Object *obj, Error **errp G_GNUC_UNUSED) 1424cf1b76bSHu Tao { 1434cf1b76bSHu Tao HostMemoryBackend *backend = MEMORY_BACKEND(obj); 144a3590dacSDaniel P. Berrange return backend->policy; 1454cf1b76bSHu Tao } 1464cf1b76bSHu Tao 1474cf1b76bSHu Tao static void 148a3590dacSDaniel P. Berrange host_memory_backend_set_policy(Object *obj, int policy, Error **errp) 1494cf1b76bSHu Tao { 1504cf1b76bSHu Tao HostMemoryBackend *backend = MEMORY_BACKEND(obj); 1514cf1b76bSHu Tao backend->policy = policy; 1524cf1b76bSHu Tao 1534cf1b76bSHu Tao #ifndef CONFIG_NUMA 1544cf1b76bSHu Tao if (policy != HOST_MEM_POLICY_DEFAULT) { 1554cf1b76bSHu Tao error_setg(errp, "NUMA policies are not supported by this QEMU"); 1564cf1b76bSHu Tao } 1574cf1b76bSHu Tao #endif 1584cf1b76bSHu Tao } 1594cf1b76bSHu Tao 160605d0a94SPaolo Bonzini static bool host_memory_backend_get_merge(Object *obj, Error **errp) 161605d0a94SPaolo Bonzini { 162605d0a94SPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj); 163605d0a94SPaolo Bonzini 164605d0a94SPaolo Bonzini return backend->merge; 165605d0a94SPaolo Bonzini } 166605d0a94SPaolo Bonzini 167605d0a94SPaolo Bonzini static void host_memory_backend_set_merge(Object *obj, bool value, Error **errp) 168605d0a94SPaolo Bonzini { 169605d0a94SPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj); 170605d0a94SPaolo Bonzini 1716f4c60e4SPeter Xu if (!host_memory_backend_mr_inited(backend)) { 172605d0a94SPaolo Bonzini backend->merge = value; 173605d0a94SPaolo Bonzini return; 174605d0a94SPaolo Bonzini } 175605d0a94SPaolo Bonzini 176605d0a94SPaolo Bonzini if (value != backend->merge) { 177605d0a94SPaolo Bonzini void *ptr = memory_region_get_ram_ptr(&backend->mr); 178605d0a94SPaolo Bonzini uint64_t sz = memory_region_size(&backend->mr); 179605d0a94SPaolo Bonzini 180605d0a94SPaolo Bonzini qemu_madvise(ptr, sz, 181605d0a94SPaolo Bonzini value ? QEMU_MADV_MERGEABLE : QEMU_MADV_UNMERGEABLE); 182605d0a94SPaolo Bonzini backend->merge = value; 183605d0a94SPaolo Bonzini } 184605d0a94SPaolo Bonzini } 185605d0a94SPaolo Bonzini 186605d0a94SPaolo Bonzini static bool host_memory_backend_get_dump(Object *obj, Error **errp) 187605d0a94SPaolo Bonzini { 188605d0a94SPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj); 189605d0a94SPaolo Bonzini 190605d0a94SPaolo Bonzini return backend->dump; 191605d0a94SPaolo Bonzini } 192605d0a94SPaolo Bonzini 193605d0a94SPaolo Bonzini static void host_memory_backend_set_dump(Object *obj, bool value, Error **errp) 194605d0a94SPaolo Bonzini { 195605d0a94SPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj); 196605d0a94SPaolo Bonzini 1976f4c60e4SPeter Xu if (!host_memory_backend_mr_inited(backend)) { 198605d0a94SPaolo Bonzini backend->dump = value; 199605d0a94SPaolo Bonzini return; 200605d0a94SPaolo Bonzini } 201605d0a94SPaolo Bonzini 202605d0a94SPaolo Bonzini if (value != backend->dump) { 203605d0a94SPaolo Bonzini void *ptr = memory_region_get_ram_ptr(&backend->mr); 204605d0a94SPaolo Bonzini uint64_t sz = memory_region_size(&backend->mr); 205605d0a94SPaolo Bonzini 206605d0a94SPaolo Bonzini qemu_madvise(ptr, sz, 207605d0a94SPaolo Bonzini value ? QEMU_MADV_DODUMP : QEMU_MADV_DONTDUMP); 208605d0a94SPaolo Bonzini backend->dump = value; 209605d0a94SPaolo Bonzini } 210605d0a94SPaolo Bonzini } 211605d0a94SPaolo Bonzini 212a35ba7beSPaolo Bonzini static bool host_memory_backend_get_prealloc(Object *obj, Error **errp) 213a35ba7beSPaolo Bonzini { 214a35ba7beSPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj); 215a35ba7beSPaolo Bonzini 2164ebc74dbSIgor Mammedov return backend->prealloc; 217a35ba7beSPaolo Bonzini } 218a35ba7beSPaolo Bonzini 219a35ba7beSPaolo Bonzini static void host_memory_backend_set_prealloc(Object *obj, bool value, 220a35ba7beSPaolo Bonzini Error **errp) 221a35ba7beSPaolo Bonzini { 222056b68afSIgor Mammedov Error *local_err = NULL; 223a35ba7beSPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj); 224a35ba7beSPaolo Bonzini 2259181fb70SDavid Hildenbrand if (!backend->reserve && value) { 2269181fb70SDavid Hildenbrand error_setg(errp, "'prealloc=on' and 'reserve=off' are incompatible"); 2279181fb70SDavid Hildenbrand return; 2289181fb70SDavid Hildenbrand } 2299181fb70SDavid Hildenbrand 2306f4c60e4SPeter Xu if (!host_memory_backend_mr_inited(backend)) { 231a35ba7beSPaolo Bonzini backend->prealloc = value; 232a35ba7beSPaolo Bonzini return; 233a35ba7beSPaolo Bonzini } 234a35ba7beSPaolo Bonzini 235a35ba7beSPaolo Bonzini if (value && !backend->prealloc) { 236a35ba7beSPaolo Bonzini int fd = memory_region_get_fd(&backend->mr); 237a35ba7beSPaolo Bonzini void *ptr = memory_region_get_ram_ptr(&backend->mr); 238a35ba7beSPaolo Bonzini uint64_t sz = memory_region_size(&backend->mr); 239a35ba7beSPaolo Bonzini 240e6816458SDavid Hildenbrand qemu_prealloc_mem(fd, ptr, sz, backend->prealloc_threads, 241e6816458SDavid Hildenbrand backend->prealloc_context, &local_err); 242056b68afSIgor Mammedov if (local_err) { 243056b68afSIgor Mammedov error_propagate(errp, local_err); 244056b68afSIgor Mammedov return; 245056b68afSIgor Mammedov } 246a35ba7beSPaolo Bonzini backend->prealloc = true; 247a35ba7beSPaolo Bonzini } 248a35ba7beSPaolo Bonzini } 249a35ba7beSPaolo Bonzini 250ffac16faSIgor Mammedov static void host_memory_backend_get_prealloc_threads(Object *obj, Visitor *v, 251ffac16faSIgor Mammedov const char *name, void *opaque, Error **errp) 252ffac16faSIgor Mammedov { 253ffac16faSIgor Mammedov HostMemoryBackend *backend = MEMORY_BACKEND(obj); 254ffac16faSIgor Mammedov visit_type_uint32(v, name, &backend->prealloc_threads, errp); 255ffac16faSIgor Mammedov } 256ffac16faSIgor Mammedov 257ffac16faSIgor Mammedov static void host_memory_backend_set_prealloc_threads(Object *obj, Visitor *v, 258ffac16faSIgor Mammedov const char *name, void *opaque, Error **errp) 259ffac16faSIgor Mammedov { 260ffac16faSIgor Mammedov HostMemoryBackend *backend = MEMORY_BACKEND(obj); 261ffac16faSIgor Mammedov uint32_t value; 262ffac16faSIgor Mammedov 263668f62ecSMarkus Armbruster if (!visit_type_uint32(v, name, &value, errp)) { 264dcfe4805SMarkus Armbruster return; 265ffac16faSIgor Mammedov } 266ffac16faSIgor Mammedov if (value <= 0) { 267dcfe4805SMarkus Armbruster error_setg(errp, "property '%s' of %s doesn't take value '%d'", name, 268dcfe4805SMarkus Armbruster object_get_typename(obj), value); 269dcfe4805SMarkus Armbruster return; 270ffac16faSIgor Mammedov } 271ffac16faSIgor Mammedov backend->prealloc_threads = value; 272ffac16faSIgor Mammedov } 273ffac16faSIgor Mammedov 27458f4662cSHu Tao static void host_memory_backend_init(Object *obj) 2751f070489SIgor Mammedov { 276605d0a94SPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj); 2776b269967SEduardo Habkost MachineState *machine = MACHINE(qdev_get_machine()); 278605d0a94SPaolo Bonzini 279ffac16faSIgor Mammedov /* TODO: convert access to globals to compat properties */ 2806b269967SEduardo Habkost backend->merge = machine_mem_merge(machine); 2816b269967SEduardo Habkost backend->dump = machine_dump_guest_core(machine); 2829181fb70SDavid Hildenbrand backend->reserve = true; 283f8d426a6SJaroslav Jindrak backend->prealloc_threads = machine->smp.cpus; 2841f070489SIgor Mammedov } 2851f070489SIgor Mammedov 286fa0cb34dSMarc-André Lureau static void host_memory_backend_post_init(Object *obj) 287fa0cb34dSMarc-André Lureau { 288fa0cb34dSMarc-André Lureau object_apply_compat_props(obj); 289fa0cb34dSMarc-André Lureau } 290fa0cb34dSMarc-André Lureau 2914728b574SPeter Xu bool host_memory_backend_mr_inited(HostMemoryBackend *backend) 2924728b574SPeter Xu { 2934728b574SPeter Xu /* 2944728b574SPeter Xu * NOTE: We forbid zero-length memory backend, so here zero means 2954728b574SPeter Xu * "we haven't inited the backend memory region yet". 2964728b574SPeter Xu */ 2974728b574SPeter Xu return memory_region_size(&backend->mr) != 0; 2984728b574SPeter Xu } 2994728b574SPeter Xu 3007943e97bSDavid Hildenbrand MemoryRegion *host_memory_backend_get_memory(HostMemoryBackend *backend) 3011f070489SIgor Mammedov { 3026f4c60e4SPeter Xu return host_memory_backend_mr_inited(backend) ? &backend->mr : NULL; 3031f070489SIgor Mammedov } 3041f070489SIgor Mammedov 3052aece63cSXiao Guangrong void host_memory_backend_set_mapped(HostMemoryBackend *backend, bool mapped) 3062aece63cSXiao Guangrong { 3072aece63cSXiao Guangrong backend->is_mapped = mapped; 3082aece63cSXiao Guangrong } 3092aece63cSXiao Guangrong 3102aece63cSXiao Guangrong bool host_memory_backend_is_mapped(HostMemoryBackend *backend) 3112aece63cSXiao Guangrong { 3122aece63cSXiao Guangrong return backend->is_mapped; 3132aece63cSXiao Guangrong } 3142aece63cSXiao Guangrong 3152b108085SDavid Gibson size_t host_memory_backend_pagesize(HostMemoryBackend *memdev) 3162b108085SDavid Gibson { 3178be934b7SThomas Huth size_t pagesize = qemu_ram_pagesize(memdev->mr.ram_block); 3188be934b7SThomas Huth g_assert(pagesize >= qemu_real_host_page_size()); 3192b108085SDavid Gibson return pagesize; 3202b108085SDavid Gibson } 3212b108085SDavid Gibson 322bd9262d9SHu Tao static void 323bd9262d9SHu Tao host_memory_backend_memory_complete(UserCreatable *uc, Error **errp) 324bd9262d9SHu Tao { 325bd9262d9SHu Tao HostMemoryBackend *backend = MEMORY_BACKEND(uc); 326bd9262d9SHu Tao HostMemoryBackendClass *bc = MEMORY_BACKEND_GET_CLASS(uc); 327605d0a94SPaolo Bonzini Error *local_err = NULL; 328605d0a94SPaolo Bonzini void *ptr; 329605d0a94SPaolo Bonzini uint64_t sz; 330bd9262d9SHu Tao 331e199f7adSPhilippe Mathieu-Daudé if (!bc->alloc) { 332e199f7adSPhilippe Mathieu-Daudé return; 333e199f7adSPhilippe Mathieu-Daudé } 334*fdb63cf3SPhilippe Mathieu-Daudé if (!bc->alloc(backend, errp)) { 335*fdb63cf3SPhilippe Mathieu-Daudé return; 336605d0a94SPaolo Bonzini } 337605d0a94SPaolo Bonzini 338605d0a94SPaolo Bonzini ptr = memory_region_get_ram_ptr(&backend->mr); 339605d0a94SPaolo Bonzini sz = memory_region_size(&backend->mr); 340605d0a94SPaolo Bonzini 341605d0a94SPaolo Bonzini if (backend->merge) { 342605d0a94SPaolo Bonzini qemu_madvise(ptr, sz, QEMU_MADV_MERGEABLE); 343605d0a94SPaolo Bonzini } 344605d0a94SPaolo Bonzini if (!backend->dump) { 345605d0a94SPaolo Bonzini qemu_madvise(ptr, sz, QEMU_MADV_DONTDUMP); 346605d0a94SPaolo Bonzini } 3474cf1b76bSHu Tao #ifdef CONFIG_NUMA 3484cf1b76bSHu Tao unsigned long lastbit = find_last_bit(backend->host_nodes, MAX_NODES); 3494cf1b76bSHu Tao /* lastbit == MAX_NODES means maxnode = 0 */ 3504cf1b76bSHu Tao unsigned long maxnode = (lastbit + 1) % (MAX_NODES + 1); 3514cf1b76bSHu Tao /* ensure policy won't be ignored in case memory is preallocated 3524cf1b76bSHu Tao * before mbind(). note: MPOL_MF_STRICT is ignored on hugepages so 3534cf1b76bSHu Tao * this doesn't catch hugepage case. */ 354288d3322SMichael S. Tsirkin unsigned flags = MPOL_MF_STRICT | MPOL_MF_MOVE; 3556bb613f0SMichal Privoznik int mode = backend->policy; 3564cf1b76bSHu Tao 3574cf1b76bSHu Tao /* check for invalid host-nodes and policies and give more verbose 3584cf1b76bSHu Tao * error messages than mbind(). */ 3594cf1b76bSHu Tao if (maxnode && backend->policy == MPOL_DEFAULT) { 3604cf1b76bSHu Tao error_setg(errp, "host-nodes must be empty for policy default," 3614cf1b76bSHu Tao " or you should explicitly specify a policy other" 3624cf1b76bSHu Tao " than default"); 3634cf1b76bSHu Tao return; 3644cf1b76bSHu Tao } else if (maxnode == 0 && backend->policy != MPOL_DEFAULT) { 3654cf1b76bSHu Tao error_setg(errp, "host-nodes must be set for policy %s", 366977c736fSMarkus Armbruster HostMemPolicy_str(backend->policy)); 3674cf1b76bSHu Tao return; 3684cf1b76bSHu Tao } 3694cf1b76bSHu Tao 3704cf1b76bSHu Tao /* We can have up to MAX_NODES nodes, but we need to pass maxnode+1 3714cf1b76bSHu Tao * as argument to mbind() due to an old Linux bug (feature?) which 3724cf1b76bSHu Tao * cuts off the last specified node. This means backend->host_nodes 3734cf1b76bSHu Tao * must have MAX_NODES+1 bits available. 3744cf1b76bSHu Tao */ 3754cf1b76bSHu Tao assert(sizeof(backend->host_nodes) >= 3764cf1b76bSHu Tao BITS_TO_LONGS(MAX_NODES + 1) * sizeof(unsigned long)); 3774cf1b76bSHu Tao assert(maxnode <= MAX_NODES); 37870b6d525SIgor Mammedov 3796bb613f0SMichal Privoznik #ifdef HAVE_NUMA_HAS_PREFERRED_MANY 3806bb613f0SMichal Privoznik if (mode == MPOL_PREFERRED && numa_has_preferred_many() > 0) { 3816bb613f0SMichal Privoznik /* 3826bb613f0SMichal Privoznik * Replace with MPOL_PREFERRED_MANY otherwise the mbind() below 3836bb613f0SMichal Privoznik * silently picks the first node. 3846bb613f0SMichal Privoznik */ 3856bb613f0SMichal Privoznik mode = MPOL_PREFERRED_MANY; 3866bb613f0SMichal Privoznik } 3876bb613f0SMichal Privoznik #endif 3886bb613f0SMichal Privoznik 38970b6d525SIgor Mammedov if (maxnode && 3906bb613f0SMichal Privoznik mbind(ptr, sz, mode, backend->host_nodes, maxnode + 1, flags)) { 391a3567ba1SPavel Fedin if (backend->policy != MPOL_DEFAULT || errno != ENOSYS) { 3924cf1b76bSHu Tao error_setg_errno(errp, errno, 3934cf1b76bSHu Tao "cannot bind memory to host NUMA nodes"); 3944cf1b76bSHu Tao return; 3954cf1b76bSHu Tao } 396a3567ba1SPavel Fedin } 3974cf1b76bSHu Tao #endif 3984cf1b76bSHu Tao /* Preallocate memory after the NUMA policy has been instantiated. 3994cf1b76bSHu Tao * This is necessary to guarantee memory is allocated with 4004cf1b76bSHu Tao * specified NUMA policy in place. 4014cf1b76bSHu Tao */ 402a35ba7beSPaolo Bonzini if (backend->prealloc) { 4036556aadcSDavid Hildenbrand qemu_prealloc_mem(memory_region_get_fd(&backend->mr), ptr, sz, 404e6816458SDavid Hildenbrand backend->prealloc_threads, 405e6816458SDavid Hildenbrand backend->prealloc_context, &local_err); 406056b68afSIgor Mammedov if (local_err) { 407056b68afSIgor Mammedov goto out; 408a35ba7beSPaolo Bonzini } 409bd9262d9SHu Tao } 410056b68afSIgor Mammedov out: 411056b68afSIgor Mammedov error_propagate(errp, local_err); 412056b68afSIgor Mammedov } 413bd9262d9SHu Tao 41436bce5caSLin Ma static bool 4153beacfb9SEduardo Habkost host_memory_backend_can_be_deleted(UserCreatable *uc) 41636bce5caSLin Ma { 4172aece63cSXiao Guangrong if (host_memory_backend_is_mapped(MEMORY_BACKEND(uc))) { 41836bce5caSLin Ma return false; 41936bce5caSLin Ma } else { 42036bce5caSLin Ma return true; 42136bce5caSLin Ma } 42236bce5caSLin Ma } 42336bce5caSLin Ma 42406329cceSMarcel Apfelbaum static bool host_memory_backend_get_share(Object *o, Error **errp) 42506329cceSMarcel Apfelbaum { 42606329cceSMarcel Apfelbaum HostMemoryBackend *backend = MEMORY_BACKEND(o); 42706329cceSMarcel Apfelbaum 42806329cceSMarcel Apfelbaum return backend->share; 42906329cceSMarcel Apfelbaum } 43006329cceSMarcel Apfelbaum 43106329cceSMarcel Apfelbaum static void host_memory_backend_set_share(Object *o, bool value, Error **errp) 43206329cceSMarcel Apfelbaum { 43306329cceSMarcel Apfelbaum HostMemoryBackend *backend = MEMORY_BACKEND(o); 43406329cceSMarcel Apfelbaum 43506329cceSMarcel Apfelbaum if (host_memory_backend_mr_inited(backend)) { 43606329cceSMarcel Apfelbaum error_setg(errp, "cannot change property value"); 43706329cceSMarcel Apfelbaum return; 43806329cceSMarcel Apfelbaum } 43906329cceSMarcel Apfelbaum backend->share = value; 44006329cceSMarcel Apfelbaum } 44106329cceSMarcel Apfelbaum 4429181fb70SDavid Hildenbrand #ifdef CONFIG_LINUX 4439181fb70SDavid Hildenbrand static bool host_memory_backend_get_reserve(Object *o, Error **errp) 4449181fb70SDavid Hildenbrand { 4459181fb70SDavid Hildenbrand HostMemoryBackend *backend = MEMORY_BACKEND(o); 4469181fb70SDavid Hildenbrand 4479181fb70SDavid Hildenbrand return backend->reserve; 4489181fb70SDavid Hildenbrand } 4499181fb70SDavid Hildenbrand 4509181fb70SDavid Hildenbrand static void host_memory_backend_set_reserve(Object *o, bool value, Error **errp) 4519181fb70SDavid Hildenbrand { 4529181fb70SDavid Hildenbrand HostMemoryBackend *backend = MEMORY_BACKEND(o); 4539181fb70SDavid Hildenbrand 4549181fb70SDavid Hildenbrand if (host_memory_backend_mr_inited(backend)) { 4559181fb70SDavid Hildenbrand error_setg(errp, "cannot change property value"); 4569181fb70SDavid Hildenbrand return; 4579181fb70SDavid Hildenbrand } 4589181fb70SDavid Hildenbrand if (backend->prealloc && !value) { 4599181fb70SDavid Hildenbrand error_setg(errp, "'prealloc=on' and 'reserve=off' are incompatible"); 4609181fb70SDavid Hildenbrand return; 4619181fb70SDavid Hildenbrand } 4629181fb70SDavid Hildenbrand backend->reserve = value; 4639181fb70SDavid Hildenbrand } 4649181fb70SDavid Hildenbrand #endif /* CONFIG_LINUX */ 4659181fb70SDavid Hildenbrand 466fa0cb34dSMarc-André Lureau static bool 467fa0cb34dSMarc-André Lureau host_memory_backend_get_use_canonical_path(Object *obj, Error **errp) 468fa0cb34dSMarc-André Lureau { 469fa0cb34dSMarc-André Lureau HostMemoryBackend *backend = MEMORY_BACKEND(obj); 470fa0cb34dSMarc-André Lureau 471fa0cb34dSMarc-André Lureau return backend->use_canonical_path; 472fa0cb34dSMarc-André Lureau } 473fa0cb34dSMarc-André Lureau 474fa0cb34dSMarc-André Lureau static void 475fa0cb34dSMarc-André Lureau host_memory_backend_set_use_canonical_path(Object *obj, bool value, 476fa0cb34dSMarc-André Lureau Error **errp) 477fa0cb34dSMarc-André Lureau { 478fa0cb34dSMarc-André Lureau HostMemoryBackend *backend = MEMORY_BACKEND(obj); 479fa0cb34dSMarc-André Lureau 480fa0cb34dSMarc-André Lureau backend->use_canonical_path = value; 481fa0cb34dSMarc-André Lureau } 482fa0cb34dSMarc-André Lureau 483bd9262d9SHu Tao static void 484bd9262d9SHu Tao host_memory_backend_class_init(ObjectClass *oc, void *data) 485bd9262d9SHu Tao { 486bd9262d9SHu Tao UserCreatableClass *ucc = USER_CREATABLE_CLASS(oc); 487bd9262d9SHu Tao 488bd9262d9SHu Tao ucc->complete = host_memory_backend_memory_complete; 48936bce5caSLin Ma ucc->can_be_deleted = host_memory_backend_can_be_deleted; 490e62834caSEduardo Habkost 491e62834caSEduardo Habkost object_class_property_add_bool(oc, "merge", 492e62834caSEduardo Habkost host_memory_backend_get_merge, 493d2623129SMarkus Armbruster host_memory_backend_set_merge); 494033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "merge", 4957eecec7dSMarkus Armbruster "Mark memory as mergeable"); 496e62834caSEduardo Habkost object_class_property_add_bool(oc, "dump", 497e62834caSEduardo Habkost host_memory_backend_get_dump, 498d2623129SMarkus Armbruster host_memory_backend_set_dump); 499033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "dump", 5007eecec7dSMarkus Armbruster "Set to 'off' to exclude from core dump"); 501e62834caSEduardo Habkost object_class_property_add_bool(oc, "prealloc", 502e62834caSEduardo Habkost host_memory_backend_get_prealloc, 503d2623129SMarkus Armbruster host_memory_backend_set_prealloc); 504033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "prealloc", 5057eecec7dSMarkus Armbruster "Preallocate memory"); 506ffac16faSIgor Mammedov object_class_property_add(oc, "prealloc-threads", "int", 507ffac16faSIgor Mammedov host_memory_backend_get_prealloc_threads, 508ffac16faSIgor Mammedov host_memory_backend_set_prealloc_threads, 509d2623129SMarkus Armbruster NULL, NULL); 510ffac16faSIgor Mammedov object_class_property_set_description(oc, "prealloc-threads", 5117eecec7dSMarkus Armbruster "Number of CPU threads to use for prealloc"); 512e6816458SDavid Hildenbrand object_class_property_add_link(oc, "prealloc-context", 513e6816458SDavid Hildenbrand TYPE_THREAD_CONTEXT, offsetof(HostMemoryBackend, prealloc_context), 514e6816458SDavid Hildenbrand object_property_allow_set_link, OBJ_PROP_LINK_STRONG); 515e6816458SDavid Hildenbrand object_class_property_set_description(oc, "prealloc-context", 516e6816458SDavid Hildenbrand "Context to use for creating CPU threads for preallocation"); 517e62834caSEduardo Habkost object_class_property_add(oc, "size", "int", 518e62834caSEduardo Habkost host_memory_backend_get_size, 519e62834caSEduardo Habkost host_memory_backend_set_size, 520d2623129SMarkus Armbruster NULL, NULL); 521033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "size", 5227eecec7dSMarkus Armbruster "Size of the memory region (ex: 500M)"); 523e62834caSEduardo Habkost object_class_property_add(oc, "host-nodes", "int", 524e62834caSEduardo Habkost host_memory_backend_get_host_nodes, 525e62834caSEduardo Habkost host_memory_backend_set_host_nodes, 526d2623129SMarkus Armbruster NULL, NULL); 527033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "host-nodes", 5287eecec7dSMarkus Armbruster "Binds memory to the list of NUMA host nodes"); 529e62834caSEduardo Habkost object_class_property_add_enum(oc, "policy", "HostMemPolicy", 530f7abe0ecSMarc-André Lureau &HostMemPolicy_lookup, 531e62834caSEduardo Habkost host_memory_backend_get_policy, 532d2623129SMarkus Armbruster host_memory_backend_set_policy); 533033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "policy", 5347eecec7dSMarkus Armbruster "Set the NUMA policy"); 53506329cceSMarcel Apfelbaum object_class_property_add_bool(oc, "share", 536d2623129SMarkus Armbruster host_memory_backend_get_share, host_memory_backend_set_share); 537033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "share", 5387eecec7dSMarkus Armbruster "Mark the memory as private to QEMU or shared"); 5399181fb70SDavid Hildenbrand #ifdef CONFIG_LINUX 5409181fb70SDavid Hildenbrand object_class_property_add_bool(oc, "reserve", 5419181fb70SDavid Hildenbrand host_memory_backend_get_reserve, host_memory_backend_set_reserve); 5429181fb70SDavid Hildenbrand object_class_property_set_description(oc, "reserve", 5439181fb70SDavid Hildenbrand "Reserve swap space (or huge pages) if applicable"); 5449181fb70SDavid Hildenbrand #endif /* CONFIG_LINUX */ 5458db0b204SIgor Mammedov /* 5468db0b204SIgor Mammedov * Do not delete/rename option. This option must be considered stable 5478db0b204SIgor Mammedov * (as if it didn't have the 'x-' prefix including deprecation period) as 5488db0b204SIgor Mammedov * long as 4.0 and older machine types exists. 5498db0b204SIgor Mammedov * Option will be used by upper layers to override (disable) canonical path 5508db0b204SIgor Mammedov * for ramblock-id set by compat properties on old machine types ( <= 4.0), 5518db0b204SIgor Mammedov * to keep migration working when backend is used for main RAM with 5528db0b204SIgor Mammedov * -machine memory-backend= option (main RAM historically used prefix-less 5538db0b204SIgor Mammedov * ramblock-id). 5548db0b204SIgor Mammedov */ 555fa0cb34dSMarc-André Lureau object_class_property_add_bool(oc, "x-use-canonical-path-for-ramblock-id", 556fa0cb34dSMarc-André Lureau host_memory_backend_get_use_canonical_path, 557d2623129SMarkus Armbruster host_memory_backend_set_use_canonical_path); 558e1ff3c67SIgor Mammedov } 559e1ff3c67SIgor Mammedov 56058f4662cSHu Tao static const TypeInfo host_memory_backend_info = { 5611f070489SIgor Mammedov .name = TYPE_MEMORY_BACKEND, 5621f070489SIgor Mammedov .parent = TYPE_OBJECT, 5631f070489SIgor Mammedov .abstract = true, 5641f070489SIgor Mammedov .class_size = sizeof(HostMemoryBackendClass), 565bd9262d9SHu Tao .class_init = host_memory_backend_class_init, 5661f070489SIgor Mammedov .instance_size = sizeof(HostMemoryBackend), 56758f4662cSHu Tao .instance_init = host_memory_backend_init, 568fa0cb34dSMarc-André Lureau .instance_post_init = host_memory_backend_post_init, 5691f070489SIgor Mammedov .interfaces = (InterfaceInfo[]) { 5701f070489SIgor Mammedov { TYPE_USER_CREATABLE }, 5711f070489SIgor Mammedov { } 5721f070489SIgor Mammedov } 5731f070489SIgor Mammedov }; 5741f070489SIgor Mammedov 5751f070489SIgor Mammedov static void register_types(void) 5761f070489SIgor Mammedov { 57758f4662cSHu Tao type_register_static(&host_memory_backend_info); 5781f070489SIgor Mammedov } 5791f070489SIgor Mammedov 5801f070489SIgor Mammedov type_init(register_types); 581