xref: /qemu/backends/hostmem.c (revision fdb63cf3b57a230f4cc530ea2515229aeada0998)
11f070489SIgor Mammedov /*
21f070489SIgor Mammedov  * QEMU Host Memory Backend
31f070489SIgor Mammedov  *
41f070489SIgor Mammedov  * Copyright (C) 2013-2014 Red Hat Inc
51f070489SIgor Mammedov  *
61f070489SIgor Mammedov  * Authors:
71f070489SIgor Mammedov  *   Igor Mammedov <imammedo@redhat.com>
81f070489SIgor Mammedov  *
91f070489SIgor Mammedov  * This work is licensed under the terms of the GNU GPL, version 2 or later.
101f070489SIgor Mammedov  * See the COPYING file in the top-level directory.
111f070489SIgor Mammedov  */
129af23989SMarkus Armbruster 
139c058332SPeter Maydell #include "qemu/osdep.h"
141f070489SIgor Mammedov #include "sysemu/hostmem.h"
156b269967SEduardo Habkost #include "hw/boards.h"
16da34e65cSMarkus Armbruster #include "qapi/error.h"
17eb815e24SMarkus Armbruster #include "qapi/qapi-builtin-visit.h"
181f070489SIgor Mammedov #include "qapi/visitor.h"
191f070489SIgor Mammedov #include "qemu/config-file.h"
201f070489SIgor Mammedov #include "qom/object_interfaces.h"
212b108085SDavid Gibson #include "qemu/mmap-alloc.h"
22b85ea5faSPeter Maydell #include "qemu/madvise.h"
231f070489SIgor Mammedov 
244cf1b76bSHu Tao #ifdef CONFIG_NUMA
254cf1b76bSHu Tao #include <numaif.h>
266bb613f0SMichal Privoznik #include <numa.h>
274cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_DEFAULT != MPOL_DEFAULT);
286bb613f0SMichal Privoznik /*
296bb613f0SMichal Privoznik  * HOST_MEM_POLICY_PREFERRED may either translate to MPOL_PREFERRED or
306bb613f0SMichal Privoznik  * MPOL_PREFERRED_MANY, see comments further below.
316bb613f0SMichal Privoznik  */
324cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_PREFERRED != MPOL_PREFERRED);
334cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_BIND != MPOL_BIND);
344cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_INTERLEAVE != MPOL_INTERLEAVE);
354cf1b76bSHu Tao #endif
364cf1b76bSHu Tao 
37fa0cb34dSMarc-André Lureau char *
38fa0cb34dSMarc-André Lureau host_memory_backend_get_name(HostMemoryBackend *backend)
39fa0cb34dSMarc-André Lureau {
40fa0cb34dSMarc-André Lureau     if (!backend->use_canonical_path) {
417a309cc9SMarkus Armbruster         return g_strdup(object_get_canonical_path_component(OBJECT(backend)));
42fa0cb34dSMarc-André Lureau     }
43fa0cb34dSMarc-André Lureau 
44fa0cb34dSMarc-André Lureau     return object_get_canonical_path(OBJECT(backend));
45fa0cb34dSMarc-André Lureau }
46fa0cb34dSMarc-André Lureau 
471f070489SIgor Mammedov static void
48d7bce999SEric Blake host_memory_backend_get_size(Object *obj, Visitor *v, const char *name,
49d7bce999SEric Blake                              void *opaque, Error **errp)
501f070489SIgor Mammedov {
511f070489SIgor Mammedov     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
521f070489SIgor Mammedov     uint64_t value = backend->size;
531f070489SIgor Mammedov 
5451e72bc1SEric Blake     visit_type_size(v, name, &value, errp);
551f070489SIgor Mammedov }
561f070489SIgor Mammedov 
571f070489SIgor Mammedov static void
58d7bce999SEric Blake host_memory_backend_set_size(Object *obj, Visitor *v, const char *name,
59d7bce999SEric Blake                              void *opaque, Error **errp)
601f070489SIgor Mammedov {
611f070489SIgor Mammedov     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
621f070489SIgor Mammedov     uint64_t value;
631f070489SIgor Mammedov 
646f4c60e4SPeter Xu     if (host_memory_backend_mr_inited(backend)) {
65dcfe4805SMarkus Armbruster         error_setg(errp, "cannot change property %s of %s ", name,
66dcfe4805SMarkus Armbruster                    object_get_typename(obj));
67dcfe4805SMarkus Armbruster         return;
681f070489SIgor Mammedov     }
691f070489SIgor Mammedov 
70668f62ecSMarkus Armbruster     if (!visit_type_size(v, name, &value, errp)) {
71dcfe4805SMarkus Armbruster         return;
721f070489SIgor Mammedov     }
731f070489SIgor Mammedov     if (!value) {
74dcfe4805SMarkus Armbruster         error_setg(errp,
7521d16836SZhang Yi                    "property '%s' of %s doesn't take value '%" PRIu64 "'",
7621d16836SZhang Yi                    name, object_get_typename(obj), value);
77dcfe4805SMarkus Armbruster         return;
781f070489SIgor Mammedov     }
791f070489SIgor Mammedov     backend->size = value;
801f070489SIgor Mammedov }
811f070489SIgor Mammedov 
824cf1b76bSHu Tao static void
83d7bce999SEric Blake host_memory_backend_get_host_nodes(Object *obj, Visitor *v, const char *name,
84d7bce999SEric Blake                                    void *opaque, Error **errp)
854cf1b76bSHu Tao {
864cf1b76bSHu Tao     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
874cf1b76bSHu Tao     uint16List *host_nodes = NULL;
88c3033fd3SEric Blake     uint16List **tail = &host_nodes;
894cf1b76bSHu Tao     unsigned long value;
904cf1b76bSHu Tao 
914cf1b76bSHu Tao     value = find_first_bit(backend->host_nodes, MAX_NODES);
921454d33fSXiao Guangrong     if (value == MAX_NODES) {
9315160ab7SIgor Mammedov         goto ret;
941454d33fSXiao Guangrong     }
954cf1b76bSHu Tao 
96c3033fd3SEric Blake     QAPI_LIST_APPEND(tail, value);
97658ae5a7SMarkus Armbruster 
984cf1b76bSHu Tao     do {
994cf1b76bSHu Tao         value = find_next_bit(backend->host_nodes, MAX_NODES, value + 1);
1004cf1b76bSHu Tao         if (value == MAX_NODES) {
1014cf1b76bSHu Tao             break;
1024cf1b76bSHu Tao         }
1034cf1b76bSHu Tao 
104c3033fd3SEric Blake         QAPI_LIST_APPEND(tail, value);
1054cf1b76bSHu Tao     } while (true);
1064cf1b76bSHu Tao 
10715160ab7SIgor Mammedov ret:
10851e72bc1SEric Blake     visit_type_uint16List(v, name, &host_nodes, errp);
109bdd5ce05SKeqian Zhu     qapi_free_uint16List(host_nodes);
1104cf1b76bSHu Tao }
1114cf1b76bSHu Tao 
1124cf1b76bSHu Tao static void
113d7bce999SEric Blake host_memory_backend_set_host_nodes(Object *obj, Visitor *v, const char *name,
114d7bce999SEric Blake                                    void *opaque, Error **errp)
1154cf1b76bSHu Tao {
1164cf1b76bSHu Tao #ifdef CONFIG_NUMA
1174cf1b76bSHu Tao     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
118ffa144b3SEduardo Habkost     uint16List *l, *host_nodes = NULL;
1194cf1b76bSHu Tao 
120ffa144b3SEduardo Habkost     visit_type_uint16List(v, name, &host_nodes, errp);
1214cf1b76bSHu Tao 
122ffa144b3SEduardo Habkost     for (l = host_nodes; l; l = l->next) {
123ffa144b3SEduardo Habkost         if (l->value >= MAX_NODES) {
124ffa144b3SEduardo Habkost             error_setg(errp, "Invalid host-nodes value: %d", l->value);
125ffa144b3SEduardo Habkost             goto out;
1264cf1b76bSHu Tao         }
127ffa144b3SEduardo Habkost     }
128ffa144b3SEduardo Habkost 
129ffa144b3SEduardo Habkost     for (l = host_nodes; l; l = l->next) {
130ffa144b3SEduardo Habkost         bitmap_set(backend->host_nodes, l->value, 1);
131ffa144b3SEduardo Habkost     }
132ffa144b3SEduardo Habkost 
133ffa144b3SEduardo Habkost out:
134ffa144b3SEduardo Habkost     qapi_free_uint16List(host_nodes);
1354cf1b76bSHu Tao #else
1364cf1b76bSHu Tao     error_setg(errp, "NUMA node binding are not supported by this QEMU");
1374cf1b76bSHu Tao #endif
1384cf1b76bSHu Tao }
1394cf1b76bSHu Tao 
140a3590dacSDaniel P. Berrange static int
141a3590dacSDaniel P. Berrange host_memory_backend_get_policy(Object *obj, Error **errp G_GNUC_UNUSED)
1424cf1b76bSHu Tao {
1434cf1b76bSHu Tao     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
144a3590dacSDaniel P. Berrange     return backend->policy;
1454cf1b76bSHu Tao }
1464cf1b76bSHu Tao 
1474cf1b76bSHu Tao static void
148a3590dacSDaniel P. Berrange host_memory_backend_set_policy(Object *obj, int policy, Error **errp)
1494cf1b76bSHu Tao {
1504cf1b76bSHu Tao     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
1514cf1b76bSHu Tao     backend->policy = policy;
1524cf1b76bSHu Tao 
1534cf1b76bSHu Tao #ifndef CONFIG_NUMA
1544cf1b76bSHu Tao     if (policy != HOST_MEM_POLICY_DEFAULT) {
1554cf1b76bSHu Tao         error_setg(errp, "NUMA policies are not supported by this QEMU");
1564cf1b76bSHu Tao     }
1574cf1b76bSHu Tao #endif
1584cf1b76bSHu Tao }
1594cf1b76bSHu Tao 
160605d0a94SPaolo Bonzini static bool host_memory_backend_get_merge(Object *obj, Error **errp)
161605d0a94SPaolo Bonzini {
162605d0a94SPaolo Bonzini     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
163605d0a94SPaolo Bonzini 
164605d0a94SPaolo Bonzini     return backend->merge;
165605d0a94SPaolo Bonzini }
166605d0a94SPaolo Bonzini 
167605d0a94SPaolo Bonzini static void host_memory_backend_set_merge(Object *obj, bool value, Error **errp)
168605d0a94SPaolo Bonzini {
169605d0a94SPaolo Bonzini     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
170605d0a94SPaolo Bonzini 
1716f4c60e4SPeter Xu     if (!host_memory_backend_mr_inited(backend)) {
172605d0a94SPaolo Bonzini         backend->merge = value;
173605d0a94SPaolo Bonzini         return;
174605d0a94SPaolo Bonzini     }
175605d0a94SPaolo Bonzini 
176605d0a94SPaolo Bonzini     if (value != backend->merge) {
177605d0a94SPaolo Bonzini         void *ptr = memory_region_get_ram_ptr(&backend->mr);
178605d0a94SPaolo Bonzini         uint64_t sz = memory_region_size(&backend->mr);
179605d0a94SPaolo Bonzini 
180605d0a94SPaolo Bonzini         qemu_madvise(ptr, sz,
181605d0a94SPaolo Bonzini                      value ? QEMU_MADV_MERGEABLE : QEMU_MADV_UNMERGEABLE);
182605d0a94SPaolo Bonzini         backend->merge = value;
183605d0a94SPaolo Bonzini     }
184605d0a94SPaolo Bonzini }
185605d0a94SPaolo Bonzini 
186605d0a94SPaolo Bonzini static bool host_memory_backend_get_dump(Object *obj, Error **errp)
187605d0a94SPaolo Bonzini {
188605d0a94SPaolo Bonzini     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
189605d0a94SPaolo Bonzini 
190605d0a94SPaolo Bonzini     return backend->dump;
191605d0a94SPaolo Bonzini }
192605d0a94SPaolo Bonzini 
193605d0a94SPaolo Bonzini static void host_memory_backend_set_dump(Object *obj, bool value, Error **errp)
194605d0a94SPaolo Bonzini {
195605d0a94SPaolo Bonzini     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
196605d0a94SPaolo Bonzini 
1976f4c60e4SPeter Xu     if (!host_memory_backend_mr_inited(backend)) {
198605d0a94SPaolo Bonzini         backend->dump = value;
199605d0a94SPaolo Bonzini         return;
200605d0a94SPaolo Bonzini     }
201605d0a94SPaolo Bonzini 
202605d0a94SPaolo Bonzini     if (value != backend->dump) {
203605d0a94SPaolo Bonzini         void *ptr = memory_region_get_ram_ptr(&backend->mr);
204605d0a94SPaolo Bonzini         uint64_t sz = memory_region_size(&backend->mr);
205605d0a94SPaolo Bonzini 
206605d0a94SPaolo Bonzini         qemu_madvise(ptr, sz,
207605d0a94SPaolo Bonzini                      value ? QEMU_MADV_DODUMP : QEMU_MADV_DONTDUMP);
208605d0a94SPaolo Bonzini         backend->dump = value;
209605d0a94SPaolo Bonzini     }
210605d0a94SPaolo Bonzini }
211605d0a94SPaolo Bonzini 
212a35ba7beSPaolo Bonzini static bool host_memory_backend_get_prealloc(Object *obj, Error **errp)
213a35ba7beSPaolo Bonzini {
214a35ba7beSPaolo Bonzini     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
215a35ba7beSPaolo Bonzini 
2164ebc74dbSIgor Mammedov     return backend->prealloc;
217a35ba7beSPaolo Bonzini }
218a35ba7beSPaolo Bonzini 
219a35ba7beSPaolo Bonzini static void host_memory_backend_set_prealloc(Object *obj, bool value,
220a35ba7beSPaolo Bonzini                                              Error **errp)
221a35ba7beSPaolo Bonzini {
222056b68afSIgor Mammedov     Error *local_err = NULL;
223a35ba7beSPaolo Bonzini     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
224a35ba7beSPaolo Bonzini 
2259181fb70SDavid Hildenbrand     if (!backend->reserve && value) {
2269181fb70SDavid Hildenbrand         error_setg(errp, "'prealloc=on' and 'reserve=off' are incompatible");
2279181fb70SDavid Hildenbrand         return;
2289181fb70SDavid Hildenbrand     }
2299181fb70SDavid Hildenbrand 
2306f4c60e4SPeter Xu     if (!host_memory_backend_mr_inited(backend)) {
231a35ba7beSPaolo Bonzini         backend->prealloc = value;
232a35ba7beSPaolo Bonzini         return;
233a35ba7beSPaolo Bonzini     }
234a35ba7beSPaolo Bonzini 
235a35ba7beSPaolo Bonzini     if (value && !backend->prealloc) {
236a35ba7beSPaolo Bonzini         int fd = memory_region_get_fd(&backend->mr);
237a35ba7beSPaolo Bonzini         void *ptr = memory_region_get_ram_ptr(&backend->mr);
238a35ba7beSPaolo Bonzini         uint64_t sz = memory_region_size(&backend->mr);
239a35ba7beSPaolo Bonzini 
240e6816458SDavid Hildenbrand         qemu_prealloc_mem(fd, ptr, sz, backend->prealloc_threads,
241e6816458SDavid Hildenbrand                           backend->prealloc_context, &local_err);
242056b68afSIgor Mammedov         if (local_err) {
243056b68afSIgor Mammedov             error_propagate(errp, local_err);
244056b68afSIgor Mammedov             return;
245056b68afSIgor Mammedov         }
246a35ba7beSPaolo Bonzini         backend->prealloc = true;
247a35ba7beSPaolo Bonzini     }
248a35ba7beSPaolo Bonzini }
249a35ba7beSPaolo Bonzini 
250ffac16faSIgor Mammedov static void host_memory_backend_get_prealloc_threads(Object *obj, Visitor *v,
251ffac16faSIgor Mammedov     const char *name, void *opaque, Error **errp)
252ffac16faSIgor Mammedov {
253ffac16faSIgor Mammedov     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
254ffac16faSIgor Mammedov     visit_type_uint32(v, name, &backend->prealloc_threads, errp);
255ffac16faSIgor Mammedov }
256ffac16faSIgor Mammedov 
257ffac16faSIgor Mammedov static void host_memory_backend_set_prealloc_threads(Object *obj, Visitor *v,
258ffac16faSIgor Mammedov     const char *name, void *opaque, Error **errp)
259ffac16faSIgor Mammedov {
260ffac16faSIgor Mammedov     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
261ffac16faSIgor Mammedov     uint32_t value;
262ffac16faSIgor Mammedov 
263668f62ecSMarkus Armbruster     if (!visit_type_uint32(v, name, &value, errp)) {
264dcfe4805SMarkus Armbruster         return;
265ffac16faSIgor Mammedov     }
266ffac16faSIgor Mammedov     if (value <= 0) {
267dcfe4805SMarkus Armbruster         error_setg(errp, "property '%s' of %s doesn't take value '%d'", name,
268dcfe4805SMarkus Armbruster                    object_get_typename(obj), value);
269dcfe4805SMarkus Armbruster         return;
270ffac16faSIgor Mammedov     }
271ffac16faSIgor Mammedov     backend->prealloc_threads = value;
272ffac16faSIgor Mammedov }
273ffac16faSIgor Mammedov 
27458f4662cSHu Tao static void host_memory_backend_init(Object *obj)
2751f070489SIgor Mammedov {
276605d0a94SPaolo Bonzini     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
2776b269967SEduardo Habkost     MachineState *machine = MACHINE(qdev_get_machine());
278605d0a94SPaolo Bonzini 
279ffac16faSIgor Mammedov     /* TODO: convert access to globals to compat properties */
2806b269967SEduardo Habkost     backend->merge = machine_mem_merge(machine);
2816b269967SEduardo Habkost     backend->dump = machine_dump_guest_core(machine);
2829181fb70SDavid Hildenbrand     backend->reserve = true;
283f8d426a6SJaroslav Jindrak     backend->prealloc_threads = machine->smp.cpus;
2841f070489SIgor Mammedov }
2851f070489SIgor Mammedov 
286fa0cb34dSMarc-André Lureau static void host_memory_backend_post_init(Object *obj)
287fa0cb34dSMarc-André Lureau {
288fa0cb34dSMarc-André Lureau     object_apply_compat_props(obj);
289fa0cb34dSMarc-André Lureau }
290fa0cb34dSMarc-André Lureau 
2914728b574SPeter Xu bool host_memory_backend_mr_inited(HostMemoryBackend *backend)
2924728b574SPeter Xu {
2934728b574SPeter Xu     /*
2944728b574SPeter Xu      * NOTE: We forbid zero-length memory backend, so here zero means
2954728b574SPeter Xu      * "we haven't inited the backend memory region yet".
2964728b574SPeter Xu      */
2974728b574SPeter Xu     return memory_region_size(&backend->mr) != 0;
2984728b574SPeter Xu }
2994728b574SPeter Xu 
3007943e97bSDavid Hildenbrand MemoryRegion *host_memory_backend_get_memory(HostMemoryBackend *backend)
3011f070489SIgor Mammedov {
3026f4c60e4SPeter Xu     return host_memory_backend_mr_inited(backend) ? &backend->mr : NULL;
3031f070489SIgor Mammedov }
3041f070489SIgor Mammedov 
3052aece63cSXiao Guangrong void host_memory_backend_set_mapped(HostMemoryBackend *backend, bool mapped)
3062aece63cSXiao Guangrong {
3072aece63cSXiao Guangrong     backend->is_mapped = mapped;
3082aece63cSXiao Guangrong }
3092aece63cSXiao Guangrong 
3102aece63cSXiao Guangrong bool host_memory_backend_is_mapped(HostMemoryBackend *backend)
3112aece63cSXiao Guangrong {
3122aece63cSXiao Guangrong     return backend->is_mapped;
3132aece63cSXiao Guangrong }
3142aece63cSXiao Guangrong 
3152b108085SDavid Gibson size_t host_memory_backend_pagesize(HostMemoryBackend *memdev)
3162b108085SDavid Gibson {
3178be934b7SThomas Huth     size_t pagesize = qemu_ram_pagesize(memdev->mr.ram_block);
3188be934b7SThomas Huth     g_assert(pagesize >= qemu_real_host_page_size());
3192b108085SDavid Gibson     return pagesize;
3202b108085SDavid Gibson }
3212b108085SDavid Gibson 
322bd9262d9SHu Tao static void
323bd9262d9SHu Tao host_memory_backend_memory_complete(UserCreatable *uc, Error **errp)
324bd9262d9SHu Tao {
325bd9262d9SHu Tao     HostMemoryBackend *backend = MEMORY_BACKEND(uc);
326bd9262d9SHu Tao     HostMemoryBackendClass *bc = MEMORY_BACKEND_GET_CLASS(uc);
327605d0a94SPaolo Bonzini     Error *local_err = NULL;
328605d0a94SPaolo Bonzini     void *ptr;
329605d0a94SPaolo Bonzini     uint64_t sz;
330bd9262d9SHu Tao 
331e199f7adSPhilippe Mathieu-Daudé     if (!bc->alloc) {
332e199f7adSPhilippe Mathieu-Daudé         return;
333e199f7adSPhilippe Mathieu-Daudé     }
334*fdb63cf3SPhilippe Mathieu-Daudé     if (!bc->alloc(backend, errp)) {
335*fdb63cf3SPhilippe Mathieu-Daudé         return;
336605d0a94SPaolo Bonzini     }
337605d0a94SPaolo Bonzini 
338605d0a94SPaolo Bonzini     ptr = memory_region_get_ram_ptr(&backend->mr);
339605d0a94SPaolo Bonzini     sz = memory_region_size(&backend->mr);
340605d0a94SPaolo Bonzini 
341605d0a94SPaolo Bonzini     if (backend->merge) {
342605d0a94SPaolo Bonzini         qemu_madvise(ptr, sz, QEMU_MADV_MERGEABLE);
343605d0a94SPaolo Bonzini     }
344605d0a94SPaolo Bonzini     if (!backend->dump) {
345605d0a94SPaolo Bonzini         qemu_madvise(ptr, sz, QEMU_MADV_DONTDUMP);
346605d0a94SPaolo Bonzini     }
3474cf1b76bSHu Tao #ifdef CONFIG_NUMA
3484cf1b76bSHu Tao     unsigned long lastbit = find_last_bit(backend->host_nodes, MAX_NODES);
3494cf1b76bSHu Tao     /* lastbit == MAX_NODES means maxnode = 0 */
3504cf1b76bSHu Tao     unsigned long maxnode = (lastbit + 1) % (MAX_NODES + 1);
3514cf1b76bSHu Tao     /* ensure policy won't be ignored in case memory is preallocated
3524cf1b76bSHu Tao      * before mbind(). note: MPOL_MF_STRICT is ignored on hugepages so
3534cf1b76bSHu Tao      * this doesn't catch hugepage case. */
354288d3322SMichael S. Tsirkin     unsigned flags = MPOL_MF_STRICT | MPOL_MF_MOVE;
3556bb613f0SMichal Privoznik     int mode = backend->policy;
3564cf1b76bSHu Tao 
3574cf1b76bSHu Tao     /* check for invalid host-nodes and policies and give more verbose
3584cf1b76bSHu Tao      * error messages than mbind(). */
3594cf1b76bSHu Tao     if (maxnode && backend->policy == MPOL_DEFAULT) {
3604cf1b76bSHu Tao         error_setg(errp, "host-nodes must be empty for policy default,"
3614cf1b76bSHu Tao                    " or you should explicitly specify a policy other"
3624cf1b76bSHu Tao                    " than default");
3634cf1b76bSHu Tao         return;
3644cf1b76bSHu Tao     } else if (maxnode == 0 && backend->policy != MPOL_DEFAULT) {
3654cf1b76bSHu Tao         error_setg(errp, "host-nodes must be set for policy %s",
366977c736fSMarkus Armbruster                    HostMemPolicy_str(backend->policy));
3674cf1b76bSHu Tao         return;
3684cf1b76bSHu Tao     }
3694cf1b76bSHu Tao 
3704cf1b76bSHu Tao     /* We can have up to MAX_NODES nodes, but we need to pass maxnode+1
3714cf1b76bSHu Tao      * as argument to mbind() due to an old Linux bug (feature?) which
3724cf1b76bSHu Tao      * cuts off the last specified node. This means backend->host_nodes
3734cf1b76bSHu Tao      * must have MAX_NODES+1 bits available.
3744cf1b76bSHu Tao      */
3754cf1b76bSHu Tao     assert(sizeof(backend->host_nodes) >=
3764cf1b76bSHu Tao            BITS_TO_LONGS(MAX_NODES + 1) * sizeof(unsigned long));
3774cf1b76bSHu Tao     assert(maxnode <= MAX_NODES);
37870b6d525SIgor Mammedov 
3796bb613f0SMichal Privoznik #ifdef HAVE_NUMA_HAS_PREFERRED_MANY
3806bb613f0SMichal Privoznik     if (mode == MPOL_PREFERRED && numa_has_preferred_many() > 0) {
3816bb613f0SMichal Privoznik         /*
3826bb613f0SMichal Privoznik          * Replace with MPOL_PREFERRED_MANY otherwise the mbind() below
3836bb613f0SMichal Privoznik          * silently picks the first node.
3846bb613f0SMichal Privoznik          */
3856bb613f0SMichal Privoznik         mode = MPOL_PREFERRED_MANY;
3866bb613f0SMichal Privoznik     }
3876bb613f0SMichal Privoznik #endif
3886bb613f0SMichal Privoznik 
38970b6d525SIgor Mammedov     if (maxnode &&
3906bb613f0SMichal Privoznik         mbind(ptr, sz, mode, backend->host_nodes, maxnode + 1, flags)) {
391a3567ba1SPavel Fedin         if (backend->policy != MPOL_DEFAULT || errno != ENOSYS) {
3924cf1b76bSHu Tao             error_setg_errno(errp, errno,
3934cf1b76bSHu Tao                              "cannot bind memory to host NUMA nodes");
3944cf1b76bSHu Tao             return;
3954cf1b76bSHu Tao         }
396a3567ba1SPavel Fedin     }
3974cf1b76bSHu Tao #endif
3984cf1b76bSHu Tao     /* Preallocate memory after the NUMA policy has been instantiated.
3994cf1b76bSHu Tao      * This is necessary to guarantee memory is allocated with
4004cf1b76bSHu Tao      * specified NUMA policy in place.
4014cf1b76bSHu Tao      */
402a35ba7beSPaolo Bonzini     if (backend->prealloc) {
4036556aadcSDavid Hildenbrand         qemu_prealloc_mem(memory_region_get_fd(&backend->mr), ptr, sz,
404e6816458SDavid Hildenbrand                           backend->prealloc_threads,
405e6816458SDavid Hildenbrand                           backend->prealloc_context, &local_err);
406056b68afSIgor Mammedov         if (local_err) {
407056b68afSIgor Mammedov             goto out;
408a35ba7beSPaolo Bonzini         }
409bd9262d9SHu Tao     }
410056b68afSIgor Mammedov out:
411056b68afSIgor Mammedov     error_propagate(errp, local_err);
412056b68afSIgor Mammedov }
413bd9262d9SHu Tao 
41436bce5caSLin Ma static bool
4153beacfb9SEduardo Habkost host_memory_backend_can_be_deleted(UserCreatable *uc)
41636bce5caSLin Ma {
4172aece63cSXiao Guangrong     if (host_memory_backend_is_mapped(MEMORY_BACKEND(uc))) {
41836bce5caSLin Ma         return false;
41936bce5caSLin Ma     } else {
42036bce5caSLin Ma         return true;
42136bce5caSLin Ma     }
42236bce5caSLin Ma }
42336bce5caSLin Ma 
42406329cceSMarcel Apfelbaum static bool host_memory_backend_get_share(Object *o, Error **errp)
42506329cceSMarcel Apfelbaum {
42606329cceSMarcel Apfelbaum     HostMemoryBackend *backend = MEMORY_BACKEND(o);
42706329cceSMarcel Apfelbaum 
42806329cceSMarcel Apfelbaum     return backend->share;
42906329cceSMarcel Apfelbaum }
43006329cceSMarcel Apfelbaum 
43106329cceSMarcel Apfelbaum static void host_memory_backend_set_share(Object *o, bool value, Error **errp)
43206329cceSMarcel Apfelbaum {
43306329cceSMarcel Apfelbaum     HostMemoryBackend *backend = MEMORY_BACKEND(o);
43406329cceSMarcel Apfelbaum 
43506329cceSMarcel Apfelbaum     if (host_memory_backend_mr_inited(backend)) {
43606329cceSMarcel Apfelbaum         error_setg(errp, "cannot change property value");
43706329cceSMarcel Apfelbaum         return;
43806329cceSMarcel Apfelbaum     }
43906329cceSMarcel Apfelbaum     backend->share = value;
44006329cceSMarcel Apfelbaum }
44106329cceSMarcel Apfelbaum 
4429181fb70SDavid Hildenbrand #ifdef CONFIG_LINUX
4439181fb70SDavid Hildenbrand static bool host_memory_backend_get_reserve(Object *o, Error **errp)
4449181fb70SDavid Hildenbrand {
4459181fb70SDavid Hildenbrand     HostMemoryBackend *backend = MEMORY_BACKEND(o);
4469181fb70SDavid Hildenbrand 
4479181fb70SDavid Hildenbrand     return backend->reserve;
4489181fb70SDavid Hildenbrand }
4499181fb70SDavid Hildenbrand 
4509181fb70SDavid Hildenbrand static void host_memory_backend_set_reserve(Object *o, bool value, Error **errp)
4519181fb70SDavid Hildenbrand {
4529181fb70SDavid Hildenbrand     HostMemoryBackend *backend = MEMORY_BACKEND(o);
4539181fb70SDavid Hildenbrand 
4549181fb70SDavid Hildenbrand     if (host_memory_backend_mr_inited(backend)) {
4559181fb70SDavid Hildenbrand         error_setg(errp, "cannot change property value");
4569181fb70SDavid Hildenbrand         return;
4579181fb70SDavid Hildenbrand     }
4589181fb70SDavid Hildenbrand     if (backend->prealloc && !value) {
4599181fb70SDavid Hildenbrand         error_setg(errp, "'prealloc=on' and 'reserve=off' are incompatible");
4609181fb70SDavid Hildenbrand         return;
4619181fb70SDavid Hildenbrand     }
4629181fb70SDavid Hildenbrand     backend->reserve = value;
4639181fb70SDavid Hildenbrand }
4649181fb70SDavid Hildenbrand #endif /* CONFIG_LINUX */
4659181fb70SDavid Hildenbrand 
466fa0cb34dSMarc-André Lureau static bool
467fa0cb34dSMarc-André Lureau host_memory_backend_get_use_canonical_path(Object *obj, Error **errp)
468fa0cb34dSMarc-André Lureau {
469fa0cb34dSMarc-André Lureau     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
470fa0cb34dSMarc-André Lureau 
471fa0cb34dSMarc-André Lureau     return backend->use_canonical_path;
472fa0cb34dSMarc-André Lureau }
473fa0cb34dSMarc-André Lureau 
474fa0cb34dSMarc-André Lureau static void
475fa0cb34dSMarc-André Lureau host_memory_backend_set_use_canonical_path(Object *obj, bool value,
476fa0cb34dSMarc-André Lureau                                            Error **errp)
477fa0cb34dSMarc-André Lureau {
478fa0cb34dSMarc-André Lureau     HostMemoryBackend *backend = MEMORY_BACKEND(obj);
479fa0cb34dSMarc-André Lureau 
480fa0cb34dSMarc-André Lureau     backend->use_canonical_path = value;
481fa0cb34dSMarc-André Lureau }
482fa0cb34dSMarc-André Lureau 
483bd9262d9SHu Tao static void
484bd9262d9SHu Tao host_memory_backend_class_init(ObjectClass *oc, void *data)
485bd9262d9SHu Tao {
486bd9262d9SHu Tao     UserCreatableClass *ucc = USER_CREATABLE_CLASS(oc);
487bd9262d9SHu Tao 
488bd9262d9SHu Tao     ucc->complete = host_memory_backend_memory_complete;
48936bce5caSLin Ma     ucc->can_be_deleted = host_memory_backend_can_be_deleted;
490e62834caSEduardo Habkost 
491e62834caSEduardo Habkost     object_class_property_add_bool(oc, "merge",
492e62834caSEduardo Habkost         host_memory_backend_get_merge,
493d2623129SMarkus Armbruster         host_memory_backend_set_merge);
494033bfc5eSMarc-André Lureau     object_class_property_set_description(oc, "merge",
4957eecec7dSMarkus Armbruster         "Mark memory as mergeable");
496e62834caSEduardo Habkost     object_class_property_add_bool(oc, "dump",
497e62834caSEduardo Habkost         host_memory_backend_get_dump,
498d2623129SMarkus Armbruster         host_memory_backend_set_dump);
499033bfc5eSMarc-André Lureau     object_class_property_set_description(oc, "dump",
5007eecec7dSMarkus Armbruster         "Set to 'off' to exclude from core dump");
501e62834caSEduardo Habkost     object_class_property_add_bool(oc, "prealloc",
502e62834caSEduardo Habkost         host_memory_backend_get_prealloc,
503d2623129SMarkus Armbruster         host_memory_backend_set_prealloc);
504033bfc5eSMarc-André Lureau     object_class_property_set_description(oc, "prealloc",
5057eecec7dSMarkus Armbruster         "Preallocate memory");
506ffac16faSIgor Mammedov     object_class_property_add(oc, "prealloc-threads", "int",
507ffac16faSIgor Mammedov         host_memory_backend_get_prealloc_threads,
508ffac16faSIgor Mammedov         host_memory_backend_set_prealloc_threads,
509d2623129SMarkus Armbruster         NULL, NULL);
510ffac16faSIgor Mammedov     object_class_property_set_description(oc, "prealloc-threads",
5117eecec7dSMarkus Armbruster         "Number of CPU threads to use for prealloc");
512e6816458SDavid Hildenbrand     object_class_property_add_link(oc, "prealloc-context",
513e6816458SDavid Hildenbrand         TYPE_THREAD_CONTEXT, offsetof(HostMemoryBackend, prealloc_context),
514e6816458SDavid Hildenbrand         object_property_allow_set_link, OBJ_PROP_LINK_STRONG);
515e6816458SDavid Hildenbrand     object_class_property_set_description(oc, "prealloc-context",
516e6816458SDavid Hildenbrand         "Context to use for creating CPU threads for preallocation");
517e62834caSEduardo Habkost     object_class_property_add(oc, "size", "int",
518e62834caSEduardo Habkost         host_memory_backend_get_size,
519e62834caSEduardo Habkost         host_memory_backend_set_size,
520d2623129SMarkus Armbruster         NULL, NULL);
521033bfc5eSMarc-André Lureau     object_class_property_set_description(oc, "size",
5227eecec7dSMarkus Armbruster         "Size of the memory region (ex: 500M)");
523e62834caSEduardo Habkost     object_class_property_add(oc, "host-nodes", "int",
524e62834caSEduardo Habkost         host_memory_backend_get_host_nodes,
525e62834caSEduardo Habkost         host_memory_backend_set_host_nodes,
526d2623129SMarkus Armbruster         NULL, NULL);
527033bfc5eSMarc-André Lureau     object_class_property_set_description(oc, "host-nodes",
5287eecec7dSMarkus Armbruster         "Binds memory to the list of NUMA host nodes");
529e62834caSEduardo Habkost     object_class_property_add_enum(oc, "policy", "HostMemPolicy",
530f7abe0ecSMarc-André Lureau         &HostMemPolicy_lookup,
531e62834caSEduardo Habkost         host_memory_backend_get_policy,
532d2623129SMarkus Armbruster         host_memory_backend_set_policy);
533033bfc5eSMarc-André Lureau     object_class_property_set_description(oc, "policy",
5347eecec7dSMarkus Armbruster         "Set the NUMA policy");
53506329cceSMarcel Apfelbaum     object_class_property_add_bool(oc, "share",
536d2623129SMarkus Armbruster         host_memory_backend_get_share, host_memory_backend_set_share);
537033bfc5eSMarc-André Lureau     object_class_property_set_description(oc, "share",
5387eecec7dSMarkus Armbruster         "Mark the memory as private to QEMU or shared");
5399181fb70SDavid Hildenbrand #ifdef CONFIG_LINUX
5409181fb70SDavid Hildenbrand     object_class_property_add_bool(oc, "reserve",
5419181fb70SDavid Hildenbrand         host_memory_backend_get_reserve, host_memory_backend_set_reserve);
5429181fb70SDavid Hildenbrand     object_class_property_set_description(oc, "reserve",
5439181fb70SDavid Hildenbrand         "Reserve swap space (or huge pages) if applicable");
5449181fb70SDavid Hildenbrand #endif /* CONFIG_LINUX */
5458db0b204SIgor Mammedov     /*
5468db0b204SIgor Mammedov      * Do not delete/rename option. This option must be considered stable
5478db0b204SIgor Mammedov      * (as if it didn't have the 'x-' prefix including deprecation period) as
5488db0b204SIgor Mammedov      * long as 4.0 and older machine types exists.
5498db0b204SIgor Mammedov      * Option will be used by upper layers to override (disable) canonical path
5508db0b204SIgor Mammedov      * for ramblock-id set by compat properties on old machine types ( <= 4.0),
5518db0b204SIgor Mammedov      * to keep migration working when backend is used for main RAM with
5528db0b204SIgor Mammedov      * -machine memory-backend= option (main RAM historically used prefix-less
5538db0b204SIgor Mammedov      * ramblock-id).
5548db0b204SIgor Mammedov      */
555fa0cb34dSMarc-André Lureau     object_class_property_add_bool(oc, "x-use-canonical-path-for-ramblock-id",
556fa0cb34dSMarc-André Lureau         host_memory_backend_get_use_canonical_path,
557d2623129SMarkus Armbruster         host_memory_backend_set_use_canonical_path);
558e1ff3c67SIgor Mammedov }
559e1ff3c67SIgor Mammedov 
56058f4662cSHu Tao static const TypeInfo host_memory_backend_info = {
5611f070489SIgor Mammedov     .name = TYPE_MEMORY_BACKEND,
5621f070489SIgor Mammedov     .parent = TYPE_OBJECT,
5631f070489SIgor Mammedov     .abstract = true,
5641f070489SIgor Mammedov     .class_size = sizeof(HostMemoryBackendClass),
565bd9262d9SHu Tao     .class_init = host_memory_backend_class_init,
5661f070489SIgor Mammedov     .instance_size = sizeof(HostMemoryBackend),
56758f4662cSHu Tao     .instance_init = host_memory_backend_init,
568fa0cb34dSMarc-André Lureau     .instance_post_init = host_memory_backend_post_init,
5691f070489SIgor Mammedov     .interfaces = (InterfaceInfo[]) {
5701f070489SIgor Mammedov         { TYPE_USER_CREATABLE },
5711f070489SIgor Mammedov         { }
5721f070489SIgor Mammedov     }
5731f070489SIgor Mammedov };
5741f070489SIgor Mammedov 
5751f070489SIgor Mammedov static void register_types(void)
5761f070489SIgor Mammedov {
57758f4662cSHu Tao     type_register_static(&host_memory_backend_info);
5781f070489SIgor Mammedov }
5791f070489SIgor Mammedov 
5801f070489SIgor Mammedov type_init(register_types);
581