11f070489SIgor Mammedov /*
21f070489SIgor Mammedov * QEMU Host Memory Backend
31f070489SIgor Mammedov *
41f070489SIgor Mammedov * Copyright (C) 2013-2014 Red Hat Inc
51f070489SIgor Mammedov *
61f070489SIgor Mammedov * Authors:
71f070489SIgor Mammedov * Igor Mammedov <imammedo@redhat.com>
81f070489SIgor Mammedov *
91f070489SIgor Mammedov * This work is licensed under the terms of the GNU GPL, version 2 or later.
101f070489SIgor Mammedov * See the COPYING file in the top-level directory.
111f070489SIgor Mammedov */
129af23989SMarkus Armbruster
139c058332SPeter Maydell #include "qemu/osdep.h"
141f070489SIgor Mammedov #include "sysemu/hostmem.h"
156b269967SEduardo Habkost #include "hw/boards.h"
16da34e65cSMarkus Armbruster #include "qapi/error.h"
17eb815e24SMarkus Armbruster #include "qapi/qapi-builtin-visit.h"
181f070489SIgor Mammedov #include "qapi/visitor.h"
191f070489SIgor Mammedov #include "qemu/config-file.h"
201f070489SIgor Mammedov #include "qom/object_interfaces.h"
212b108085SDavid Gibson #include "qemu/mmap-alloc.h"
22b85ea5faSPeter Maydell #include "qemu/madvise.h"
235d9a9a61SMichal Privoznik #include "qemu/cutils.h"
2404accf43SMark Kanda #include "hw/qdev-core.h"
251f070489SIgor Mammedov
264cf1b76bSHu Tao #ifdef CONFIG_NUMA
274cf1b76bSHu Tao #include <numaif.h>
286bb613f0SMichal Privoznik #include <numa.h>
294cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_DEFAULT != MPOL_DEFAULT);
306bb613f0SMichal Privoznik /*
316bb613f0SMichal Privoznik * HOST_MEM_POLICY_PREFERRED may either translate to MPOL_PREFERRED or
326bb613f0SMichal Privoznik * MPOL_PREFERRED_MANY, see comments further below.
336bb613f0SMichal Privoznik */
344cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_PREFERRED != MPOL_PREFERRED);
354cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_BIND != MPOL_BIND);
364cf1b76bSHu Tao QEMU_BUILD_BUG_ON(HOST_MEM_POLICY_INTERLEAVE != MPOL_INTERLEAVE);
374cf1b76bSHu Tao #endif
384cf1b76bSHu Tao
39fa0cb34dSMarc-André Lureau char *
host_memory_backend_get_name(HostMemoryBackend * backend)40fa0cb34dSMarc-André Lureau host_memory_backend_get_name(HostMemoryBackend *backend)
41fa0cb34dSMarc-André Lureau {
42fa0cb34dSMarc-André Lureau if (!backend->use_canonical_path) {
437a309cc9SMarkus Armbruster return g_strdup(object_get_canonical_path_component(OBJECT(backend)));
44fa0cb34dSMarc-André Lureau }
45fa0cb34dSMarc-André Lureau
46fa0cb34dSMarc-André Lureau return object_get_canonical_path(OBJECT(backend));
47fa0cb34dSMarc-André Lureau }
48fa0cb34dSMarc-André Lureau
491f070489SIgor Mammedov static void
host_memory_backend_get_size(Object * obj,Visitor * v,const char * name,void * opaque,Error ** errp)50d7bce999SEric Blake host_memory_backend_get_size(Object *obj, Visitor *v, const char *name,
51d7bce999SEric Blake void *opaque, Error **errp)
521f070489SIgor Mammedov {
531f070489SIgor Mammedov HostMemoryBackend *backend = MEMORY_BACKEND(obj);
541f070489SIgor Mammedov uint64_t value = backend->size;
551f070489SIgor Mammedov
5651e72bc1SEric Blake visit_type_size(v, name, &value, errp);
571f070489SIgor Mammedov }
581f070489SIgor Mammedov
591f070489SIgor Mammedov static void
host_memory_backend_set_size(Object * obj,Visitor * v,const char * name,void * opaque,Error ** errp)60d7bce999SEric Blake host_memory_backend_set_size(Object *obj, Visitor *v, const char *name,
61d7bce999SEric Blake void *opaque, Error **errp)
621f070489SIgor Mammedov {
631f070489SIgor Mammedov HostMemoryBackend *backend = MEMORY_BACKEND(obj);
641f070489SIgor Mammedov uint64_t value;
651f070489SIgor Mammedov
666f4c60e4SPeter Xu if (host_memory_backend_mr_inited(backend)) {
67dcfe4805SMarkus Armbruster error_setg(errp, "cannot change property %s of %s ", name,
68dcfe4805SMarkus Armbruster object_get_typename(obj));
69dcfe4805SMarkus Armbruster return;
701f070489SIgor Mammedov }
711f070489SIgor Mammedov
72668f62ecSMarkus Armbruster if (!visit_type_size(v, name, &value, errp)) {
73dcfe4805SMarkus Armbruster return;
741f070489SIgor Mammedov }
751f070489SIgor Mammedov if (!value) {
76dcfe4805SMarkus Armbruster error_setg(errp,
7721d16836SZhang Yi "property '%s' of %s doesn't take value '%" PRIu64 "'",
7821d16836SZhang Yi name, object_get_typename(obj), value);
79dcfe4805SMarkus Armbruster return;
801f070489SIgor Mammedov }
811f070489SIgor Mammedov backend->size = value;
821f070489SIgor Mammedov }
831f070489SIgor Mammedov
844cf1b76bSHu Tao static void
host_memory_backend_get_host_nodes(Object * obj,Visitor * v,const char * name,void * opaque,Error ** errp)85d7bce999SEric Blake host_memory_backend_get_host_nodes(Object *obj, Visitor *v, const char *name,
86d7bce999SEric Blake void *opaque, Error **errp)
874cf1b76bSHu Tao {
884cf1b76bSHu Tao HostMemoryBackend *backend = MEMORY_BACKEND(obj);
894cf1b76bSHu Tao uint16List *host_nodes = NULL;
90c3033fd3SEric Blake uint16List **tail = &host_nodes;
914cf1b76bSHu Tao unsigned long value;
924cf1b76bSHu Tao
934cf1b76bSHu Tao value = find_first_bit(backend->host_nodes, MAX_NODES);
941454d33fSXiao Guangrong if (value == MAX_NODES) {
9515160ab7SIgor Mammedov goto ret;
961454d33fSXiao Guangrong }
974cf1b76bSHu Tao
98c3033fd3SEric Blake QAPI_LIST_APPEND(tail, value);
99658ae5a7SMarkus Armbruster
1004cf1b76bSHu Tao do {
1014cf1b76bSHu Tao value = find_next_bit(backend->host_nodes, MAX_NODES, value + 1);
1024cf1b76bSHu Tao if (value == MAX_NODES) {
1034cf1b76bSHu Tao break;
1044cf1b76bSHu Tao }
1054cf1b76bSHu Tao
106c3033fd3SEric Blake QAPI_LIST_APPEND(tail, value);
1074cf1b76bSHu Tao } while (true);
1084cf1b76bSHu Tao
10915160ab7SIgor Mammedov ret:
11051e72bc1SEric Blake visit_type_uint16List(v, name, &host_nodes, errp);
111bdd5ce05SKeqian Zhu qapi_free_uint16List(host_nodes);
1124cf1b76bSHu Tao }
1134cf1b76bSHu Tao
1144cf1b76bSHu Tao static void
host_memory_backend_set_host_nodes(Object * obj,Visitor * v,const char * name,void * opaque,Error ** errp)115d7bce999SEric Blake host_memory_backend_set_host_nodes(Object *obj, Visitor *v, const char *name,
116d7bce999SEric Blake void *opaque, Error **errp)
1174cf1b76bSHu Tao {
1184cf1b76bSHu Tao #ifdef CONFIG_NUMA
1194cf1b76bSHu Tao HostMemoryBackend *backend = MEMORY_BACKEND(obj);
120ffa144b3SEduardo Habkost uint16List *l, *host_nodes = NULL;
1214cf1b76bSHu Tao
122ffa144b3SEduardo Habkost visit_type_uint16List(v, name, &host_nodes, errp);
1234cf1b76bSHu Tao
124ffa144b3SEduardo Habkost for (l = host_nodes; l; l = l->next) {
125ffa144b3SEduardo Habkost if (l->value >= MAX_NODES) {
126ffa144b3SEduardo Habkost error_setg(errp, "Invalid host-nodes value: %d", l->value);
127ffa144b3SEduardo Habkost goto out;
1284cf1b76bSHu Tao }
129ffa144b3SEduardo Habkost }
130ffa144b3SEduardo Habkost
131ffa144b3SEduardo Habkost for (l = host_nodes; l; l = l->next) {
132ffa144b3SEduardo Habkost bitmap_set(backend->host_nodes, l->value, 1);
133ffa144b3SEduardo Habkost }
134ffa144b3SEduardo Habkost
135ffa144b3SEduardo Habkost out:
136ffa144b3SEduardo Habkost qapi_free_uint16List(host_nodes);
1374cf1b76bSHu Tao #else
1384cf1b76bSHu Tao error_setg(errp, "NUMA node binding are not supported by this QEMU");
1394cf1b76bSHu Tao #endif
1404cf1b76bSHu Tao }
1414cf1b76bSHu Tao
142a3590dacSDaniel P. Berrange static int
host_memory_backend_get_policy(Object * obj,Error ** errp G_GNUC_UNUSED)143a3590dacSDaniel P. Berrange host_memory_backend_get_policy(Object *obj, Error **errp G_GNUC_UNUSED)
1444cf1b76bSHu Tao {
1454cf1b76bSHu Tao HostMemoryBackend *backend = MEMORY_BACKEND(obj);
146a3590dacSDaniel P. Berrange return backend->policy;
1474cf1b76bSHu Tao }
1484cf1b76bSHu Tao
1494cf1b76bSHu Tao static void
host_memory_backend_set_policy(Object * obj,int policy,Error ** errp)150a3590dacSDaniel P. Berrange host_memory_backend_set_policy(Object *obj, int policy, Error **errp)
1514cf1b76bSHu Tao {
1524cf1b76bSHu Tao HostMemoryBackend *backend = MEMORY_BACKEND(obj);
1534cf1b76bSHu Tao backend->policy = policy;
1544cf1b76bSHu Tao
1554cf1b76bSHu Tao #ifndef CONFIG_NUMA
1564cf1b76bSHu Tao if (policy != HOST_MEM_POLICY_DEFAULT) {
1574cf1b76bSHu Tao error_setg(errp, "NUMA policies are not supported by this QEMU");
1584cf1b76bSHu Tao }
1594cf1b76bSHu Tao #endif
1604cf1b76bSHu Tao }
1614cf1b76bSHu Tao
host_memory_backend_get_merge(Object * obj,Error ** errp)162605d0a94SPaolo Bonzini static bool host_memory_backend_get_merge(Object *obj, Error **errp)
163605d0a94SPaolo Bonzini {
164605d0a94SPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj);
165605d0a94SPaolo Bonzini
166605d0a94SPaolo Bonzini return backend->merge;
167605d0a94SPaolo Bonzini }
168605d0a94SPaolo Bonzini
host_memory_backend_set_merge(Object * obj,bool value,Error ** errp)169605d0a94SPaolo Bonzini static void host_memory_backend_set_merge(Object *obj, bool value, Error **errp)
170605d0a94SPaolo Bonzini {
171605d0a94SPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj);
172605d0a94SPaolo Bonzini
173a2b6a965SPaolo Bonzini if (QEMU_MADV_MERGEABLE == QEMU_MADV_INVALID) {
174a2b6a965SPaolo Bonzini if (value) {
175a2b6a965SPaolo Bonzini error_setg(errp, "Memory merging is not supported on this host");
176a2b6a965SPaolo Bonzini }
177a2b6a965SPaolo Bonzini assert(!backend->merge);
178a2b6a965SPaolo Bonzini return;
179a2b6a965SPaolo Bonzini }
180a2b6a965SPaolo Bonzini
181*78c8f780SGavin Shan if (host_memory_backend_mr_inited(backend) &&
1825becdc0aSPaolo Bonzini value != backend->merge) {
183605d0a94SPaolo Bonzini void *ptr = memory_region_get_ram_ptr(&backend->mr);
184605d0a94SPaolo Bonzini uint64_t sz = memory_region_size(&backend->mr);
185605d0a94SPaolo Bonzini
186605d0a94SPaolo Bonzini qemu_madvise(ptr, sz,
187605d0a94SPaolo Bonzini value ? QEMU_MADV_MERGEABLE : QEMU_MADV_UNMERGEABLE);
188605d0a94SPaolo Bonzini }
1895becdc0aSPaolo Bonzini
1905becdc0aSPaolo Bonzini backend->merge = value;
191605d0a94SPaolo Bonzini }
192605d0a94SPaolo Bonzini
host_memory_backend_get_dump(Object * obj,Error ** errp)193605d0a94SPaolo Bonzini static bool host_memory_backend_get_dump(Object *obj, Error **errp)
194605d0a94SPaolo Bonzini {
195605d0a94SPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj);
196605d0a94SPaolo Bonzini
197605d0a94SPaolo Bonzini return backend->dump;
198605d0a94SPaolo Bonzini }
199605d0a94SPaolo Bonzini
host_memory_backend_set_dump(Object * obj,bool value,Error ** errp)200605d0a94SPaolo Bonzini static void host_memory_backend_set_dump(Object *obj, bool value, Error **errp)
201605d0a94SPaolo Bonzini {
202605d0a94SPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj);
203605d0a94SPaolo Bonzini
204a2b6a965SPaolo Bonzini if (QEMU_MADV_DONTDUMP == QEMU_MADV_INVALID) {
205a2b6a965SPaolo Bonzini if (!value) {
206a2b6a965SPaolo Bonzini error_setg(errp, "Dumping guest memory cannot be disabled on this host");
207a2b6a965SPaolo Bonzini }
208a2b6a965SPaolo Bonzini assert(backend->dump);
209a2b6a965SPaolo Bonzini return;
210a2b6a965SPaolo Bonzini }
211a2b6a965SPaolo Bonzini
2125becdc0aSPaolo Bonzini if (host_memory_backend_mr_inited(backend) &&
2135becdc0aSPaolo Bonzini value != backend->dump) {
214605d0a94SPaolo Bonzini void *ptr = memory_region_get_ram_ptr(&backend->mr);
215605d0a94SPaolo Bonzini uint64_t sz = memory_region_size(&backend->mr);
216605d0a94SPaolo Bonzini
217605d0a94SPaolo Bonzini qemu_madvise(ptr, sz,
218605d0a94SPaolo Bonzini value ? QEMU_MADV_DODUMP : QEMU_MADV_DONTDUMP);
219605d0a94SPaolo Bonzini }
2205becdc0aSPaolo Bonzini
2215becdc0aSPaolo Bonzini backend->dump = value;
222605d0a94SPaolo Bonzini }
223605d0a94SPaolo Bonzini
host_memory_backend_get_prealloc(Object * obj,Error ** errp)224a35ba7beSPaolo Bonzini static bool host_memory_backend_get_prealloc(Object *obj, Error **errp)
225a35ba7beSPaolo Bonzini {
226a35ba7beSPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj);
227a35ba7beSPaolo Bonzini
2284ebc74dbSIgor Mammedov return backend->prealloc;
229a35ba7beSPaolo Bonzini }
230a35ba7beSPaolo Bonzini
host_memory_backend_set_prealloc(Object * obj,bool value,Error ** errp)231a35ba7beSPaolo Bonzini static void host_memory_backend_set_prealloc(Object *obj, bool value,
232a35ba7beSPaolo Bonzini Error **errp)
233a35ba7beSPaolo Bonzini {
234a35ba7beSPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj);
235a35ba7beSPaolo Bonzini
2369181fb70SDavid Hildenbrand if (!backend->reserve && value) {
2379181fb70SDavid Hildenbrand error_setg(errp, "'prealloc=on' and 'reserve=off' are incompatible");
2389181fb70SDavid Hildenbrand return;
2399181fb70SDavid Hildenbrand }
2409181fb70SDavid Hildenbrand
2416f4c60e4SPeter Xu if (!host_memory_backend_mr_inited(backend)) {
242a35ba7beSPaolo Bonzini backend->prealloc = value;
243a35ba7beSPaolo Bonzini return;
244a35ba7beSPaolo Bonzini }
245a35ba7beSPaolo Bonzini
246a35ba7beSPaolo Bonzini if (value && !backend->prealloc) {
247a35ba7beSPaolo Bonzini int fd = memory_region_get_fd(&backend->mr);
248a35ba7beSPaolo Bonzini void *ptr = memory_region_get_ram_ptr(&backend->mr);
249a35ba7beSPaolo Bonzini uint64_t sz = memory_region_size(&backend->mr);
250a35ba7beSPaolo Bonzini
2519c878ad6SPhilippe Mathieu-Daudé if (!qemu_prealloc_mem(fd, ptr, sz, backend->prealloc_threads,
25204accf43SMark Kanda backend->prealloc_context, false, errp)) {
253056b68afSIgor Mammedov return;
254056b68afSIgor Mammedov }
255a35ba7beSPaolo Bonzini backend->prealloc = true;
256a35ba7beSPaolo Bonzini }
257a35ba7beSPaolo Bonzini }
258a35ba7beSPaolo Bonzini
host_memory_backend_get_prealloc_threads(Object * obj,Visitor * v,const char * name,void * opaque,Error ** errp)259ffac16faSIgor Mammedov static void host_memory_backend_get_prealloc_threads(Object *obj, Visitor *v,
260ffac16faSIgor Mammedov const char *name, void *opaque, Error **errp)
261ffac16faSIgor Mammedov {
262ffac16faSIgor Mammedov HostMemoryBackend *backend = MEMORY_BACKEND(obj);
263ffac16faSIgor Mammedov visit_type_uint32(v, name, &backend->prealloc_threads, errp);
264ffac16faSIgor Mammedov }
265ffac16faSIgor Mammedov
host_memory_backend_set_prealloc_threads(Object * obj,Visitor * v,const char * name,void * opaque,Error ** errp)266ffac16faSIgor Mammedov static void host_memory_backend_set_prealloc_threads(Object *obj, Visitor *v,
267ffac16faSIgor Mammedov const char *name, void *opaque, Error **errp)
268ffac16faSIgor Mammedov {
269ffac16faSIgor Mammedov HostMemoryBackend *backend = MEMORY_BACKEND(obj);
270ffac16faSIgor Mammedov uint32_t value;
271ffac16faSIgor Mammedov
272668f62ecSMarkus Armbruster if (!visit_type_uint32(v, name, &value, errp)) {
273dcfe4805SMarkus Armbruster return;
274ffac16faSIgor Mammedov }
275ffac16faSIgor Mammedov if (value <= 0) {
276dcfe4805SMarkus Armbruster error_setg(errp, "property '%s' of %s doesn't take value '%d'", name,
277dcfe4805SMarkus Armbruster object_get_typename(obj), value);
278dcfe4805SMarkus Armbruster return;
279ffac16faSIgor Mammedov }
280ffac16faSIgor Mammedov backend->prealloc_threads = value;
281ffac16faSIgor Mammedov }
282ffac16faSIgor Mammedov
host_memory_backend_init(Object * obj)28358f4662cSHu Tao static void host_memory_backend_init(Object *obj)
2841f070489SIgor Mammedov {
285605d0a94SPaolo Bonzini HostMemoryBackend *backend = MEMORY_BACKEND(obj);
2866b269967SEduardo Habkost MachineState *machine = MACHINE(qdev_get_machine());
287605d0a94SPaolo Bonzini
288ffac16faSIgor Mammedov /* TODO: convert access to globals to compat properties */
2896b269967SEduardo Habkost backend->merge = machine_mem_merge(machine);
2906b269967SEduardo Habkost backend->dump = machine_dump_guest_core(machine);
29137662d85SXiaoyao Li backend->guest_memfd = machine_require_guest_memfd(machine);
2929181fb70SDavid Hildenbrand backend->reserve = true;
293f8d426a6SJaroslav Jindrak backend->prealloc_threads = machine->smp.cpus;
2941f070489SIgor Mammedov }
2951f070489SIgor Mammedov
host_memory_backend_post_init(Object * obj)296fa0cb34dSMarc-André Lureau static void host_memory_backend_post_init(Object *obj)
297fa0cb34dSMarc-André Lureau {
298fa0cb34dSMarc-André Lureau object_apply_compat_props(obj);
299fa0cb34dSMarc-André Lureau }
300fa0cb34dSMarc-André Lureau
host_memory_backend_mr_inited(HostMemoryBackend * backend)3014728b574SPeter Xu bool host_memory_backend_mr_inited(HostMemoryBackend *backend)
3024728b574SPeter Xu {
3034728b574SPeter Xu /*
3044728b574SPeter Xu * NOTE: We forbid zero-length memory backend, so here zero means
3054728b574SPeter Xu * "we haven't inited the backend memory region yet".
3064728b574SPeter Xu */
3074728b574SPeter Xu return memory_region_size(&backend->mr) != 0;
3084728b574SPeter Xu }
3094728b574SPeter Xu
host_memory_backend_get_memory(HostMemoryBackend * backend)3107943e97bSDavid Hildenbrand MemoryRegion *host_memory_backend_get_memory(HostMemoryBackend *backend)
3111f070489SIgor Mammedov {
3126f4c60e4SPeter Xu return host_memory_backend_mr_inited(backend) ? &backend->mr : NULL;
3131f070489SIgor Mammedov }
3141f070489SIgor Mammedov
host_memory_backend_set_mapped(HostMemoryBackend * backend,bool mapped)3152aece63cSXiao Guangrong void host_memory_backend_set_mapped(HostMemoryBackend *backend, bool mapped)
3162aece63cSXiao Guangrong {
3172aece63cSXiao Guangrong backend->is_mapped = mapped;
3182aece63cSXiao Guangrong }
3192aece63cSXiao Guangrong
host_memory_backend_is_mapped(HostMemoryBackend * backend)3202aece63cSXiao Guangrong bool host_memory_backend_is_mapped(HostMemoryBackend *backend)
3212aece63cSXiao Guangrong {
3222aece63cSXiao Guangrong return backend->is_mapped;
3232aece63cSXiao Guangrong }
3242aece63cSXiao Guangrong
host_memory_backend_pagesize(HostMemoryBackend * memdev)3252b108085SDavid Gibson size_t host_memory_backend_pagesize(HostMemoryBackend *memdev)
3262b108085SDavid Gibson {
3278be934b7SThomas Huth size_t pagesize = qemu_ram_pagesize(memdev->mr.ram_block);
3288be934b7SThomas Huth g_assert(pagesize >= qemu_real_host_page_size());
3292b108085SDavid Gibson return pagesize;
3302b108085SDavid Gibson }
3312b108085SDavid Gibson
332bd9262d9SHu Tao static void
host_memory_backend_memory_complete(UserCreatable * uc,Error ** errp)333bd9262d9SHu Tao host_memory_backend_memory_complete(UserCreatable *uc, Error **errp)
334bd9262d9SHu Tao {
335bd9262d9SHu Tao HostMemoryBackend *backend = MEMORY_BACKEND(uc);
336bd9262d9SHu Tao HostMemoryBackendClass *bc = MEMORY_BACKEND_GET_CLASS(uc);
337605d0a94SPaolo Bonzini void *ptr;
338605d0a94SPaolo Bonzini uint64_t sz;
3395d9a9a61SMichal Privoznik size_t pagesize;
34004accf43SMark Kanda bool async = !phase_check(PHASE_LATE_BACKENDS_CREATED);
341bd9262d9SHu Tao
342e199f7adSPhilippe Mathieu-Daudé if (!bc->alloc) {
343e199f7adSPhilippe Mathieu-Daudé return;
344e199f7adSPhilippe Mathieu-Daudé }
345fdb63cf3SPhilippe Mathieu-Daudé if (!bc->alloc(backend, errp)) {
346fdb63cf3SPhilippe Mathieu-Daudé return;
347605d0a94SPaolo Bonzini }
348605d0a94SPaolo Bonzini
349605d0a94SPaolo Bonzini ptr = memory_region_get_ram_ptr(&backend->mr);
350605d0a94SPaolo Bonzini sz = memory_region_size(&backend->mr);
3515d9a9a61SMichal Privoznik pagesize = qemu_ram_pagesize(backend->mr.ram_block);
3525d9a9a61SMichal Privoznik
3535d9a9a61SMichal Privoznik if (backend->aligned && !QEMU_IS_ALIGNED(sz, pagesize)) {
3545d9a9a61SMichal Privoznik g_autofree char *pagesize_str = size_to_str(pagesize);
3555d9a9a61SMichal Privoznik error_setg(errp, "backend '%s' memory size must be multiple of %s",
3565d9a9a61SMichal Privoznik object_get_typename(OBJECT(uc)), pagesize_str);
3575d9a9a61SMichal Privoznik return;
3585d9a9a61SMichal Privoznik }
359605d0a94SPaolo Bonzini
360605d0a94SPaolo Bonzini if (backend->merge) {
361605d0a94SPaolo Bonzini qemu_madvise(ptr, sz, QEMU_MADV_MERGEABLE);
362605d0a94SPaolo Bonzini }
363605d0a94SPaolo Bonzini if (!backend->dump) {
364605d0a94SPaolo Bonzini qemu_madvise(ptr, sz, QEMU_MADV_DONTDUMP);
365605d0a94SPaolo Bonzini }
3664cf1b76bSHu Tao #ifdef CONFIG_NUMA
3674cf1b76bSHu Tao unsigned long lastbit = find_last_bit(backend->host_nodes, MAX_NODES);
3684cf1b76bSHu Tao /* lastbit == MAX_NODES means maxnode = 0 */
3694cf1b76bSHu Tao unsigned long maxnode = (lastbit + 1) % (MAX_NODES + 1);
37093e08863SPhilippe Mathieu-Daudé /*
37193e08863SPhilippe Mathieu-Daudé * Ensure policy won't be ignored in case memory is preallocated
3724cf1b76bSHu Tao * before mbind(). note: MPOL_MF_STRICT is ignored on hugepages so
37393e08863SPhilippe Mathieu-Daudé * this doesn't catch hugepage case.
37493e08863SPhilippe Mathieu-Daudé */
375288d3322SMichael S. Tsirkin unsigned flags = MPOL_MF_STRICT | MPOL_MF_MOVE;
3766bb613f0SMichal Privoznik int mode = backend->policy;
3774cf1b76bSHu Tao
3784cf1b76bSHu Tao /* check for invalid host-nodes and policies and give more verbose
3794cf1b76bSHu Tao * error messages than mbind(). */
3804cf1b76bSHu Tao if (maxnode && backend->policy == MPOL_DEFAULT) {
3814cf1b76bSHu Tao error_setg(errp, "host-nodes must be empty for policy default,"
3824cf1b76bSHu Tao " or you should explicitly specify a policy other"
3834cf1b76bSHu Tao " than default");
3844cf1b76bSHu Tao return;
3854cf1b76bSHu Tao } else if (maxnode == 0 && backend->policy != MPOL_DEFAULT) {
3864cf1b76bSHu Tao error_setg(errp, "host-nodes must be set for policy %s",
387977c736fSMarkus Armbruster HostMemPolicy_str(backend->policy));
3884cf1b76bSHu Tao return;
3894cf1b76bSHu Tao }
3904cf1b76bSHu Tao
39193e08863SPhilippe Mathieu-Daudé /*
39293e08863SPhilippe Mathieu-Daudé * We can have up to MAX_NODES nodes, but we need to pass maxnode+1
3934cf1b76bSHu Tao * as argument to mbind() due to an old Linux bug (feature?) which
3944cf1b76bSHu Tao * cuts off the last specified node. This means backend->host_nodes
3954cf1b76bSHu Tao * must have MAX_NODES+1 bits available.
3964cf1b76bSHu Tao */
3974cf1b76bSHu Tao assert(sizeof(backend->host_nodes) >=
3984cf1b76bSHu Tao BITS_TO_LONGS(MAX_NODES + 1) * sizeof(unsigned long));
3994cf1b76bSHu Tao assert(maxnode <= MAX_NODES);
40070b6d525SIgor Mammedov
4016bb613f0SMichal Privoznik #ifdef HAVE_NUMA_HAS_PREFERRED_MANY
4026bb613f0SMichal Privoznik if (mode == MPOL_PREFERRED && numa_has_preferred_many() > 0) {
4036bb613f0SMichal Privoznik /*
4046bb613f0SMichal Privoznik * Replace with MPOL_PREFERRED_MANY otherwise the mbind() below
4056bb613f0SMichal Privoznik * silently picks the first node.
4066bb613f0SMichal Privoznik */
4076bb613f0SMichal Privoznik mode = MPOL_PREFERRED_MANY;
4086bb613f0SMichal Privoznik }
4096bb613f0SMichal Privoznik #endif
4106bb613f0SMichal Privoznik
41170b6d525SIgor Mammedov if (maxnode &&
4126bb613f0SMichal Privoznik mbind(ptr, sz, mode, backend->host_nodes, maxnode + 1, flags)) {
413a3567ba1SPavel Fedin if (backend->policy != MPOL_DEFAULT || errno != ENOSYS) {
4144cf1b76bSHu Tao error_setg_errno(errp, errno,
4154cf1b76bSHu Tao "cannot bind memory to host NUMA nodes");
4164cf1b76bSHu Tao return;
4174cf1b76bSHu Tao }
418a3567ba1SPavel Fedin }
4194cf1b76bSHu Tao #endif
42093e08863SPhilippe Mathieu-Daudé /*
42193e08863SPhilippe Mathieu-Daudé * Preallocate memory after the NUMA policy has been instantiated.
4224cf1b76bSHu Tao * This is necessary to guarantee memory is allocated with
4234cf1b76bSHu Tao * specified NUMA policy in place.
4244cf1b76bSHu Tao */
4259c878ad6SPhilippe Mathieu-Daudé if (backend->prealloc && !qemu_prealloc_mem(memory_region_get_fd(&backend->mr),
4269c878ad6SPhilippe Mathieu-Daudé ptr, sz,
427e6816458SDavid Hildenbrand backend->prealloc_threads,
42804accf43SMark Kanda backend->prealloc_context,
42904accf43SMark Kanda async, errp)) {
4303961613aSPhilippe Mathieu-Daudé return;
4313961613aSPhilippe Mathieu-Daudé }
4323961613aSPhilippe Mathieu-Daudé }
433bd9262d9SHu Tao
43436bce5caSLin Ma static bool
host_memory_backend_can_be_deleted(UserCreatable * uc)4353beacfb9SEduardo Habkost host_memory_backend_can_be_deleted(UserCreatable *uc)
43636bce5caSLin Ma {
4372aece63cSXiao Guangrong if (host_memory_backend_is_mapped(MEMORY_BACKEND(uc))) {
43836bce5caSLin Ma return false;
43936bce5caSLin Ma } else {
44036bce5caSLin Ma return true;
44136bce5caSLin Ma }
44236bce5caSLin Ma }
44336bce5caSLin Ma
host_memory_backend_get_share(Object * o,Error ** errp)44406329cceSMarcel Apfelbaum static bool host_memory_backend_get_share(Object *o, Error **errp)
44506329cceSMarcel Apfelbaum {
44606329cceSMarcel Apfelbaum HostMemoryBackend *backend = MEMORY_BACKEND(o);
44706329cceSMarcel Apfelbaum
44806329cceSMarcel Apfelbaum return backend->share;
44906329cceSMarcel Apfelbaum }
45006329cceSMarcel Apfelbaum
host_memory_backend_set_share(Object * o,bool value,Error ** errp)45106329cceSMarcel Apfelbaum static void host_memory_backend_set_share(Object *o, bool value, Error **errp)
45206329cceSMarcel Apfelbaum {
45306329cceSMarcel Apfelbaum HostMemoryBackend *backend = MEMORY_BACKEND(o);
45406329cceSMarcel Apfelbaum
45506329cceSMarcel Apfelbaum if (host_memory_backend_mr_inited(backend)) {
45606329cceSMarcel Apfelbaum error_setg(errp, "cannot change property value");
45706329cceSMarcel Apfelbaum return;
45806329cceSMarcel Apfelbaum }
45906329cceSMarcel Apfelbaum backend->share = value;
46006329cceSMarcel Apfelbaum }
46106329cceSMarcel Apfelbaum
4629181fb70SDavid Hildenbrand #ifdef CONFIG_LINUX
host_memory_backend_get_reserve(Object * o,Error ** errp)4639181fb70SDavid Hildenbrand static bool host_memory_backend_get_reserve(Object *o, Error **errp)
4649181fb70SDavid Hildenbrand {
4659181fb70SDavid Hildenbrand HostMemoryBackend *backend = MEMORY_BACKEND(o);
4669181fb70SDavid Hildenbrand
4679181fb70SDavid Hildenbrand return backend->reserve;
4689181fb70SDavid Hildenbrand }
4699181fb70SDavid Hildenbrand
host_memory_backend_set_reserve(Object * o,bool value,Error ** errp)4709181fb70SDavid Hildenbrand static void host_memory_backend_set_reserve(Object *o, bool value, Error **errp)
4719181fb70SDavid Hildenbrand {
4729181fb70SDavid Hildenbrand HostMemoryBackend *backend = MEMORY_BACKEND(o);
4739181fb70SDavid Hildenbrand
4749181fb70SDavid Hildenbrand if (host_memory_backend_mr_inited(backend)) {
4759181fb70SDavid Hildenbrand error_setg(errp, "cannot change property value");
4769181fb70SDavid Hildenbrand return;
4779181fb70SDavid Hildenbrand }
4789181fb70SDavid Hildenbrand if (backend->prealloc && !value) {
4799181fb70SDavid Hildenbrand error_setg(errp, "'prealloc=on' and 'reserve=off' are incompatible");
4809181fb70SDavid Hildenbrand return;
4819181fb70SDavid Hildenbrand }
4829181fb70SDavid Hildenbrand backend->reserve = value;
4839181fb70SDavid Hildenbrand }
4849181fb70SDavid Hildenbrand #endif /* CONFIG_LINUX */
4859181fb70SDavid Hildenbrand
486fa0cb34dSMarc-André Lureau static bool
host_memory_backend_get_use_canonical_path(Object * obj,Error ** errp)487fa0cb34dSMarc-André Lureau host_memory_backend_get_use_canonical_path(Object *obj, Error **errp)
488fa0cb34dSMarc-André Lureau {
489fa0cb34dSMarc-André Lureau HostMemoryBackend *backend = MEMORY_BACKEND(obj);
490fa0cb34dSMarc-André Lureau
491fa0cb34dSMarc-André Lureau return backend->use_canonical_path;
492fa0cb34dSMarc-André Lureau }
493fa0cb34dSMarc-André Lureau
494fa0cb34dSMarc-André Lureau static void
host_memory_backend_set_use_canonical_path(Object * obj,bool value,Error ** errp)495fa0cb34dSMarc-André Lureau host_memory_backend_set_use_canonical_path(Object *obj, bool value,
496fa0cb34dSMarc-André Lureau Error **errp)
497fa0cb34dSMarc-André Lureau {
498fa0cb34dSMarc-André Lureau HostMemoryBackend *backend = MEMORY_BACKEND(obj);
499fa0cb34dSMarc-André Lureau
500fa0cb34dSMarc-André Lureau backend->use_canonical_path = value;
501fa0cb34dSMarc-André Lureau }
502fa0cb34dSMarc-André Lureau
503bd9262d9SHu Tao static void
host_memory_backend_class_init(ObjectClass * oc,void * data)504bd9262d9SHu Tao host_memory_backend_class_init(ObjectClass *oc, void *data)
505bd9262d9SHu Tao {
506bd9262d9SHu Tao UserCreatableClass *ucc = USER_CREATABLE_CLASS(oc);
507bd9262d9SHu Tao
508bd9262d9SHu Tao ucc->complete = host_memory_backend_memory_complete;
50936bce5caSLin Ma ucc->can_be_deleted = host_memory_backend_can_be_deleted;
510e62834caSEduardo Habkost
511e62834caSEduardo Habkost object_class_property_add_bool(oc, "merge",
512e62834caSEduardo Habkost host_memory_backend_get_merge,
513d2623129SMarkus Armbruster host_memory_backend_set_merge);
514033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "merge",
5157eecec7dSMarkus Armbruster "Mark memory as mergeable");
516e62834caSEduardo Habkost object_class_property_add_bool(oc, "dump",
517e62834caSEduardo Habkost host_memory_backend_get_dump,
518d2623129SMarkus Armbruster host_memory_backend_set_dump);
519033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "dump",
5207eecec7dSMarkus Armbruster "Set to 'off' to exclude from core dump");
521e62834caSEduardo Habkost object_class_property_add_bool(oc, "prealloc",
522e62834caSEduardo Habkost host_memory_backend_get_prealloc,
523d2623129SMarkus Armbruster host_memory_backend_set_prealloc);
524033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "prealloc",
5257eecec7dSMarkus Armbruster "Preallocate memory");
526ffac16faSIgor Mammedov object_class_property_add(oc, "prealloc-threads", "int",
527ffac16faSIgor Mammedov host_memory_backend_get_prealloc_threads,
528ffac16faSIgor Mammedov host_memory_backend_set_prealloc_threads,
529d2623129SMarkus Armbruster NULL, NULL);
530ffac16faSIgor Mammedov object_class_property_set_description(oc, "prealloc-threads",
5317eecec7dSMarkus Armbruster "Number of CPU threads to use for prealloc");
532e6816458SDavid Hildenbrand object_class_property_add_link(oc, "prealloc-context",
533e6816458SDavid Hildenbrand TYPE_THREAD_CONTEXT, offsetof(HostMemoryBackend, prealloc_context),
534e6816458SDavid Hildenbrand object_property_allow_set_link, OBJ_PROP_LINK_STRONG);
535e6816458SDavid Hildenbrand object_class_property_set_description(oc, "prealloc-context",
536e6816458SDavid Hildenbrand "Context to use for creating CPU threads for preallocation");
537e62834caSEduardo Habkost object_class_property_add(oc, "size", "int",
538e62834caSEduardo Habkost host_memory_backend_get_size,
539e62834caSEduardo Habkost host_memory_backend_set_size,
540d2623129SMarkus Armbruster NULL, NULL);
541033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "size",
5427eecec7dSMarkus Armbruster "Size of the memory region (ex: 500M)");
543e62834caSEduardo Habkost object_class_property_add(oc, "host-nodes", "int",
544e62834caSEduardo Habkost host_memory_backend_get_host_nodes,
545e62834caSEduardo Habkost host_memory_backend_set_host_nodes,
546d2623129SMarkus Armbruster NULL, NULL);
547033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "host-nodes",
5487eecec7dSMarkus Armbruster "Binds memory to the list of NUMA host nodes");
549e62834caSEduardo Habkost object_class_property_add_enum(oc, "policy", "HostMemPolicy",
550f7abe0ecSMarc-André Lureau &HostMemPolicy_lookup,
551e62834caSEduardo Habkost host_memory_backend_get_policy,
552d2623129SMarkus Armbruster host_memory_backend_set_policy);
553033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "policy",
5547eecec7dSMarkus Armbruster "Set the NUMA policy");
55506329cceSMarcel Apfelbaum object_class_property_add_bool(oc, "share",
556d2623129SMarkus Armbruster host_memory_backend_get_share, host_memory_backend_set_share);
557033bfc5eSMarc-André Lureau object_class_property_set_description(oc, "share",
5587eecec7dSMarkus Armbruster "Mark the memory as private to QEMU or shared");
5599181fb70SDavid Hildenbrand #ifdef CONFIG_LINUX
5609181fb70SDavid Hildenbrand object_class_property_add_bool(oc, "reserve",
5619181fb70SDavid Hildenbrand host_memory_backend_get_reserve, host_memory_backend_set_reserve);
5629181fb70SDavid Hildenbrand object_class_property_set_description(oc, "reserve",
5639181fb70SDavid Hildenbrand "Reserve swap space (or huge pages) if applicable");
5649181fb70SDavid Hildenbrand #endif /* CONFIG_LINUX */
5658db0b204SIgor Mammedov /*
5668db0b204SIgor Mammedov * Do not delete/rename option. This option must be considered stable
5678db0b204SIgor Mammedov * (as if it didn't have the 'x-' prefix including deprecation period) as
5688db0b204SIgor Mammedov * long as 4.0 and older machine types exists.
5698db0b204SIgor Mammedov * Option will be used by upper layers to override (disable) canonical path
5708db0b204SIgor Mammedov * for ramblock-id set by compat properties on old machine types ( <= 4.0),
5718db0b204SIgor Mammedov * to keep migration working when backend is used for main RAM with
5728db0b204SIgor Mammedov * -machine memory-backend= option (main RAM historically used prefix-less
5738db0b204SIgor Mammedov * ramblock-id).
5748db0b204SIgor Mammedov */
575fa0cb34dSMarc-André Lureau object_class_property_add_bool(oc, "x-use-canonical-path-for-ramblock-id",
576fa0cb34dSMarc-André Lureau host_memory_backend_get_use_canonical_path,
577d2623129SMarkus Armbruster host_memory_backend_set_use_canonical_path);
578e1ff3c67SIgor Mammedov }
579e1ff3c67SIgor Mammedov
58058f4662cSHu Tao static const TypeInfo host_memory_backend_info = {
5811f070489SIgor Mammedov .name = TYPE_MEMORY_BACKEND,
5821f070489SIgor Mammedov .parent = TYPE_OBJECT,
5831f070489SIgor Mammedov .abstract = true,
5841f070489SIgor Mammedov .class_size = sizeof(HostMemoryBackendClass),
585bd9262d9SHu Tao .class_init = host_memory_backend_class_init,
5861f070489SIgor Mammedov .instance_size = sizeof(HostMemoryBackend),
58758f4662cSHu Tao .instance_init = host_memory_backend_init,
588fa0cb34dSMarc-André Lureau .instance_post_init = host_memory_backend_post_init,
5891f070489SIgor Mammedov .interfaces = (InterfaceInfo[]) {
5901f070489SIgor Mammedov { TYPE_USER_CREATABLE },
5911f070489SIgor Mammedov { }
5921f070489SIgor Mammedov }
5931f070489SIgor Mammedov };
5941f070489SIgor Mammedov
register_types(void)5951f070489SIgor Mammedov static void register_types(void)
5961f070489SIgor Mammedov {
59758f4662cSHu Tao type_register_static(&host_memory_backend_info);
5981f070489SIgor Mammedov }
5991f070489SIgor Mammedov
6001f070489SIgor Mammedov type_init(register_types);
601