1 /* 2 * Memory Device Interface 3 * 4 * Copyright ProfitBricks GmbH 2012 5 * Copyright (C) 2014 Red Hat Inc 6 * Copyright (c) 2018 Red Hat Inc 7 * 8 * This work is licensed under the terms of the GNU GPL, version 2 or later. 9 * See the COPYING file in the top-level directory. 10 */ 11 12 #include "qemu/osdep.h" 13 #include "hw/mem/memory-device.h" 14 #include "qapi/error.h" 15 #include "hw/boards.h" 16 #include "qemu/range.h" 17 #include "hw/virtio/vhost.h" 18 #include "sysemu/kvm.h" 19 #include "trace.h" 20 21 static gint memory_device_addr_sort(gconstpointer a, gconstpointer b) 22 { 23 const MemoryDeviceState *md_a = MEMORY_DEVICE(a); 24 const MemoryDeviceState *md_b = MEMORY_DEVICE(b); 25 const MemoryDeviceClass *mdc_a = MEMORY_DEVICE_GET_CLASS(a); 26 const MemoryDeviceClass *mdc_b = MEMORY_DEVICE_GET_CLASS(b); 27 const uint64_t addr_a = mdc_a->get_addr(md_a); 28 const uint64_t addr_b = mdc_b->get_addr(md_b); 29 30 if (addr_a > addr_b) { 31 return 1; 32 } else if (addr_a < addr_b) { 33 return -1; 34 } 35 return 0; 36 } 37 38 static int memory_device_build_list(Object *obj, void *opaque) 39 { 40 GSList **list = opaque; 41 42 if (object_dynamic_cast(obj, TYPE_MEMORY_DEVICE)) { 43 DeviceState *dev = DEVICE(obj); 44 if (dev->realized) { /* only realized memory devices matter */ 45 *list = g_slist_insert_sorted(*list, dev, memory_device_addr_sort); 46 } 47 } 48 49 object_child_foreach(obj, memory_device_build_list, opaque); 50 return 0; 51 } 52 53 static int memory_device_used_region_size(Object *obj, void *opaque) 54 { 55 uint64_t *size = opaque; 56 57 if (object_dynamic_cast(obj, TYPE_MEMORY_DEVICE)) { 58 const DeviceState *dev = DEVICE(obj); 59 const MemoryDeviceState *md = MEMORY_DEVICE(obj); 60 61 if (dev->realized) { 62 *size += memory_device_get_region_size(md, &error_abort); 63 } 64 } 65 66 object_child_foreach(obj, memory_device_used_region_size, opaque); 67 return 0; 68 } 69 70 static void memory_device_check_addable(MachineState *ms, uint64_t size, 71 Error **errp) 72 { 73 uint64_t used_region_size = 0; 74 75 /* we will need a new memory slot for kvm and vhost */ 76 if (kvm_enabled() && !kvm_has_free_slot(ms)) { 77 error_setg(errp, "hypervisor has no free memory slots left"); 78 return; 79 } 80 if (!vhost_has_free_slot()) { 81 error_setg(errp, "a used vhost backend has no free memory slots left"); 82 return; 83 } 84 85 /* will we exceed the total amount of memory specified */ 86 memory_device_used_region_size(OBJECT(ms), &used_region_size); 87 if (used_region_size + size < used_region_size || 88 used_region_size + size > ms->maxram_size - ms->ram_size) { 89 error_setg(errp, "not enough space, currently 0x%" PRIx64 90 " in use of total space for memory devices 0x" RAM_ADDR_FMT, 91 used_region_size, ms->maxram_size - ms->ram_size); 92 return; 93 } 94 95 } 96 97 static uint64_t memory_device_get_free_addr(MachineState *ms, 98 const uint64_t *hint, 99 uint64_t align, uint64_t size, 100 Error **errp) 101 { 102 Error *err = NULL; 103 GSList *list = NULL, *item; 104 Range as, new = range_empty; 105 106 if (!ms->device_memory) { 107 error_setg(errp, "memory devices (e.g. for memory hotplug) are not " 108 "supported by the machine"); 109 return 0; 110 } 111 112 if (!memory_region_size(&ms->device_memory->mr)) { 113 error_setg(errp, "memory devices (e.g. for memory hotplug) are not " 114 "enabled, please specify the maxmem option"); 115 return 0; 116 } 117 range_init_nofail(&as, ms->device_memory->base, 118 memory_region_size(&ms->device_memory->mr)); 119 120 /* start of address space indicates the maximum alignment we expect */ 121 if (!QEMU_IS_ALIGNED(range_lob(&as), align)) { 122 warn_report("the alignment (0x%" PRIx64 ") exceeds the expected" 123 " maximum alignment, memory will get fragmented and not" 124 " all 'maxmem' might be usable for memory devices.", 125 align); 126 } 127 128 memory_device_check_addable(ms, size, &err); 129 if (err) { 130 error_propagate(errp, err); 131 return 0; 132 } 133 134 if (hint && !QEMU_IS_ALIGNED(*hint, align)) { 135 error_setg(errp, "address must be aligned to 0x%" PRIx64 " bytes", 136 align); 137 return 0; 138 } 139 140 if (!QEMU_IS_ALIGNED(size, align)) { 141 error_setg(errp, "backend memory size must be multiple of 0x%" 142 PRIx64, align); 143 return 0; 144 } 145 146 if (hint) { 147 if (range_init(&new, *hint, size) || !range_contains_range(&as, &new)) { 148 error_setg(errp, "can't add memory device [0x%" PRIx64 ":0x%" PRIx64 149 "], usable range for memory devices [0x%" PRIx64 ":0x%" 150 PRIx64 "]", *hint, size, range_lob(&as), 151 range_size(&as)); 152 return 0; 153 } 154 } else { 155 if (range_init(&new, QEMU_ALIGN_UP(range_lob(&as), align), size)) { 156 error_setg(errp, "can't add memory device, device too big"); 157 return 0; 158 } 159 } 160 161 /* find address range that will fit new memory device */ 162 object_child_foreach(OBJECT(ms), memory_device_build_list, &list); 163 for (item = list; item; item = g_slist_next(item)) { 164 const MemoryDeviceState *md = item->data; 165 const MemoryDeviceClass *mdc = MEMORY_DEVICE_GET_CLASS(OBJECT(md)); 166 uint64_t next_addr; 167 Range tmp; 168 169 range_init_nofail(&tmp, mdc->get_addr(md), 170 memory_device_get_region_size(md, &error_abort)); 171 172 if (range_overlaps_range(&tmp, &new)) { 173 if (hint) { 174 const DeviceState *d = DEVICE(md); 175 error_setg(errp, "address range conflicts with memory device" 176 " id='%s'", d->id ? d->id : "(unnamed)"); 177 goto out; 178 } 179 180 next_addr = QEMU_ALIGN_UP(range_upb(&tmp) + 1, align); 181 if (!next_addr || range_init(&new, next_addr, range_size(&new))) { 182 range_make_empty(&new); 183 break; 184 } 185 } else if (range_lob(&tmp) > range_upb(&new)) { 186 break; 187 } 188 } 189 190 if (!range_contains_range(&as, &new)) { 191 error_setg(errp, "could not find position in guest address space for " 192 "memory device - memory fragmented due to alignments"); 193 } 194 out: 195 g_slist_free(list); 196 return range_lob(&new); 197 } 198 199 MemoryDeviceInfoList *qmp_memory_device_list(void) 200 { 201 GSList *devices = NULL, *item; 202 MemoryDeviceInfoList *list = NULL, *prev = NULL; 203 204 object_child_foreach(qdev_get_machine(), memory_device_build_list, 205 &devices); 206 207 for (item = devices; item; item = g_slist_next(item)) { 208 const MemoryDeviceState *md = MEMORY_DEVICE(item->data); 209 const MemoryDeviceClass *mdc = MEMORY_DEVICE_GET_CLASS(item->data); 210 MemoryDeviceInfoList *elem = g_new0(MemoryDeviceInfoList, 1); 211 MemoryDeviceInfo *info = g_new0(MemoryDeviceInfo, 1); 212 213 mdc->fill_device_info(md, info); 214 215 elem->value = info; 216 elem->next = NULL; 217 if (prev) { 218 prev->next = elem; 219 } else { 220 list = elem; 221 } 222 prev = elem; 223 } 224 225 g_slist_free(devices); 226 227 return list; 228 } 229 230 static int memory_device_plugged_size(Object *obj, void *opaque) 231 { 232 uint64_t *size = opaque; 233 234 if (object_dynamic_cast(obj, TYPE_MEMORY_DEVICE)) { 235 const DeviceState *dev = DEVICE(obj); 236 const MemoryDeviceState *md = MEMORY_DEVICE(obj); 237 const MemoryDeviceClass *mdc = MEMORY_DEVICE_GET_CLASS(obj); 238 239 if (dev->realized) { 240 *size += mdc->get_plugged_size(md, &error_abort); 241 } 242 } 243 244 object_child_foreach(obj, memory_device_plugged_size, opaque); 245 return 0; 246 } 247 248 uint64_t get_plugged_memory_size(void) 249 { 250 uint64_t size = 0; 251 252 memory_device_plugged_size(qdev_get_machine(), &size); 253 254 return size; 255 } 256 257 void memory_device_pre_plug(MemoryDeviceState *md, MachineState *ms, 258 const uint64_t *legacy_align, Error **errp) 259 { 260 const MemoryDeviceClass *mdc = MEMORY_DEVICE_GET_CLASS(md); 261 Error *local_err = NULL; 262 uint64_t addr, align = 0; 263 MemoryRegion *mr; 264 265 mr = mdc->get_memory_region(md, &local_err); 266 if (local_err) { 267 goto out; 268 } 269 270 if (legacy_align) { 271 align = *legacy_align; 272 } else { 273 if (mdc->get_min_alignment) { 274 align = mdc->get_min_alignment(md); 275 } 276 align = MAX(align, memory_region_get_alignment(mr)); 277 } 278 addr = mdc->get_addr(md); 279 addr = memory_device_get_free_addr(ms, !addr ? NULL : &addr, align, 280 memory_region_size(mr), &local_err); 281 if (local_err) { 282 goto out; 283 } 284 mdc->set_addr(md, addr, &local_err); 285 if (!local_err) { 286 trace_memory_device_pre_plug(DEVICE(md)->id ? DEVICE(md)->id : "", 287 addr); 288 } 289 out: 290 error_propagate(errp, local_err); 291 } 292 293 void memory_device_plug(MemoryDeviceState *md, MachineState *ms) 294 { 295 const MemoryDeviceClass *mdc = MEMORY_DEVICE_GET_CLASS(md); 296 const uint64_t addr = mdc->get_addr(md); 297 MemoryRegion *mr; 298 299 /* 300 * We expect that a previous call to memory_device_pre_plug() succeeded, so 301 * it can't fail at this point. 302 */ 303 mr = mdc->get_memory_region(md, &error_abort); 304 g_assert(ms->device_memory); 305 306 memory_region_add_subregion(&ms->device_memory->mr, 307 addr - ms->device_memory->base, mr); 308 trace_memory_device_plug(DEVICE(md)->id ? DEVICE(md)->id : "", addr); 309 } 310 311 void memory_device_unplug(MemoryDeviceState *md, MachineState *ms) 312 { 313 const MemoryDeviceClass *mdc = MEMORY_DEVICE_GET_CLASS(md); 314 MemoryRegion *mr; 315 316 /* 317 * We expect that a previous call to memory_device_pre_plug() succeeded, so 318 * it can't fail at this point. 319 */ 320 mr = mdc->get_memory_region(md, &error_abort); 321 g_assert(ms->device_memory); 322 323 memory_region_del_subregion(&ms->device_memory->mr, mr); 324 trace_memory_device_unplug(DEVICE(md)->id ? DEVICE(md)->id : "", 325 mdc->get_addr(md)); 326 } 327 328 uint64_t memory_device_get_region_size(const MemoryDeviceState *md, 329 Error **errp) 330 { 331 const MemoryDeviceClass *mdc = MEMORY_DEVICE_GET_CLASS(md); 332 MemoryRegion *mr; 333 334 /* dropping const here is fine as we don't touch the memory region */ 335 mr = mdc->get_memory_region((MemoryDeviceState *)md, errp); 336 if (!mr) { 337 return 0; 338 } 339 340 return memory_region_size(mr); 341 } 342 343 static const TypeInfo memory_device_info = { 344 .name = TYPE_MEMORY_DEVICE, 345 .parent = TYPE_INTERFACE, 346 .class_size = sizeof(MemoryDeviceClass), 347 }; 348 349 static void memory_device_register_types(void) 350 { 351 type_register_static(&memory_device_info); 352 } 353 354 type_init(memory_device_register_types) 355