xref: /openbmc/qemu/hw/ppc/spapr_nvdimm.c (revision ac12b601)
1 /*
2  * QEMU PAPR Storage Class Memory Interfaces
3  *
4  * Copyright (c) 2019-2020, IBM Corporation.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a copy
7  * of this software and associated documentation files (the "Software"), to deal
8  * in the Software without restriction, including without limitation the rights
9  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10  * copies of the Software, and to permit persons to whom the Software is
11  * furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in
14  * all copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22  * THE SOFTWARE.
23  */
24 #include "qemu/osdep.h"
25 #include "qapi/error.h"
26 #include "hw/ppc/spapr_drc.h"
27 #include "hw/ppc/spapr_nvdimm.h"
28 #include "hw/mem/nvdimm.h"
29 #include "qemu/nvdimm-utils.h"
30 #include "hw/ppc/fdt.h"
31 #include "qemu/range.h"
32 #include "hw/ppc/spapr_numa.h"
33 
34 /* DIMM health bitmap bitmap indicators. Taken from kernel's papr_scm.c */
35 /* SCM device is unable to persist memory contents */
36 #define PAPR_PMEM_UNARMED PPC_BIT(0)
37 
38 bool spapr_nvdimm_validate(HotplugHandler *hotplug_dev, NVDIMMDevice *nvdimm,
39                            uint64_t size, Error **errp)
40 {
41     const MachineClass *mc = MACHINE_GET_CLASS(hotplug_dev);
42     const MachineState *ms = MACHINE(hotplug_dev);
43     g_autofree char *uuidstr = NULL;
44     QemuUUID uuid;
45     int ret;
46 
47     if (!mc->nvdimm_supported) {
48         error_setg(errp, "NVDIMM hotplug not supported for this machine");
49         return false;
50     }
51 
52     if (!ms->nvdimms_state->is_enabled) {
53         error_setg(errp, "nvdimm device found but 'nvdimm=off' was set");
54         return false;
55     }
56 
57     if (object_property_get_int(OBJECT(nvdimm), NVDIMM_LABEL_SIZE_PROP,
58                                 &error_abort) == 0) {
59         error_setg(errp, "PAPR requires NVDIMM devices to have label-size set");
60         return false;
61     }
62 
63     if (size % SPAPR_MINIMUM_SCM_BLOCK_SIZE) {
64         error_setg(errp, "PAPR requires NVDIMM memory size (excluding label)"
65                    " to be a multiple of %" PRIu64 "MB",
66                    SPAPR_MINIMUM_SCM_BLOCK_SIZE / MiB);
67         return false;
68     }
69 
70     uuidstr = object_property_get_str(OBJECT(nvdimm), NVDIMM_UUID_PROP,
71                                       &error_abort);
72     ret = qemu_uuid_parse(uuidstr, &uuid);
73     g_assert(!ret);
74 
75     if (qemu_uuid_is_null(&uuid)) {
76         error_setg(errp, "NVDIMM device requires the uuid to be set");
77         return false;
78     }
79 
80     return true;
81 }
82 
83 
84 void spapr_add_nvdimm(DeviceState *dev, uint64_t slot)
85 {
86     SpaprDrc *drc;
87     bool hotplugged = spapr_drc_hotplugged(dev);
88 
89     drc = spapr_drc_by_id(TYPE_SPAPR_DRC_PMEM, slot);
90     g_assert(drc);
91 
92     /*
93      * pc_dimm_get_free_slot() provided a free slot at pre-plug. The
94      * corresponding DRC is thus assumed to be attachable.
95      */
96     spapr_drc_attach(drc, dev);
97 
98     if (hotplugged) {
99         spapr_hotplug_req_add_by_index(drc);
100     }
101 }
102 
103 static int spapr_dt_nvdimm(SpaprMachineState *spapr, void *fdt,
104                            int parent_offset, NVDIMMDevice *nvdimm)
105 {
106     int child_offset;
107     char *buf;
108     SpaprDrc *drc;
109     uint32_t drc_idx;
110     uint32_t node = object_property_get_uint(OBJECT(nvdimm), PC_DIMM_NODE_PROP,
111                                              &error_abort);
112     uint64_t slot = object_property_get_uint(OBJECT(nvdimm), PC_DIMM_SLOT_PROP,
113                                              &error_abort);
114     uint64_t lsize = nvdimm->label_size;
115     uint64_t size = object_property_get_int(OBJECT(nvdimm), PC_DIMM_SIZE_PROP,
116                                             NULL);
117 
118     drc = spapr_drc_by_id(TYPE_SPAPR_DRC_PMEM, slot);
119     g_assert(drc);
120 
121     drc_idx = spapr_drc_index(drc);
122 
123     buf = g_strdup_printf("ibm,pmemory@%x", drc_idx);
124     child_offset = fdt_add_subnode(fdt, parent_offset, buf);
125     g_free(buf);
126 
127     _FDT(child_offset);
128 
129     _FDT((fdt_setprop_cell(fdt, child_offset, "reg", drc_idx)));
130     _FDT((fdt_setprop_string(fdt, child_offset, "compatible", "ibm,pmemory")));
131     _FDT((fdt_setprop_string(fdt, child_offset, "device_type", "ibm,pmemory")));
132 
133     spapr_numa_write_associativity_dt(spapr, fdt, child_offset, node);
134 
135     buf = qemu_uuid_unparse_strdup(&nvdimm->uuid);
136     _FDT((fdt_setprop_string(fdt, child_offset, "ibm,unit-guid", buf)));
137     g_free(buf);
138 
139     _FDT((fdt_setprop_cell(fdt, child_offset, "ibm,my-drc-index", drc_idx)));
140 
141     _FDT((fdt_setprop_u64(fdt, child_offset, "ibm,block-size",
142                           SPAPR_MINIMUM_SCM_BLOCK_SIZE)));
143     _FDT((fdt_setprop_u64(fdt, child_offset, "ibm,number-of-blocks",
144                           size / SPAPR_MINIMUM_SCM_BLOCK_SIZE)));
145     _FDT((fdt_setprop_cell(fdt, child_offset, "ibm,metadata-size", lsize)));
146 
147     _FDT((fdt_setprop_string(fdt, child_offset, "ibm,pmem-application",
148                              "operating-system")));
149     _FDT(fdt_setprop(fdt, child_offset, "ibm,cache-flush-required", NULL, 0));
150 
151     return child_offset;
152 }
153 
154 int spapr_pmem_dt_populate(SpaprDrc *drc, SpaprMachineState *spapr,
155                            void *fdt, int *fdt_start_offset, Error **errp)
156 {
157     NVDIMMDevice *nvdimm = NVDIMM(drc->dev);
158 
159     *fdt_start_offset = spapr_dt_nvdimm(spapr, fdt, 0, nvdimm);
160 
161     return 0;
162 }
163 
164 void spapr_dt_persistent_memory(SpaprMachineState *spapr, void *fdt)
165 {
166     int offset = fdt_subnode_offset(fdt, 0, "persistent-memory");
167     GSList *iter, *nvdimms = nvdimm_get_device_list();
168 
169     if (offset < 0) {
170         offset = fdt_add_subnode(fdt, 0, "persistent-memory");
171         _FDT(offset);
172         _FDT((fdt_setprop_cell(fdt, offset, "#address-cells", 0x1)));
173         _FDT((fdt_setprop_cell(fdt, offset, "#size-cells", 0x0)));
174         _FDT((fdt_setprop_string(fdt, offset, "device_type",
175                                  "ibm,persistent-memory")));
176     }
177 
178     /* Create DT entries for cold plugged NVDIMM devices */
179     for (iter = nvdimms; iter; iter = iter->next) {
180         NVDIMMDevice *nvdimm = iter->data;
181 
182         spapr_dt_nvdimm(spapr, fdt, offset, nvdimm);
183     }
184     g_slist_free(nvdimms);
185 
186     return;
187 }
188 
189 static target_ulong h_scm_read_metadata(PowerPCCPU *cpu,
190                                         SpaprMachineState *spapr,
191                                         target_ulong opcode,
192                                         target_ulong *args)
193 {
194     uint32_t drc_index = args[0];
195     uint64_t offset = args[1];
196     uint64_t len = args[2];
197     SpaprDrc *drc = spapr_drc_by_index(drc_index);
198     NVDIMMDevice *nvdimm;
199     NVDIMMClass *ddc;
200     uint64_t data = 0;
201     uint8_t buf[8] = { 0 };
202 
203     if (!drc || !drc->dev ||
204         spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
205         return H_PARAMETER;
206     }
207 
208     if (len != 1 && len != 2 &&
209         len != 4 && len != 8) {
210         return H_P3;
211     }
212 
213     nvdimm = NVDIMM(drc->dev);
214     if ((offset + len < offset) ||
215         (nvdimm->label_size < len + offset)) {
216         return H_P2;
217     }
218 
219     ddc = NVDIMM_GET_CLASS(nvdimm);
220     ddc->read_label_data(nvdimm, buf, len, offset);
221 
222     switch (len) {
223     case 1:
224         data = ldub_p(buf);
225         break;
226     case 2:
227         data = lduw_be_p(buf);
228         break;
229     case 4:
230         data = ldl_be_p(buf);
231         break;
232     case 8:
233         data = ldq_be_p(buf);
234         break;
235     default:
236         g_assert_not_reached();
237     }
238 
239     args[0] = data;
240 
241     return H_SUCCESS;
242 }
243 
244 static target_ulong h_scm_write_metadata(PowerPCCPU *cpu,
245                                          SpaprMachineState *spapr,
246                                          target_ulong opcode,
247                                          target_ulong *args)
248 {
249     uint32_t drc_index = args[0];
250     uint64_t offset = args[1];
251     uint64_t data = args[2];
252     uint64_t len = args[3];
253     SpaprDrc *drc = spapr_drc_by_index(drc_index);
254     NVDIMMDevice *nvdimm;
255     NVDIMMClass *ddc;
256     uint8_t buf[8] = { 0 };
257 
258     if (!drc || !drc->dev ||
259         spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
260         return H_PARAMETER;
261     }
262 
263     if (len != 1 && len != 2 &&
264         len != 4 && len != 8) {
265         return H_P4;
266     }
267 
268     nvdimm = NVDIMM(drc->dev);
269     if ((offset + len < offset) ||
270         (nvdimm->label_size < len + offset)) {
271         return H_P2;
272     }
273 
274     switch (len) {
275     case 1:
276         if (data & 0xffffffffffffff00) {
277             return H_P2;
278         }
279         stb_p(buf, data);
280         break;
281     case 2:
282         if (data & 0xffffffffffff0000) {
283             return H_P2;
284         }
285         stw_be_p(buf, data);
286         break;
287     case 4:
288         if (data & 0xffffffff00000000) {
289             return H_P2;
290         }
291         stl_be_p(buf, data);
292         break;
293     case 8:
294         stq_be_p(buf, data);
295         break;
296     default:
297             g_assert_not_reached();
298     }
299 
300     ddc = NVDIMM_GET_CLASS(nvdimm);
301     ddc->write_label_data(nvdimm, buf, len, offset);
302 
303     return H_SUCCESS;
304 }
305 
306 static target_ulong h_scm_bind_mem(PowerPCCPU *cpu, SpaprMachineState *spapr,
307                                    target_ulong opcode, target_ulong *args)
308 {
309     uint32_t drc_index = args[0];
310     uint64_t starting_idx = args[1];
311     uint64_t no_of_scm_blocks_to_bind = args[2];
312     uint64_t target_logical_mem_addr = args[3];
313     uint64_t continue_token = args[4];
314     uint64_t size;
315     uint64_t total_no_of_scm_blocks;
316     SpaprDrc *drc = spapr_drc_by_index(drc_index);
317     hwaddr addr;
318     NVDIMMDevice *nvdimm;
319 
320     if (!drc || !drc->dev ||
321         spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
322         return H_PARAMETER;
323     }
324 
325     /*
326      * Currently continue token should be zero qemu has already bound
327      * everything and this hcall doesnt return H_BUSY.
328      */
329     if (continue_token > 0) {
330         return H_P5;
331     }
332 
333     /* Currently qemu assigns the address. */
334     if (target_logical_mem_addr != 0xffffffffffffffff) {
335         return H_OVERLAP;
336     }
337 
338     nvdimm = NVDIMM(drc->dev);
339 
340     size = object_property_get_uint(OBJECT(nvdimm),
341                                     PC_DIMM_SIZE_PROP, &error_abort);
342 
343     total_no_of_scm_blocks = size / SPAPR_MINIMUM_SCM_BLOCK_SIZE;
344 
345     if (starting_idx > total_no_of_scm_blocks) {
346         return H_P2;
347     }
348 
349     if (((starting_idx + no_of_scm_blocks_to_bind) < starting_idx) ||
350         ((starting_idx + no_of_scm_blocks_to_bind) > total_no_of_scm_blocks)) {
351         return H_P3;
352     }
353 
354     addr = object_property_get_uint(OBJECT(nvdimm),
355                                     PC_DIMM_ADDR_PROP, &error_abort);
356 
357     addr += starting_idx * SPAPR_MINIMUM_SCM_BLOCK_SIZE;
358 
359     /* Already bound, Return target logical address in R5 */
360     args[1] = addr;
361     args[2] = no_of_scm_blocks_to_bind;
362 
363     return H_SUCCESS;
364 }
365 
366 static target_ulong h_scm_unbind_mem(PowerPCCPU *cpu, SpaprMachineState *spapr,
367                                      target_ulong opcode, target_ulong *args)
368 {
369     uint32_t drc_index = args[0];
370     uint64_t starting_scm_logical_addr = args[1];
371     uint64_t no_of_scm_blocks_to_unbind = args[2];
372     uint64_t continue_token = args[3];
373     uint64_t size_to_unbind;
374     Range blockrange = range_empty;
375     Range nvdimmrange = range_empty;
376     SpaprDrc *drc = spapr_drc_by_index(drc_index);
377     NVDIMMDevice *nvdimm;
378     uint64_t size, addr;
379 
380     if (!drc || !drc->dev ||
381         spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
382         return H_PARAMETER;
383     }
384 
385     /* continue_token should be zero as this hcall doesn't return H_BUSY. */
386     if (continue_token > 0) {
387         return H_P4;
388     }
389 
390     /* Check if starting_scm_logical_addr is block aligned */
391     if (!QEMU_IS_ALIGNED(starting_scm_logical_addr,
392                          SPAPR_MINIMUM_SCM_BLOCK_SIZE)) {
393         return H_P2;
394     }
395 
396     size_to_unbind = no_of_scm_blocks_to_unbind * SPAPR_MINIMUM_SCM_BLOCK_SIZE;
397     if (no_of_scm_blocks_to_unbind == 0 || no_of_scm_blocks_to_unbind !=
398                                size_to_unbind / SPAPR_MINIMUM_SCM_BLOCK_SIZE) {
399         return H_P3;
400     }
401 
402     nvdimm = NVDIMM(drc->dev);
403     size = object_property_get_int(OBJECT(nvdimm), PC_DIMM_SIZE_PROP,
404                                    &error_abort);
405     addr = object_property_get_int(OBJECT(nvdimm), PC_DIMM_ADDR_PROP,
406                                    &error_abort);
407 
408     range_init_nofail(&nvdimmrange, addr, size);
409     range_init_nofail(&blockrange, starting_scm_logical_addr, size_to_unbind);
410 
411     if (!range_contains_range(&nvdimmrange, &blockrange)) {
412         return H_P3;
413     }
414 
415     args[1] = no_of_scm_blocks_to_unbind;
416 
417     /* let unplug take care of actual unbind */
418     return H_SUCCESS;
419 }
420 
421 #define H_UNBIND_SCOPE_ALL 0x1
422 #define H_UNBIND_SCOPE_DRC 0x2
423 
424 static target_ulong h_scm_unbind_all(PowerPCCPU *cpu, SpaprMachineState *spapr,
425                                      target_ulong opcode, target_ulong *args)
426 {
427     uint64_t target_scope = args[0];
428     uint32_t drc_index = args[1];
429     uint64_t continue_token = args[2];
430     NVDIMMDevice *nvdimm;
431     uint64_t size;
432     uint64_t no_of_scm_blocks_unbound = 0;
433 
434     /* continue_token should be zero as this hcall doesn't return H_BUSY. */
435     if (continue_token > 0) {
436         return H_P4;
437     }
438 
439     if (target_scope == H_UNBIND_SCOPE_DRC) {
440         SpaprDrc *drc = spapr_drc_by_index(drc_index);
441 
442         if (!drc || !drc->dev ||
443             spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
444             return H_P2;
445         }
446 
447         nvdimm = NVDIMM(drc->dev);
448         size = object_property_get_int(OBJECT(nvdimm), PC_DIMM_SIZE_PROP,
449                                        &error_abort);
450 
451         no_of_scm_blocks_unbound = size / SPAPR_MINIMUM_SCM_BLOCK_SIZE;
452     } else if (target_scope ==  H_UNBIND_SCOPE_ALL) {
453         GSList *list, *nvdimms;
454 
455         nvdimms = nvdimm_get_device_list();
456         for (list = nvdimms; list; list = list->next) {
457             nvdimm = list->data;
458             size = object_property_get_int(OBJECT(nvdimm), PC_DIMM_SIZE_PROP,
459                                            &error_abort);
460 
461             no_of_scm_blocks_unbound += size / SPAPR_MINIMUM_SCM_BLOCK_SIZE;
462         }
463         g_slist_free(nvdimms);
464     } else {
465         return H_PARAMETER;
466     }
467 
468     args[1] = no_of_scm_blocks_unbound;
469 
470     /* let unplug take care of actual unbind */
471     return H_SUCCESS;
472 }
473 
474 static target_ulong h_scm_health(PowerPCCPU *cpu, SpaprMachineState *spapr,
475                                  target_ulong opcode, target_ulong *args)
476 {
477 
478     NVDIMMDevice *nvdimm;
479     uint64_t hbitmap = 0;
480     uint32_t drc_index = args[0];
481     SpaprDrc *drc = spapr_drc_by_index(drc_index);
482     const uint64_t hbitmap_mask = PAPR_PMEM_UNARMED;
483 
484 
485     /* Ensure that the drc is valid & is valid PMEM dimm and is plugged in */
486     if (!drc || !drc->dev ||
487         spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
488         return H_PARAMETER;
489     }
490 
491     nvdimm = NVDIMM(drc->dev);
492 
493     /* Update if the nvdimm is unarmed and send its status via health bitmaps */
494     if (object_property_get_bool(OBJECT(nvdimm), NVDIMM_UNARMED_PROP, NULL)) {
495         hbitmap |= PAPR_PMEM_UNARMED;
496     }
497 
498     /* Update the out args with health bitmap/mask */
499     args[0] = hbitmap;
500     args[1] = hbitmap_mask;
501 
502     return H_SUCCESS;
503 }
504 
505 static void spapr_scm_register_types(void)
506 {
507     /* qemu/scm specific hcalls */
508     spapr_register_hypercall(H_SCM_READ_METADATA, h_scm_read_metadata);
509     spapr_register_hypercall(H_SCM_WRITE_METADATA, h_scm_write_metadata);
510     spapr_register_hypercall(H_SCM_BIND_MEM, h_scm_bind_mem);
511     spapr_register_hypercall(H_SCM_UNBIND_MEM, h_scm_unbind_mem);
512     spapr_register_hypercall(H_SCM_UNBIND_ALL, h_scm_unbind_all);
513     spapr_register_hypercall(H_SCM_HEALTH, h_scm_health);
514 }
515 
516 type_init(spapr_scm_register_types)
517