1 /*
2 * QEMU NVM Express Subsystem: nvme-subsys
3 *
4 * Copyright (c) 2021 Minwoo Im <minwoo.im.dev@gmail.com>
5 *
6 * This code is licensed under the GNU GPL v2. Refer COPYING.
7 */
8
9 #include "qemu/osdep.h"
10 #include "qemu/units.h"
11 #include "qapi/error.h"
12
13 #include "nvme.h"
14
15 #define NVME_DEFAULT_RU_SIZE (96 * MiB)
16
nvme_subsys_reserve_cntlids(NvmeCtrl * n,int start,int num)17 static int nvme_subsys_reserve_cntlids(NvmeCtrl *n, int start, int num)
18 {
19 NvmeSubsystem *subsys = n->subsys;
20 NvmeSecCtrlEntry *list = n->sec_ctrl_list;
21 NvmeSecCtrlEntry *sctrl;
22 int i, cnt = 0;
23
24 for (i = start; i < ARRAY_SIZE(subsys->ctrls) && cnt < num; i++) {
25 if (!subsys->ctrls[i]) {
26 sctrl = &list[cnt];
27 sctrl->scid = cpu_to_le16(i);
28 subsys->ctrls[i] = SUBSYS_SLOT_RSVD;
29 cnt++;
30 }
31 }
32
33 return cnt;
34 }
35
nvme_subsys_unreserve_cntlids(NvmeCtrl * n)36 static void nvme_subsys_unreserve_cntlids(NvmeCtrl *n)
37 {
38 NvmeSubsystem *subsys = n->subsys;
39 NvmeSecCtrlEntry *list = n->sec_ctrl_list;
40 NvmeSecCtrlEntry *sctrl;
41 int i, cntlid;
42
43 for (i = 0; i < n->params.sriov_max_vfs; i++) {
44 sctrl = &list[i];
45 cntlid = le16_to_cpu(sctrl->scid);
46
47 if (cntlid) {
48 assert(subsys->ctrls[cntlid] == SUBSYS_SLOT_RSVD);
49 subsys->ctrls[cntlid] = NULL;
50 sctrl->scid = 0;
51 }
52 }
53 }
54
nvme_subsys_register_ctrl(NvmeCtrl * n,Error ** errp)55 int nvme_subsys_register_ctrl(NvmeCtrl *n, Error **errp)
56 {
57 NvmeSubsystem *subsys = n->subsys;
58 NvmeSecCtrlEntry *sctrl = nvme_sctrl(n);
59 int cntlid, nsid, num_rsvd, num_vfs = n->params.sriov_max_vfs;
60
61 if (pci_is_vf(&n->parent_obj)) {
62 cntlid = le16_to_cpu(sctrl->scid);
63 } else {
64 n->sec_ctrl_list = g_new0(NvmeSecCtrlEntry, num_vfs);
65
66 for (cntlid = 0; cntlid < ARRAY_SIZE(subsys->ctrls); cntlid++) {
67 if (!subsys->ctrls[cntlid]) {
68 break;
69 }
70 }
71
72 if (cntlid == ARRAY_SIZE(subsys->ctrls)) {
73 error_setg(errp, "no more free controller id");
74 return -1;
75 }
76
77 num_rsvd = nvme_subsys_reserve_cntlids(n, cntlid + 1, num_vfs);
78 if (num_rsvd != num_vfs) {
79 nvme_subsys_unreserve_cntlids(n);
80 error_setg(errp,
81 "no more free controller ids for secondary controllers");
82 return -1;
83 }
84 }
85
86 if (!subsys->serial) {
87 subsys->serial = g_strdup(n->params.serial);
88 } else if (strcmp(subsys->serial, n->params.serial)) {
89 error_setg(errp, "invalid controller serial");
90 return -1;
91 }
92
93 subsys->ctrls[cntlid] = n;
94
95 for (nsid = 1; nsid < ARRAY_SIZE(subsys->namespaces); nsid++) {
96 NvmeNamespace *ns = subsys->namespaces[nsid];
97 if (ns && ns->params.shared && !ns->params.detached) {
98 nvme_attach_ns(n, ns);
99 }
100 }
101
102 return cntlid;
103 }
104
nvme_subsys_unregister_ctrl(NvmeSubsystem * subsys,NvmeCtrl * n)105 void nvme_subsys_unregister_ctrl(NvmeSubsystem *subsys, NvmeCtrl *n)
106 {
107 if (pci_is_vf(&n->parent_obj)) {
108 subsys->ctrls[n->cntlid] = SUBSYS_SLOT_RSVD;
109 } else {
110 subsys->ctrls[n->cntlid] = NULL;
111 nvme_subsys_unreserve_cntlids(n);
112 }
113
114 n->cntlid = -1;
115 }
116
nvme_calc_rgif(uint16_t nruh,uint16_t nrg,uint8_t * rgif)117 static bool nvme_calc_rgif(uint16_t nruh, uint16_t nrg, uint8_t *rgif)
118 {
119 uint16_t val;
120 unsigned int i;
121
122 if (unlikely(nrg == 1)) {
123 /* PIDRG_NORGI scenario, all of pid is used for PHID */
124 *rgif = 0;
125 return true;
126 }
127
128 val = nrg;
129 i = 0;
130 while (val) {
131 val >>= 1;
132 i++;
133 }
134 *rgif = i;
135
136 /* ensure remaining bits suffice to represent number of phids in a RG */
137 if (unlikely((UINT16_MAX >> i) < nruh)) {
138 *rgif = 0;
139 return false;
140 }
141
142 return true;
143 }
144
nvme_subsys_setup_fdp(NvmeSubsystem * subsys,Error ** errp)145 static bool nvme_subsys_setup_fdp(NvmeSubsystem *subsys, Error **errp)
146 {
147 NvmeEnduranceGroup *endgrp = &subsys->endgrp;
148
149 if (!subsys->params.fdp.runs) {
150 error_setg(errp, "fdp.runs must be non-zero");
151 return false;
152 }
153
154 endgrp->fdp.runs = subsys->params.fdp.runs;
155
156 if (!subsys->params.fdp.nrg) {
157 error_setg(errp, "fdp.nrg must be non-zero");
158 return false;
159 }
160
161 endgrp->fdp.nrg = subsys->params.fdp.nrg;
162
163 if (!subsys->params.fdp.nruh ||
164 subsys->params.fdp.nruh > NVME_FDP_MAXPIDS) {
165 error_setg(errp, "fdp.nruh must be non-zero and less than %u",
166 NVME_FDP_MAXPIDS);
167 return false;
168 }
169
170 endgrp->fdp.nruh = subsys->params.fdp.nruh;
171
172 if (!nvme_calc_rgif(endgrp->fdp.nruh, endgrp->fdp.nrg, &endgrp->fdp.rgif)) {
173 error_setg(errp,
174 "cannot derive a valid rgif (nruh %"PRIu16" nrg %"PRIu32")",
175 endgrp->fdp.nruh, endgrp->fdp.nrg);
176 return false;
177 }
178
179 endgrp->fdp.ruhs = g_new(NvmeRuHandle, endgrp->fdp.nruh);
180
181 for (uint16_t ruhid = 0; ruhid < endgrp->fdp.nruh; ruhid++) {
182 endgrp->fdp.ruhs[ruhid] = (NvmeRuHandle) {
183 .ruht = NVME_RUHT_INITIALLY_ISOLATED,
184 .ruha = NVME_RUHA_UNUSED,
185 };
186
187 endgrp->fdp.ruhs[ruhid].rus = g_new(NvmeReclaimUnit, endgrp->fdp.nrg);
188 }
189
190 endgrp->fdp.enabled = true;
191
192 return true;
193 }
194
nvme_subsys_setup(NvmeSubsystem * subsys,Error ** errp)195 static bool nvme_subsys_setup(NvmeSubsystem *subsys, Error **errp)
196 {
197 const char *nqn = subsys->params.nqn ?
198 subsys->params.nqn : subsys->parent_obj.id;
199
200 snprintf((char *)subsys->subnqn, sizeof(subsys->subnqn),
201 "nqn.2019-08.org.qemu:%s", nqn);
202
203 if (subsys->params.fdp.enabled && !nvme_subsys_setup_fdp(subsys, errp)) {
204 return false;
205 }
206
207 return true;
208 }
209
nvme_subsys_realize(DeviceState * dev,Error ** errp)210 static void nvme_subsys_realize(DeviceState *dev, Error **errp)
211 {
212 NvmeSubsystem *subsys = NVME_SUBSYS(dev);
213
214 qbus_init(&subsys->bus, sizeof(NvmeBus), TYPE_NVME_BUS, dev, dev->id);
215
216 nvme_subsys_setup(subsys, errp);
217 }
218
219 static Property nvme_subsystem_props[] = {
220 DEFINE_PROP_STRING("nqn", NvmeSubsystem, params.nqn),
221 DEFINE_PROP_BOOL("fdp", NvmeSubsystem, params.fdp.enabled, false),
222 DEFINE_PROP_SIZE("fdp.runs", NvmeSubsystem, params.fdp.runs,
223 NVME_DEFAULT_RU_SIZE),
224 DEFINE_PROP_UINT32("fdp.nrg", NvmeSubsystem, params.fdp.nrg, 1),
225 DEFINE_PROP_UINT16("fdp.nruh", NvmeSubsystem, params.fdp.nruh, 0),
226 DEFINE_PROP_END_OF_LIST(),
227 };
228
nvme_subsys_class_init(ObjectClass * oc,void * data)229 static void nvme_subsys_class_init(ObjectClass *oc, void *data)
230 {
231 DeviceClass *dc = DEVICE_CLASS(oc);
232
233 set_bit(DEVICE_CATEGORY_STORAGE, dc->categories);
234
235 dc->realize = nvme_subsys_realize;
236 dc->desc = "Virtual NVMe subsystem";
237 dc->hotpluggable = false;
238
239 device_class_set_props(dc, nvme_subsystem_props);
240 }
241
242 static const TypeInfo nvme_subsys_info = {
243 .name = TYPE_NVME_SUBSYS,
244 .parent = TYPE_DEVICE,
245 .class_init = nvme_subsys_class_init,
246 .instance_size = sizeof(NvmeSubsystem),
247 };
248
nvme_subsys_register_types(void)249 static void nvme_subsys_register_types(void)
250 {
251 type_register_static(&nvme_subsys_info);
252 }
253
254 type_init(nvme_subsys_register_types)
255