xref: /openbmc/qemu/hw/nvme/nvme.h (revision 73064edfb864743cde2c08f319609344af02aeb3)
188eea45cSKlaus Jensen /*
288eea45cSKlaus Jensen  * QEMU NVM Express
388eea45cSKlaus Jensen  *
488eea45cSKlaus Jensen  * Copyright (c) 2012 Intel Corporation
588eea45cSKlaus Jensen  * Copyright (c) 2021 Minwoo Im
688eea45cSKlaus Jensen  * Copyright (c) 2021 Samsung Electronics Co., Ltd.
788eea45cSKlaus Jensen  *
888eea45cSKlaus Jensen  * Authors:
988eea45cSKlaus Jensen  *   Keith Busch            <kbusch@kernel.org>
1088eea45cSKlaus Jensen  *   Klaus Jensen           <k.jensen@samsung.com>
1188eea45cSKlaus Jensen  *   Gollu Appalanaidu      <anaidu.gollu@samsung.com>
1288eea45cSKlaus Jensen  *   Dmitry Fomichev        <dmitry.fomichev@wdc.com>
1388eea45cSKlaus Jensen  *   Minwoo Im              <minwoo.im.dev@gmail.com>
1488eea45cSKlaus Jensen  *
1588eea45cSKlaus Jensen  * This code is licensed under the GNU GPL v2 or later.
1688eea45cSKlaus Jensen  */
1788eea45cSKlaus Jensen 
1852581c71SMarkus Armbruster #ifndef HW_NVME_NVME_H
1952581c71SMarkus Armbruster #define HW_NVME_NVME_H
2088eea45cSKlaus Jensen 
2188eea45cSKlaus Jensen #include "qemu/uuid.h"
22edf5ca5dSMarkus Armbruster #include "hw/pci/pci_device.h"
2388eea45cSKlaus Jensen #include "hw/block/block.h"
2488eea45cSKlaus Jensen 
2588eea45cSKlaus Jensen #include "block/nvme.h"
2688eea45cSKlaus Jensen 
2744c2c094SLukasz Maniak #define NVME_MAX_CONTROLLERS 256
2888eea45cSKlaus Jensen #define NVME_MAX_NAMESPACES  256
293276dde4SHeinrich Schuchardt #define NVME_EUI64_DEFAULT ((uint64_t)0x5254000000000000)
30*73064edfSJesper Devantier #define NVME_FDP_MAX_EVENTS 63
31*73064edfSJesper Devantier #define NVME_FDP_MAXPIDS 128
3288eea45cSKlaus Jensen 
3338f4ac65SKlaus Jensen QEMU_BUILD_BUG_ON(NVME_MAX_NAMESPACES > NVME_NSID_BROADCAST - 1);
3438f4ac65SKlaus Jensen 
3588eea45cSKlaus Jensen typedef struct NvmeCtrl NvmeCtrl;
3688eea45cSKlaus Jensen typedef struct NvmeNamespace NvmeNamespace;
3788eea45cSKlaus Jensen 
385ffbaeedSKlaus Jensen #define TYPE_NVME_BUS "nvme-bus"
395ffbaeedSKlaus Jensen OBJECT_DECLARE_SIMPLE_TYPE(NvmeBus, NVME_BUS)
405ffbaeedSKlaus Jensen 
415ffbaeedSKlaus Jensen typedef struct NvmeBus {
425ffbaeedSKlaus Jensen     BusState parent_bus;
435ffbaeedSKlaus Jensen } NvmeBus;
445ffbaeedSKlaus Jensen 
4588eea45cSKlaus Jensen #define TYPE_NVME_SUBSYS "nvme-subsys"
4688eea45cSKlaus Jensen #define NVME_SUBSYS(obj) \
4788eea45cSKlaus Jensen     OBJECT_CHECK(NvmeSubsystem, (obj), TYPE_NVME_SUBSYS)
4899f48ae7SLukasz Maniak #define SUBSYS_SLOT_RSVD (void *)0xFFFF
4988eea45cSKlaus Jensen 
50*73064edfSJesper Devantier typedef struct NvmeReclaimUnit {
51*73064edfSJesper Devantier     uint64_t ruamw;
52*73064edfSJesper Devantier } NvmeReclaimUnit;
53*73064edfSJesper Devantier 
54*73064edfSJesper Devantier typedef struct NvmeRuHandle {
55*73064edfSJesper Devantier     uint8_t  ruht;
56*73064edfSJesper Devantier     uint8_t  ruha;
57*73064edfSJesper Devantier     uint64_t event_filter;
58*73064edfSJesper Devantier     uint8_t  lbafi;
59*73064edfSJesper Devantier     uint64_t ruamw;
60*73064edfSJesper Devantier 
61*73064edfSJesper Devantier     /* reclaim units indexed by reclaim group */
62*73064edfSJesper Devantier     NvmeReclaimUnit *rus;
63*73064edfSJesper Devantier } NvmeRuHandle;
64*73064edfSJesper Devantier 
65*73064edfSJesper Devantier typedef struct NvmeFdpEventBuffer {
66*73064edfSJesper Devantier     NvmeFdpEvent     events[NVME_FDP_MAX_EVENTS];
67*73064edfSJesper Devantier     unsigned int     nelems;
68*73064edfSJesper Devantier     unsigned int     start;
69*73064edfSJesper Devantier     unsigned int     next;
70*73064edfSJesper Devantier } NvmeFdpEventBuffer;
71*73064edfSJesper Devantier 
72771dbc3aSKlaus Jensen typedef struct NvmeEnduranceGroup {
73771dbc3aSKlaus Jensen     uint8_t event_conf;
74*73064edfSJesper Devantier 
75*73064edfSJesper Devantier     struct {
76*73064edfSJesper Devantier         NvmeFdpEventBuffer host_events, ctrl_events;
77*73064edfSJesper Devantier 
78*73064edfSJesper Devantier         uint16_t nruh;
79*73064edfSJesper Devantier         uint16_t nrg;
80*73064edfSJesper Devantier         uint8_t  rgif;
81*73064edfSJesper Devantier         uint64_t runs;
82*73064edfSJesper Devantier 
83*73064edfSJesper Devantier         uint64_t hbmw;
84*73064edfSJesper Devantier         uint64_t mbmw;
85*73064edfSJesper Devantier         uint64_t mbe;
86*73064edfSJesper Devantier 
87*73064edfSJesper Devantier         bool enabled;
88*73064edfSJesper Devantier 
89*73064edfSJesper Devantier         NvmeRuHandle *ruhs;
90*73064edfSJesper Devantier     } fdp;
91771dbc3aSKlaus Jensen } NvmeEnduranceGroup;
92771dbc3aSKlaus Jensen 
9388eea45cSKlaus Jensen typedef struct NvmeSubsystem {
9488eea45cSKlaus Jensen     DeviceState parent_obj;
955ffbaeedSKlaus Jensen     NvmeBus     bus;
9688eea45cSKlaus Jensen     uint8_t     subnqn[256];
97a859eb9fSKlaus Jensen     char        *serial;
9888eea45cSKlaus Jensen 
9988eea45cSKlaus Jensen     NvmeCtrl           *ctrls[NVME_MAX_CONTROLLERS];
10088eea45cSKlaus Jensen     NvmeNamespace      *namespaces[NVME_MAX_NAMESPACES + 1];
101*73064edfSJesper Devantier     NvmeEnduranceGroup endgrp;
10288eea45cSKlaus Jensen 
10388eea45cSKlaus Jensen     struct {
10488eea45cSKlaus Jensen         char *nqn;
105*73064edfSJesper Devantier 
106*73064edfSJesper Devantier         struct {
107*73064edfSJesper Devantier             bool     enabled;
108*73064edfSJesper Devantier             uint64_t runs;
109*73064edfSJesper Devantier             uint16_t nruh;
110*73064edfSJesper Devantier             uint32_t nrg;
111*73064edfSJesper Devantier         } fdp;
11288eea45cSKlaus Jensen     } params;
11388eea45cSKlaus Jensen } NvmeSubsystem;
11488eea45cSKlaus Jensen 
11588eea45cSKlaus Jensen int nvme_subsys_register_ctrl(NvmeCtrl *n, Error **errp);
116b0fde9e8SKlaus Jensen void nvme_subsys_unregister_ctrl(NvmeSubsystem *subsys, NvmeCtrl *n);
11788eea45cSKlaus Jensen 
11888eea45cSKlaus Jensen static inline NvmeCtrl *nvme_subsys_ctrl(NvmeSubsystem *subsys,
11988eea45cSKlaus Jensen                                          uint32_t cntlid)
12088eea45cSKlaus Jensen {
12188eea45cSKlaus Jensen     if (!subsys || cntlid >= NVME_MAX_CONTROLLERS) {
12288eea45cSKlaus Jensen         return NULL;
12388eea45cSKlaus Jensen     }
12488eea45cSKlaus Jensen 
12599f48ae7SLukasz Maniak     if (subsys->ctrls[cntlid] == SUBSYS_SLOT_RSVD) {
12699f48ae7SLukasz Maniak         return NULL;
12799f48ae7SLukasz Maniak     }
12899f48ae7SLukasz Maniak 
12988eea45cSKlaus Jensen     return subsys->ctrls[cntlid];
13088eea45cSKlaus Jensen }
13188eea45cSKlaus Jensen 
13288eea45cSKlaus Jensen static inline NvmeNamespace *nvme_subsys_ns(NvmeSubsystem *subsys,
13388eea45cSKlaus Jensen                                             uint32_t nsid)
13488eea45cSKlaus Jensen {
13588eea45cSKlaus Jensen     if (!subsys || !nsid || nsid > NVME_MAX_NAMESPACES) {
13688eea45cSKlaus Jensen         return NULL;
13788eea45cSKlaus Jensen     }
13888eea45cSKlaus Jensen 
13988eea45cSKlaus Jensen     return subsys->namespaces[nsid];
14088eea45cSKlaus Jensen }
14188eea45cSKlaus Jensen 
14288eea45cSKlaus Jensen #define TYPE_NVME_NS "nvme-ns"
14388eea45cSKlaus Jensen #define NVME_NS(obj) \
14488eea45cSKlaus Jensen     OBJECT_CHECK(NvmeNamespace, (obj), TYPE_NVME_NS)
14588eea45cSKlaus Jensen 
14688eea45cSKlaus Jensen typedef struct NvmeZone {
14788eea45cSKlaus Jensen     NvmeZoneDescr   d;
14888eea45cSKlaus Jensen     uint64_t        w_ptr;
14988eea45cSKlaus Jensen     QTAILQ_ENTRY(NvmeZone) entry;
15088eea45cSKlaus Jensen } NvmeZone;
15188eea45cSKlaus Jensen 
152*73064edfSJesper Devantier #define FDP_EVT_MAX 0xff
153*73064edfSJesper Devantier #define NVME_FDP_MAX_NS_RUHS 32u
154*73064edfSJesper Devantier #define FDPVSS 0
155*73064edfSJesper Devantier 
156*73064edfSJesper Devantier static const uint8_t nvme_fdp_evf_shifts[FDP_EVT_MAX] = {
157*73064edfSJesper Devantier     /* Host events */
158*73064edfSJesper Devantier     [FDP_EVT_RU_NOT_FULLY_WRITTEN]      = 0,
159*73064edfSJesper Devantier     [FDP_EVT_RU_ATL_EXCEEDED]           = 1,
160*73064edfSJesper Devantier     [FDP_EVT_CTRL_RESET_RUH]            = 2,
161*73064edfSJesper Devantier     [FDP_EVT_INVALID_PID]               = 3,
162*73064edfSJesper Devantier     /* CTRL events */
163*73064edfSJesper Devantier     [FDP_EVT_MEDIA_REALLOC]             = 32,
164*73064edfSJesper Devantier     [FDP_EVT_RUH_IMPLICIT_RU_CHANGE]    = 33,
165*73064edfSJesper Devantier };
166*73064edfSJesper Devantier 
16788eea45cSKlaus Jensen typedef struct NvmeNamespaceParams {
16888eea45cSKlaus Jensen     bool     detached;
16988eea45cSKlaus Jensen     bool     shared;
17088eea45cSKlaus Jensen     uint32_t nsid;
17188eea45cSKlaus Jensen     QemuUUID uuid;
1726870cfb8SHeinrich Schuchardt     uint64_t eui64;
1733276dde4SHeinrich Schuchardt     bool     eui64_default;
17488eea45cSKlaus Jensen 
17588eea45cSKlaus Jensen     uint16_t ms;
17688eea45cSKlaus Jensen     uint8_t  mset;
17788eea45cSKlaus Jensen     uint8_t  pi;
17888eea45cSKlaus Jensen     uint8_t  pil;
17944219b60SNaveen Nagar     uint8_t  pif;
18088eea45cSKlaus Jensen 
18188eea45cSKlaus Jensen     uint16_t mssrl;
18288eea45cSKlaus Jensen     uint32_t mcl;
18388eea45cSKlaus Jensen     uint8_t  msrc;
18488eea45cSKlaus Jensen 
18588eea45cSKlaus Jensen     bool     zoned;
18688eea45cSKlaus Jensen     bool     cross_zone_read;
18788eea45cSKlaus Jensen     uint64_t zone_size_bs;
18888eea45cSKlaus Jensen     uint64_t zone_cap_bs;
18988eea45cSKlaus Jensen     uint32_t max_active_zones;
19088eea45cSKlaus Jensen     uint32_t max_open_zones;
19188eea45cSKlaus Jensen     uint32_t zd_extension_size;
192e321b4cdSKlaus Jensen 
193e321b4cdSKlaus Jensen     uint32_t numzrwa;
194e321b4cdSKlaus Jensen     uint64_t zrwas;
195e321b4cdSKlaus Jensen     uint64_t zrwafg;
196*73064edfSJesper Devantier 
197*73064edfSJesper Devantier     struct {
198*73064edfSJesper Devantier         char *ruhs;
199*73064edfSJesper Devantier     } fdp;
20088eea45cSKlaus Jensen } NvmeNamespaceParams;
20188eea45cSKlaus Jensen 
20288eea45cSKlaus Jensen typedef struct NvmeNamespace {
20388eea45cSKlaus Jensen     DeviceState  parent_obj;
20488eea45cSKlaus Jensen     BlockConf    blkconf;
20588eea45cSKlaus Jensen     int32_t      bootindex;
20688eea45cSKlaus Jensen     int64_t      size;
20788eea45cSKlaus Jensen     int64_t      moff;
20888eea45cSKlaus Jensen     NvmeIdNs     id_ns;
20944219b60SNaveen Nagar     NvmeIdNsNvm  id_ns_nvm;
21088eea45cSKlaus Jensen     NvmeLBAF     lbaf;
211763c05dfSNaveen Nagar     unsigned int nlbaf;
21288eea45cSKlaus Jensen     size_t       lbasz;
21388eea45cSKlaus Jensen     const uint32_t *iocs;
21488eea45cSKlaus Jensen     uint8_t      csi;
21588eea45cSKlaus Jensen     uint16_t     status;
21688eea45cSKlaus Jensen     int          attached;
21744219b60SNaveen Nagar     uint8_t      pif;
21888eea45cSKlaus Jensen 
219e321b4cdSKlaus Jensen     struct {
220e321b4cdSKlaus Jensen         uint16_t zrwas;
221e321b4cdSKlaus Jensen         uint16_t zrwafg;
222e321b4cdSKlaus Jensen         uint32_t numzrwa;
223e321b4cdSKlaus Jensen     } zns;
224e321b4cdSKlaus Jensen 
22588eea45cSKlaus Jensen     QTAILQ_ENTRY(NvmeNamespace) entry;
22688eea45cSKlaus Jensen 
22788eea45cSKlaus Jensen     NvmeIdNsZoned   *id_ns_zoned;
22888eea45cSKlaus Jensen     NvmeZone        *zone_array;
22988eea45cSKlaus Jensen     QTAILQ_HEAD(, NvmeZone) exp_open_zones;
23088eea45cSKlaus Jensen     QTAILQ_HEAD(, NvmeZone) imp_open_zones;
23188eea45cSKlaus Jensen     QTAILQ_HEAD(, NvmeZone) closed_zones;
23288eea45cSKlaus Jensen     QTAILQ_HEAD(, NvmeZone) full_zones;
23388eea45cSKlaus Jensen     uint32_t        num_zones;
23488eea45cSKlaus Jensen     uint64_t        zone_size;
23588eea45cSKlaus Jensen     uint64_t        zone_capacity;
23688eea45cSKlaus Jensen     uint32_t        zone_size_log2;
23788eea45cSKlaus Jensen     uint8_t         *zd_extensions;
23888eea45cSKlaus Jensen     int32_t         nr_open_zones;
23988eea45cSKlaus Jensen     int32_t         nr_active_zones;
24088eea45cSKlaus Jensen 
24188eea45cSKlaus Jensen     NvmeNamespaceParams params;
242534a93d3SNiklas Cassel     NvmeSubsystem *subsys;
243*73064edfSJesper Devantier     NvmeEnduranceGroup *endgrp;
24488eea45cSKlaus Jensen 
24588eea45cSKlaus Jensen     struct {
24688eea45cSKlaus Jensen         uint32_t err_rec;
24788eea45cSKlaus Jensen     } features;
248*73064edfSJesper Devantier 
249*73064edfSJesper Devantier     struct {
250*73064edfSJesper Devantier         uint16_t nphs;
251*73064edfSJesper Devantier         /* reclaim unit handle identifiers indexed by placement handle */
252*73064edfSJesper Devantier         uint16_t *phs;
253*73064edfSJesper Devantier     } fdp;
25488eea45cSKlaus Jensen } NvmeNamespace;
25588eea45cSKlaus Jensen 
25688eea45cSKlaus Jensen static inline uint32_t nvme_nsid(NvmeNamespace *ns)
25788eea45cSKlaus Jensen {
25888eea45cSKlaus Jensen     if (ns) {
25988eea45cSKlaus Jensen         return ns->params.nsid;
26088eea45cSKlaus Jensen     }
26188eea45cSKlaus Jensen 
26288eea45cSKlaus Jensen     return 0;
26388eea45cSKlaus Jensen }
26488eea45cSKlaus Jensen 
26588eea45cSKlaus Jensen static inline size_t nvme_l2b(NvmeNamespace *ns, uint64_t lba)
26688eea45cSKlaus Jensen {
26788eea45cSKlaus Jensen     return lba << ns->lbaf.ds;
26888eea45cSKlaus Jensen }
26988eea45cSKlaus Jensen 
27088eea45cSKlaus Jensen static inline size_t nvme_m2b(NvmeNamespace *ns, uint64_t lba)
27188eea45cSKlaus Jensen {
27288eea45cSKlaus Jensen     return ns->lbaf.ms * lba;
27388eea45cSKlaus Jensen }
27488eea45cSKlaus Jensen 
27588eea45cSKlaus Jensen static inline int64_t nvme_moff(NvmeNamespace *ns, uint64_t lba)
27688eea45cSKlaus Jensen {
27788eea45cSKlaus Jensen     return ns->moff + nvme_m2b(ns, lba);
27888eea45cSKlaus Jensen }
27988eea45cSKlaus Jensen 
28088eea45cSKlaus Jensen static inline bool nvme_ns_ext(NvmeNamespace *ns)
28188eea45cSKlaus Jensen {
28288eea45cSKlaus Jensen     return !!NVME_ID_NS_FLBAS_EXTENDED(ns->id_ns.flbas);
28388eea45cSKlaus Jensen }
28488eea45cSKlaus Jensen 
28588eea45cSKlaus Jensen static inline NvmeZoneState nvme_get_zone_state(NvmeZone *zone)
28688eea45cSKlaus Jensen {
28788eea45cSKlaus Jensen     return zone->d.zs >> 4;
28888eea45cSKlaus Jensen }
28988eea45cSKlaus Jensen 
29088eea45cSKlaus Jensen static inline void nvme_set_zone_state(NvmeZone *zone, NvmeZoneState state)
29188eea45cSKlaus Jensen {
29288eea45cSKlaus Jensen     zone->d.zs = state << 4;
29388eea45cSKlaus Jensen }
29488eea45cSKlaus Jensen 
29588eea45cSKlaus Jensen static inline uint64_t nvme_zone_rd_boundary(NvmeNamespace *ns, NvmeZone *zone)
29688eea45cSKlaus Jensen {
29788eea45cSKlaus Jensen     return zone->d.zslba + ns->zone_size;
29888eea45cSKlaus Jensen }
29988eea45cSKlaus Jensen 
30088eea45cSKlaus Jensen static inline uint64_t nvme_zone_wr_boundary(NvmeZone *zone)
30188eea45cSKlaus Jensen {
30288eea45cSKlaus Jensen     return zone->d.zslba + zone->d.zcap;
30388eea45cSKlaus Jensen }
30488eea45cSKlaus Jensen 
30588eea45cSKlaus Jensen static inline bool nvme_wp_is_valid(NvmeZone *zone)
30688eea45cSKlaus Jensen {
30788eea45cSKlaus Jensen     uint8_t st = nvme_get_zone_state(zone);
30888eea45cSKlaus Jensen 
30988eea45cSKlaus Jensen     return st != NVME_ZONE_STATE_FULL &&
31088eea45cSKlaus Jensen            st != NVME_ZONE_STATE_READ_ONLY &&
31188eea45cSKlaus Jensen            st != NVME_ZONE_STATE_OFFLINE;
31288eea45cSKlaus Jensen }
31388eea45cSKlaus Jensen 
31488eea45cSKlaus Jensen static inline uint8_t *nvme_get_zd_extension(NvmeNamespace *ns,
31588eea45cSKlaus Jensen                                              uint32_t zone_idx)
31688eea45cSKlaus Jensen {
31788eea45cSKlaus Jensen     return &ns->zd_extensions[zone_idx * ns->params.zd_extension_size];
31888eea45cSKlaus Jensen }
31988eea45cSKlaus Jensen 
32088eea45cSKlaus Jensen static inline void nvme_aor_inc_open(NvmeNamespace *ns)
32188eea45cSKlaus Jensen {
32288eea45cSKlaus Jensen     assert(ns->nr_open_zones >= 0);
32388eea45cSKlaus Jensen     if (ns->params.max_open_zones) {
32488eea45cSKlaus Jensen         ns->nr_open_zones++;
32588eea45cSKlaus Jensen         assert(ns->nr_open_zones <= ns->params.max_open_zones);
32688eea45cSKlaus Jensen     }
32788eea45cSKlaus Jensen }
32888eea45cSKlaus Jensen 
32988eea45cSKlaus Jensen static inline void nvme_aor_dec_open(NvmeNamespace *ns)
33088eea45cSKlaus Jensen {
33188eea45cSKlaus Jensen     if (ns->params.max_open_zones) {
33288eea45cSKlaus Jensen         assert(ns->nr_open_zones > 0);
33388eea45cSKlaus Jensen         ns->nr_open_zones--;
33488eea45cSKlaus Jensen     }
33588eea45cSKlaus Jensen     assert(ns->nr_open_zones >= 0);
33688eea45cSKlaus Jensen }
33788eea45cSKlaus Jensen 
33888eea45cSKlaus Jensen static inline void nvme_aor_inc_active(NvmeNamespace *ns)
33988eea45cSKlaus Jensen {
34088eea45cSKlaus Jensen     assert(ns->nr_active_zones >= 0);
34188eea45cSKlaus Jensen     if (ns->params.max_active_zones) {
34288eea45cSKlaus Jensen         ns->nr_active_zones++;
34388eea45cSKlaus Jensen         assert(ns->nr_active_zones <= ns->params.max_active_zones);
34488eea45cSKlaus Jensen     }
34588eea45cSKlaus Jensen }
34688eea45cSKlaus Jensen 
34788eea45cSKlaus Jensen static inline void nvme_aor_dec_active(NvmeNamespace *ns)
34888eea45cSKlaus Jensen {
34988eea45cSKlaus Jensen     if (ns->params.max_active_zones) {
35088eea45cSKlaus Jensen         assert(ns->nr_active_zones > 0);
35188eea45cSKlaus Jensen         ns->nr_active_zones--;
35288eea45cSKlaus Jensen         assert(ns->nr_active_zones >= ns->nr_open_zones);
35388eea45cSKlaus Jensen     }
35488eea45cSKlaus Jensen     assert(ns->nr_active_zones >= 0);
35588eea45cSKlaus Jensen }
35688eea45cSKlaus Jensen 
357*73064edfSJesper Devantier static inline void nvme_fdp_stat_inc(uint64_t *a, uint64_t b)
358*73064edfSJesper Devantier {
359*73064edfSJesper Devantier     uint64_t ret = *a + b;
360*73064edfSJesper Devantier     *a = ret < *a ? UINT64_MAX : ret;
361*73064edfSJesper Devantier }
362*73064edfSJesper Devantier 
36388eea45cSKlaus Jensen void nvme_ns_init_format(NvmeNamespace *ns);
3645e4f6bccSKlaus Jensen int nvme_ns_setup(NvmeNamespace *ns, Error **errp);
36588eea45cSKlaus Jensen void nvme_ns_drain(NvmeNamespace *ns);
36688eea45cSKlaus Jensen void nvme_ns_shutdown(NvmeNamespace *ns);
36788eea45cSKlaus Jensen void nvme_ns_cleanup(NvmeNamespace *ns);
36888eea45cSKlaus Jensen 
36988eea45cSKlaus Jensen typedef struct NvmeAsyncEvent {
37088eea45cSKlaus Jensen     QTAILQ_ENTRY(NvmeAsyncEvent) entry;
37188eea45cSKlaus Jensen     NvmeAerResult result;
37288eea45cSKlaus Jensen } NvmeAsyncEvent;
37388eea45cSKlaus Jensen 
37488eea45cSKlaus Jensen enum {
37588eea45cSKlaus Jensen     NVME_SG_ALLOC = 1 << 0,
37688eea45cSKlaus Jensen     NVME_SG_DMA   = 1 << 1,
37788eea45cSKlaus Jensen };
37888eea45cSKlaus Jensen 
37988eea45cSKlaus Jensen typedef struct NvmeSg {
38088eea45cSKlaus Jensen     int flags;
38188eea45cSKlaus Jensen 
38288eea45cSKlaus Jensen     union {
38388eea45cSKlaus Jensen         QEMUSGList   qsg;
38488eea45cSKlaus Jensen         QEMUIOVector iov;
38588eea45cSKlaus Jensen     };
38688eea45cSKlaus Jensen } NvmeSg;
38788eea45cSKlaus Jensen 
38888eea45cSKlaus Jensen typedef enum NvmeTxDirection {
38988eea45cSKlaus Jensen     NVME_TX_DIRECTION_TO_DEVICE   = 0,
39088eea45cSKlaus Jensen     NVME_TX_DIRECTION_FROM_DEVICE = 1,
39188eea45cSKlaus Jensen } NvmeTxDirection;
39288eea45cSKlaus Jensen 
39388eea45cSKlaus Jensen typedef struct NvmeRequest {
39488eea45cSKlaus Jensen     struct NvmeSQueue       *sq;
39588eea45cSKlaus Jensen     struct NvmeNamespace    *ns;
39688eea45cSKlaus Jensen     BlockAIOCB              *aiocb;
39788eea45cSKlaus Jensen     uint16_t                status;
39888eea45cSKlaus Jensen     void                    *opaque;
39988eea45cSKlaus Jensen     NvmeCqe                 cqe;
40088eea45cSKlaus Jensen     NvmeCmd                 cmd;
40188eea45cSKlaus Jensen     BlockAcctCookie         acct;
40288eea45cSKlaus Jensen     NvmeSg                  sg;
40388eea45cSKlaus Jensen     QTAILQ_ENTRY(NvmeRequest)entry;
40488eea45cSKlaus Jensen } NvmeRequest;
40588eea45cSKlaus Jensen 
40688eea45cSKlaus Jensen typedef struct NvmeBounceContext {
40788eea45cSKlaus Jensen     NvmeRequest *req;
40888eea45cSKlaus Jensen 
40988eea45cSKlaus Jensen     struct {
41088eea45cSKlaus Jensen         QEMUIOVector iov;
41188eea45cSKlaus Jensen         uint8_t *bounce;
41288eea45cSKlaus Jensen     } data, mdata;
41388eea45cSKlaus Jensen } NvmeBounceContext;
41488eea45cSKlaus Jensen 
41588eea45cSKlaus Jensen static inline const char *nvme_adm_opc_str(uint8_t opc)
41688eea45cSKlaus Jensen {
41788eea45cSKlaus Jensen     switch (opc) {
41888eea45cSKlaus Jensen     case NVME_ADM_CMD_DELETE_SQ:        return "NVME_ADM_CMD_DELETE_SQ";
41988eea45cSKlaus Jensen     case NVME_ADM_CMD_CREATE_SQ:        return "NVME_ADM_CMD_CREATE_SQ";
42088eea45cSKlaus Jensen     case NVME_ADM_CMD_GET_LOG_PAGE:     return "NVME_ADM_CMD_GET_LOG_PAGE";
42188eea45cSKlaus Jensen     case NVME_ADM_CMD_DELETE_CQ:        return "NVME_ADM_CMD_DELETE_CQ";
42288eea45cSKlaus Jensen     case NVME_ADM_CMD_CREATE_CQ:        return "NVME_ADM_CMD_CREATE_CQ";
42388eea45cSKlaus Jensen     case NVME_ADM_CMD_IDENTIFY:         return "NVME_ADM_CMD_IDENTIFY";
42488eea45cSKlaus Jensen     case NVME_ADM_CMD_ABORT:            return "NVME_ADM_CMD_ABORT";
42588eea45cSKlaus Jensen     case NVME_ADM_CMD_SET_FEATURES:     return "NVME_ADM_CMD_SET_FEATURES";
42688eea45cSKlaus Jensen     case NVME_ADM_CMD_GET_FEATURES:     return "NVME_ADM_CMD_GET_FEATURES";
42788eea45cSKlaus Jensen     case NVME_ADM_CMD_ASYNC_EV_REQ:     return "NVME_ADM_CMD_ASYNC_EV_REQ";
42888eea45cSKlaus Jensen     case NVME_ADM_CMD_NS_ATTACHMENT:    return "NVME_ADM_CMD_NS_ATTACHMENT";
429e181d3daSGollu Appalanaidu     case NVME_ADM_CMD_DIRECTIVE_SEND:   return "NVME_ADM_CMD_DIRECTIVE_SEND";
43011871f53SŁukasz Gieryk     case NVME_ADM_CMD_VIRT_MNGMT:       return "NVME_ADM_CMD_VIRT_MNGMT";
431e181d3daSGollu Appalanaidu     case NVME_ADM_CMD_DIRECTIVE_RECV:   return "NVME_ADM_CMD_DIRECTIVE_RECV";
4323f7fe8deSJinhao Fan     case NVME_ADM_CMD_DBBUF_CONFIG:     return "NVME_ADM_CMD_DBBUF_CONFIG";
43388eea45cSKlaus Jensen     case NVME_ADM_CMD_FORMAT_NVM:       return "NVME_ADM_CMD_FORMAT_NVM";
43488eea45cSKlaus Jensen     default:                            return "NVME_ADM_CMD_UNKNOWN";
43588eea45cSKlaus Jensen     }
43688eea45cSKlaus Jensen }
43788eea45cSKlaus Jensen 
43888eea45cSKlaus Jensen static inline const char *nvme_io_opc_str(uint8_t opc)
43988eea45cSKlaus Jensen {
44088eea45cSKlaus Jensen     switch (opc) {
44188eea45cSKlaus Jensen     case NVME_CMD_FLUSH:            return "NVME_NVM_CMD_FLUSH";
44288eea45cSKlaus Jensen     case NVME_CMD_WRITE:            return "NVME_NVM_CMD_WRITE";
44388eea45cSKlaus Jensen     case NVME_CMD_READ:             return "NVME_NVM_CMD_READ";
44488eea45cSKlaus Jensen     case NVME_CMD_COMPARE:          return "NVME_NVM_CMD_COMPARE";
44588eea45cSKlaus Jensen     case NVME_CMD_WRITE_ZEROES:     return "NVME_NVM_CMD_WRITE_ZEROES";
44688eea45cSKlaus Jensen     case NVME_CMD_DSM:              return "NVME_NVM_CMD_DSM";
44788eea45cSKlaus Jensen     case NVME_CMD_VERIFY:           return "NVME_NVM_CMD_VERIFY";
44888eea45cSKlaus Jensen     case NVME_CMD_COPY:             return "NVME_NVM_CMD_COPY";
44988eea45cSKlaus Jensen     case NVME_CMD_ZONE_MGMT_SEND:   return "NVME_ZONED_CMD_MGMT_SEND";
45088eea45cSKlaus Jensen     case NVME_CMD_ZONE_MGMT_RECV:   return "NVME_ZONED_CMD_MGMT_RECV";
45188eea45cSKlaus Jensen     case NVME_CMD_ZONE_APPEND:      return "NVME_ZONED_CMD_ZONE_APPEND";
45288eea45cSKlaus Jensen     default:                        return "NVME_NVM_CMD_UNKNOWN";
45388eea45cSKlaus Jensen     }
45488eea45cSKlaus Jensen }
45588eea45cSKlaus Jensen 
45688eea45cSKlaus Jensen typedef struct NvmeSQueue {
45788eea45cSKlaus Jensen     struct NvmeCtrl *ctrl;
45888eea45cSKlaus Jensen     uint16_t    sqid;
45988eea45cSKlaus Jensen     uint16_t    cqid;
46088eea45cSKlaus Jensen     uint32_t    head;
46188eea45cSKlaus Jensen     uint32_t    tail;
46288eea45cSKlaus Jensen     uint32_t    size;
46388eea45cSKlaus Jensen     uint64_t    dma_addr;
4643f7fe8deSJinhao Fan     uint64_t    db_addr;
4653f7fe8deSJinhao Fan     uint64_t    ei_addr;
466d38cc6fdSKlaus Jensen     QEMUBH      *bh;
4672e53b0b4SJinhao Fan     EventNotifier notifier;
4682e53b0b4SJinhao Fan     bool        ioeventfd_enabled;
46988eea45cSKlaus Jensen     NvmeRequest *io_req;
47088eea45cSKlaus Jensen     QTAILQ_HEAD(, NvmeRequest) req_list;
47188eea45cSKlaus Jensen     QTAILQ_HEAD(, NvmeRequest) out_req_list;
47288eea45cSKlaus Jensen     QTAILQ_ENTRY(NvmeSQueue) entry;
47388eea45cSKlaus Jensen } NvmeSQueue;
47488eea45cSKlaus Jensen 
47588eea45cSKlaus Jensen typedef struct NvmeCQueue {
47688eea45cSKlaus Jensen     struct NvmeCtrl *ctrl;
47788eea45cSKlaus Jensen     uint8_t     phase;
47888eea45cSKlaus Jensen     uint16_t    cqid;
47988eea45cSKlaus Jensen     uint16_t    irq_enabled;
48088eea45cSKlaus Jensen     uint32_t    head;
48188eea45cSKlaus Jensen     uint32_t    tail;
48288eea45cSKlaus Jensen     uint32_t    vector;
48388eea45cSKlaus Jensen     uint32_t    size;
48488eea45cSKlaus Jensen     uint64_t    dma_addr;
4853f7fe8deSJinhao Fan     uint64_t    db_addr;
4863f7fe8deSJinhao Fan     uint64_t    ei_addr;
487d38cc6fdSKlaus Jensen     QEMUBH      *bh;
4882e53b0b4SJinhao Fan     EventNotifier notifier;
4892e53b0b4SJinhao Fan     bool        ioeventfd_enabled;
49088eea45cSKlaus Jensen     QTAILQ_HEAD(, NvmeSQueue) sq_list;
49188eea45cSKlaus Jensen     QTAILQ_HEAD(, NvmeRequest) req_list;
49288eea45cSKlaus Jensen } NvmeCQueue;
49388eea45cSKlaus Jensen 
49488eea45cSKlaus Jensen #define TYPE_NVME "nvme"
49588eea45cSKlaus Jensen #define NVME(obj) \
49688eea45cSKlaus Jensen         OBJECT_CHECK(NvmeCtrl, (obj), TYPE_NVME)
49788eea45cSKlaus Jensen 
49888eea45cSKlaus Jensen typedef struct NvmeParams {
49988eea45cSKlaus Jensen     char     *serial;
50088eea45cSKlaus Jensen     uint32_t num_queues; /* deprecated since 5.1 */
50188eea45cSKlaus Jensen     uint32_t max_ioqpairs;
50288eea45cSKlaus Jensen     uint16_t msix_qsize;
50388eea45cSKlaus Jensen     uint32_t cmb_size_mb;
50488eea45cSKlaus Jensen     uint8_t  aerl;
50588eea45cSKlaus Jensen     uint32_t aer_max_queued;
50688eea45cSKlaus Jensen     uint8_t  mdts;
50788eea45cSKlaus Jensen     uint8_t  vsl;
50888eea45cSKlaus Jensen     bool     use_intel_id;
50988eea45cSKlaus Jensen     uint8_t  zasl;
510cccc2651SNiklas Cassel     bool     auto_transition_zones;
51188eea45cSKlaus Jensen     bool     legacy_cmb;
5122e53b0b4SJinhao Fan     bool     ioeventfd;
51344c2c094SLukasz Maniak     uint8_t  sriov_max_vfs;
514746d42b1SŁukasz Gieryk     uint16_t sriov_vq_flexible;
515746d42b1SŁukasz Gieryk     uint16_t sriov_vi_flexible;
516746d42b1SŁukasz Gieryk     uint8_t  sriov_max_vq_per_vf;
517746d42b1SŁukasz Gieryk     uint8_t  sriov_max_vi_per_vf;
51888eea45cSKlaus Jensen } NvmeParams;
51988eea45cSKlaus Jensen 
52088eea45cSKlaus Jensen typedef struct NvmeCtrl {
52188eea45cSKlaus Jensen     PCIDevice    parent_obj;
52288eea45cSKlaus Jensen     MemoryRegion bar0;
52388eea45cSKlaus Jensen     MemoryRegion iomem;
52488eea45cSKlaus Jensen     NvmeBar      bar;
52588eea45cSKlaus Jensen     NvmeParams   params;
52688eea45cSKlaus Jensen     NvmeBus      bus;
52788eea45cSKlaus Jensen 
52888eea45cSKlaus Jensen     uint16_t    cntlid;
52988eea45cSKlaus Jensen     bool        qs_created;
53088eea45cSKlaus Jensen     uint32_t    page_size;
53188eea45cSKlaus Jensen     uint16_t    page_bits;
53288eea45cSKlaus Jensen     uint16_t    max_prp_ents;
53388eea45cSKlaus Jensen     uint16_t    cqe_size;
53488eea45cSKlaus Jensen     uint16_t    sqe_size;
53588eea45cSKlaus Jensen     uint32_t    max_q_ents;
53688eea45cSKlaus Jensen     uint8_t     outstanding_aers;
53788eea45cSKlaus Jensen     uint32_t    irq_status;
53883d7ed5cSKlaus Jensen     int         cq_pending;
53988eea45cSKlaus Jensen     uint64_t    host_timestamp;                 /* Timestamp sent by the host */
54088eea45cSKlaus Jensen     uint64_t    timestamp_set_qemu_clock_ms;    /* QEMU clock time */
54188eea45cSKlaus Jensen     uint64_t    starttime_ms;
54288eea45cSKlaus Jensen     uint16_t    temperature;
54388eea45cSKlaus Jensen     uint8_t     smart_critical_warning;
544decc0261SŁukasz Gieryk     uint32_t    conf_msix_qsize;
545decc0261SŁukasz Gieryk     uint32_t    conf_ioqpairs;
5463f7fe8deSJinhao Fan     uint64_t    dbbuf_dbs;
5473f7fe8deSJinhao Fan     uint64_t    dbbuf_eis;
5483f7fe8deSJinhao Fan     bool        dbbuf_enabled;
54988eea45cSKlaus Jensen 
55088eea45cSKlaus Jensen     struct {
55188eea45cSKlaus Jensen         MemoryRegion mem;
55288eea45cSKlaus Jensen         uint8_t      *buf;
55388eea45cSKlaus Jensen         bool         cmse;
55488eea45cSKlaus Jensen         hwaddr       cba;
55588eea45cSKlaus Jensen     } cmb;
55688eea45cSKlaus Jensen 
55788eea45cSKlaus Jensen     struct {
55888eea45cSKlaus Jensen         HostMemoryBackend *dev;
55988eea45cSKlaus Jensen         bool              cmse;
56088eea45cSKlaus Jensen         hwaddr            cba;
56188eea45cSKlaus Jensen     } pmr;
56288eea45cSKlaus Jensen 
56388eea45cSKlaus Jensen     uint8_t     aer_mask;
56488eea45cSKlaus Jensen     NvmeRequest **aer_reqs;
56588eea45cSKlaus Jensen     QTAILQ_HEAD(, NvmeAsyncEvent) aer_queue;
56688eea45cSKlaus Jensen     int         aer_queued;
56788eea45cSKlaus Jensen 
56888eea45cSKlaus Jensen     uint32_t    dmrsl;
56988eea45cSKlaus Jensen 
57088eea45cSKlaus Jensen     /* Namespace ID is started with 1 so bitmap should be 1-based */
57188eea45cSKlaus Jensen #define NVME_CHANGED_NSID_SIZE  (NVME_MAX_NAMESPACES + 1)
57288eea45cSKlaus Jensen     DECLARE_BITMAP(changed_nsids, NVME_CHANGED_NSID_SIZE);
57388eea45cSKlaus Jensen 
57488eea45cSKlaus Jensen     NvmeSubsystem   *subsys;
57588eea45cSKlaus Jensen 
57688eea45cSKlaus Jensen     NvmeNamespace   namespace;
57788eea45cSKlaus Jensen     NvmeNamespace   *namespaces[NVME_MAX_NAMESPACES + 1];
57888eea45cSKlaus Jensen     NvmeSQueue      **sq;
57988eea45cSKlaus Jensen     NvmeCQueue      **cq;
58088eea45cSKlaus Jensen     NvmeSQueue      admin_sq;
58188eea45cSKlaus Jensen     NvmeCQueue      admin_cq;
58288eea45cSKlaus Jensen     NvmeIdCtrl      id_ctrl;
58388eea45cSKlaus Jensen 
58488eea45cSKlaus Jensen     struct {
58588eea45cSKlaus Jensen         struct {
58688eea45cSKlaus Jensen             uint16_t temp_thresh_hi;
58788eea45cSKlaus Jensen             uint16_t temp_thresh_low;
58888eea45cSKlaus Jensen         };
589d0c0697bSNaveen Nagar 
59088eea45cSKlaus Jensen         uint32_t                async_config;
591d0c0697bSNaveen Nagar         NvmeHostBehaviorSupport hbs;
59288eea45cSKlaus Jensen     } features;
5935e6f963fSLukasz Maniak 
5945e6f963fSLukasz Maniak     NvmePriCtrlCap  pri_ctrl_cap;
59599f48ae7SLukasz Maniak     NvmeSecCtrlList sec_ctrl_list;
59611871f53SŁukasz Gieryk     struct {
59711871f53SŁukasz Gieryk         uint16_t    vqrfap;
59811871f53SŁukasz Gieryk         uint16_t    virfap;
59911871f53SŁukasz Gieryk     } next_pri_ctrl_cap;    /* These override pri_ctrl_cap after reset */
60088eea45cSKlaus Jensen } NvmeCtrl;
60188eea45cSKlaus Jensen 
6021e9c685eSŁukasz Gieryk typedef enum NvmeResetType {
6031e9c685eSŁukasz Gieryk     NVME_RESET_FUNCTION   = 0,
6041e9c685eSŁukasz Gieryk     NVME_RESET_CONTROLLER = 1,
6051e9c685eSŁukasz Gieryk } NvmeResetType;
6061e9c685eSŁukasz Gieryk 
60788eea45cSKlaus Jensen static inline NvmeNamespace *nvme_ns(NvmeCtrl *n, uint32_t nsid)
60888eea45cSKlaus Jensen {
60988eea45cSKlaus Jensen     if (!nsid || nsid > NVME_MAX_NAMESPACES) {
61088eea45cSKlaus Jensen         return NULL;
61188eea45cSKlaus Jensen     }
61288eea45cSKlaus Jensen 
61388eea45cSKlaus Jensen     return n->namespaces[nsid];
61488eea45cSKlaus Jensen }
61588eea45cSKlaus Jensen 
61688eea45cSKlaus Jensen static inline NvmeCQueue *nvme_cq(NvmeRequest *req)
61788eea45cSKlaus Jensen {
61888eea45cSKlaus Jensen     NvmeSQueue *sq = req->sq;
61988eea45cSKlaus Jensen     NvmeCtrl *n = sq->ctrl;
62088eea45cSKlaus Jensen 
62188eea45cSKlaus Jensen     return n->cq[sq->cqid];
62288eea45cSKlaus Jensen }
62388eea45cSKlaus Jensen 
62488eea45cSKlaus Jensen static inline NvmeCtrl *nvme_ctrl(NvmeRequest *req)
62588eea45cSKlaus Jensen {
62688eea45cSKlaus Jensen     NvmeSQueue *sq = req->sq;
62788eea45cSKlaus Jensen     return sq->ctrl;
62888eea45cSKlaus Jensen }
62988eea45cSKlaus Jensen 
63088eea45cSKlaus Jensen static inline uint16_t nvme_cid(NvmeRequest *req)
63188eea45cSKlaus Jensen {
63288eea45cSKlaus Jensen     if (!req) {
63388eea45cSKlaus Jensen         return 0xffff;
63488eea45cSKlaus Jensen     }
63588eea45cSKlaus Jensen 
63688eea45cSKlaus Jensen     return le16_to_cpu(req->cqe.cid);
63788eea45cSKlaus Jensen }
63888eea45cSKlaus Jensen 
63999f48ae7SLukasz Maniak static inline NvmeSecCtrlEntry *nvme_sctrl(NvmeCtrl *n)
64099f48ae7SLukasz Maniak {
64199f48ae7SLukasz Maniak     PCIDevice *pci_dev = &n->parent_obj;
64299f48ae7SLukasz Maniak     NvmeCtrl *pf = NVME(pcie_sriov_get_pf(pci_dev));
64399f48ae7SLukasz Maniak 
64499f48ae7SLukasz Maniak     if (pci_is_vf(pci_dev)) {
64599f48ae7SLukasz Maniak         return &pf->sec_ctrl_list.sec[pcie_sriov_vf_number(pci_dev)];
64699f48ae7SLukasz Maniak     }
64799f48ae7SLukasz Maniak 
64899f48ae7SLukasz Maniak     return NULL;
64999f48ae7SLukasz Maniak }
65099f48ae7SLukasz Maniak 
65111871f53SŁukasz Gieryk static inline NvmeSecCtrlEntry *nvme_sctrl_for_cntlid(NvmeCtrl *n,
65211871f53SŁukasz Gieryk                                                       uint16_t cntlid)
65311871f53SŁukasz Gieryk {
65411871f53SŁukasz Gieryk     NvmeSecCtrlList *list = &n->sec_ctrl_list;
65511871f53SŁukasz Gieryk     uint8_t i;
65611871f53SŁukasz Gieryk 
65711871f53SŁukasz Gieryk     for (i = 0; i < list->numcntl; i++) {
65811871f53SŁukasz Gieryk         if (le16_to_cpu(list->sec[i].scid) == cntlid) {
65911871f53SŁukasz Gieryk             return &list->sec[i];
66011871f53SŁukasz Gieryk         }
66111871f53SŁukasz Gieryk     }
66211871f53SŁukasz Gieryk 
66311871f53SŁukasz Gieryk     return NULL;
66411871f53SŁukasz Gieryk }
66511871f53SŁukasz Gieryk 
66688eea45cSKlaus Jensen void nvme_attach_ns(NvmeCtrl *n, NvmeNamespace *ns);
6678d3a17beSPhilippe Mathieu-Daudé uint16_t nvme_bounce_data(NvmeCtrl *n, void *ptr, uint32_t len,
66888eea45cSKlaus Jensen                           NvmeTxDirection dir, NvmeRequest *req);
6698d3a17beSPhilippe Mathieu-Daudé uint16_t nvme_bounce_mdata(NvmeCtrl *n, void *ptr, uint32_t len,
67088eea45cSKlaus Jensen                            NvmeTxDirection dir, NvmeRequest *req);
67188eea45cSKlaus Jensen void nvme_rw_complete_cb(void *opaque, int ret);
67288eea45cSKlaus Jensen uint16_t nvme_map_dptr(NvmeCtrl *n, NvmeSg *sg, size_t len,
67388eea45cSKlaus Jensen                        NvmeCmd *cmd);
67488eea45cSKlaus Jensen 
67552581c71SMarkus Armbruster #endif /* HW_NVME_NVME_H */
676