188eea45cSKlaus Jensen /* 288eea45cSKlaus Jensen * QEMU NVM Express 388eea45cSKlaus Jensen * 488eea45cSKlaus Jensen * Copyright (c) 2012 Intel Corporation 588eea45cSKlaus Jensen * Copyright (c) 2021 Minwoo Im 688eea45cSKlaus Jensen * Copyright (c) 2021 Samsung Electronics Co., Ltd. 788eea45cSKlaus Jensen * 888eea45cSKlaus Jensen * Authors: 988eea45cSKlaus Jensen * Keith Busch <kbusch@kernel.org> 1088eea45cSKlaus Jensen * Klaus Jensen <k.jensen@samsung.com> 1188eea45cSKlaus Jensen * Gollu Appalanaidu <anaidu.gollu@samsung.com> 1288eea45cSKlaus Jensen * Dmitry Fomichev <dmitry.fomichev@wdc.com> 1388eea45cSKlaus Jensen * Minwoo Im <minwoo.im.dev@gmail.com> 1488eea45cSKlaus Jensen * 1588eea45cSKlaus Jensen * This code is licensed under the GNU GPL v2 or later. 1688eea45cSKlaus Jensen */ 1788eea45cSKlaus Jensen 1852581c71SMarkus Armbruster #ifndef HW_NVME_NVME_H 1952581c71SMarkus Armbruster #define HW_NVME_NVME_H 2088eea45cSKlaus Jensen 2188eea45cSKlaus Jensen #include "qemu/uuid.h" 22edf5ca5dSMarkus Armbruster #include "hw/pci/pci_device.h" 2388eea45cSKlaus Jensen #include "hw/block/block.h" 2488eea45cSKlaus Jensen 2588eea45cSKlaus Jensen #include "block/nvme.h" 2688eea45cSKlaus Jensen 2744c2c094SLukasz Maniak #define NVME_MAX_CONTROLLERS 256 2888eea45cSKlaus Jensen #define NVME_MAX_NAMESPACES 256 293276dde4SHeinrich Schuchardt #define NVME_EUI64_DEFAULT ((uint64_t)0x5254000000000000) 30*73064edfSJesper Devantier #define NVME_FDP_MAX_EVENTS 63 31*73064edfSJesper Devantier #define NVME_FDP_MAXPIDS 128 3288eea45cSKlaus Jensen 3338f4ac65SKlaus Jensen QEMU_BUILD_BUG_ON(NVME_MAX_NAMESPACES > NVME_NSID_BROADCAST - 1); 3438f4ac65SKlaus Jensen 3588eea45cSKlaus Jensen typedef struct NvmeCtrl NvmeCtrl; 3688eea45cSKlaus Jensen typedef struct NvmeNamespace NvmeNamespace; 3788eea45cSKlaus Jensen 385ffbaeedSKlaus Jensen #define TYPE_NVME_BUS "nvme-bus" 395ffbaeedSKlaus Jensen OBJECT_DECLARE_SIMPLE_TYPE(NvmeBus, NVME_BUS) 405ffbaeedSKlaus Jensen 415ffbaeedSKlaus Jensen typedef struct NvmeBus { 425ffbaeedSKlaus Jensen BusState parent_bus; 435ffbaeedSKlaus Jensen } NvmeBus; 445ffbaeedSKlaus Jensen 4588eea45cSKlaus Jensen #define TYPE_NVME_SUBSYS "nvme-subsys" 4688eea45cSKlaus Jensen #define NVME_SUBSYS(obj) \ 4788eea45cSKlaus Jensen OBJECT_CHECK(NvmeSubsystem, (obj), TYPE_NVME_SUBSYS) 4899f48ae7SLukasz Maniak #define SUBSYS_SLOT_RSVD (void *)0xFFFF 4988eea45cSKlaus Jensen 50*73064edfSJesper Devantier typedef struct NvmeReclaimUnit { 51*73064edfSJesper Devantier uint64_t ruamw; 52*73064edfSJesper Devantier } NvmeReclaimUnit; 53*73064edfSJesper Devantier 54*73064edfSJesper Devantier typedef struct NvmeRuHandle { 55*73064edfSJesper Devantier uint8_t ruht; 56*73064edfSJesper Devantier uint8_t ruha; 57*73064edfSJesper Devantier uint64_t event_filter; 58*73064edfSJesper Devantier uint8_t lbafi; 59*73064edfSJesper Devantier uint64_t ruamw; 60*73064edfSJesper Devantier 61*73064edfSJesper Devantier /* reclaim units indexed by reclaim group */ 62*73064edfSJesper Devantier NvmeReclaimUnit *rus; 63*73064edfSJesper Devantier } NvmeRuHandle; 64*73064edfSJesper Devantier 65*73064edfSJesper Devantier typedef struct NvmeFdpEventBuffer { 66*73064edfSJesper Devantier NvmeFdpEvent events[NVME_FDP_MAX_EVENTS]; 67*73064edfSJesper Devantier unsigned int nelems; 68*73064edfSJesper Devantier unsigned int start; 69*73064edfSJesper Devantier unsigned int next; 70*73064edfSJesper Devantier } NvmeFdpEventBuffer; 71*73064edfSJesper Devantier 72771dbc3aSKlaus Jensen typedef struct NvmeEnduranceGroup { 73771dbc3aSKlaus Jensen uint8_t event_conf; 74*73064edfSJesper Devantier 75*73064edfSJesper Devantier struct { 76*73064edfSJesper Devantier NvmeFdpEventBuffer host_events, ctrl_events; 77*73064edfSJesper Devantier 78*73064edfSJesper Devantier uint16_t nruh; 79*73064edfSJesper Devantier uint16_t nrg; 80*73064edfSJesper Devantier uint8_t rgif; 81*73064edfSJesper Devantier uint64_t runs; 82*73064edfSJesper Devantier 83*73064edfSJesper Devantier uint64_t hbmw; 84*73064edfSJesper Devantier uint64_t mbmw; 85*73064edfSJesper Devantier uint64_t mbe; 86*73064edfSJesper Devantier 87*73064edfSJesper Devantier bool enabled; 88*73064edfSJesper Devantier 89*73064edfSJesper Devantier NvmeRuHandle *ruhs; 90*73064edfSJesper Devantier } fdp; 91771dbc3aSKlaus Jensen } NvmeEnduranceGroup; 92771dbc3aSKlaus Jensen 9388eea45cSKlaus Jensen typedef struct NvmeSubsystem { 9488eea45cSKlaus Jensen DeviceState parent_obj; 955ffbaeedSKlaus Jensen NvmeBus bus; 9688eea45cSKlaus Jensen uint8_t subnqn[256]; 97a859eb9fSKlaus Jensen char *serial; 9888eea45cSKlaus Jensen 9988eea45cSKlaus Jensen NvmeCtrl *ctrls[NVME_MAX_CONTROLLERS]; 10088eea45cSKlaus Jensen NvmeNamespace *namespaces[NVME_MAX_NAMESPACES + 1]; 101*73064edfSJesper Devantier NvmeEnduranceGroup endgrp; 10288eea45cSKlaus Jensen 10388eea45cSKlaus Jensen struct { 10488eea45cSKlaus Jensen char *nqn; 105*73064edfSJesper Devantier 106*73064edfSJesper Devantier struct { 107*73064edfSJesper Devantier bool enabled; 108*73064edfSJesper Devantier uint64_t runs; 109*73064edfSJesper Devantier uint16_t nruh; 110*73064edfSJesper Devantier uint32_t nrg; 111*73064edfSJesper Devantier } fdp; 11288eea45cSKlaus Jensen } params; 11388eea45cSKlaus Jensen } NvmeSubsystem; 11488eea45cSKlaus Jensen 11588eea45cSKlaus Jensen int nvme_subsys_register_ctrl(NvmeCtrl *n, Error **errp); 116b0fde9e8SKlaus Jensen void nvme_subsys_unregister_ctrl(NvmeSubsystem *subsys, NvmeCtrl *n); 11788eea45cSKlaus Jensen 11888eea45cSKlaus Jensen static inline NvmeCtrl *nvme_subsys_ctrl(NvmeSubsystem *subsys, 11988eea45cSKlaus Jensen uint32_t cntlid) 12088eea45cSKlaus Jensen { 12188eea45cSKlaus Jensen if (!subsys || cntlid >= NVME_MAX_CONTROLLERS) { 12288eea45cSKlaus Jensen return NULL; 12388eea45cSKlaus Jensen } 12488eea45cSKlaus Jensen 12599f48ae7SLukasz Maniak if (subsys->ctrls[cntlid] == SUBSYS_SLOT_RSVD) { 12699f48ae7SLukasz Maniak return NULL; 12799f48ae7SLukasz Maniak } 12899f48ae7SLukasz Maniak 12988eea45cSKlaus Jensen return subsys->ctrls[cntlid]; 13088eea45cSKlaus Jensen } 13188eea45cSKlaus Jensen 13288eea45cSKlaus Jensen static inline NvmeNamespace *nvme_subsys_ns(NvmeSubsystem *subsys, 13388eea45cSKlaus Jensen uint32_t nsid) 13488eea45cSKlaus Jensen { 13588eea45cSKlaus Jensen if (!subsys || !nsid || nsid > NVME_MAX_NAMESPACES) { 13688eea45cSKlaus Jensen return NULL; 13788eea45cSKlaus Jensen } 13888eea45cSKlaus Jensen 13988eea45cSKlaus Jensen return subsys->namespaces[nsid]; 14088eea45cSKlaus Jensen } 14188eea45cSKlaus Jensen 14288eea45cSKlaus Jensen #define TYPE_NVME_NS "nvme-ns" 14388eea45cSKlaus Jensen #define NVME_NS(obj) \ 14488eea45cSKlaus Jensen OBJECT_CHECK(NvmeNamespace, (obj), TYPE_NVME_NS) 14588eea45cSKlaus Jensen 14688eea45cSKlaus Jensen typedef struct NvmeZone { 14788eea45cSKlaus Jensen NvmeZoneDescr d; 14888eea45cSKlaus Jensen uint64_t w_ptr; 14988eea45cSKlaus Jensen QTAILQ_ENTRY(NvmeZone) entry; 15088eea45cSKlaus Jensen } NvmeZone; 15188eea45cSKlaus Jensen 152*73064edfSJesper Devantier #define FDP_EVT_MAX 0xff 153*73064edfSJesper Devantier #define NVME_FDP_MAX_NS_RUHS 32u 154*73064edfSJesper Devantier #define FDPVSS 0 155*73064edfSJesper Devantier 156*73064edfSJesper Devantier static const uint8_t nvme_fdp_evf_shifts[FDP_EVT_MAX] = { 157*73064edfSJesper Devantier /* Host events */ 158*73064edfSJesper Devantier [FDP_EVT_RU_NOT_FULLY_WRITTEN] = 0, 159*73064edfSJesper Devantier [FDP_EVT_RU_ATL_EXCEEDED] = 1, 160*73064edfSJesper Devantier [FDP_EVT_CTRL_RESET_RUH] = 2, 161*73064edfSJesper Devantier [FDP_EVT_INVALID_PID] = 3, 162*73064edfSJesper Devantier /* CTRL events */ 163*73064edfSJesper Devantier [FDP_EVT_MEDIA_REALLOC] = 32, 164*73064edfSJesper Devantier [FDP_EVT_RUH_IMPLICIT_RU_CHANGE] = 33, 165*73064edfSJesper Devantier }; 166*73064edfSJesper Devantier 16788eea45cSKlaus Jensen typedef struct NvmeNamespaceParams { 16888eea45cSKlaus Jensen bool detached; 16988eea45cSKlaus Jensen bool shared; 17088eea45cSKlaus Jensen uint32_t nsid; 17188eea45cSKlaus Jensen QemuUUID uuid; 1726870cfb8SHeinrich Schuchardt uint64_t eui64; 1733276dde4SHeinrich Schuchardt bool eui64_default; 17488eea45cSKlaus Jensen 17588eea45cSKlaus Jensen uint16_t ms; 17688eea45cSKlaus Jensen uint8_t mset; 17788eea45cSKlaus Jensen uint8_t pi; 17888eea45cSKlaus Jensen uint8_t pil; 17944219b60SNaveen Nagar uint8_t pif; 18088eea45cSKlaus Jensen 18188eea45cSKlaus Jensen uint16_t mssrl; 18288eea45cSKlaus Jensen uint32_t mcl; 18388eea45cSKlaus Jensen uint8_t msrc; 18488eea45cSKlaus Jensen 18588eea45cSKlaus Jensen bool zoned; 18688eea45cSKlaus Jensen bool cross_zone_read; 18788eea45cSKlaus Jensen uint64_t zone_size_bs; 18888eea45cSKlaus Jensen uint64_t zone_cap_bs; 18988eea45cSKlaus Jensen uint32_t max_active_zones; 19088eea45cSKlaus Jensen uint32_t max_open_zones; 19188eea45cSKlaus Jensen uint32_t zd_extension_size; 192e321b4cdSKlaus Jensen 193e321b4cdSKlaus Jensen uint32_t numzrwa; 194e321b4cdSKlaus Jensen uint64_t zrwas; 195e321b4cdSKlaus Jensen uint64_t zrwafg; 196*73064edfSJesper Devantier 197*73064edfSJesper Devantier struct { 198*73064edfSJesper Devantier char *ruhs; 199*73064edfSJesper Devantier } fdp; 20088eea45cSKlaus Jensen } NvmeNamespaceParams; 20188eea45cSKlaus Jensen 20288eea45cSKlaus Jensen typedef struct NvmeNamespace { 20388eea45cSKlaus Jensen DeviceState parent_obj; 20488eea45cSKlaus Jensen BlockConf blkconf; 20588eea45cSKlaus Jensen int32_t bootindex; 20688eea45cSKlaus Jensen int64_t size; 20788eea45cSKlaus Jensen int64_t moff; 20888eea45cSKlaus Jensen NvmeIdNs id_ns; 20944219b60SNaveen Nagar NvmeIdNsNvm id_ns_nvm; 21088eea45cSKlaus Jensen NvmeLBAF lbaf; 211763c05dfSNaveen Nagar unsigned int nlbaf; 21288eea45cSKlaus Jensen size_t lbasz; 21388eea45cSKlaus Jensen const uint32_t *iocs; 21488eea45cSKlaus Jensen uint8_t csi; 21588eea45cSKlaus Jensen uint16_t status; 21688eea45cSKlaus Jensen int attached; 21744219b60SNaveen Nagar uint8_t pif; 21888eea45cSKlaus Jensen 219e321b4cdSKlaus Jensen struct { 220e321b4cdSKlaus Jensen uint16_t zrwas; 221e321b4cdSKlaus Jensen uint16_t zrwafg; 222e321b4cdSKlaus Jensen uint32_t numzrwa; 223e321b4cdSKlaus Jensen } zns; 224e321b4cdSKlaus Jensen 22588eea45cSKlaus Jensen QTAILQ_ENTRY(NvmeNamespace) entry; 22688eea45cSKlaus Jensen 22788eea45cSKlaus Jensen NvmeIdNsZoned *id_ns_zoned; 22888eea45cSKlaus Jensen NvmeZone *zone_array; 22988eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeZone) exp_open_zones; 23088eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeZone) imp_open_zones; 23188eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeZone) closed_zones; 23288eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeZone) full_zones; 23388eea45cSKlaus Jensen uint32_t num_zones; 23488eea45cSKlaus Jensen uint64_t zone_size; 23588eea45cSKlaus Jensen uint64_t zone_capacity; 23688eea45cSKlaus Jensen uint32_t zone_size_log2; 23788eea45cSKlaus Jensen uint8_t *zd_extensions; 23888eea45cSKlaus Jensen int32_t nr_open_zones; 23988eea45cSKlaus Jensen int32_t nr_active_zones; 24088eea45cSKlaus Jensen 24188eea45cSKlaus Jensen NvmeNamespaceParams params; 242534a93d3SNiklas Cassel NvmeSubsystem *subsys; 243*73064edfSJesper Devantier NvmeEnduranceGroup *endgrp; 24488eea45cSKlaus Jensen 24588eea45cSKlaus Jensen struct { 24688eea45cSKlaus Jensen uint32_t err_rec; 24788eea45cSKlaus Jensen } features; 248*73064edfSJesper Devantier 249*73064edfSJesper Devantier struct { 250*73064edfSJesper Devantier uint16_t nphs; 251*73064edfSJesper Devantier /* reclaim unit handle identifiers indexed by placement handle */ 252*73064edfSJesper Devantier uint16_t *phs; 253*73064edfSJesper Devantier } fdp; 25488eea45cSKlaus Jensen } NvmeNamespace; 25588eea45cSKlaus Jensen 25688eea45cSKlaus Jensen static inline uint32_t nvme_nsid(NvmeNamespace *ns) 25788eea45cSKlaus Jensen { 25888eea45cSKlaus Jensen if (ns) { 25988eea45cSKlaus Jensen return ns->params.nsid; 26088eea45cSKlaus Jensen } 26188eea45cSKlaus Jensen 26288eea45cSKlaus Jensen return 0; 26388eea45cSKlaus Jensen } 26488eea45cSKlaus Jensen 26588eea45cSKlaus Jensen static inline size_t nvme_l2b(NvmeNamespace *ns, uint64_t lba) 26688eea45cSKlaus Jensen { 26788eea45cSKlaus Jensen return lba << ns->lbaf.ds; 26888eea45cSKlaus Jensen } 26988eea45cSKlaus Jensen 27088eea45cSKlaus Jensen static inline size_t nvme_m2b(NvmeNamespace *ns, uint64_t lba) 27188eea45cSKlaus Jensen { 27288eea45cSKlaus Jensen return ns->lbaf.ms * lba; 27388eea45cSKlaus Jensen } 27488eea45cSKlaus Jensen 27588eea45cSKlaus Jensen static inline int64_t nvme_moff(NvmeNamespace *ns, uint64_t lba) 27688eea45cSKlaus Jensen { 27788eea45cSKlaus Jensen return ns->moff + nvme_m2b(ns, lba); 27888eea45cSKlaus Jensen } 27988eea45cSKlaus Jensen 28088eea45cSKlaus Jensen static inline bool nvme_ns_ext(NvmeNamespace *ns) 28188eea45cSKlaus Jensen { 28288eea45cSKlaus Jensen return !!NVME_ID_NS_FLBAS_EXTENDED(ns->id_ns.flbas); 28388eea45cSKlaus Jensen } 28488eea45cSKlaus Jensen 28588eea45cSKlaus Jensen static inline NvmeZoneState nvme_get_zone_state(NvmeZone *zone) 28688eea45cSKlaus Jensen { 28788eea45cSKlaus Jensen return zone->d.zs >> 4; 28888eea45cSKlaus Jensen } 28988eea45cSKlaus Jensen 29088eea45cSKlaus Jensen static inline void nvme_set_zone_state(NvmeZone *zone, NvmeZoneState state) 29188eea45cSKlaus Jensen { 29288eea45cSKlaus Jensen zone->d.zs = state << 4; 29388eea45cSKlaus Jensen } 29488eea45cSKlaus Jensen 29588eea45cSKlaus Jensen static inline uint64_t nvme_zone_rd_boundary(NvmeNamespace *ns, NvmeZone *zone) 29688eea45cSKlaus Jensen { 29788eea45cSKlaus Jensen return zone->d.zslba + ns->zone_size; 29888eea45cSKlaus Jensen } 29988eea45cSKlaus Jensen 30088eea45cSKlaus Jensen static inline uint64_t nvme_zone_wr_boundary(NvmeZone *zone) 30188eea45cSKlaus Jensen { 30288eea45cSKlaus Jensen return zone->d.zslba + zone->d.zcap; 30388eea45cSKlaus Jensen } 30488eea45cSKlaus Jensen 30588eea45cSKlaus Jensen static inline bool nvme_wp_is_valid(NvmeZone *zone) 30688eea45cSKlaus Jensen { 30788eea45cSKlaus Jensen uint8_t st = nvme_get_zone_state(zone); 30888eea45cSKlaus Jensen 30988eea45cSKlaus Jensen return st != NVME_ZONE_STATE_FULL && 31088eea45cSKlaus Jensen st != NVME_ZONE_STATE_READ_ONLY && 31188eea45cSKlaus Jensen st != NVME_ZONE_STATE_OFFLINE; 31288eea45cSKlaus Jensen } 31388eea45cSKlaus Jensen 31488eea45cSKlaus Jensen static inline uint8_t *nvme_get_zd_extension(NvmeNamespace *ns, 31588eea45cSKlaus Jensen uint32_t zone_idx) 31688eea45cSKlaus Jensen { 31788eea45cSKlaus Jensen return &ns->zd_extensions[zone_idx * ns->params.zd_extension_size]; 31888eea45cSKlaus Jensen } 31988eea45cSKlaus Jensen 32088eea45cSKlaus Jensen static inline void nvme_aor_inc_open(NvmeNamespace *ns) 32188eea45cSKlaus Jensen { 32288eea45cSKlaus Jensen assert(ns->nr_open_zones >= 0); 32388eea45cSKlaus Jensen if (ns->params.max_open_zones) { 32488eea45cSKlaus Jensen ns->nr_open_zones++; 32588eea45cSKlaus Jensen assert(ns->nr_open_zones <= ns->params.max_open_zones); 32688eea45cSKlaus Jensen } 32788eea45cSKlaus Jensen } 32888eea45cSKlaus Jensen 32988eea45cSKlaus Jensen static inline void nvme_aor_dec_open(NvmeNamespace *ns) 33088eea45cSKlaus Jensen { 33188eea45cSKlaus Jensen if (ns->params.max_open_zones) { 33288eea45cSKlaus Jensen assert(ns->nr_open_zones > 0); 33388eea45cSKlaus Jensen ns->nr_open_zones--; 33488eea45cSKlaus Jensen } 33588eea45cSKlaus Jensen assert(ns->nr_open_zones >= 0); 33688eea45cSKlaus Jensen } 33788eea45cSKlaus Jensen 33888eea45cSKlaus Jensen static inline void nvme_aor_inc_active(NvmeNamespace *ns) 33988eea45cSKlaus Jensen { 34088eea45cSKlaus Jensen assert(ns->nr_active_zones >= 0); 34188eea45cSKlaus Jensen if (ns->params.max_active_zones) { 34288eea45cSKlaus Jensen ns->nr_active_zones++; 34388eea45cSKlaus Jensen assert(ns->nr_active_zones <= ns->params.max_active_zones); 34488eea45cSKlaus Jensen } 34588eea45cSKlaus Jensen } 34688eea45cSKlaus Jensen 34788eea45cSKlaus Jensen static inline void nvme_aor_dec_active(NvmeNamespace *ns) 34888eea45cSKlaus Jensen { 34988eea45cSKlaus Jensen if (ns->params.max_active_zones) { 35088eea45cSKlaus Jensen assert(ns->nr_active_zones > 0); 35188eea45cSKlaus Jensen ns->nr_active_zones--; 35288eea45cSKlaus Jensen assert(ns->nr_active_zones >= ns->nr_open_zones); 35388eea45cSKlaus Jensen } 35488eea45cSKlaus Jensen assert(ns->nr_active_zones >= 0); 35588eea45cSKlaus Jensen } 35688eea45cSKlaus Jensen 357*73064edfSJesper Devantier static inline void nvme_fdp_stat_inc(uint64_t *a, uint64_t b) 358*73064edfSJesper Devantier { 359*73064edfSJesper Devantier uint64_t ret = *a + b; 360*73064edfSJesper Devantier *a = ret < *a ? UINT64_MAX : ret; 361*73064edfSJesper Devantier } 362*73064edfSJesper Devantier 36388eea45cSKlaus Jensen void nvme_ns_init_format(NvmeNamespace *ns); 3645e4f6bccSKlaus Jensen int nvme_ns_setup(NvmeNamespace *ns, Error **errp); 36588eea45cSKlaus Jensen void nvme_ns_drain(NvmeNamespace *ns); 36688eea45cSKlaus Jensen void nvme_ns_shutdown(NvmeNamespace *ns); 36788eea45cSKlaus Jensen void nvme_ns_cleanup(NvmeNamespace *ns); 36888eea45cSKlaus Jensen 36988eea45cSKlaus Jensen typedef struct NvmeAsyncEvent { 37088eea45cSKlaus Jensen QTAILQ_ENTRY(NvmeAsyncEvent) entry; 37188eea45cSKlaus Jensen NvmeAerResult result; 37288eea45cSKlaus Jensen } NvmeAsyncEvent; 37388eea45cSKlaus Jensen 37488eea45cSKlaus Jensen enum { 37588eea45cSKlaus Jensen NVME_SG_ALLOC = 1 << 0, 37688eea45cSKlaus Jensen NVME_SG_DMA = 1 << 1, 37788eea45cSKlaus Jensen }; 37888eea45cSKlaus Jensen 37988eea45cSKlaus Jensen typedef struct NvmeSg { 38088eea45cSKlaus Jensen int flags; 38188eea45cSKlaus Jensen 38288eea45cSKlaus Jensen union { 38388eea45cSKlaus Jensen QEMUSGList qsg; 38488eea45cSKlaus Jensen QEMUIOVector iov; 38588eea45cSKlaus Jensen }; 38688eea45cSKlaus Jensen } NvmeSg; 38788eea45cSKlaus Jensen 38888eea45cSKlaus Jensen typedef enum NvmeTxDirection { 38988eea45cSKlaus Jensen NVME_TX_DIRECTION_TO_DEVICE = 0, 39088eea45cSKlaus Jensen NVME_TX_DIRECTION_FROM_DEVICE = 1, 39188eea45cSKlaus Jensen } NvmeTxDirection; 39288eea45cSKlaus Jensen 39388eea45cSKlaus Jensen typedef struct NvmeRequest { 39488eea45cSKlaus Jensen struct NvmeSQueue *sq; 39588eea45cSKlaus Jensen struct NvmeNamespace *ns; 39688eea45cSKlaus Jensen BlockAIOCB *aiocb; 39788eea45cSKlaus Jensen uint16_t status; 39888eea45cSKlaus Jensen void *opaque; 39988eea45cSKlaus Jensen NvmeCqe cqe; 40088eea45cSKlaus Jensen NvmeCmd cmd; 40188eea45cSKlaus Jensen BlockAcctCookie acct; 40288eea45cSKlaus Jensen NvmeSg sg; 40388eea45cSKlaus Jensen QTAILQ_ENTRY(NvmeRequest)entry; 40488eea45cSKlaus Jensen } NvmeRequest; 40588eea45cSKlaus Jensen 40688eea45cSKlaus Jensen typedef struct NvmeBounceContext { 40788eea45cSKlaus Jensen NvmeRequest *req; 40888eea45cSKlaus Jensen 40988eea45cSKlaus Jensen struct { 41088eea45cSKlaus Jensen QEMUIOVector iov; 41188eea45cSKlaus Jensen uint8_t *bounce; 41288eea45cSKlaus Jensen } data, mdata; 41388eea45cSKlaus Jensen } NvmeBounceContext; 41488eea45cSKlaus Jensen 41588eea45cSKlaus Jensen static inline const char *nvme_adm_opc_str(uint8_t opc) 41688eea45cSKlaus Jensen { 41788eea45cSKlaus Jensen switch (opc) { 41888eea45cSKlaus Jensen case NVME_ADM_CMD_DELETE_SQ: return "NVME_ADM_CMD_DELETE_SQ"; 41988eea45cSKlaus Jensen case NVME_ADM_CMD_CREATE_SQ: return "NVME_ADM_CMD_CREATE_SQ"; 42088eea45cSKlaus Jensen case NVME_ADM_CMD_GET_LOG_PAGE: return "NVME_ADM_CMD_GET_LOG_PAGE"; 42188eea45cSKlaus Jensen case NVME_ADM_CMD_DELETE_CQ: return "NVME_ADM_CMD_DELETE_CQ"; 42288eea45cSKlaus Jensen case NVME_ADM_CMD_CREATE_CQ: return "NVME_ADM_CMD_CREATE_CQ"; 42388eea45cSKlaus Jensen case NVME_ADM_CMD_IDENTIFY: return "NVME_ADM_CMD_IDENTIFY"; 42488eea45cSKlaus Jensen case NVME_ADM_CMD_ABORT: return "NVME_ADM_CMD_ABORT"; 42588eea45cSKlaus Jensen case NVME_ADM_CMD_SET_FEATURES: return "NVME_ADM_CMD_SET_FEATURES"; 42688eea45cSKlaus Jensen case NVME_ADM_CMD_GET_FEATURES: return "NVME_ADM_CMD_GET_FEATURES"; 42788eea45cSKlaus Jensen case NVME_ADM_CMD_ASYNC_EV_REQ: return "NVME_ADM_CMD_ASYNC_EV_REQ"; 42888eea45cSKlaus Jensen case NVME_ADM_CMD_NS_ATTACHMENT: return "NVME_ADM_CMD_NS_ATTACHMENT"; 429e181d3daSGollu Appalanaidu case NVME_ADM_CMD_DIRECTIVE_SEND: return "NVME_ADM_CMD_DIRECTIVE_SEND"; 43011871f53SŁukasz Gieryk case NVME_ADM_CMD_VIRT_MNGMT: return "NVME_ADM_CMD_VIRT_MNGMT"; 431e181d3daSGollu Appalanaidu case NVME_ADM_CMD_DIRECTIVE_RECV: return "NVME_ADM_CMD_DIRECTIVE_RECV"; 4323f7fe8deSJinhao Fan case NVME_ADM_CMD_DBBUF_CONFIG: return "NVME_ADM_CMD_DBBUF_CONFIG"; 43388eea45cSKlaus Jensen case NVME_ADM_CMD_FORMAT_NVM: return "NVME_ADM_CMD_FORMAT_NVM"; 43488eea45cSKlaus Jensen default: return "NVME_ADM_CMD_UNKNOWN"; 43588eea45cSKlaus Jensen } 43688eea45cSKlaus Jensen } 43788eea45cSKlaus Jensen 43888eea45cSKlaus Jensen static inline const char *nvme_io_opc_str(uint8_t opc) 43988eea45cSKlaus Jensen { 44088eea45cSKlaus Jensen switch (opc) { 44188eea45cSKlaus Jensen case NVME_CMD_FLUSH: return "NVME_NVM_CMD_FLUSH"; 44288eea45cSKlaus Jensen case NVME_CMD_WRITE: return "NVME_NVM_CMD_WRITE"; 44388eea45cSKlaus Jensen case NVME_CMD_READ: return "NVME_NVM_CMD_READ"; 44488eea45cSKlaus Jensen case NVME_CMD_COMPARE: return "NVME_NVM_CMD_COMPARE"; 44588eea45cSKlaus Jensen case NVME_CMD_WRITE_ZEROES: return "NVME_NVM_CMD_WRITE_ZEROES"; 44688eea45cSKlaus Jensen case NVME_CMD_DSM: return "NVME_NVM_CMD_DSM"; 44788eea45cSKlaus Jensen case NVME_CMD_VERIFY: return "NVME_NVM_CMD_VERIFY"; 44888eea45cSKlaus Jensen case NVME_CMD_COPY: return "NVME_NVM_CMD_COPY"; 44988eea45cSKlaus Jensen case NVME_CMD_ZONE_MGMT_SEND: return "NVME_ZONED_CMD_MGMT_SEND"; 45088eea45cSKlaus Jensen case NVME_CMD_ZONE_MGMT_RECV: return "NVME_ZONED_CMD_MGMT_RECV"; 45188eea45cSKlaus Jensen case NVME_CMD_ZONE_APPEND: return "NVME_ZONED_CMD_ZONE_APPEND"; 45288eea45cSKlaus Jensen default: return "NVME_NVM_CMD_UNKNOWN"; 45388eea45cSKlaus Jensen } 45488eea45cSKlaus Jensen } 45588eea45cSKlaus Jensen 45688eea45cSKlaus Jensen typedef struct NvmeSQueue { 45788eea45cSKlaus Jensen struct NvmeCtrl *ctrl; 45888eea45cSKlaus Jensen uint16_t sqid; 45988eea45cSKlaus Jensen uint16_t cqid; 46088eea45cSKlaus Jensen uint32_t head; 46188eea45cSKlaus Jensen uint32_t tail; 46288eea45cSKlaus Jensen uint32_t size; 46388eea45cSKlaus Jensen uint64_t dma_addr; 4643f7fe8deSJinhao Fan uint64_t db_addr; 4653f7fe8deSJinhao Fan uint64_t ei_addr; 466d38cc6fdSKlaus Jensen QEMUBH *bh; 4672e53b0b4SJinhao Fan EventNotifier notifier; 4682e53b0b4SJinhao Fan bool ioeventfd_enabled; 46988eea45cSKlaus Jensen NvmeRequest *io_req; 47088eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeRequest) req_list; 47188eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeRequest) out_req_list; 47288eea45cSKlaus Jensen QTAILQ_ENTRY(NvmeSQueue) entry; 47388eea45cSKlaus Jensen } NvmeSQueue; 47488eea45cSKlaus Jensen 47588eea45cSKlaus Jensen typedef struct NvmeCQueue { 47688eea45cSKlaus Jensen struct NvmeCtrl *ctrl; 47788eea45cSKlaus Jensen uint8_t phase; 47888eea45cSKlaus Jensen uint16_t cqid; 47988eea45cSKlaus Jensen uint16_t irq_enabled; 48088eea45cSKlaus Jensen uint32_t head; 48188eea45cSKlaus Jensen uint32_t tail; 48288eea45cSKlaus Jensen uint32_t vector; 48388eea45cSKlaus Jensen uint32_t size; 48488eea45cSKlaus Jensen uint64_t dma_addr; 4853f7fe8deSJinhao Fan uint64_t db_addr; 4863f7fe8deSJinhao Fan uint64_t ei_addr; 487d38cc6fdSKlaus Jensen QEMUBH *bh; 4882e53b0b4SJinhao Fan EventNotifier notifier; 4892e53b0b4SJinhao Fan bool ioeventfd_enabled; 49088eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeSQueue) sq_list; 49188eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeRequest) req_list; 49288eea45cSKlaus Jensen } NvmeCQueue; 49388eea45cSKlaus Jensen 49488eea45cSKlaus Jensen #define TYPE_NVME "nvme" 49588eea45cSKlaus Jensen #define NVME(obj) \ 49688eea45cSKlaus Jensen OBJECT_CHECK(NvmeCtrl, (obj), TYPE_NVME) 49788eea45cSKlaus Jensen 49888eea45cSKlaus Jensen typedef struct NvmeParams { 49988eea45cSKlaus Jensen char *serial; 50088eea45cSKlaus Jensen uint32_t num_queues; /* deprecated since 5.1 */ 50188eea45cSKlaus Jensen uint32_t max_ioqpairs; 50288eea45cSKlaus Jensen uint16_t msix_qsize; 50388eea45cSKlaus Jensen uint32_t cmb_size_mb; 50488eea45cSKlaus Jensen uint8_t aerl; 50588eea45cSKlaus Jensen uint32_t aer_max_queued; 50688eea45cSKlaus Jensen uint8_t mdts; 50788eea45cSKlaus Jensen uint8_t vsl; 50888eea45cSKlaus Jensen bool use_intel_id; 50988eea45cSKlaus Jensen uint8_t zasl; 510cccc2651SNiklas Cassel bool auto_transition_zones; 51188eea45cSKlaus Jensen bool legacy_cmb; 5122e53b0b4SJinhao Fan bool ioeventfd; 51344c2c094SLukasz Maniak uint8_t sriov_max_vfs; 514746d42b1SŁukasz Gieryk uint16_t sriov_vq_flexible; 515746d42b1SŁukasz Gieryk uint16_t sriov_vi_flexible; 516746d42b1SŁukasz Gieryk uint8_t sriov_max_vq_per_vf; 517746d42b1SŁukasz Gieryk uint8_t sriov_max_vi_per_vf; 51888eea45cSKlaus Jensen } NvmeParams; 51988eea45cSKlaus Jensen 52088eea45cSKlaus Jensen typedef struct NvmeCtrl { 52188eea45cSKlaus Jensen PCIDevice parent_obj; 52288eea45cSKlaus Jensen MemoryRegion bar0; 52388eea45cSKlaus Jensen MemoryRegion iomem; 52488eea45cSKlaus Jensen NvmeBar bar; 52588eea45cSKlaus Jensen NvmeParams params; 52688eea45cSKlaus Jensen NvmeBus bus; 52788eea45cSKlaus Jensen 52888eea45cSKlaus Jensen uint16_t cntlid; 52988eea45cSKlaus Jensen bool qs_created; 53088eea45cSKlaus Jensen uint32_t page_size; 53188eea45cSKlaus Jensen uint16_t page_bits; 53288eea45cSKlaus Jensen uint16_t max_prp_ents; 53388eea45cSKlaus Jensen uint16_t cqe_size; 53488eea45cSKlaus Jensen uint16_t sqe_size; 53588eea45cSKlaus Jensen uint32_t max_q_ents; 53688eea45cSKlaus Jensen uint8_t outstanding_aers; 53788eea45cSKlaus Jensen uint32_t irq_status; 53883d7ed5cSKlaus Jensen int cq_pending; 53988eea45cSKlaus Jensen uint64_t host_timestamp; /* Timestamp sent by the host */ 54088eea45cSKlaus Jensen uint64_t timestamp_set_qemu_clock_ms; /* QEMU clock time */ 54188eea45cSKlaus Jensen uint64_t starttime_ms; 54288eea45cSKlaus Jensen uint16_t temperature; 54388eea45cSKlaus Jensen uint8_t smart_critical_warning; 544decc0261SŁukasz Gieryk uint32_t conf_msix_qsize; 545decc0261SŁukasz Gieryk uint32_t conf_ioqpairs; 5463f7fe8deSJinhao Fan uint64_t dbbuf_dbs; 5473f7fe8deSJinhao Fan uint64_t dbbuf_eis; 5483f7fe8deSJinhao Fan bool dbbuf_enabled; 54988eea45cSKlaus Jensen 55088eea45cSKlaus Jensen struct { 55188eea45cSKlaus Jensen MemoryRegion mem; 55288eea45cSKlaus Jensen uint8_t *buf; 55388eea45cSKlaus Jensen bool cmse; 55488eea45cSKlaus Jensen hwaddr cba; 55588eea45cSKlaus Jensen } cmb; 55688eea45cSKlaus Jensen 55788eea45cSKlaus Jensen struct { 55888eea45cSKlaus Jensen HostMemoryBackend *dev; 55988eea45cSKlaus Jensen bool cmse; 56088eea45cSKlaus Jensen hwaddr cba; 56188eea45cSKlaus Jensen } pmr; 56288eea45cSKlaus Jensen 56388eea45cSKlaus Jensen uint8_t aer_mask; 56488eea45cSKlaus Jensen NvmeRequest **aer_reqs; 56588eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeAsyncEvent) aer_queue; 56688eea45cSKlaus Jensen int aer_queued; 56788eea45cSKlaus Jensen 56888eea45cSKlaus Jensen uint32_t dmrsl; 56988eea45cSKlaus Jensen 57088eea45cSKlaus Jensen /* Namespace ID is started with 1 so bitmap should be 1-based */ 57188eea45cSKlaus Jensen #define NVME_CHANGED_NSID_SIZE (NVME_MAX_NAMESPACES + 1) 57288eea45cSKlaus Jensen DECLARE_BITMAP(changed_nsids, NVME_CHANGED_NSID_SIZE); 57388eea45cSKlaus Jensen 57488eea45cSKlaus Jensen NvmeSubsystem *subsys; 57588eea45cSKlaus Jensen 57688eea45cSKlaus Jensen NvmeNamespace namespace; 57788eea45cSKlaus Jensen NvmeNamespace *namespaces[NVME_MAX_NAMESPACES + 1]; 57888eea45cSKlaus Jensen NvmeSQueue **sq; 57988eea45cSKlaus Jensen NvmeCQueue **cq; 58088eea45cSKlaus Jensen NvmeSQueue admin_sq; 58188eea45cSKlaus Jensen NvmeCQueue admin_cq; 58288eea45cSKlaus Jensen NvmeIdCtrl id_ctrl; 58388eea45cSKlaus Jensen 58488eea45cSKlaus Jensen struct { 58588eea45cSKlaus Jensen struct { 58688eea45cSKlaus Jensen uint16_t temp_thresh_hi; 58788eea45cSKlaus Jensen uint16_t temp_thresh_low; 58888eea45cSKlaus Jensen }; 589d0c0697bSNaveen Nagar 59088eea45cSKlaus Jensen uint32_t async_config; 591d0c0697bSNaveen Nagar NvmeHostBehaviorSupport hbs; 59288eea45cSKlaus Jensen } features; 5935e6f963fSLukasz Maniak 5945e6f963fSLukasz Maniak NvmePriCtrlCap pri_ctrl_cap; 59599f48ae7SLukasz Maniak NvmeSecCtrlList sec_ctrl_list; 59611871f53SŁukasz Gieryk struct { 59711871f53SŁukasz Gieryk uint16_t vqrfap; 59811871f53SŁukasz Gieryk uint16_t virfap; 59911871f53SŁukasz Gieryk } next_pri_ctrl_cap; /* These override pri_ctrl_cap after reset */ 60088eea45cSKlaus Jensen } NvmeCtrl; 60188eea45cSKlaus Jensen 6021e9c685eSŁukasz Gieryk typedef enum NvmeResetType { 6031e9c685eSŁukasz Gieryk NVME_RESET_FUNCTION = 0, 6041e9c685eSŁukasz Gieryk NVME_RESET_CONTROLLER = 1, 6051e9c685eSŁukasz Gieryk } NvmeResetType; 6061e9c685eSŁukasz Gieryk 60788eea45cSKlaus Jensen static inline NvmeNamespace *nvme_ns(NvmeCtrl *n, uint32_t nsid) 60888eea45cSKlaus Jensen { 60988eea45cSKlaus Jensen if (!nsid || nsid > NVME_MAX_NAMESPACES) { 61088eea45cSKlaus Jensen return NULL; 61188eea45cSKlaus Jensen } 61288eea45cSKlaus Jensen 61388eea45cSKlaus Jensen return n->namespaces[nsid]; 61488eea45cSKlaus Jensen } 61588eea45cSKlaus Jensen 61688eea45cSKlaus Jensen static inline NvmeCQueue *nvme_cq(NvmeRequest *req) 61788eea45cSKlaus Jensen { 61888eea45cSKlaus Jensen NvmeSQueue *sq = req->sq; 61988eea45cSKlaus Jensen NvmeCtrl *n = sq->ctrl; 62088eea45cSKlaus Jensen 62188eea45cSKlaus Jensen return n->cq[sq->cqid]; 62288eea45cSKlaus Jensen } 62388eea45cSKlaus Jensen 62488eea45cSKlaus Jensen static inline NvmeCtrl *nvme_ctrl(NvmeRequest *req) 62588eea45cSKlaus Jensen { 62688eea45cSKlaus Jensen NvmeSQueue *sq = req->sq; 62788eea45cSKlaus Jensen return sq->ctrl; 62888eea45cSKlaus Jensen } 62988eea45cSKlaus Jensen 63088eea45cSKlaus Jensen static inline uint16_t nvme_cid(NvmeRequest *req) 63188eea45cSKlaus Jensen { 63288eea45cSKlaus Jensen if (!req) { 63388eea45cSKlaus Jensen return 0xffff; 63488eea45cSKlaus Jensen } 63588eea45cSKlaus Jensen 63688eea45cSKlaus Jensen return le16_to_cpu(req->cqe.cid); 63788eea45cSKlaus Jensen } 63888eea45cSKlaus Jensen 63999f48ae7SLukasz Maniak static inline NvmeSecCtrlEntry *nvme_sctrl(NvmeCtrl *n) 64099f48ae7SLukasz Maniak { 64199f48ae7SLukasz Maniak PCIDevice *pci_dev = &n->parent_obj; 64299f48ae7SLukasz Maniak NvmeCtrl *pf = NVME(pcie_sriov_get_pf(pci_dev)); 64399f48ae7SLukasz Maniak 64499f48ae7SLukasz Maniak if (pci_is_vf(pci_dev)) { 64599f48ae7SLukasz Maniak return &pf->sec_ctrl_list.sec[pcie_sriov_vf_number(pci_dev)]; 64699f48ae7SLukasz Maniak } 64799f48ae7SLukasz Maniak 64899f48ae7SLukasz Maniak return NULL; 64999f48ae7SLukasz Maniak } 65099f48ae7SLukasz Maniak 65111871f53SŁukasz Gieryk static inline NvmeSecCtrlEntry *nvme_sctrl_for_cntlid(NvmeCtrl *n, 65211871f53SŁukasz Gieryk uint16_t cntlid) 65311871f53SŁukasz Gieryk { 65411871f53SŁukasz Gieryk NvmeSecCtrlList *list = &n->sec_ctrl_list; 65511871f53SŁukasz Gieryk uint8_t i; 65611871f53SŁukasz Gieryk 65711871f53SŁukasz Gieryk for (i = 0; i < list->numcntl; i++) { 65811871f53SŁukasz Gieryk if (le16_to_cpu(list->sec[i].scid) == cntlid) { 65911871f53SŁukasz Gieryk return &list->sec[i]; 66011871f53SŁukasz Gieryk } 66111871f53SŁukasz Gieryk } 66211871f53SŁukasz Gieryk 66311871f53SŁukasz Gieryk return NULL; 66411871f53SŁukasz Gieryk } 66511871f53SŁukasz Gieryk 66688eea45cSKlaus Jensen void nvme_attach_ns(NvmeCtrl *n, NvmeNamespace *ns); 6678d3a17beSPhilippe Mathieu-Daudé uint16_t nvme_bounce_data(NvmeCtrl *n, void *ptr, uint32_t len, 66888eea45cSKlaus Jensen NvmeTxDirection dir, NvmeRequest *req); 6698d3a17beSPhilippe Mathieu-Daudé uint16_t nvme_bounce_mdata(NvmeCtrl *n, void *ptr, uint32_t len, 67088eea45cSKlaus Jensen NvmeTxDirection dir, NvmeRequest *req); 67188eea45cSKlaus Jensen void nvme_rw_complete_cb(void *opaque, int ret); 67288eea45cSKlaus Jensen uint16_t nvme_map_dptr(NvmeCtrl *n, NvmeSg *sg, size_t len, 67388eea45cSKlaus Jensen NvmeCmd *cmd); 67488eea45cSKlaus Jensen 67552581c71SMarkus Armbruster #endif /* HW_NVME_NVME_H */ 676