188eea45cSKlaus Jensen /* 288eea45cSKlaus Jensen * QEMU NVM Express 388eea45cSKlaus Jensen * 488eea45cSKlaus Jensen * Copyright (c) 2012 Intel Corporation 588eea45cSKlaus Jensen * Copyright (c) 2021 Minwoo Im 688eea45cSKlaus Jensen * Copyright (c) 2021 Samsung Electronics Co., Ltd. 788eea45cSKlaus Jensen * 888eea45cSKlaus Jensen * Authors: 988eea45cSKlaus Jensen * Keith Busch <kbusch@kernel.org> 1088eea45cSKlaus Jensen * Klaus Jensen <k.jensen@samsung.com> 1188eea45cSKlaus Jensen * Gollu Appalanaidu <anaidu.gollu@samsung.com> 1288eea45cSKlaus Jensen * Dmitry Fomichev <dmitry.fomichev@wdc.com> 1388eea45cSKlaus Jensen * Minwoo Im <minwoo.im.dev@gmail.com> 1488eea45cSKlaus Jensen * 1588eea45cSKlaus Jensen * This code is licensed under the GNU GPL v2 or later. 1688eea45cSKlaus Jensen */ 1788eea45cSKlaus Jensen 1852581c71SMarkus Armbruster #ifndef HW_NVME_NVME_H 1952581c71SMarkus Armbruster #define HW_NVME_NVME_H 2088eea45cSKlaus Jensen 2188eea45cSKlaus Jensen #include "qemu/uuid.h" 22edf5ca5dSMarkus Armbruster #include "hw/pci/pci_device.h" 2388eea45cSKlaus Jensen #include "hw/block/block.h" 2488eea45cSKlaus Jensen 2588eea45cSKlaus Jensen #include "block/nvme.h" 2688eea45cSKlaus Jensen 2744c2c094SLukasz Maniak #define NVME_MAX_CONTROLLERS 256 2888eea45cSKlaus Jensen #define NVME_MAX_NAMESPACES 256 293276dde4SHeinrich Schuchardt #define NVME_EUI64_DEFAULT ((uint64_t)0x5254000000000000) 3073064edfSJesper Devantier #define NVME_FDP_MAX_EVENTS 63 3173064edfSJesper Devantier #define NVME_FDP_MAXPIDS 128 3288eea45cSKlaus Jensen 336a33f2e9SKlaus Jensen /* 346a33f2e9SKlaus Jensen * The controller only supports Submission and Completion Queue Entry Sizes of 356a33f2e9SKlaus Jensen * 64 and 16 bytes respectively. 366a33f2e9SKlaus Jensen */ 376a33f2e9SKlaus Jensen #define NVME_SQES 6 386a33f2e9SKlaus Jensen #define NVME_CQES 4 396a33f2e9SKlaus Jensen 4038f4ac65SKlaus Jensen QEMU_BUILD_BUG_ON(NVME_MAX_NAMESPACES > NVME_NSID_BROADCAST - 1); 4138f4ac65SKlaus Jensen 4288eea45cSKlaus Jensen typedef struct NvmeCtrl NvmeCtrl; 4388eea45cSKlaus Jensen typedef struct NvmeNamespace NvmeNamespace; 4488eea45cSKlaus Jensen 455ffbaeedSKlaus Jensen #define TYPE_NVME_BUS "nvme-bus" 465ffbaeedSKlaus Jensen OBJECT_DECLARE_SIMPLE_TYPE(NvmeBus, NVME_BUS) 475ffbaeedSKlaus Jensen 485ffbaeedSKlaus Jensen typedef struct NvmeBus { 495ffbaeedSKlaus Jensen BusState parent_bus; 505ffbaeedSKlaus Jensen } NvmeBus; 515ffbaeedSKlaus Jensen 5288eea45cSKlaus Jensen #define TYPE_NVME_SUBSYS "nvme-subsys" 5388eea45cSKlaus Jensen #define NVME_SUBSYS(obj) \ 5488eea45cSKlaus Jensen OBJECT_CHECK(NvmeSubsystem, (obj), TYPE_NVME_SUBSYS) 5599f48ae7SLukasz Maniak #define SUBSYS_SLOT_RSVD (void *)0xFFFF 5688eea45cSKlaus Jensen 5773064edfSJesper Devantier typedef struct NvmeReclaimUnit { 5873064edfSJesper Devantier uint64_t ruamw; 5973064edfSJesper Devantier } NvmeReclaimUnit; 6073064edfSJesper Devantier 6173064edfSJesper Devantier typedef struct NvmeRuHandle { 6273064edfSJesper Devantier uint8_t ruht; 6373064edfSJesper Devantier uint8_t ruha; 6473064edfSJesper Devantier uint64_t event_filter; 6573064edfSJesper Devantier uint8_t lbafi; 6673064edfSJesper Devantier uint64_t ruamw; 6773064edfSJesper Devantier 6873064edfSJesper Devantier /* reclaim units indexed by reclaim group */ 6973064edfSJesper Devantier NvmeReclaimUnit *rus; 7073064edfSJesper Devantier } NvmeRuHandle; 7173064edfSJesper Devantier 7273064edfSJesper Devantier typedef struct NvmeFdpEventBuffer { 7373064edfSJesper Devantier NvmeFdpEvent events[NVME_FDP_MAX_EVENTS]; 7473064edfSJesper Devantier unsigned int nelems; 7573064edfSJesper Devantier unsigned int start; 7673064edfSJesper Devantier unsigned int next; 7773064edfSJesper Devantier } NvmeFdpEventBuffer; 7873064edfSJesper Devantier 79771dbc3aSKlaus Jensen typedef struct NvmeEnduranceGroup { 80771dbc3aSKlaus Jensen uint8_t event_conf; 8173064edfSJesper Devantier 8273064edfSJesper Devantier struct { 8373064edfSJesper Devantier NvmeFdpEventBuffer host_events, ctrl_events; 8473064edfSJesper Devantier 8573064edfSJesper Devantier uint16_t nruh; 8673064edfSJesper Devantier uint16_t nrg; 8773064edfSJesper Devantier uint8_t rgif; 8873064edfSJesper Devantier uint64_t runs; 8973064edfSJesper Devantier 9073064edfSJesper Devantier uint64_t hbmw; 9173064edfSJesper Devantier uint64_t mbmw; 9273064edfSJesper Devantier uint64_t mbe; 9373064edfSJesper Devantier 9473064edfSJesper Devantier bool enabled; 9573064edfSJesper Devantier 9673064edfSJesper Devantier NvmeRuHandle *ruhs; 9773064edfSJesper Devantier } fdp; 98771dbc3aSKlaus Jensen } NvmeEnduranceGroup; 99771dbc3aSKlaus Jensen 10088eea45cSKlaus Jensen typedef struct NvmeSubsystem { 10188eea45cSKlaus Jensen DeviceState parent_obj; 1025ffbaeedSKlaus Jensen NvmeBus bus; 10388eea45cSKlaus Jensen uint8_t subnqn[256]; 104a859eb9fSKlaus Jensen char *serial; 10588eea45cSKlaus Jensen 10688eea45cSKlaus Jensen NvmeCtrl *ctrls[NVME_MAX_CONTROLLERS]; 10788eea45cSKlaus Jensen NvmeNamespace *namespaces[NVME_MAX_NAMESPACES + 1]; 10873064edfSJesper Devantier NvmeEnduranceGroup endgrp; 10988eea45cSKlaus Jensen 11088eea45cSKlaus Jensen struct { 11188eea45cSKlaus Jensen char *nqn; 11273064edfSJesper Devantier 11373064edfSJesper Devantier struct { 11473064edfSJesper Devantier bool enabled; 11573064edfSJesper Devantier uint64_t runs; 11673064edfSJesper Devantier uint16_t nruh; 11773064edfSJesper Devantier uint32_t nrg; 11873064edfSJesper Devantier } fdp; 11988eea45cSKlaus Jensen } params; 12088eea45cSKlaus Jensen } NvmeSubsystem; 12188eea45cSKlaus Jensen 12288eea45cSKlaus Jensen int nvme_subsys_register_ctrl(NvmeCtrl *n, Error **errp); 123b0fde9e8SKlaus Jensen void nvme_subsys_unregister_ctrl(NvmeSubsystem *subsys, NvmeCtrl *n); 12488eea45cSKlaus Jensen 12588eea45cSKlaus Jensen static inline NvmeCtrl *nvme_subsys_ctrl(NvmeSubsystem *subsys, 12688eea45cSKlaus Jensen uint32_t cntlid) 12788eea45cSKlaus Jensen { 12888eea45cSKlaus Jensen if (!subsys || cntlid >= NVME_MAX_CONTROLLERS) { 12988eea45cSKlaus Jensen return NULL; 13088eea45cSKlaus Jensen } 13188eea45cSKlaus Jensen 13299f48ae7SLukasz Maniak if (subsys->ctrls[cntlid] == SUBSYS_SLOT_RSVD) { 13399f48ae7SLukasz Maniak return NULL; 13499f48ae7SLukasz Maniak } 13599f48ae7SLukasz Maniak 13688eea45cSKlaus Jensen return subsys->ctrls[cntlid]; 13788eea45cSKlaus Jensen } 13888eea45cSKlaus Jensen 13988eea45cSKlaus Jensen static inline NvmeNamespace *nvme_subsys_ns(NvmeSubsystem *subsys, 14088eea45cSKlaus Jensen uint32_t nsid) 14188eea45cSKlaus Jensen { 14288eea45cSKlaus Jensen if (!subsys || !nsid || nsid > NVME_MAX_NAMESPACES) { 14388eea45cSKlaus Jensen return NULL; 14488eea45cSKlaus Jensen } 14588eea45cSKlaus Jensen 14688eea45cSKlaus Jensen return subsys->namespaces[nsid]; 14788eea45cSKlaus Jensen } 14888eea45cSKlaus Jensen 14988eea45cSKlaus Jensen #define TYPE_NVME_NS "nvme-ns" 15088eea45cSKlaus Jensen #define NVME_NS(obj) \ 15188eea45cSKlaus Jensen OBJECT_CHECK(NvmeNamespace, (obj), TYPE_NVME_NS) 15288eea45cSKlaus Jensen 15388eea45cSKlaus Jensen typedef struct NvmeZone { 15488eea45cSKlaus Jensen NvmeZoneDescr d; 15588eea45cSKlaus Jensen uint64_t w_ptr; 15688eea45cSKlaus Jensen QTAILQ_ENTRY(NvmeZone) entry; 15788eea45cSKlaus Jensen } NvmeZone; 15888eea45cSKlaus Jensen 15973064edfSJesper Devantier #define FDP_EVT_MAX 0xff 16073064edfSJesper Devantier #define NVME_FDP_MAX_NS_RUHS 32u 16173064edfSJesper Devantier #define FDPVSS 0 16273064edfSJesper Devantier 16373064edfSJesper Devantier static const uint8_t nvme_fdp_evf_shifts[FDP_EVT_MAX] = { 16473064edfSJesper Devantier /* Host events */ 16573064edfSJesper Devantier [FDP_EVT_RU_NOT_FULLY_WRITTEN] = 0, 16673064edfSJesper Devantier [FDP_EVT_RU_ATL_EXCEEDED] = 1, 16773064edfSJesper Devantier [FDP_EVT_CTRL_RESET_RUH] = 2, 16873064edfSJesper Devantier [FDP_EVT_INVALID_PID] = 3, 16973064edfSJesper Devantier /* CTRL events */ 17073064edfSJesper Devantier [FDP_EVT_MEDIA_REALLOC] = 32, 17173064edfSJesper Devantier [FDP_EVT_RUH_IMPLICIT_RU_CHANGE] = 33, 17273064edfSJesper Devantier }; 17373064edfSJesper Devantier 174*bdc31646SRoque Arcudia Hernandez #define NGUID_LEN 16 175*bdc31646SRoque Arcudia Hernandez 176*bdc31646SRoque Arcudia Hernandez typedef struct { 177*bdc31646SRoque Arcudia Hernandez uint8_t data[NGUID_LEN]; 178*bdc31646SRoque Arcudia Hernandez } NvmeNGUID; 179*bdc31646SRoque Arcudia Hernandez 180*bdc31646SRoque Arcudia Hernandez bool nvme_nguid_is_null(const NvmeNGUID *nguid); 181*bdc31646SRoque Arcudia Hernandez 182*bdc31646SRoque Arcudia Hernandez extern const PropertyInfo qdev_prop_nguid; 183*bdc31646SRoque Arcudia Hernandez 184*bdc31646SRoque Arcudia Hernandez #define DEFINE_PROP_NGUID_NODEFAULT(_name, _state, _field) \ 185*bdc31646SRoque Arcudia Hernandez DEFINE_PROP(_name, _state, _field, qdev_prop_nguid, NvmeNGUID) 186*bdc31646SRoque Arcudia Hernandez 18788eea45cSKlaus Jensen typedef struct NvmeNamespaceParams { 18888eea45cSKlaus Jensen bool detached; 18988eea45cSKlaus Jensen bool shared; 19088eea45cSKlaus Jensen uint32_t nsid; 19188eea45cSKlaus Jensen QemuUUID uuid; 192*bdc31646SRoque Arcudia Hernandez NvmeNGUID nguid; 1936870cfb8SHeinrich Schuchardt uint64_t eui64; 1943276dde4SHeinrich Schuchardt bool eui64_default; 19588eea45cSKlaus Jensen 19688eea45cSKlaus Jensen uint16_t ms; 19788eea45cSKlaus Jensen uint8_t mset; 19888eea45cSKlaus Jensen uint8_t pi; 19988eea45cSKlaus Jensen uint8_t pil; 20044219b60SNaveen Nagar uint8_t pif; 20188eea45cSKlaus Jensen 20288eea45cSKlaus Jensen uint16_t mssrl; 20388eea45cSKlaus Jensen uint32_t mcl; 20488eea45cSKlaus Jensen uint8_t msrc; 20588eea45cSKlaus Jensen 20688eea45cSKlaus Jensen bool zoned; 20788eea45cSKlaus Jensen bool cross_zone_read; 20888eea45cSKlaus Jensen uint64_t zone_size_bs; 20988eea45cSKlaus Jensen uint64_t zone_cap_bs; 21088eea45cSKlaus Jensen uint32_t max_active_zones; 21188eea45cSKlaus Jensen uint32_t max_open_zones; 21288eea45cSKlaus Jensen uint32_t zd_extension_size; 213e321b4cdSKlaus Jensen 214e321b4cdSKlaus Jensen uint32_t numzrwa; 215e321b4cdSKlaus Jensen uint64_t zrwas; 216e321b4cdSKlaus Jensen uint64_t zrwafg; 21773064edfSJesper Devantier 21873064edfSJesper Devantier struct { 21973064edfSJesper Devantier char *ruhs; 22073064edfSJesper Devantier } fdp; 22188eea45cSKlaus Jensen } NvmeNamespaceParams; 22288eea45cSKlaus Jensen 22388eea45cSKlaus Jensen typedef struct NvmeNamespace { 22488eea45cSKlaus Jensen DeviceState parent_obj; 22588eea45cSKlaus Jensen BlockConf blkconf; 22688eea45cSKlaus Jensen int32_t bootindex; 22788eea45cSKlaus Jensen int64_t size; 22888eea45cSKlaus Jensen int64_t moff; 22988eea45cSKlaus Jensen NvmeIdNs id_ns; 23044219b60SNaveen Nagar NvmeIdNsNvm id_ns_nvm; 23188eea45cSKlaus Jensen NvmeLBAF lbaf; 232763c05dfSNaveen Nagar unsigned int nlbaf; 23388eea45cSKlaus Jensen size_t lbasz; 23488eea45cSKlaus Jensen const uint32_t *iocs; 23588eea45cSKlaus Jensen uint8_t csi; 23688eea45cSKlaus Jensen uint16_t status; 23788eea45cSKlaus Jensen int attached; 23844219b60SNaveen Nagar uint8_t pif; 23988eea45cSKlaus Jensen 240e321b4cdSKlaus Jensen struct { 241e321b4cdSKlaus Jensen uint16_t zrwas; 242e321b4cdSKlaus Jensen uint16_t zrwafg; 243e321b4cdSKlaus Jensen uint32_t numzrwa; 244e321b4cdSKlaus Jensen } zns; 245e321b4cdSKlaus Jensen 24688eea45cSKlaus Jensen QTAILQ_ENTRY(NvmeNamespace) entry; 24788eea45cSKlaus Jensen 24888eea45cSKlaus Jensen NvmeIdNsZoned *id_ns_zoned; 24988eea45cSKlaus Jensen NvmeZone *zone_array; 25088eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeZone) exp_open_zones; 25188eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeZone) imp_open_zones; 25288eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeZone) closed_zones; 25388eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeZone) full_zones; 25488eea45cSKlaus Jensen uint32_t num_zones; 25588eea45cSKlaus Jensen uint64_t zone_size; 25688eea45cSKlaus Jensen uint64_t zone_capacity; 25788eea45cSKlaus Jensen uint32_t zone_size_log2; 25888eea45cSKlaus Jensen uint8_t *zd_extensions; 25988eea45cSKlaus Jensen int32_t nr_open_zones; 26088eea45cSKlaus Jensen int32_t nr_active_zones; 26188eea45cSKlaus Jensen 26288eea45cSKlaus Jensen NvmeNamespaceParams params; 263534a93d3SNiklas Cassel NvmeSubsystem *subsys; 26473064edfSJesper Devantier NvmeEnduranceGroup *endgrp; 26588eea45cSKlaus Jensen 26688eea45cSKlaus Jensen struct { 26788eea45cSKlaus Jensen uint32_t err_rec; 26888eea45cSKlaus Jensen } features; 26973064edfSJesper Devantier 27073064edfSJesper Devantier struct { 27173064edfSJesper Devantier uint16_t nphs; 27273064edfSJesper Devantier /* reclaim unit handle identifiers indexed by placement handle */ 27373064edfSJesper Devantier uint16_t *phs; 27473064edfSJesper Devantier } fdp; 27588eea45cSKlaus Jensen } NvmeNamespace; 27688eea45cSKlaus Jensen 27788eea45cSKlaus Jensen static inline uint32_t nvme_nsid(NvmeNamespace *ns) 27888eea45cSKlaus Jensen { 27988eea45cSKlaus Jensen if (ns) { 28088eea45cSKlaus Jensen return ns->params.nsid; 28188eea45cSKlaus Jensen } 28288eea45cSKlaus Jensen 28388eea45cSKlaus Jensen return 0; 28488eea45cSKlaus Jensen } 28588eea45cSKlaus Jensen 28688eea45cSKlaus Jensen static inline size_t nvme_l2b(NvmeNamespace *ns, uint64_t lba) 28788eea45cSKlaus Jensen { 28888eea45cSKlaus Jensen return lba << ns->lbaf.ds; 28988eea45cSKlaus Jensen } 29088eea45cSKlaus Jensen 29188eea45cSKlaus Jensen static inline size_t nvme_m2b(NvmeNamespace *ns, uint64_t lba) 29288eea45cSKlaus Jensen { 29388eea45cSKlaus Jensen return ns->lbaf.ms * lba; 29488eea45cSKlaus Jensen } 29588eea45cSKlaus Jensen 29688eea45cSKlaus Jensen static inline int64_t nvme_moff(NvmeNamespace *ns, uint64_t lba) 29788eea45cSKlaus Jensen { 29888eea45cSKlaus Jensen return ns->moff + nvme_m2b(ns, lba); 29988eea45cSKlaus Jensen } 30088eea45cSKlaus Jensen 30188eea45cSKlaus Jensen static inline bool nvme_ns_ext(NvmeNamespace *ns) 30288eea45cSKlaus Jensen { 30388eea45cSKlaus Jensen return !!NVME_ID_NS_FLBAS_EXTENDED(ns->id_ns.flbas); 30488eea45cSKlaus Jensen } 30588eea45cSKlaus Jensen 30688eea45cSKlaus Jensen static inline NvmeZoneState nvme_get_zone_state(NvmeZone *zone) 30788eea45cSKlaus Jensen { 30888eea45cSKlaus Jensen return zone->d.zs >> 4; 30988eea45cSKlaus Jensen } 31088eea45cSKlaus Jensen 31188eea45cSKlaus Jensen static inline void nvme_set_zone_state(NvmeZone *zone, NvmeZoneState state) 31288eea45cSKlaus Jensen { 31388eea45cSKlaus Jensen zone->d.zs = state << 4; 31488eea45cSKlaus Jensen } 31588eea45cSKlaus Jensen 31688eea45cSKlaus Jensen static inline uint64_t nvme_zone_rd_boundary(NvmeNamespace *ns, NvmeZone *zone) 31788eea45cSKlaus Jensen { 31888eea45cSKlaus Jensen return zone->d.zslba + ns->zone_size; 31988eea45cSKlaus Jensen } 32088eea45cSKlaus Jensen 32188eea45cSKlaus Jensen static inline uint64_t nvme_zone_wr_boundary(NvmeZone *zone) 32288eea45cSKlaus Jensen { 32388eea45cSKlaus Jensen return zone->d.zslba + zone->d.zcap; 32488eea45cSKlaus Jensen } 32588eea45cSKlaus Jensen 32688eea45cSKlaus Jensen static inline bool nvme_wp_is_valid(NvmeZone *zone) 32788eea45cSKlaus Jensen { 32888eea45cSKlaus Jensen uint8_t st = nvme_get_zone_state(zone); 32988eea45cSKlaus Jensen 33088eea45cSKlaus Jensen return st != NVME_ZONE_STATE_FULL && 33188eea45cSKlaus Jensen st != NVME_ZONE_STATE_READ_ONLY && 33288eea45cSKlaus Jensen st != NVME_ZONE_STATE_OFFLINE; 33388eea45cSKlaus Jensen } 33488eea45cSKlaus Jensen 33588eea45cSKlaus Jensen static inline uint8_t *nvme_get_zd_extension(NvmeNamespace *ns, 33688eea45cSKlaus Jensen uint32_t zone_idx) 33788eea45cSKlaus Jensen { 33888eea45cSKlaus Jensen return &ns->zd_extensions[zone_idx * ns->params.zd_extension_size]; 33988eea45cSKlaus Jensen } 34088eea45cSKlaus Jensen 34188eea45cSKlaus Jensen static inline void nvme_aor_inc_open(NvmeNamespace *ns) 34288eea45cSKlaus Jensen { 34388eea45cSKlaus Jensen assert(ns->nr_open_zones >= 0); 34488eea45cSKlaus Jensen if (ns->params.max_open_zones) { 34588eea45cSKlaus Jensen ns->nr_open_zones++; 34688eea45cSKlaus Jensen assert(ns->nr_open_zones <= ns->params.max_open_zones); 34788eea45cSKlaus Jensen } 34888eea45cSKlaus Jensen } 34988eea45cSKlaus Jensen 35088eea45cSKlaus Jensen static inline void nvme_aor_dec_open(NvmeNamespace *ns) 35188eea45cSKlaus Jensen { 35288eea45cSKlaus Jensen if (ns->params.max_open_zones) { 35388eea45cSKlaus Jensen assert(ns->nr_open_zones > 0); 35488eea45cSKlaus Jensen ns->nr_open_zones--; 35588eea45cSKlaus Jensen } 35688eea45cSKlaus Jensen assert(ns->nr_open_zones >= 0); 35788eea45cSKlaus Jensen } 35888eea45cSKlaus Jensen 35988eea45cSKlaus Jensen static inline void nvme_aor_inc_active(NvmeNamespace *ns) 36088eea45cSKlaus Jensen { 36188eea45cSKlaus Jensen assert(ns->nr_active_zones >= 0); 36288eea45cSKlaus Jensen if (ns->params.max_active_zones) { 36388eea45cSKlaus Jensen ns->nr_active_zones++; 36488eea45cSKlaus Jensen assert(ns->nr_active_zones <= ns->params.max_active_zones); 36588eea45cSKlaus Jensen } 36688eea45cSKlaus Jensen } 36788eea45cSKlaus Jensen 36888eea45cSKlaus Jensen static inline void nvme_aor_dec_active(NvmeNamespace *ns) 36988eea45cSKlaus Jensen { 37088eea45cSKlaus Jensen if (ns->params.max_active_zones) { 37188eea45cSKlaus Jensen assert(ns->nr_active_zones > 0); 37288eea45cSKlaus Jensen ns->nr_active_zones--; 37388eea45cSKlaus Jensen assert(ns->nr_active_zones >= ns->nr_open_zones); 37488eea45cSKlaus Jensen } 37588eea45cSKlaus Jensen assert(ns->nr_active_zones >= 0); 37688eea45cSKlaus Jensen } 37788eea45cSKlaus Jensen 37873064edfSJesper Devantier static inline void nvme_fdp_stat_inc(uint64_t *a, uint64_t b) 37973064edfSJesper Devantier { 38073064edfSJesper Devantier uint64_t ret = *a + b; 38173064edfSJesper Devantier *a = ret < *a ? UINT64_MAX : ret; 38273064edfSJesper Devantier } 38373064edfSJesper Devantier 38488eea45cSKlaus Jensen void nvme_ns_init_format(NvmeNamespace *ns); 3855e4f6bccSKlaus Jensen int nvme_ns_setup(NvmeNamespace *ns, Error **errp); 38688eea45cSKlaus Jensen void nvme_ns_drain(NvmeNamespace *ns); 38788eea45cSKlaus Jensen void nvme_ns_shutdown(NvmeNamespace *ns); 38888eea45cSKlaus Jensen void nvme_ns_cleanup(NvmeNamespace *ns); 38988eea45cSKlaus Jensen 39088eea45cSKlaus Jensen typedef struct NvmeAsyncEvent { 39188eea45cSKlaus Jensen QTAILQ_ENTRY(NvmeAsyncEvent) entry; 39288eea45cSKlaus Jensen NvmeAerResult result; 39388eea45cSKlaus Jensen } NvmeAsyncEvent; 39488eea45cSKlaus Jensen 39588eea45cSKlaus Jensen enum { 39688eea45cSKlaus Jensen NVME_SG_ALLOC = 1 << 0, 39788eea45cSKlaus Jensen NVME_SG_DMA = 1 << 1, 39888eea45cSKlaus Jensen }; 39988eea45cSKlaus Jensen 40088eea45cSKlaus Jensen typedef struct NvmeSg { 40188eea45cSKlaus Jensen int flags; 40288eea45cSKlaus Jensen 40388eea45cSKlaus Jensen union { 40488eea45cSKlaus Jensen QEMUSGList qsg; 40588eea45cSKlaus Jensen QEMUIOVector iov; 40688eea45cSKlaus Jensen }; 40788eea45cSKlaus Jensen } NvmeSg; 40888eea45cSKlaus Jensen 40988eea45cSKlaus Jensen typedef enum NvmeTxDirection { 41088eea45cSKlaus Jensen NVME_TX_DIRECTION_TO_DEVICE = 0, 41188eea45cSKlaus Jensen NVME_TX_DIRECTION_FROM_DEVICE = 1, 41288eea45cSKlaus Jensen } NvmeTxDirection; 41388eea45cSKlaus Jensen 41488eea45cSKlaus Jensen typedef struct NvmeRequest { 41588eea45cSKlaus Jensen struct NvmeSQueue *sq; 41688eea45cSKlaus Jensen struct NvmeNamespace *ns; 41788eea45cSKlaus Jensen BlockAIOCB *aiocb; 41888eea45cSKlaus Jensen uint16_t status; 41988eea45cSKlaus Jensen void *opaque; 42088eea45cSKlaus Jensen NvmeCqe cqe; 42188eea45cSKlaus Jensen NvmeCmd cmd; 42288eea45cSKlaus Jensen BlockAcctCookie acct; 42388eea45cSKlaus Jensen NvmeSg sg; 42488eea45cSKlaus Jensen QTAILQ_ENTRY(NvmeRequest)entry; 42588eea45cSKlaus Jensen } NvmeRequest; 42688eea45cSKlaus Jensen 42788eea45cSKlaus Jensen typedef struct NvmeBounceContext { 42888eea45cSKlaus Jensen NvmeRequest *req; 42988eea45cSKlaus Jensen 43088eea45cSKlaus Jensen struct { 43188eea45cSKlaus Jensen QEMUIOVector iov; 43288eea45cSKlaus Jensen uint8_t *bounce; 43388eea45cSKlaus Jensen } data, mdata; 43488eea45cSKlaus Jensen } NvmeBounceContext; 43588eea45cSKlaus Jensen 43688eea45cSKlaus Jensen static inline const char *nvme_adm_opc_str(uint8_t opc) 43788eea45cSKlaus Jensen { 43888eea45cSKlaus Jensen switch (opc) { 43988eea45cSKlaus Jensen case NVME_ADM_CMD_DELETE_SQ: return "NVME_ADM_CMD_DELETE_SQ"; 44088eea45cSKlaus Jensen case NVME_ADM_CMD_CREATE_SQ: return "NVME_ADM_CMD_CREATE_SQ"; 44188eea45cSKlaus Jensen case NVME_ADM_CMD_GET_LOG_PAGE: return "NVME_ADM_CMD_GET_LOG_PAGE"; 44288eea45cSKlaus Jensen case NVME_ADM_CMD_DELETE_CQ: return "NVME_ADM_CMD_DELETE_CQ"; 44388eea45cSKlaus Jensen case NVME_ADM_CMD_CREATE_CQ: return "NVME_ADM_CMD_CREATE_CQ"; 44488eea45cSKlaus Jensen case NVME_ADM_CMD_IDENTIFY: return "NVME_ADM_CMD_IDENTIFY"; 44588eea45cSKlaus Jensen case NVME_ADM_CMD_ABORT: return "NVME_ADM_CMD_ABORT"; 44688eea45cSKlaus Jensen case NVME_ADM_CMD_SET_FEATURES: return "NVME_ADM_CMD_SET_FEATURES"; 44788eea45cSKlaus Jensen case NVME_ADM_CMD_GET_FEATURES: return "NVME_ADM_CMD_GET_FEATURES"; 44888eea45cSKlaus Jensen case NVME_ADM_CMD_ASYNC_EV_REQ: return "NVME_ADM_CMD_ASYNC_EV_REQ"; 44988eea45cSKlaus Jensen case NVME_ADM_CMD_NS_ATTACHMENT: return "NVME_ADM_CMD_NS_ATTACHMENT"; 450e181d3daSGollu Appalanaidu case NVME_ADM_CMD_DIRECTIVE_SEND: return "NVME_ADM_CMD_DIRECTIVE_SEND"; 45111871f53SŁukasz Gieryk case NVME_ADM_CMD_VIRT_MNGMT: return "NVME_ADM_CMD_VIRT_MNGMT"; 452e181d3daSGollu Appalanaidu case NVME_ADM_CMD_DIRECTIVE_RECV: return "NVME_ADM_CMD_DIRECTIVE_RECV"; 4533f7fe8deSJinhao Fan case NVME_ADM_CMD_DBBUF_CONFIG: return "NVME_ADM_CMD_DBBUF_CONFIG"; 45488eea45cSKlaus Jensen case NVME_ADM_CMD_FORMAT_NVM: return "NVME_ADM_CMD_FORMAT_NVM"; 45588eea45cSKlaus Jensen default: return "NVME_ADM_CMD_UNKNOWN"; 45688eea45cSKlaus Jensen } 45788eea45cSKlaus Jensen } 45888eea45cSKlaus Jensen 45988eea45cSKlaus Jensen static inline const char *nvme_io_opc_str(uint8_t opc) 46088eea45cSKlaus Jensen { 46188eea45cSKlaus Jensen switch (opc) { 46288eea45cSKlaus Jensen case NVME_CMD_FLUSH: return "NVME_NVM_CMD_FLUSH"; 46388eea45cSKlaus Jensen case NVME_CMD_WRITE: return "NVME_NVM_CMD_WRITE"; 46488eea45cSKlaus Jensen case NVME_CMD_READ: return "NVME_NVM_CMD_READ"; 46588eea45cSKlaus Jensen case NVME_CMD_COMPARE: return "NVME_NVM_CMD_COMPARE"; 46688eea45cSKlaus Jensen case NVME_CMD_WRITE_ZEROES: return "NVME_NVM_CMD_WRITE_ZEROES"; 46788eea45cSKlaus Jensen case NVME_CMD_DSM: return "NVME_NVM_CMD_DSM"; 46888eea45cSKlaus Jensen case NVME_CMD_VERIFY: return "NVME_NVM_CMD_VERIFY"; 46988eea45cSKlaus Jensen case NVME_CMD_COPY: return "NVME_NVM_CMD_COPY"; 47088eea45cSKlaus Jensen case NVME_CMD_ZONE_MGMT_SEND: return "NVME_ZONED_CMD_MGMT_SEND"; 47188eea45cSKlaus Jensen case NVME_CMD_ZONE_MGMT_RECV: return "NVME_ZONED_CMD_MGMT_RECV"; 47288eea45cSKlaus Jensen case NVME_CMD_ZONE_APPEND: return "NVME_ZONED_CMD_ZONE_APPEND"; 47388eea45cSKlaus Jensen default: return "NVME_NVM_CMD_UNKNOWN"; 47488eea45cSKlaus Jensen } 47588eea45cSKlaus Jensen } 47688eea45cSKlaus Jensen 47788eea45cSKlaus Jensen typedef struct NvmeSQueue { 47888eea45cSKlaus Jensen struct NvmeCtrl *ctrl; 47988eea45cSKlaus Jensen uint16_t sqid; 48088eea45cSKlaus Jensen uint16_t cqid; 48188eea45cSKlaus Jensen uint32_t head; 48288eea45cSKlaus Jensen uint32_t tail; 48388eea45cSKlaus Jensen uint32_t size; 48488eea45cSKlaus Jensen uint64_t dma_addr; 4853f7fe8deSJinhao Fan uint64_t db_addr; 4863f7fe8deSJinhao Fan uint64_t ei_addr; 487d38cc6fdSKlaus Jensen QEMUBH *bh; 4882e53b0b4SJinhao Fan EventNotifier notifier; 4892e53b0b4SJinhao Fan bool ioeventfd_enabled; 49088eea45cSKlaus Jensen NvmeRequest *io_req; 49188eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeRequest) req_list; 49288eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeRequest) out_req_list; 49388eea45cSKlaus Jensen QTAILQ_ENTRY(NvmeSQueue) entry; 49488eea45cSKlaus Jensen } NvmeSQueue; 49588eea45cSKlaus Jensen 49688eea45cSKlaus Jensen typedef struct NvmeCQueue { 49788eea45cSKlaus Jensen struct NvmeCtrl *ctrl; 49888eea45cSKlaus Jensen uint8_t phase; 49988eea45cSKlaus Jensen uint16_t cqid; 50088eea45cSKlaus Jensen uint16_t irq_enabled; 50188eea45cSKlaus Jensen uint32_t head; 50288eea45cSKlaus Jensen uint32_t tail; 50388eea45cSKlaus Jensen uint32_t vector; 50488eea45cSKlaus Jensen uint32_t size; 50588eea45cSKlaus Jensen uint64_t dma_addr; 5063f7fe8deSJinhao Fan uint64_t db_addr; 5073f7fe8deSJinhao Fan uint64_t ei_addr; 508d38cc6fdSKlaus Jensen QEMUBH *bh; 5092e53b0b4SJinhao Fan EventNotifier notifier; 5102e53b0b4SJinhao Fan bool ioeventfd_enabled; 51188eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeSQueue) sq_list; 51288eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeRequest) req_list; 51388eea45cSKlaus Jensen } NvmeCQueue; 51488eea45cSKlaus Jensen 51588eea45cSKlaus Jensen #define TYPE_NVME "nvme" 51688eea45cSKlaus Jensen #define NVME(obj) \ 51788eea45cSKlaus Jensen OBJECT_CHECK(NvmeCtrl, (obj), TYPE_NVME) 51888eea45cSKlaus Jensen 51988eea45cSKlaus Jensen typedef struct NvmeParams { 52088eea45cSKlaus Jensen char *serial; 52188eea45cSKlaus Jensen uint32_t num_queues; /* deprecated since 5.1 */ 52288eea45cSKlaus Jensen uint32_t max_ioqpairs; 52388eea45cSKlaus Jensen uint16_t msix_qsize; 52488eea45cSKlaus Jensen uint32_t cmb_size_mb; 52588eea45cSKlaus Jensen uint8_t aerl; 52688eea45cSKlaus Jensen uint32_t aer_max_queued; 52788eea45cSKlaus Jensen uint8_t mdts; 52888eea45cSKlaus Jensen uint8_t vsl; 52988eea45cSKlaus Jensen bool use_intel_id; 53088eea45cSKlaus Jensen uint8_t zasl; 531cccc2651SNiklas Cassel bool auto_transition_zones; 53288eea45cSKlaus Jensen bool legacy_cmb; 5332e53b0b4SJinhao Fan bool ioeventfd; 53444c2c094SLukasz Maniak uint8_t sriov_max_vfs; 535746d42b1SŁukasz Gieryk uint16_t sriov_vq_flexible; 536746d42b1SŁukasz Gieryk uint16_t sriov_vi_flexible; 537746d42b1SŁukasz Gieryk uint8_t sriov_max_vq_per_vf; 538746d42b1SŁukasz Gieryk uint8_t sriov_max_vi_per_vf; 53988eea45cSKlaus Jensen } NvmeParams; 54088eea45cSKlaus Jensen 54188eea45cSKlaus Jensen typedef struct NvmeCtrl { 54288eea45cSKlaus Jensen PCIDevice parent_obj; 54388eea45cSKlaus Jensen MemoryRegion bar0; 54488eea45cSKlaus Jensen MemoryRegion iomem; 54588eea45cSKlaus Jensen NvmeBar bar; 54688eea45cSKlaus Jensen NvmeParams params; 54788eea45cSKlaus Jensen NvmeBus bus; 54888eea45cSKlaus Jensen 54988eea45cSKlaus Jensen uint16_t cntlid; 55088eea45cSKlaus Jensen bool qs_created; 55188eea45cSKlaus Jensen uint32_t page_size; 55288eea45cSKlaus Jensen uint16_t page_bits; 55388eea45cSKlaus Jensen uint16_t max_prp_ents; 55488eea45cSKlaus Jensen uint32_t max_q_ents; 55588eea45cSKlaus Jensen uint8_t outstanding_aers; 55688eea45cSKlaus Jensen uint32_t irq_status; 55783d7ed5cSKlaus Jensen int cq_pending; 55888eea45cSKlaus Jensen uint64_t host_timestamp; /* Timestamp sent by the host */ 55988eea45cSKlaus Jensen uint64_t timestamp_set_qemu_clock_ms; /* QEMU clock time */ 56088eea45cSKlaus Jensen uint64_t starttime_ms; 56188eea45cSKlaus Jensen uint16_t temperature; 56288eea45cSKlaus Jensen uint8_t smart_critical_warning; 563decc0261SŁukasz Gieryk uint32_t conf_msix_qsize; 564decc0261SŁukasz Gieryk uint32_t conf_ioqpairs; 5653f7fe8deSJinhao Fan uint64_t dbbuf_dbs; 5663f7fe8deSJinhao Fan uint64_t dbbuf_eis; 5673f7fe8deSJinhao Fan bool dbbuf_enabled; 56888eea45cSKlaus Jensen 56988eea45cSKlaus Jensen struct { 57088eea45cSKlaus Jensen MemoryRegion mem; 57188eea45cSKlaus Jensen uint8_t *buf; 57288eea45cSKlaus Jensen bool cmse; 57388eea45cSKlaus Jensen hwaddr cba; 57488eea45cSKlaus Jensen } cmb; 57588eea45cSKlaus Jensen 57688eea45cSKlaus Jensen struct { 57788eea45cSKlaus Jensen HostMemoryBackend *dev; 57888eea45cSKlaus Jensen bool cmse; 57988eea45cSKlaus Jensen hwaddr cba; 58088eea45cSKlaus Jensen } pmr; 58188eea45cSKlaus Jensen 58288eea45cSKlaus Jensen uint8_t aer_mask; 58388eea45cSKlaus Jensen NvmeRequest **aer_reqs; 58488eea45cSKlaus Jensen QTAILQ_HEAD(, NvmeAsyncEvent) aer_queue; 58588eea45cSKlaus Jensen int aer_queued; 58688eea45cSKlaus Jensen 58788eea45cSKlaus Jensen uint32_t dmrsl; 58888eea45cSKlaus Jensen 58988eea45cSKlaus Jensen /* Namespace ID is started with 1 so bitmap should be 1-based */ 59088eea45cSKlaus Jensen #define NVME_CHANGED_NSID_SIZE (NVME_MAX_NAMESPACES + 1) 59188eea45cSKlaus Jensen DECLARE_BITMAP(changed_nsids, NVME_CHANGED_NSID_SIZE); 59288eea45cSKlaus Jensen 59388eea45cSKlaus Jensen NvmeSubsystem *subsys; 59488eea45cSKlaus Jensen 59588eea45cSKlaus Jensen NvmeNamespace namespace; 59688eea45cSKlaus Jensen NvmeNamespace *namespaces[NVME_MAX_NAMESPACES + 1]; 59788eea45cSKlaus Jensen NvmeSQueue **sq; 59888eea45cSKlaus Jensen NvmeCQueue **cq; 59988eea45cSKlaus Jensen NvmeSQueue admin_sq; 60088eea45cSKlaus Jensen NvmeCQueue admin_cq; 60188eea45cSKlaus Jensen NvmeIdCtrl id_ctrl; 60288eea45cSKlaus Jensen 60388eea45cSKlaus Jensen struct { 60488eea45cSKlaus Jensen struct { 60588eea45cSKlaus Jensen uint16_t temp_thresh_hi; 60688eea45cSKlaus Jensen uint16_t temp_thresh_low; 60788eea45cSKlaus Jensen }; 608d0c0697bSNaveen Nagar 60988eea45cSKlaus Jensen uint32_t async_config; 610d0c0697bSNaveen Nagar NvmeHostBehaviorSupport hbs; 61188eea45cSKlaus Jensen } features; 6125e6f963fSLukasz Maniak 6135e6f963fSLukasz Maniak NvmePriCtrlCap pri_ctrl_cap; 61499f48ae7SLukasz Maniak NvmeSecCtrlList sec_ctrl_list; 61511871f53SŁukasz Gieryk struct { 61611871f53SŁukasz Gieryk uint16_t vqrfap; 61711871f53SŁukasz Gieryk uint16_t virfap; 61811871f53SŁukasz Gieryk } next_pri_ctrl_cap; /* These override pri_ctrl_cap after reset */ 61988eea45cSKlaus Jensen } NvmeCtrl; 62088eea45cSKlaus Jensen 6211e9c685eSŁukasz Gieryk typedef enum NvmeResetType { 6221e9c685eSŁukasz Gieryk NVME_RESET_FUNCTION = 0, 6231e9c685eSŁukasz Gieryk NVME_RESET_CONTROLLER = 1, 6241e9c685eSŁukasz Gieryk } NvmeResetType; 6251e9c685eSŁukasz Gieryk 62688eea45cSKlaus Jensen static inline NvmeNamespace *nvme_ns(NvmeCtrl *n, uint32_t nsid) 62788eea45cSKlaus Jensen { 62888eea45cSKlaus Jensen if (!nsid || nsid > NVME_MAX_NAMESPACES) { 62988eea45cSKlaus Jensen return NULL; 63088eea45cSKlaus Jensen } 63188eea45cSKlaus Jensen 63288eea45cSKlaus Jensen return n->namespaces[nsid]; 63388eea45cSKlaus Jensen } 63488eea45cSKlaus Jensen 63588eea45cSKlaus Jensen static inline NvmeCQueue *nvme_cq(NvmeRequest *req) 63688eea45cSKlaus Jensen { 63788eea45cSKlaus Jensen NvmeSQueue *sq = req->sq; 63888eea45cSKlaus Jensen NvmeCtrl *n = sq->ctrl; 63988eea45cSKlaus Jensen 64088eea45cSKlaus Jensen return n->cq[sq->cqid]; 64188eea45cSKlaus Jensen } 64288eea45cSKlaus Jensen 64388eea45cSKlaus Jensen static inline NvmeCtrl *nvme_ctrl(NvmeRequest *req) 64488eea45cSKlaus Jensen { 64588eea45cSKlaus Jensen NvmeSQueue *sq = req->sq; 64688eea45cSKlaus Jensen return sq->ctrl; 64788eea45cSKlaus Jensen } 64888eea45cSKlaus Jensen 64988eea45cSKlaus Jensen static inline uint16_t nvme_cid(NvmeRequest *req) 65088eea45cSKlaus Jensen { 65188eea45cSKlaus Jensen if (!req) { 65288eea45cSKlaus Jensen return 0xffff; 65388eea45cSKlaus Jensen } 65488eea45cSKlaus Jensen 65588eea45cSKlaus Jensen return le16_to_cpu(req->cqe.cid); 65688eea45cSKlaus Jensen } 65788eea45cSKlaus Jensen 65899f48ae7SLukasz Maniak static inline NvmeSecCtrlEntry *nvme_sctrl(NvmeCtrl *n) 65999f48ae7SLukasz Maniak { 66099f48ae7SLukasz Maniak PCIDevice *pci_dev = &n->parent_obj; 66199f48ae7SLukasz Maniak NvmeCtrl *pf = NVME(pcie_sriov_get_pf(pci_dev)); 66299f48ae7SLukasz Maniak 66399f48ae7SLukasz Maniak if (pci_is_vf(pci_dev)) { 66499f48ae7SLukasz Maniak return &pf->sec_ctrl_list.sec[pcie_sriov_vf_number(pci_dev)]; 66599f48ae7SLukasz Maniak } 66699f48ae7SLukasz Maniak 66799f48ae7SLukasz Maniak return NULL; 66899f48ae7SLukasz Maniak } 66999f48ae7SLukasz Maniak 67011871f53SŁukasz Gieryk static inline NvmeSecCtrlEntry *nvme_sctrl_for_cntlid(NvmeCtrl *n, 67111871f53SŁukasz Gieryk uint16_t cntlid) 67211871f53SŁukasz Gieryk { 67311871f53SŁukasz Gieryk NvmeSecCtrlList *list = &n->sec_ctrl_list; 67411871f53SŁukasz Gieryk uint8_t i; 67511871f53SŁukasz Gieryk 67611871f53SŁukasz Gieryk for (i = 0; i < list->numcntl; i++) { 67711871f53SŁukasz Gieryk if (le16_to_cpu(list->sec[i].scid) == cntlid) { 67811871f53SŁukasz Gieryk return &list->sec[i]; 67911871f53SŁukasz Gieryk } 68011871f53SŁukasz Gieryk } 68111871f53SŁukasz Gieryk 68211871f53SŁukasz Gieryk return NULL; 68311871f53SŁukasz Gieryk } 68411871f53SŁukasz Gieryk 68588eea45cSKlaus Jensen void nvme_attach_ns(NvmeCtrl *n, NvmeNamespace *ns); 6868d3a17beSPhilippe Mathieu-Daudé uint16_t nvme_bounce_data(NvmeCtrl *n, void *ptr, uint32_t len, 68788eea45cSKlaus Jensen NvmeTxDirection dir, NvmeRequest *req); 6888d3a17beSPhilippe Mathieu-Daudé uint16_t nvme_bounce_mdata(NvmeCtrl *n, void *ptr, uint32_t len, 68988eea45cSKlaus Jensen NvmeTxDirection dir, NvmeRequest *req); 69088eea45cSKlaus Jensen void nvme_rw_complete_cb(void *opaque, int ret); 69188eea45cSKlaus Jensen uint16_t nvme_map_dptr(NvmeCtrl *n, NvmeSg *sg, size_t len, 69288eea45cSKlaus Jensen NvmeCmd *cmd); 69388eea45cSKlaus Jensen 69452581c71SMarkus Armbruster #endif /* HW_NVME_NVME_H */ 695