1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */ 2320ae51fSJens Axboe #ifndef INT_BLK_MQ_H 3320ae51fSJens Axboe #define INT_BLK_MQ_H 4320ae51fSJens Axboe 5cf43e6beSJens Axboe #include "blk-stat.h" 6244c65a3SMing Lei #include "blk-mq-tag.h" 7cf43e6beSJens Axboe 824d2f903SChristoph Hellwig struct blk_mq_tag_set; 924d2f903SChristoph Hellwig 101db4909eSMing Lei struct blk_mq_ctxs { 111db4909eSMing Lei struct kobject kobj; 121db4909eSMing Lei struct blk_mq_ctx __percpu *queue_ctx; 131db4909eSMing Lei }; 141db4909eSMing Lei 15fe644072SLinus Walleij /** 16fe644072SLinus Walleij * struct blk_mq_ctx - State for a software queue facing the submitting CPUs 17fe644072SLinus Walleij */ 18320ae51fSJens Axboe struct blk_mq_ctx { 19320ae51fSJens Axboe struct { 20320ae51fSJens Axboe spinlock_t lock; 21c16d6b5aSMing Lei struct list_head rq_lists[HCTX_MAX_TYPES]; 22320ae51fSJens Axboe } ____cacheline_aligned_in_smp; 23320ae51fSJens Axboe 24320ae51fSJens Axboe unsigned int cpu; 25f31967f0SJens Axboe unsigned short index_hw[HCTX_MAX_TYPES]; 268ccdf4a3SJianchao Wang struct blk_mq_hw_ctx *hctxs[HCTX_MAX_TYPES]; 27320ae51fSJens Axboe 28320ae51fSJens Axboe /* incremented at dispatch time */ 29320ae51fSJens Axboe unsigned long rq_dispatched[2]; 30320ae51fSJens Axboe unsigned long rq_merged; 31320ae51fSJens Axboe 32320ae51fSJens Axboe /* incremented at completion time */ 33320ae51fSJens Axboe unsigned long ____cacheline_aligned_in_smp rq_completed[2]; 34320ae51fSJens Axboe 35320ae51fSJens Axboe struct request_queue *queue; 361db4909eSMing Lei struct blk_mq_ctxs *ctxs; 37320ae51fSJens Axboe struct kobject kobj; 384bb659b1SJens Axboe } ____cacheline_aligned_in_smp; 39320ae51fSJens Axboe 40c7e2d94bSMing Lei void blk_mq_exit_queue(struct request_queue *q); 41e3a2b3f9SJens Axboe int blk_mq_update_nr_requests(struct request_queue *q, unsigned int nr); 42aed3ea94SJens Axboe void blk_mq_wake_waiters(struct request_queue *q); 43de148297SMing Lei bool blk_mq_dispatch_rq_list(struct request_queue *, struct list_head *, bool); 44e6c98712SBart Van Assche void blk_mq_add_to_requeue_list(struct request *rq, bool at_head, 45e6c98712SBart Van Assche bool kick_requeue_list); 462c3ad667SJens Axboe void blk_mq_flush_busy_ctxs(struct blk_mq_hw_ctx *hctx, struct list_head *list); 478ab6bb9eSMing Lei bool blk_mq_get_driver_tag(struct request *rq); 48b347689fSMing Lei struct request *blk_mq_dequeue_from_ctx(struct blk_mq_hw_ctx *hctx, 49b347689fSMing Lei struct blk_mq_ctx *start); 502c3ad667SJens Axboe 512c3ad667SJens Axboe /* 522c3ad667SJens Axboe * Internal helpers for allocating/freeing the request map 532c3ad667SJens Axboe */ 54cc71a6f4SJens Axboe void blk_mq_free_rqs(struct blk_mq_tag_set *set, struct blk_mq_tags *tags, 552c3ad667SJens Axboe unsigned int hctx_idx); 56cc71a6f4SJens Axboe void blk_mq_free_rq_map(struct blk_mq_tags *tags); 57cc71a6f4SJens Axboe struct blk_mq_tags *blk_mq_alloc_rq_map(struct blk_mq_tag_set *set, 58cc71a6f4SJens Axboe unsigned int hctx_idx, 59cc71a6f4SJens Axboe unsigned int nr_tags, 60cc71a6f4SJens Axboe unsigned int reserved_tags); 61cc71a6f4SJens Axboe int blk_mq_alloc_rqs(struct blk_mq_tag_set *set, struct blk_mq_tags *tags, 62cc71a6f4SJens Axboe unsigned int hctx_idx, unsigned int depth); 632c3ad667SJens Axboe 642c3ad667SJens Axboe /* 652c3ad667SJens Axboe * Internal helpers for request insertion into sw queues 662c3ad667SJens Axboe */ 672c3ad667SJens Axboe void __blk_mq_insert_request(struct blk_mq_hw_ctx *hctx, struct request *rq, 682c3ad667SJens Axboe bool at_head); 69b0850297SMing Lei void blk_mq_request_bypass_insert(struct request *rq, bool run_queue); 70bd166ef1SJens Axboe void blk_mq_insert_requests(struct blk_mq_hw_ctx *hctx, struct blk_mq_ctx *ctx, 71bd166ef1SJens Axboe struct list_head *list); 72320ae51fSJens Axboe 73fd9c40f6SBart Van Assche /* Used by blk_insert_cloned_request() to issue request directly */ 74fd9c40f6SBart Van Assche blk_status_t blk_mq_request_issue_directly(struct request *rq, bool last); 756ce3dd6eSMing Lei void blk_mq_try_issue_list_directly(struct blk_mq_hw_ctx *hctx, 766ce3dd6eSMing Lei struct list_head *list); 77396eaf21SMing Lei 78320ae51fSJens Axboe /* 79320ae51fSJens Axboe * CPU -> queue mappings 80320ae51fSJens Axboe */ 81ed76e329SJens Axboe extern int blk_mq_hw_queue_to_node(struct blk_mq_queue_map *qmap, unsigned int); 82320ae51fSJens Axboe 83b3c661b1SJens Axboe /* 84b3c661b1SJens Axboe * blk_mq_map_queue_type() - map (hctx_type,cpu) to hardware queue 85b3c661b1SJens Axboe * @q: request queue 86e20ba6e1SChristoph Hellwig * @type: the hctx type index 87b3c661b1SJens Axboe * @cpu: CPU 88b3c661b1SJens Axboe */ 89ff2c5660SJens Axboe static inline struct blk_mq_hw_ctx *blk_mq_map_queue_type(struct request_queue *q, 90e20ba6e1SChristoph Hellwig enum hctx_type type, 91ff2c5660SJens Axboe unsigned int cpu) 92ff2c5660SJens Axboe { 93e20ba6e1SChristoph Hellwig return q->queue_hw_ctx[q->tag_set->map[type].mq_map[cpu]]; 94b3c661b1SJens Axboe } 95b3c661b1SJens Axboe 96b3c661b1SJens Axboe /* 97b3c661b1SJens Axboe * blk_mq_map_queue() - map (cmd_flags,type) to hardware queue 98b3c661b1SJens Axboe * @q: request queue 99b3c661b1SJens Axboe * @flags: request command flags 1008ccdf4a3SJianchao Wang * @cpu: cpu ctx 101b3c661b1SJens Axboe */ 102b3c661b1SJens Axboe static inline struct blk_mq_hw_ctx *blk_mq_map_queue(struct request_queue *q, 103b3c661b1SJens Axboe unsigned int flags, 1048ccdf4a3SJianchao Wang struct blk_mq_ctx *ctx) 105b3c661b1SJens Axboe { 106e20ba6e1SChristoph Hellwig enum hctx_type type = HCTX_TYPE_DEFAULT; 107b3c661b1SJens Axboe 108bb94aea1SJianchao Wang /* 109bb94aea1SJianchao Wang * The caller ensure that if REQ_HIPRI, poll must be enabled. 110bb94aea1SJianchao Wang */ 111bb94aea1SJianchao Wang if (flags & REQ_HIPRI) 112e20ba6e1SChristoph Hellwig type = HCTX_TYPE_POLL; 113bb94aea1SJianchao Wang else if ((flags & REQ_OP_MASK) == REQ_OP_READ) 114e20ba6e1SChristoph Hellwig type = HCTX_TYPE_READ; 115e20ba6e1SChristoph Hellwig 1168ccdf4a3SJianchao Wang return ctx->hctxs[type]; 117ff2c5660SJens Axboe } 118ff2c5660SJens Axboe 119e93ecf60SJens Axboe /* 12067aec14cSJens Axboe * sysfs helpers 12167aec14cSJens Axboe */ 122737f98cfSMing Lei extern void blk_mq_sysfs_init(struct request_queue *q); 1237ea5fe31SMing Lei extern void blk_mq_sysfs_deinit(struct request_queue *q); 1242d0364c8SBart Van Assche extern int __blk_mq_register_dev(struct device *dev, struct request_queue *q); 12567aec14cSJens Axboe extern int blk_mq_sysfs_register(struct request_queue *q); 12667aec14cSJens Axboe extern void blk_mq_sysfs_unregister(struct request_queue *q); 127868f2f0bSKeith Busch extern void blk_mq_hctx_kobj_init(struct blk_mq_hw_ctx *hctx); 12867aec14cSJens Axboe 129e09aae7eSMing Lei void blk_mq_release(struct request_queue *q); 130e09aae7eSMing Lei 1311d9bd516STejun Heo /** 1321d9bd516STejun Heo * blk_mq_rq_state() - read the current MQ_RQ_* state of a request 1331d9bd516STejun Heo * @rq: target request. 1341d9bd516STejun Heo */ 13512f5b931SKeith Busch static inline enum mq_rq_state blk_mq_rq_state(struct request *rq) 1361d9bd516STejun Heo { 13712f5b931SKeith Busch return READ_ONCE(rq->state); 1381d9bd516STejun Heo } 1391d9bd516STejun Heo 1401aecfe48SMing Lei static inline struct blk_mq_ctx *__blk_mq_get_ctx(struct request_queue *q, 1411aecfe48SMing Lei unsigned int cpu) 1421aecfe48SMing Lei { 1431aecfe48SMing Lei return per_cpu_ptr(q->queue_ctx, cpu); 1441aecfe48SMing Lei } 1451aecfe48SMing Lei 1461aecfe48SMing Lei /* 1471aecfe48SMing Lei * This assumes per-cpu software queueing queues. They could be per-node 1481aecfe48SMing Lei * as well, for instance. For now this is hardcoded as-is. Note that we don't 1491aecfe48SMing Lei * care about preemption, since we know the ctx's are persistent. This does 1501aecfe48SMing Lei * mean that we can't rely on ctx always matching the currently running CPU. 1511aecfe48SMing Lei */ 1521aecfe48SMing Lei static inline struct blk_mq_ctx *blk_mq_get_ctx(struct request_queue *q) 1531aecfe48SMing Lei { 154c05f4220SBart Van Assche return __blk_mq_get_ctx(q, raw_smp_processor_id()); 1551aecfe48SMing Lei } 1561aecfe48SMing Lei 157cb96a42cSMing Lei struct blk_mq_alloc_data { 158cb96a42cSMing Lei /* input parameter */ 159cb96a42cSMing Lei struct request_queue *q; 1609a95e4efSBart Van Assche blk_mq_req_flags_t flags; 161229a9287SOmar Sandoval unsigned int shallow_depth; 162f9afca4dSJens Axboe unsigned int cmd_flags; 163cb96a42cSMing Lei 164cb96a42cSMing Lei /* input & output parameter */ 165cb96a42cSMing Lei struct blk_mq_ctx *ctx; 166cb96a42cSMing Lei struct blk_mq_hw_ctx *hctx; 167cb96a42cSMing Lei }; 168cb96a42cSMing Lei 1694941115bSJens Axboe static inline struct blk_mq_tags *blk_mq_tags_from_data(struct blk_mq_alloc_data *data) 1704941115bSJens Axboe { 171bd166ef1SJens Axboe if (data->flags & BLK_MQ_REQ_INTERNAL) 172bd166ef1SJens Axboe return data->hctx->sched_tags; 173bd166ef1SJens Axboe 1744941115bSJens Axboe return data->hctx->tags; 1754941115bSJens Axboe } 1764941115bSJens Axboe 1775d1b25c1SBart Van Assche static inline bool blk_mq_hctx_stopped(struct blk_mq_hw_ctx *hctx) 1785d1b25c1SBart Van Assche { 1795d1b25c1SBart Van Assche return test_bit(BLK_MQ_S_STOPPED, &hctx->state); 1805d1b25c1SBart Van Assche } 1815d1b25c1SBart Van Assche 18219c66e59SMing Lei static inline bool blk_mq_hw_queue_mapped(struct blk_mq_hw_ctx *hctx) 18319c66e59SMing Lei { 18419c66e59SMing Lei return hctx->nr_ctx && hctx->tags; 18519c66e59SMing Lei } 18619c66e59SMing Lei 187e016b782SMikulas Patocka unsigned int blk_mq_in_flight(struct request_queue *q, struct hd_struct *part); 188bf0ddabaSOmar Sandoval void blk_mq_in_flight_rw(struct request_queue *q, struct hd_struct *part, 189bf0ddabaSOmar Sandoval unsigned int inflight[2]); 190f299b7c7SJens Axboe 191de148297SMing Lei static inline void blk_mq_put_dispatch_budget(struct blk_mq_hw_ctx *hctx) 192de148297SMing Lei { 193de148297SMing Lei struct request_queue *q = hctx->queue; 194de148297SMing Lei 195de148297SMing Lei if (q->mq_ops->put_budget) 196de148297SMing Lei q->mq_ops->put_budget(hctx); 197de148297SMing Lei } 198de148297SMing Lei 19988022d72SMing Lei static inline bool blk_mq_get_dispatch_budget(struct blk_mq_hw_ctx *hctx) 200de148297SMing Lei { 201de148297SMing Lei struct request_queue *q = hctx->queue; 202de148297SMing Lei 203de148297SMing Lei if (q->mq_ops->get_budget) 204de148297SMing Lei return q->mq_ops->get_budget(hctx); 20588022d72SMing Lei return true; 206de148297SMing Lei } 207de148297SMing Lei 208244c65a3SMing Lei static inline void __blk_mq_put_driver_tag(struct blk_mq_hw_ctx *hctx, 209244c65a3SMing Lei struct request *rq) 210244c65a3SMing Lei { 211244c65a3SMing Lei blk_mq_put_tag(hctx, hctx->tags, rq->mq_ctx, rq->tag); 212244c65a3SMing Lei rq->tag = -1; 213244c65a3SMing Lei 214244c65a3SMing Lei if (rq->rq_flags & RQF_MQ_INFLIGHT) { 215244c65a3SMing Lei rq->rq_flags &= ~RQF_MQ_INFLIGHT; 216244c65a3SMing Lei atomic_dec(&hctx->nr_active); 217244c65a3SMing Lei } 218244c65a3SMing Lei } 219244c65a3SMing Lei 220244c65a3SMing Lei static inline void blk_mq_put_driver_tag(struct request *rq) 221244c65a3SMing Lei { 222244c65a3SMing Lei if (rq->tag == -1 || rq->internal_tag == -1) 223244c65a3SMing Lei return; 224244c65a3SMing Lei 225ea4f995eSJens Axboe __blk_mq_put_driver_tag(rq->mq_hctx, rq); 226244c65a3SMing Lei } 227244c65a3SMing Lei 228ed76e329SJens Axboe static inline void blk_mq_clear_mq_map(struct blk_mq_queue_map *qmap) 2290da73d00SMinwoo Im { 2300da73d00SMinwoo Im int cpu; 2310da73d00SMinwoo Im 2320da73d00SMinwoo Im for_each_possible_cpu(cpu) 233ed76e329SJens Axboe qmap->mq_map[cpu] = 0; 2340da73d00SMinwoo Im } 2350da73d00SMinwoo Im 236*b49773e7SDamien Le Moal /* 237*b49773e7SDamien Le Moal * blk_mq_plug() - Get caller context plug 238*b49773e7SDamien Le Moal * @q: request queue 239*b49773e7SDamien Le Moal * @bio : the bio being submitted by the caller context 240*b49773e7SDamien Le Moal * 241*b49773e7SDamien Le Moal * Plugging, by design, may delay the insertion of BIOs into the elevator in 242*b49773e7SDamien Le Moal * order to increase BIO merging opportunities. This however can cause BIO 243*b49773e7SDamien Le Moal * insertion order to change from the order in which submit_bio() is being 244*b49773e7SDamien Le Moal * executed in the case of multiple contexts concurrently issuing BIOs to a 245*b49773e7SDamien Le Moal * device, even if these context are synchronized to tightly control BIO issuing 246*b49773e7SDamien Le Moal * order. While this is not a problem with regular block devices, this ordering 247*b49773e7SDamien Le Moal * change can cause write BIO failures with zoned block devices as these 248*b49773e7SDamien Le Moal * require sequential write patterns to zones. Prevent this from happening by 249*b49773e7SDamien Le Moal * ignoring the plug state of a BIO issuing context if the target request queue 250*b49773e7SDamien Le Moal * is for a zoned block device and the BIO to plug is a write operation. 251*b49773e7SDamien Le Moal * 252*b49773e7SDamien Le Moal * Return current->plug if the bio can be plugged and NULL otherwise 253*b49773e7SDamien Le Moal */ 254*b49773e7SDamien Le Moal static inline struct blk_plug *blk_mq_plug(struct request_queue *q, 255*b49773e7SDamien Le Moal struct bio *bio) 256*b49773e7SDamien Le Moal { 257*b49773e7SDamien Le Moal /* 258*b49773e7SDamien Le Moal * For regular block devices or read operations, use the context plug 259*b49773e7SDamien Le Moal * which may be NULL if blk_start_plug() was not executed. 260*b49773e7SDamien Le Moal */ 261*b49773e7SDamien Le Moal if (!blk_queue_is_zoned(q) || !op_is_write(bio_op(bio))) 262*b49773e7SDamien Le Moal return current->plug; 263*b49773e7SDamien Le Moal 264*b49773e7SDamien Le Moal /* Zoned block device write operation case: do not plug the BIO */ 265*b49773e7SDamien Le Moal return NULL; 266*b49773e7SDamien Le Moal } 267*b49773e7SDamien Le Moal 268320ae51fSJens Axboe #endif 269