1d6d48196SJens Axboe /* 2d6d48196SJens Axboe * Functions related to segment and merge handling 3d6d48196SJens Axboe */ 4d6d48196SJens Axboe #include <linux/kernel.h> 5d6d48196SJens Axboe #include <linux/module.h> 6d6d48196SJens Axboe #include <linux/bio.h> 7d6d48196SJens Axboe #include <linux/blkdev.h> 8d6d48196SJens Axboe #include <linux/scatterlist.h> 9d6d48196SJens Axboe 10cda22646SMike Krinkin #include <trace/events/block.h> 11cda22646SMike Krinkin 12d6d48196SJens Axboe #include "blk.h" 13d6d48196SJens Axboe 1454efd50bSKent Overstreet static struct bio *blk_bio_discard_split(struct request_queue *q, 1554efd50bSKent Overstreet struct bio *bio, 16bdced438SMing Lei struct bio_set *bs, 17bdced438SMing Lei unsigned *nsegs) 1854efd50bSKent Overstreet { 1954efd50bSKent Overstreet unsigned int max_discard_sectors, granularity; 2054efd50bSKent Overstreet int alignment; 2154efd50bSKent Overstreet sector_t tmp; 2254efd50bSKent Overstreet unsigned split_sectors; 2354efd50bSKent Overstreet 24bdced438SMing Lei *nsegs = 1; 25bdced438SMing Lei 2654efd50bSKent Overstreet /* Zero-sector (unknown) and one-sector granularities are the same. */ 2754efd50bSKent Overstreet granularity = max(q->limits.discard_granularity >> 9, 1U); 2854efd50bSKent Overstreet 2954efd50bSKent Overstreet max_discard_sectors = min(q->limits.max_discard_sectors, UINT_MAX >> 9); 3054efd50bSKent Overstreet max_discard_sectors -= max_discard_sectors % granularity; 3154efd50bSKent Overstreet 3254efd50bSKent Overstreet if (unlikely(!max_discard_sectors)) { 3354efd50bSKent Overstreet /* XXX: warn */ 3454efd50bSKent Overstreet return NULL; 3554efd50bSKent Overstreet } 3654efd50bSKent Overstreet 3754efd50bSKent Overstreet if (bio_sectors(bio) <= max_discard_sectors) 3854efd50bSKent Overstreet return NULL; 3954efd50bSKent Overstreet 4054efd50bSKent Overstreet split_sectors = max_discard_sectors; 4154efd50bSKent Overstreet 4254efd50bSKent Overstreet /* 4354efd50bSKent Overstreet * If the next starting sector would be misaligned, stop the discard at 4454efd50bSKent Overstreet * the previous aligned sector. 4554efd50bSKent Overstreet */ 4654efd50bSKent Overstreet alignment = (q->limits.discard_alignment >> 9) % granularity; 4754efd50bSKent Overstreet 4854efd50bSKent Overstreet tmp = bio->bi_iter.bi_sector + split_sectors - alignment; 4954efd50bSKent Overstreet tmp = sector_div(tmp, granularity); 5054efd50bSKent Overstreet 5154efd50bSKent Overstreet if (split_sectors > tmp) 5254efd50bSKent Overstreet split_sectors -= tmp; 5354efd50bSKent Overstreet 5454efd50bSKent Overstreet return bio_split(bio, split_sectors, GFP_NOIO, bs); 5554efd50bSKent Overstreet } 5654efd50bSKent Overstreet 5754efd50bSKent Overstreet static struct bio *blk_bio_write_same_split(struct request_queue *q, 5854efd50bSKent Overstreet struct bio *bio, 59bdced438SMing Lei struct bio_set *bs, 60bdced438SMing Lei unsigned *nsegs) 6154efd50bSKent Overstreet { 62bdced438SMing Lei *nsegs = 1; 63bdced438SMing Lei 6454efd50bSKent Overstreet if (!q->limits.max_write_same_sectors) 6554efd50bSKent Overstreet return NULL; 6654efd50bSKent Overstreet 6754efd50bSKent Overstreet if (bio_sectors(bio) <= q->limits.max_write_same_sectors) 6854efd50bSKent Overstreet return NULL; 6954efd50bSKent Overstreet 7054efd50bSKent Overstreet return bio_split(bio, q->limits.max_write_same_sectors, GFP_NOIO, bs); 7154efd50bSKent Overstreet } 7254efd50bSKent Overstreet 73d0e5fbb0SMing Lei static inline unsigned get_max_io_size(struct request_queue *q, 74d0e5fbb0SMing Lei struct bio *bio) 75d0e5fbb0SMing Lei { 76d0e5fbb0SMing Lei unsigned sectors = blk_max_size_offset(q, bio->bi_iter.bi_sector); 77d0e5fbb0SMing Lei unsigned mask = queue_logical_block_size(q) - 1; 78d0e5fbb0SMing Lei 79d0e5fbb0SMing Lei /* aligned to logical block size */ 80d0e5fbb0SMing Lei sectors &= ~(mask >> 9); 81d0e5fbb0SMing Lei 82d0e5fbb0SMing Lei return sectors; 83d0e5fbb0SMing Lei } 84d0e5fbb0SMing Lei 8554efd50bSKent Overstreet static struct bio *blk_bio_segment_split(struct request_queue *q, 8654efd50bSKent Overstreet struct bio *bio, 87bdced438SMing Lei struct bio_set *bs, 88bdced438SMing Lei unsigned *segs) 8954efd50bSKent Overstreet { 905014c311SJens Axboe struct bio_vec bv, bvprv, *bvprvp = NULL; 9154efd50bSKent Overstreet struct bvec_iter iter; 928ae12666SKent Overstreet unsigned seg_size = 0, nsegs = 0, sectors = 0; 9302e70742SMing Lei unsigned front_seg_size = bio->bi_seg_front_size; 9402e70742SMing Lei bool do_split = true; 9502e70742SMing Lei struct bio *new = NULL; 96d0e5fbb0SMing Lei const unsigned max_sectors = get_max_io_size(q, bio); 9754efd50bSKent Overstreet 9854efd50bSKent Overstreet bio_for_each_segment(bv, bio, iter) { 9954efd50bSKent Overstreet /* 10054efd50bSKent Overstreet * If the queue doesn't support SG gaps and adding this 10154efd50bSKent Overstreet * offset would create a gap, disallow it. 10254efd50bSKent Overstreet */ 1035014c311SJens Axboe if (bvprvp && bvec_gap_to_prev(q, bvprvp, bv.bv_offset)) 10454efd50bSKent Overstreet goto split; 10554efd50bSKent Overstreet 106d0e5fbb0SMing Lei if (sectors + (bv.bv_len >> 9) > max_sectors) { 107e36f6204SKeith Busch /* 108e36f6204SKeith Busch * Consider this a new segment if we're splitting in 109e36f6204SKeith Busch * the middle of this vector. 110e36f6204SKeith Busch */ 111e36f6204SKeith Busch if (nsegs < queue_max_segments(q) && 112d0e5fbb0SMing Lei sectors < max_sectors) { 113e36f6204SKeith Busch nsegs++; 114d0e5fbb0SMing Lei sectors = max_sectors; 115e36f6204SKeith Busch } 116d0e5fbb0SMing Lei if (sectors) 117e36f6204SKeith Busch goto split; 118d0e5fbb0SMing Lei /* Make this single bvec as the 1st segment */ 119e36f6204SKeith Busch } 120e36f6204SKeith Busch 1215014c311SJens Axboe if (bvprvp && blk_queue_cluster(q)) { 12254efd50bSKent Overstreet if (seg_size + bv.bv_len > queue_max_segment_size(q)) 12354efd50bSKent Overstreet goto new_segment; 1245014c311SJens Axboe if (!BIOVEC_PHYS_MERGEABLE(bvprvp, &bv)) 12554efd50bSKent Overstreet goto new_segment; 1265014c311SJens Axboe if (!BIOVEC_SEG_BOUNDARY(q, bvprvp, &bv)) 12754efd50bSKent Overstreet goto new_segment; 12854efd50bSKent Overstreet 12954efd50bSKent Overstreet seg_size += bv.bv_len; 13054efd50bSKent Overstreet bvprv = bv; 131578270bfSMing Lei bvprvp = &bvprv; 13252cc6eeaSMing Lei sectors += bv.bv_len >> 9; 133a88d32afSMing Lei 134a88d32afSMing Lei if (nsegs == 1 && seg_size > front_seg_size) 135a88d32afSMing Lei front_seg_size = seg_size; 13654efd50bSKent Overstreet continue; 13754efd50bSKent Overstreet } 13854efd50bSKent Overstreet new_segment: 13954efd50bSKent Overstreet if (nsegs == queue_max_segments(q)) 14054efd50bSKent Overstreet goto split; 14154efd50bSKent Overstreet 14254efd50bSKent Overstreet nsegs++; 14354efd50bSKent Overstreet bvprv = bv; 144578270bfSMing Lei bvprvp = &bvprv; 14554efd50bSKent Overstreet seg_size = bv.bv_len; 14652cc6eeaSMing Lei sectors += bv.bv_len >> 9; 14702e70742SMing Lei 14802e70742SMing Lei if (nsegs == 1 && seg_size > front_seg_size) 14902e70742SMing Lei front_seg_size = seg_size; 15054efd50bSKent Overstreet } 15154efd50bSKent Overstreet 15202e70742SMing Lei do_split = false; 15354efd50bSKent Overstreet split: 154bdced438SMing Lei *segs = nsegs; 15502e70742SMing Lei 15602e70742SMing Lei if (do_split) { 15702e70742SMing Lei new = bio_split(bio, sectors, GFP_NOIO, bs); 15802e70742SMing Lei if (new) 15902e70742SMing Lei bio = new; 16002e70742SMing Lei } 16102e70742SMing Lei 16202e70742SMing Lei bio->bi_seg_front_size = front_seg_size; 16302e70742SMing Lei if (seg_size > bio->bi_seg_back_size) 16402e70742SMing Lei bio->bi_seg_back_size = seg_size; 16502e70742SMing Lei 16602e70742SMing Lei return do_split ? new : NULL; 16754efd50bSKent Overstreet } 16854efd50bSKent Overstreet 16954efd50bSKent Overstreet void blk_queue_split(struct request_queue *q, struct bio **bio, 17054efd50bSKent Overstreet struct bio_set *bs) 17154efd50bSKent Overstreet { 172bdced438SMing Lei struct bio *split, *res; 173bdced438SMing Lei unsigned nsegs; 17454efd50bSKent Overstreet 175*7afafc8aSAdrian Hunter switch (bio_op(*bio)) { 176*7afafc8aSAdrian Hunter case REQ_OP_DISCARD: 177*7afafc8aSAdrian Hunter case REQ_OP_SECURE_ERASE: 178bdced438SMing Lei split = blk_bio_discard_split(q, *bio, bs, &nsegs); 179*7afafc8aSAdrian Hunter break; 180*7afafc8aSAdrian Hunter case REQ_OP_WRITE_SAME: 181bdced438SMing Lei split = blk_bio_write_same_split(q, *bio, bs, &nsegs); 182*7afafc8aSAdrian Hunter break; 183*7afafc8aSAdrian Hunter default: 184bdced438SMing Lei split = blk_bio_segment_split(q, *bio, q->bio_split, &nsegs); 185*7afafc8aSAdrian Hunter break; 186*7afafc8aSAdrian Hunter } 187bdced438SMing Lei 188bdced438SMing Lei /* physical segments can be figured out during splitting */ 189bdced438SMing Lei res = split ? split : *bio; 190bdced438SMing Lei res->bi_phys_segments = nsegs; 191bdced438SMing Lei bio_set_flag(res, BIO_SEG_VALID); 19254efd50bSKent Overstreet 19354efd50bSKent Overstreet if (split) { 1946ac45aebSMing Lei /* there isn't chance to merge the splitted bio */ 1951eff9d32SJens Axboe split->bi_opf |= REQ_NOMERGE; 1966ac45aebSMing Lei 19754efd50bSKent Overstreet bio_chain(split, *bio); 198cda22646SMike Krinkin trace_block_split(q, split, (*bio)->bi_iter.bi_sector); 19954efd50bSKent Overstreet generic_make_request(*bio); 20054efd50bSKent Overstreet *bio = split; 20154efd50bSKent Overstreet } 20254efd50bSKent Overstreet } 20354efd50bSKent Overstreet EXPORT_SYMBOL(blk_queue_split); 20454efd50bSKent Overstreet 2051e428079SJens Axboe static unsigned int __blk_recalc_rq_segments(struct request_queue *q, 20607388549SMing Lei struct bio *bio, 20707388549SMing Lei bool no_sg_merge) 208d6d48196SJens Axboe { 2097988613bSKent Overstreet struct bio_vec bv, bvprv = { NULL }; 21054efd50bSKent Overstreet int cluster, prev = 0; 2111e428079SJens Axboe unsigned int seg_size, nr_phys_segs; 21259247eaeSJens Axboe struct bio *fbio, *bbio; 2137988613bSKent Overstreet struct bvec_iter iter; 214d6d48196SJens Axboe 2151e428079SJens Axboe if (!bio) 2161e428079SJens Axboe return 0; 217d6d48196SJens Axboe 2185cb8850cSKent Overstreet /* 2195cb8850cSKent Overstreet * This should probably be returning 0, but blk_add_request_payload() 2205cb8850cSKent Overstreet * (Christoph!!!!) 2215cb8850cSKent Overstreet */ 222*7afafc8aSAdrian Hunter if (bio_op(bio) == REQ_OP_DISCARD || bio_op(bio) == REQ_OP_SECURE_ERASE) 2235cb8850cSKent Overstreet return 1; 2245cb8850cSKent Overstreet 22595fe6c1aSMike Christie if (bio_op(bio) == REQ_OP_WRITE_SAME) 2265cb8850cSKent Overstreet return 1; 2275cb8850cSKent Overstreet 2281e428079SJens Axboe fbio = bio; 229e692cb66SMartin K. Petersen cluster = blk_queue_cluster(q); 2305df97b91SMikulas Patocka seg_size = 0; 2312c8919deSAndi Kleen nr_phys_segs = 0; 2321e428079SJens Axboe for_each_bio(bio) { 2337988613bSKent Overstreet bio_for_each_segment(bv, bio, iter) { 234d6d48196SJens Axboe /* 23505f1dd53SJens Axboe * If SG merging is disabled, each bio vector is 23605f1dd53SJens Axboe * a segment 23705f1dd53SJens Axboe */ 23805f1dd53SJens Axboe if (no_sg_merge) 23905f1dd53SJens Axboe goto new_segment; 24005f1dd53SJens Axboe 24154efd50bSKent Overstreet if (prev && cluster) { 2427988613bSKent Overstreet if (seg_size + bv.bv_len 243ae03bf63SMartin K. Petersen > queue_max_segment_size(q)) 244d6d48196SJens Axboe goto new_segment; 2457988613bSKent Overstreet if (!BIOVEC_PHYS_MERGEABLE(&bvprv, &bv)) 246d6d48196SJens Axboe goto new_segment; 2477988613bSKent Overstreet if (!BIOVEC_SEG_BOUNDARY(q, &bvprv, &bv)) 248d6d48196SJens Axboe goto new_segment; 249d6d48196SJens Axboe 2507988613bSKent Overstreet seg_size += bv.bv_len; 251d6d48196SJens Axboe bvprv = bv; 252d6d48196SJens Axboe continue; 253d6d48196SJens Axboe } 254d6d48196SJens Axboe new_segment: 2551e428079SJens Axboe if (nr_phys_segs == 1 && seg_size > 2561e428079SJens Axboe fbio->bi_seg_front_size) 2571e428079SJens Axboe fbio->bi_seg_front_size = seg_size; 25886771427SFUJITA Tomonori 259d6d48196SJens Axboe nr_phys_segs++; 260d6d48196SJens Axboe bvprv = bv; 26154efd50bSKent Overstreet prev = 1; 2627988613bSKent Overstreet seg_size = bv.bv_len; 263d6d48196SJens Axboe } 26459247eaeSJens Axboe bbio = bio; 2651e428079SJens Axboe } 266d6d48196SJens Axboe 26759247eaeSJens Axboe if (nr_phys_segs == 1 && seg_size > fbio->bi_seg_front_size) 26859247eaeSJens Axboe fbio->bi_seg_front_size = seg_size; 26959247eaeSJens Axboe if (seg_size > bbio->bi_seg_back_size) 27059247eaeSJens Axboe bbio->bi_seg_back_size = seg_size; 2711e428079SJens Axboe 2721e428079SJens Axboe return nr_phys_segs; 2731e428079SJens Axboe } 2741e428079SJens Axboe 2751e428079SJens Axboe void blk_recalc_rq_segments(struct request *rq) 2761e428079SJens Axboe { 27707388549SMing Lei bool no_sg_merge = !!test_bit(QUEUE_FLAG_NO_SG_MERGE, 27807388549SMing Lei &rq->q->queue_flags); 27907388549SMing Lei 28007388549SMing Lei rq->nr_phys_segments = __blk_recalc_rq_segments(rq->q, rq->bio, 28107388549SMing Lei no_sg_merge); 282d6d48196SJens Axboe } 283d6d48196SJens Axboe 284d6d48196SJens Axboe void blk_recount_segments(struct request_queue *q, struct bio *bio) 285d6d48196SJens Axboe { 2867f60dcaaSMing Lei unsigned short seg_cnt; 287764f612cSMing Lei 2887f60dcaaSMing Lei /* estimate segment number by bi_vcnt for non-cloned bio */ 2897f60dcaaSMing Lei if (bio_flagged(bio, BIO_CLONED)) 2907f60dcaaSMing Lei seg_cnt = bio_segments(bio); 2917f60dcaaSMing Lei else 2927f60dcaaSMing Lei seg_cnt = bio->bi_vcnt; 2937f60dcaaSMing Lei 2947f60dcaaSMing Lei if (test_bit(QUEUE_FLAG_NO_SG_MERGE, &q->queue_flags) && 2957f60dcaaSMing Lei (seg_cnt < queue_max_segments(q))) 2967f60dcaaSMing Lei bio->bi_phys_segments = seg_cnt; 29705f1dd53SJens Axboe else { 298d6d48196SJens Axboe struct bio *nxt = bio->bi_next; 2991e428079SJens Axboe 300d6d48196SJens Axboe bio->bi_next = NULL; 3017f60dcaaSMing Lei bio->bi_phys_segments = __blk_recalc_rq_segments(q, bio, false); 302d6d48196SJens Axboe bio->bi_next = nxt; 30305f1dd53SJens Axboe } 30405f1dd53SJens Axboe 305b7c44ed9SJens Axboe bio_set_flag(bio, BIO_SEG_VALID); 306d6d48196SJens Axboe } 307d6d48196SJens Axboe EXPORT_SYMBOL(blk_recount_segments); 308d6d48196SJens Axboe 309d6d48196SJens Axboe static int blk_phys_contig_segment(struct request_queue *q, struct bio *bio, 310d6d48196SJens Axboe struct bio *nxt) 311d6d48196SJens Axboe { 3122b8221e1SKent Overstreet struct bio_vec end_bv = { NULL }, nxt_bv; 313f619d254SKent Overstreet 314e692cb66SMartin K. Petersen if (!blk_queue_cluster(q)) 315d6d48196SJens Axboe return 0; 316d6d48196SJens Axboe 31786771427SFUJITA Tomonori if (bio->bi_seg_back_size + nxt->bi_seg_front_size > 318ae03bf63SMartin K. Petersen queue_max_segment_size(q)) 319d6d48196SJens Axboe return 0; 320d6d48196SJens Axboe 321e17fc0a1SDavid Woodhouse if (!bio_has_data(bio)) 322e17fc0a1SDavid Woodhouse return 1; 323e17fc0a1SDavid Woodhouse 324e827091cSMing Lei bio_get_last_bvec(bio, &end_bv); 325e827091cSMing Lei bio_get_first_bvec(nxt, &nxt_bv); 326f619d254SKent Overstreet 327f619d254SKent Overstreet if (!BIOVEC_PHYS_MERGEABLE(&end_bv, &nxt_bv)) 328e17fc0a1SDavid Woodhouse return 0; 329e17fc0a1SDavid Woodhouse 330d6d48196SJens Axboe /* 331e17fc0a1SDavid Woodhouse * bio and nxt are contiguous in memory; check if the queue allows 332d6d48196SJens Axboe * these two to be merged into one 333d6d48196SJens Axboe */ 334f619d254SKent Overstreet if (BIOVEC_SEG_BOUNDARY(q, &end_bv, &nxt_bv)) 335d6d48196SJens Axboe return 1; 336d6d48196SJens Axboe 337d6d48196SJens Axboe return 0; 338d6d48196SJens Axboe } 339d6d48196SJens Axboe 3407988613bSKent Overstreet static inline void 341963ab9e5SAsias He __blk_segment_map_sg(struct request_queue *q, struct bio_vec *bvec, 3427988613bSKent Overstreet struct scatterlist *sglist, struct bio_vec *bvprv, 343963ab9e5SAsias He struct scatterlist **sg, int *nsegs, int *cluster) 344963ab9e5SAsias He { 345963ab9e5SAsias He 346963ab9e5SAsias He int nbytes = bvec->bv_len; 347963ab9e5SAsias He 3487988613bSKent Overstreet if (*sg && *cluster) { 349963ab9e5SAsias He if ((*sg)->length + nbytes > queue_max_segment_size(q)) 350963ab9e5SAsias He goto new_segment; 351963ab9e5SAsias He 3527988613bSKent Overstreet if (!BIOVEC_PHYS_MERGEABLE(bvprv, bvec)) 353963ab9e5SAsias He goto new_segment; 3547988613bSKent Overstreet if (!BIOVEC_SEG_BOUNDARY(q, bvprv, bvec)) 355963ab9e5SAsias He goto new_segment; 356963ab9e5SAsias He 357963ab9e5SAsias He (*sg)->length += nbytes; 358963ab9e5SAsias He } else { 359963ab9e5SAsias He new_segment: 360963ab9e5SAsias He if (!*sg) 361963ab9e5SAsias He *sg = sglist; 362963ab9e5SAsias He else { 363963ab9e5SAsias He /* 364963ab9e5SAsias He * If the driver previously mapped a shorter 365963ab9e5SAsias He * list, we could see a termination bit 366963ab9e5SAsias He * prematurely unless it fully inits the sg 367963ab9e5SAsias He * table on each mapping. We KNOW that there 368963ab9e5SAsias He * must be more entries here or the driver 369963ab9e5SAsias He * would be buggy, so force clear the 370963ab9e5SAsias He * termination bit to avoid doing a full 371963ab9e5SAsias He * sg_init_table() in drivers for each command. 372963ab9e5SAsias He */ 373c8164d89SPaolo Bonzini sg_unmark_end(*sg); 374963ab9e5SAsias He *sg = sg_next(*sg); 375963ab9e5SAsias He } 376963ab9e5SAsias He 377963ab9e5SAsias He sg_set_page(*sg, bvec->bv_page, nbytes, bvec->bv_offset); 378963ab9e5SAsias He (*nsegs)++; 379963ab9e5SAsias He } 3807988613bSKent Overstreet *bvprv = *bvec; 381963ab9e5SAsias He } 382963ab9e5SAsias He 3835cb8850cSKent Overstreet static int __blk_bios_map_sg(struct request_queue *q, struct bio *bio, 3845cb8850cSKent Overstreet struct scatterlist *sglist, 3855cb8850cSKent Overstreet struct scatterlist **sg) 3865cb8850cSKent Overstreet { 3875cb8850cSKent Overstreet struct bio_vec bvec, bvprv = { NULL }; 3885cb8850cSKent Overstreet struct bvec_iter iter; 3895cb8850cSKent Overstreet int nsegs, cluster; 3905cb8850cSKent Overstreet 3915cb8850cSKent Overstreet nsegs = 0; 3925cb8850cSKent Overstreet cluster = blk_queue_cluster(q); 3935cb8850cSKent Overstreet 394*7afafc8aSAdrian Hunter switch (bio_op(bio)) { 395*7afafc8aSAdrian Hunter case REQ_OP_DISCARD: 396*7afafc8aSAdrian Hunter case REQ_OP_SECURE_ERASE: 3975cb8850cSKent Overstreet /* 3985cb8850cSKent Overstreet * This is a hack - drivers should be neither modifying the 3995cb8850cSKent Overstreet * biovec, nor relying on bi_vcnt - but because of 4005cb8850cSKent Overstreet * blk_add_request_payload(), a discard bio may or may not have 4015cb8850cSKent Overstreet * a payload we need to set up here (thank you Christoph) and 4025cb8850cSKent Overstreet * bi_vcnt is really the only way of telling if we need to. 4035cb8850cSKent Overstreet */ 404*7afafc8aSAdrian Hunter if (!bio->bi_vcnt) 4055cb8850cSKent Overstreet return 0; 406*7afafc8aSAdrian Hunter /* Fall through */ 407*7afafc8aSAdrian Hunter case REQ_OP_WRITE_SAME: 4085cb8850cSKent Overstreet *sg = sglist; 4095cb8850cSKent Overstreet bvec = bio_iovec(bio); 4105cb8850cSKent Overstreet sg_set_page(*sg, bvec.bv_page, bvec.bv_len, bvec.bv_offset); 4115cb8850cSKent Overstreet return 1; 412*7afafc8aSAdrian Hunter default: 413*7afafc8aSAdrian Hunter break; 4145cb8850cSKent Overstreet } 4155cb8850cSKent Overstreet 4165cb8850cSKent Overstreet for_each_bio(bio) 4175cb8850cSKent Overstreet bio_for_each_segment(bvec, bio, iter) 4185cb8850cSKent Overstreet __blk_segment_map_sg(q, &bvec, sglist, &bvprv, sg, 4195cb8850cSKent Overstreet &nsegs, &cluster); 4205cb8850cSKent Overstreet 4215cb8850cSKent Overstreet return nsegs; 4225cb8850cSKent Overstreet } 4235cb8850cSKent Overstreet 424d6d48196SJens Axboe /* 425d6d48196SJens Axboe * map a request to scatterlist, return number of sg entries setup. Caller 426d6d48196SJens Axboe * must make sure sg can hold rq->nr_phys_segments entries 427d6d48196SJens Axboe */ 428d6d48196SJens Axboe int blk_rq_map_sg(struct request_queue *q, struct request *rq, 429d6d48196SJens Axboe struct scatterlist *sglist) 430d6d48196SJens Axboe { 4315cb8850cSKent Overstreet struct scatterlist *sg = NULL; 4325cb8850cSKent Overstreet int nsegs = 0; 433d6d48196SJens Axboe 4345cb8850cSKent Overstreet if (rq->bio) 4355cb8850cSKent Overstreet nsegs = __blk_bios_map_sg(q, rq->bio, sglist, &sg); 436f18573abSFUJITA Tomonori 437f18573abSFUJITA Tomonori if (unlikely(rq->cmd_flags & REQ_COPY_USER) && 4382e46e8b2STejun Heo (blk_rq_bytes(rq) & q->dma_pad_mask)) { 4392e46e8b2STejun Heo unsigned int pad_len = 4402e46e8b2STejun Heo (q->dma_pad_mask & ~blk_rq_bytes(rq)) + 1; 441f18573abSFUJITA Tomonori 442f18573abSFUJITA Tomonori sg->length += pad_len; 443f18573abSFUJITA Tomonori rq->extra_len += pad_len; 444f18573abSFUJITA Tomonori } 445f18573abSFUJITA Tomonori 4462fb98e84STejun Heo if (q->dma_drain_size && q->dma_drain_needed(rq)) { 447a8ebb056SMike Christie if (op_is_write(req_op(rq))) 448db0a2e00STejun Heo memset(q->dma_drain_buffer, 0, q->dma_drain_size); 449db0a2e00STejun Heo 450da81ed16SDan Williams sg_unmark_end(sg); 451d6d48196SJens Axboe sg = sg_next(sg); 452d6d48196SJens Axboe sg_set_page(sg, virt_to_page(q->dma_drain_buffer), 453d6d48196SJens Axboe q->dma_drain_size, 454d6d48196SJens Axboe ((unsigned long)q->dma_drain_buffer) & 455d6d48196SJens Axboe (PAGE_SIZE - 1)); 456d6d48196SJens Axboe nsegs++; 4577a85f889SFUJITA Tomonori rq->extra_len += q->dma_drain_size; 458d6d48196SJens Axboe } 459d6d48196SJens Axboe 460d6d48196SJens Axboe if (sg) 461d6d48196SJens Axboe sg_mark_end(sg); 462d6d48196SJens Axboe 46312e57f59SMing Lei /* 46412e57f59SMing Lei * Something must have been wrong if the figured number of 46512e57f59SMing Lei * segment is bigger than number of req's physical segments 46612e57f59SMing Lei */ 46712e57f59SMing Lei WARN_ON(nsegs > rq->nr_phys_segments); 46812e57f59SMing Lei 469d6d48196SJens Axboe return nsegs; 470d6d48196SJens Axboe } 471d6d48196SJens Axboe EXPORT_SYMBOL(blk_rq_map_sg); 472d6d48196SJens Axboe 473d6d48196SJens Axboe static inline int ll_new_hw_segment(struct request_queue *q, 474d6d48196SJens Axboe struct request *req, 475d6d48196SJens Axboe struct bio *bio) 476d6d48196SJens Axboe { 477d6d48196SJens Axboe int nr_phys_segs = bio_phys_segments(q, bio); 478d6d48196SJens Axboe 47913f05c8dSMartin K. Petersen if (req->nr_phys_segments + nr_phys_segs > queue_max_segments(q)) 48013f05c8dSMartin K. Petersen goto no_merge; 48113f05c8dSMartin K. Petersen 4824eaf99beSMartin K. Petersen if (blk_integrity_merge_bio(q, req, bio) == false) 48313f05c8dSMartin K. Petersen goto no_merge; 484d6d48196SJens Axboe 485d6d48196SJens Axboe /* 486d6d48196SJens Axboe * This will form the start of a new hw segment. Bump both 487d6d48196SJens Axboe * counters. 488d6d48196SJens Axboe */ 489d6d48196SJens Axboe req->nr_phys_segments += nr_phys_segs; 490d6d48196SJens Axboe return 1; 49113f05c8dSMartin K. Petersen 49213f05c8dSMartin K. Petersen no_merge: 49313f05c8dSMartin K. Petersen req->cmd_flags |= REQ_NOMERGE; 49413f05c8dSMartin K. Petersen if (req == q->last_merge) 49513f05c8dSMartin K. Petersen q->last_merge = NULL; 49613f05c8dSMartin K. Petersen return 0; 497d6d48196SJens Axboe } 498d6d48196SJens Axboe 499d6d48196SJens Axboe int ll_back_merge_fn(struct request_queue *q, struct request *req, 500d6d48196SJens Axboe struct bio *bio) 501d6d48196SJens Axboe { 5025e7c4274SJens Axboe if (req_gap_back_merge(req, bio)) 5035e7c4274SJens Axboe return 0; 5047f39add3SSagi Grimberg if (blk_integrity_rq(req) && 5057f39add3SSagi Grimberg integrity_req_gap_back_merge(req, bio)) 5067f39add3SSagi Grimberg return 0; 507f31dc1cdSMartin K. Petersen if (blk_rq_sectors(req) + bio_sectors(bio) > 50817007f39SDamien Le Moal blk_rq_get_max_sectors(req, blk_rq_pos(req))) { 509d6d48196SJens Axboe req->cmd_flags |= REQ_NOMERGE; 510d6d48196SJens Axboe if (req == q->last_merge) 511d6d48196SJens Axboe q->last_merge = NULL; 512d6d48196SJens Axboe return 0; 513d6d48196SJens Axboe } 5142cdf79caSJens Axboe if (!bio_flagged(req->biotail, BIO_SEG_VALID)) 515d6d48196SJens Axboe blk_recount_segments(q, req->biotail); 5162cdf79caSJens Axboe if (!bio_flagged(bio, BIO_SEG_VALID)) 517d6d48196SJens Axboe blk_recount_segments(q, bio); 518d6d48196SJens Axboe 519d6d48196SJens Axboe return ll_new_hw_segment(q, req, bio); 520d6d48196SJens Axboe } 521d6d48196SJens Axboe 522d6d48196SJens Axboe int ll_front_merge_fn(struct request_queue *q, struct request *req, 523d6d48196SJens Axboe struct bio *bio) 524d6d48196SJens Axboe { 5255e7c4274SJens Axboe 5265e7c4274SJens Axboe if (req_gap_front_merge(req, bio)) 5275e7c4274SJens Axboe return 0; 5287f39add3SSagi Grimberg if (blk_integrity_rq(req) && 5297f39add3SSagi Grimberg integrity_req_gap_front_merge(req, bio)) 5307f39add3SSagi Grimberg return 0; 531f31dc1cdSMartin K. Petersen if (blk_rq_sectors(req) + bio_sectors(bio) > 53217007f39SDamien Le Moal blk_rq_get_max_sectors(req, bio->bi_iter.bi_sector)) { 533d6d48196SJens Axboe req->cmd_flags |= REQ_NOMERGE; 534d6d48196SJens Axboe if (req == q->last_merge) 535d6d48196SJens Axboe q->last_merge = NULL; 536d6d48196SJens Axboe return 0; 537d6d48196SJens Axboe } 5382cdf79caSJens Axboe if (!bio_flagged(bio, BIO_SEG_VALID)) 539d6d48196SJens Axboe blk_recount_segments(q, bio); 5402cdf79caSJens Axboe if (!bio_flagged(req->bio, BIO_SEG_VALID)) 541d6d48196SJens Axboe blk_recount_segments(q, req->bio); 542d6d48196SJens Axboe 543d6d48196SJens Axboe return ll_new_hw_segment(q, req, bio); 544d6d48196SJens Axboe } 545d6d48196SJens Axboe 546e7e24500SJens Axboe /* 547e7e24500SJens Axboe * blk-mq uses req->special to carry normal driver per-request payload, it 548e7e24500SJens Axboe * does not indicate a prepared command that we cannot merge with. 549e7e24500SJens Axboe */ 550e7e24500SJens Axboe static bool req_no_special_merge(struct request *req) 551e7e24500SJens Axboe { 552e7e24500SJens Axboe struct request_queue *q = req->q; 553e7e24500SJens Axboe 554e7e24500SJens Axboe return !q->mq_ops && req->special; 555e7e24500SJens Axboe } 556e7e24500SJens Axboe 557d6d48196SJens Axboe static int ll_merge_requests_fn(struct request_queue *q, struct request *req, 558d6d48196SJens Axboe struct request *next) 559d6d48196SJens Axboe { 560d6d48196SJens Axboe int total_phys_segments; 56186771427SFUJITA Tomonori unsigned int seg_size = 56286771427SFUJITA Tomonori req->biotail->bi_seg_back_size + next->bio->bi_seg_front_size; 563d6d48196SJens Axboe 564d6d48196SJens Axboe /* 565d6d48196SJens Axboe * First check if the either of the requests are re-queued 566d6d48196SJens Axboe * requests. Can't merge them if they are. 567d6d48196SJens Axboe */ 568e7e24500SJens Axboe if (req_no_special_merge(req) || req_no_special_merge(next)) 569d6d48196SJens Axboe return 0; 570d6d48196SJens Axboe 5715e7c4274SJens Axboe if (req_gap_back_merge(req, next->bio)) 572854fbb9cSKeith Busch return 0; 573854fbb9cSKeith Busch 574d6d48196SJens Axboe /* 575d6d48196SJens Axboe * Will it become too large? 576d6d48196SJens Axboe */ 577f31dc1cdSMartin K. Petersen if ((blk_rq_sectors(req) + blk_rq_sectors(next)) > 57817007f39SDamien Le Moal blk_rq_get_max_sectors(req, blk_rq_pos(req))) 579d6d48196SJens Axboe return 0; 580d6d48196SJens Axboe 581d6d48196SJens Axboe total_phys_segments = req->nr_phys_segments + next->nr_phys_segments; 58286771427SFUJITA Tomonori if (blk_phys_contig_segment(q, req->biotail, next->bio)) { 58386771427SFUJITA Tomonori if (req->nr_phys_segments == 1) 58486771427SFUJITA Tomonori req->bio->bi_seg_front_size = seg_size; 58586771427SFUJITA Tomonori if (next->nr_phys_segments == 1) 58686771427SFUJITA Tomonori next->biotail->bi_seg_back_size = seg_size; 587d6d48196SJens Axboe total_phys_segments--; 58886771427SFUJITA Tomonori } 589d6d48196SJens Axboe 5908a78362cSMartin K. Petersen if (total_phys_segments > queue_max_segments(q)) 591d6d48196SJens Axboe return 0; 592d6d48196SJens Axboe 5934eaf99beSMartin K. Petersen if (blk_integrity_merge_rq(q, req, next) == false) 59413f05c8dSMartin K. Petersen return 0; 59513f05c8dSMartin K. Petersen 596d6d48196SJens Axboe /* Merge is OK... */ 597d6d48196SJens Axboe req->nr_phys_segments = total_phys_segments; 598d6d48196SJens Axboe return 1; 599d6d48196SJens Axboe } 600d6d48196SJens Axboe 60180a761fdSTejun Heo /** 60280a761fdSTejun Heo * blk_rq_set_mixed_merge - mark a request as mixed merge 60380a761fdSTejun Heo * @rq: request to mark as mixed merge 60480a761fdSTejun Heo * 60580a761fdSTejun Heo * Description: 60680a761fdSTejun Heo * @rq is about to be mixed merged. Make sure the attributes 60780a761fdSTejun Heo * which can be mixed are set in each bio and mark @rq as mixed 60880a761fdSTejun Heo * merged. 60980a761fdSTejun Heo */ 61080a761fdSTejun Heo void blk_rq_set_mixed_merge(struct request *rq) 61180a761fdSTejun Heo { 61280a761fdSTejun Heo unsigned int ff = rq->cmd_flags & REQ_FAILFAST_MASK; 61380a761fdSTejun Heo struct bio *bio; 61480a761fdSTejun Heo 61580a761fdSTejun Heo if (rq->cmd_flags & REQ_MIXED_MERGE) 61680a761fdSTejun Heo return; 61780a761fdSTejun Heo 61880a761fdSTejun Heo /* 61980a761fdSTejun Heo * @rq will no longer represent mixable attributes for all the 62080a761fdSTejun Heo * contained bios. It will just track those of the first one. 62180a761fdSTejun Heo * Distributes the attributs to each bio. 62280a761fdSTejun Heo */ 62380a761fdSTejun Heo for (bio = rq->bio; bio; bio = bio->bi_next) { 6241eff9d32SJens Axboe WARN_ON_ONCE((bio->bi_opf & REQ_FAILFAST_MASK) && 6251eff9d32SJens Axboe (bio->bi_opf & REQ_FAILFAST_MASK) != ff); 6261eff9d32SJens Axboe bio->bi_opf |= ff; 62780a761fdSTejun Heo } 62880a761fdSTejun Heo rq->cmd_flags |= REQ_MIXED_MERGE; 62980a761fdSTejun Heo } 63080a761fdSTejun Heo 63126308eabSJerome Marchand static void blk_account_io_merge(struct request *req) 63226308eabSJerome Marchand { 63326308eabSJerome Marchand if (blk_do_io_stat(req)) { 63426308eabSJerome Marchand struct hd_struct *part; 63526308eabSJerome Marchand int cpu; 63626308eabSJerome Marchand 63726308eabSJerome Marchand cpu = part_stat_lock(); 63809e099d4SJerome Marchand part = req->part; 63926308eabSJerome Marchand 64026308eabSJerome Marchand part_round_stats(cpu, part); 641316d315bSNikanth Karthikesan part_dec_in_flight(part, rq_data_dir(req)); 64226308eabSJerome Marchand 6436c23a968SJens Axboe hd_struct_put(part); 64426308eabSJerome Marchand part_stat_unlock(); 64526308eabSJerome Marchand } 64626308eabSJerome Marchand } 64726308eabSJerome Marchand 648d6d48196SJens Axboe /* 649d6d48196SJens Axboe * Has to be called with the request spinlock acquired 650d6d48196SJens Axboe */ 651d6d48196SJens Axboe static int attempt_merge(struct request_queue *q, struct request *req, 652d6d48196SJens Axboe struct request *next) 653d6d48196SJens Axboe { 654d6d48196SJens Axboe if (!rq_mergeable(req) || !rq_mergeable(next)) 655d6d48196SJens Axboe return 0; 656d6d48196SJens Axboe 657288dab8aSChristoph Hellwig if (req_op(req) != req_op(next)) 658f31dc1cdSMartin K. Petersen return 0; 659f31dc1cdSMartin K. Petersen 660d6d48196SJens Axboe /* 661d6d48196SJens Axboe * not contiguous 662d6d48196SJens Axboe */ 66383096ebfSTejun Heo if (blk_rq_pos(req) + blk_rq_sectors(req) != blk_rq_pos(next)) 664d6d48196SJens Axboe return 0; 665d6d48196SJens Axboe 666d6d48196SJens Axboe if (rq_data_dir(req) != rq_data_dir(next) 667d6d48196SJens Axboe || req->rq_disk != next->rq_disk 668e7e24500SJens Axboe || req_no_special_merge(next)) 669d6d48196SJens Axboe return 0; 670d6d48196SJens Axboe 6718fe0d473SMike Christie if (req_op(req) == REQ_OP_WRITE_SAME && 6724363ac7cSMartin K. Petersen !blk_write_same_mergeable(req->bio, next->bio)) 6734363ac7cSMartin K. Petersen return 0; 6744363ac7cSMartin K. Petersen 675d6d48196SJens Axboe /* 676d6d48196SJens Axboe * If we are allowed to merge, then append bio list 677d6d48196SJens Axboe * from next to rq and release next. merge_requests_fn 678d6d48196SJens Axboe * will have updated segment counts, update sector 679d6d48196SJens Axboe * counts here. 680d6d48196SJens Axboe */ 681d6d48196SJens Axboe if (!ll_merge_requests_fn(q, req, next)) 682d6d48196SJens Axboe return 0; 683d6d48196SJens Axboe 684d6d48196SJens Axboe /* 68580a761fdSTejun Heo * If failfast settings disagree or any of the two is already 68680a761fdSTejun Heo * a mixed merge, mark both as mixed before proceeding. This 68780a761fdSTejun Heo * makes sure that all involved bios have mixable attributes 68880a761fdSTejun Heo * set properly. 68980a761fdSTejun Heo */ 69080a761fdSTejun Heo if ((req->cmd_flags | next->cmd_flags) & REQ_MIXED_MERGE || 69180a761fdSTejun Heo (req->cmd_flags & REQ_FAILFAST_MASK) != 69280a761fdSTejun Heo (next->cmd_flags & REQ_FAILFAST_MASK)) { 69380a761fdSTejun Heo blk_rq_set_mixed_merge(req); 69480a761fdSTejun Heo blk_rq_set_mixed_merge(next); 69580a761fdSTejun Heo } 69680a761fdSTejun Heo 69780a761fdSTejun Heo /* 698d6d48196SJens Axboe * At this point we have either done a back merge 699d6d48196SJens Axboe * or front merge. We need the smaller start_time of 700d6d48196SJens Axboe * the merged requests to be the current request 701d6d48196SJens Axboe * for accounting purposes. 702d6d48196SJens Axboe */ 703d6d48196SJens Axboe if (time_after(req->start_time, next->start_time)) 704d6d48196SJens Axboe req->start_time = next->start_time; 705d6d48196SJens Axboe 706d6d48196SJens Axboe req->biotail->bi_next = next->bio; 707d6d48196SJens Axboe req->biotail = next->biotail; 708d6d48196SJens Axboe 709a2dec7b3STejun Heo req->__data_len += blk_rq_bytes(next); 710d6d48196SJens Axboe 711d6d48196SJens Axboe elv_merge_requests(q, req, next); 712d6d48196SJens Axboe 71342dad764SJerome Marchand /* 71442dad764SJerome Marchand * 'next' is going away, so update stats accordingly 71542dad764SJerome Marchand */ 71642dad764SJerome Marchand blk_account_io_merge(next); 717d6d48196SJens Axboe 718d6d48196SJens Axboe req->ioprio = ioprio_best(req->ioprio, next->ioprio); 719ab780f1eSJens Axboe if (blk_rq_cpu_valid(next)) 720ab780f1eSJens Axboe req->cpu = next->cpu; 721d6d48196SJens Axboe 7221cd96c24SBoaz Harrosh /* owner-ship of bio passed from next to req */ 7231cd96c24SBoaz Harrosh next->bio = NULL; 724d6d48196SJens Axboe __blk_put_request(q, next); 725d6d48196SJens Axboe return 1; 726d6d48196SJens Axboe } 727d6d48196SJens Axboe 728d6d48196SJens Axboe int attempt_back_merge(struct request_queue *q, struct request *rq) 729d6d48196SJens Axboe { 730d6d48196SJens Axboe struct request *next = elv_latter_request(q, rq); 731d6d48196SJens Axboe 732d6d48196SJens Axboe if (next) 733d6d48196SJens Axboe return attempt_merge(q, rq, next); 734d6d48196SJens Axboe 735d6d48196SJens Axboe return 0; 736d6d48196SJens Axboe } 737d6d48196SJens Axboe 738d6d48196SJens Axboe int attempt_front_merge(struct request_queue *q, struct request *rq) 739d6d48196SJens Axboe { 740d6d48196SJens Axboe struct request *prev = elv_former_request(q, rq); 741d6d48196SJens Axboe 742d6d48196SJens Axboe if (prev) 743d6d48196SJens Axboe return attempt_merge(q, prev, rq); 744d6d48196SJens Axboe 745d6d48196SJens Axboe return 0; 746d6d48196SJens Axboe } 7475e84ea3aSJens Axboe 7485e84ea3aSJens Axboe int blk_attempt_req_merge(struct request_queue *q, struct request *rq, 7495e84ea3aSJens Axboe struct request *next) 7505e84ea3aSJens Axboe { 75172ef799bSTahsin Erdogan struct elevator_queue *e = q->elevator; 75272ef799bSTahsin Erdogan 75372ef799bSTahsin Erdogan if (e->type->ops.elevator_allow_rq_merge_fn) 75472ef799bSTahsin Erdogan if (!e->type->ops.elevator_allow_rq_merge_fn(q, rq, next)) 75572ef799bSTahsin Erdogan return 0; 75672ef799bSTahsin Erdogan 7575e84ea3aSJens Axboe return attempt_merge(q, rq, next); 7585e84ea3aSJens Axboe } 759050c8ea8STejun Heo 760050c8ea8STejun Heo bool blk_rq_merge_ok(struct request *rq, struct bio *bio) 761050c8ea8STejun Heo { 762e2a60da7SMartin K. Petersen if (!rq_mergeable(rq) || !bio_mergeable(bio)) 763050c8ea8STejun Heo return false; 764050c8ea8STejun Heo 765288dab8aSChristoph Hellwig if (req_op(rq) != bio_op(bio)) 766f31dc1cdSMartin K. Petersen return false; 767f31dc1cdSMartin K. Petersen 768050c8ea8STejun Heo /* different data direction or already started, don't merge */ 769050c8ea8STejun Heo if (bio_data_dir(bio) != rq_data_dir(rq)) 770050c8ea8STejun Heo return false; 771050c8ea8STejun Heo 772050c8ea8STejun Heo /* must be same device and not a special request */ 773e7e24500SJens Axboe if (rq->rq_disk != bio->bi_bdev->bd_disk || req_no_special_merge(rq)) 774050c8ea8STejun Heo return false; 775050c8ea8STejun Heo 776050c8ea8STejun Heo /* only merge integrity protected bio into ditto rq */ 7774eaf99beSMartin K. Petersen if (blk_integrity_merge_bio(rq->q, rq, bio) == false) 778050c8ea8STejun Heo return false; 779050c8ea8STejun Heo 7804363ac7cSMartin K. Petersen /* must be using the same buffer */ 7818fe0d473SMike Christie if (req_op(rq) == REQ_OP_WRITE_SAME && 7824363ac7cSMartin K. Petersen !blk_write_same_mergeable(rq->bio, bio)) 7834363ac7cSMartin K. Petersen return false; 7844363ac7cSMartin K. Petersen 785050c8ea8STejun Heo return true; 786050c8ea8STejun Heo } 787050c8ea8STejun Heo 788050c8ea8STejun Heo int blk_try_merge(struct request *rq, struct bio *bio) 789050c8ea8STejun Heo { 7904f024f37SKent Overstreet if (blk_rq_pos(rq) + blk_rq_sectors(rq) == bio->bi_iter.bi_sector) 791050c8ea8STejun Heo return ELEVATOR_BACK_MERGE; 7924f024f37SKent Overstreet else if (blk_rq_pos(rq) - bio_sectors(bio) == bio->bi_iter.bi_sector) 793050c8ea8STejun Heo return ELEVATOR_FRONT_MERGE; 794050c8ea8STejun Heo return ELEVATOR_NO_MERGE; 795050c8ea8STejun Heo } 796