1d6d48196SJens Axboe /* 2d6d48196SJens Axboe * Functions related to segment and merge handling 3d6d48196SJens Axboe */ 4d6d48196SJens Axboe #include <linux/kernel.h> 5d6d48196SJens Axboe #include <linux/module.h> 6d6d48196SJens Axboe #include <linux/bio.h> 7d6d48196SJens Axboe #include <linux/blkdev.h> 8d6d48196SJens Axboe #include <linux/scatterlist.h> 9d6d48196SJens Axboe 10*cda22646SMike Krinkin #include <trace/events/block.h> 11*cda22646SMike Krinkin 12d6d48196SJens Axboe #include "blk.h" 13d6d48196SJens Axboe 1454efd50bSKent Overstreet static struct bio *blk_bio_discard_split(struct request_queue *q, 1554efd50bSKent Overstreet struct bio *bio, 16bdced438SMing Lei struct bio_set *bs, 17bdced438SMing Lei unsigned *nsegs) 1854efd50bSKent Overstreet { 1954efd50bSKent Overstreet unsigned int max_discard_sectors, granularity; 2054efd50bSKent Overstreet int alignment; 2154efd50bSKent Overstreet sector_t tmp; 2254efd50bSKent Overstreet unsigned split_sectors; 2354efd50bSKent Overstreet 24bdced438SMing Lei *nsegs = 1; 25bdced438SMing Lei 2654efd50bSKent Overstreet /* Zero-sector (unknown) and one-sector granularities are the same. */ 2754efd50bSKent Overstreet granularity = max(q->limits.discard_granularity >> 9, 1U); 2854efd50bSKent Overstreet 2954efd50bSKent Overstreet max_discard_sectors = min(q->limits.max_discard_sectors, UINT_MAX >> 9); 3054efd50bSKent Overstreet max_discard_sectors -= max_discard_sectors % granularity; 3154efd50bSKent Overstreet 3254efd50bSKent Overstreet if (unlikely(!max_discard_sectors)) { 3354efd50bSKent Overstreet /* XXX: warn */ 3454efd50bSKent Overstreet return NULL; 3554efd50bSKent Overstreet } 3654efd50bSKent Overstreet 3754efd50bSKent Overstreet if (bio_sectors(bio) <= max_discard_sectors) 3854efd50bSKent Overstreet return NULL; 3954efd50bSKent Overstreet 4054efd50bSKent Overstreet split_sectors = max_discard_sectors; 4154efd50bSKent Overstreet 4254efd50bSKent Overstreet /* 4354efd50bSKent Overstreet * If the next starting sector would be misaligned, stop the discard at 4454efd50bSKent Overstreet * the previous aligned sector. 4554efd50bSKent Overstreet */ 4654efd50bSKent Overstreet alignment = (q->limits.discard_alignment >> 9) % granularity; 4754efd50bSKent Overstreet 4854efd50bSKent Overstreet tmp = bio->bi_iter.bi_sector + split_sectors - alignment; 4954efd50bSKent Overstreet tmp = sector_div(tmp, granularity); 5054efd50bSKent Overstreet 5154efd50bSKent Overstreet if (split_sectors > tmp) 5254efd50bSKent Overstreet split_sectors -= tmp; 5354efd50bSKent Overstreet 5454efd50bSKent Overstreet return bio_split(bio, split_sectors, GFP_NOIO, bs); 5554efd50bSKent Overstreet } 5654efd50bSKent Overstreet 5754efd50bSKent Overstreet static struct bio *blk_bio_write_same_split(struct request_queue *q, 5854efd50bSKent Overstreet struct bio *bio, 59bdced438SMing Lei struct bio_set *bs, 60bdced438SMing Lei unsigned *nsegs) 6154efd50bSKent Overstreet { 62bdced438SMing Lei *nsegs = 1; 63bdced438SMing Lei 6454efd50bSKent Overstreet if (!q->limits.max_write_same_sectors) 6554efd50bSKent Overstreet return NULL; 6654efd50bSKent Overstreet 6754efd50bSKent Overstreet if (bio_sectors(bio) <= q->limits.max_write_same_sectors) 6854efd50bSKent Overstreet return NULL; 6954efd50bSKent Overstreet 7054efd50bSKent Overstreet return bio_split(bio, q->limits.max_write_same_sectors, GFP_NOIO, bs); 7154efd50bSKent Overstreet } 7254efd50bSKent Overstreet 7354efd50bSKent Overstreet static struct bio *blk_bio_segment_split(struct request_queue *q, 7454efd50bSKent Overstreet struct bio *bio, 75bdced438SMing Lei struct bio_set *bs, 76bdced438SMing Lei unsigned *segs) 7754efd50bSKent Overstreet { 785014c311SJens Axboe struct bio_vec bv, bvprv, *bvprvp = NULL; 7954efd50bSKent Overstreet struct bvec_iter iter; 808ae12666SKent Overstreet unsigned seg_size = 0, nsegs = 0, sectors = 0; 8102e70742SMing Lei unsigned front_seg_size = bio->bi_seg_front_size; 8202e70742SMing Lei bool do_split = true; 8302e70742SMing Lei struct bio *new = NULL; 8454efd50bSKent Overstreet 8554efd50bSKent Overstreet bio_for_each_segment(bv, bio, iter) { 8652cc6eeaSMing Lei if (sectors + (bv.bv_len >> 9) > queue_max_sectors(q)) 8754efd50bSKent Overstreet goto split; 8854efd50bSKent Overstreet 8954efd50bSKent Overstreet /* 9054efd50bSKent Overstreet * If the queue doesn't support SG gaps and adding this 9154efd50bSKent Overstreet * offset would create a gap, disallow it. 9254efd50bSKent Overstreet */ 935014c311SJens Axboe if (bvprvp && bvec_gap_to_prev(q, bvprvp, bv.bv_offset)) 9454efd50bSKent Overstreet goto split; 9554efd50bSKent Overstreet 965014c311SJens Axboe if (bvprvp && blk_queue_cluster(q)) { 9754efd50bSKent Overstreet if (seg_size + bv.bv_len > queue_max_segment_size(q)) 9854efd50bSKent Overstreet goto new_segment; 995014c311SJens Axboe if (!BIOVEC_PHYS_MERGEABLE(bvprvp, &bv)) 10054efd50bSKent Overstreet goto new_segment; 1015014c311SJens Axboe if (!BIOVEC_SEG_BOUNDARY(q, bvprvp, &bv)) 10254efd50bSKent Overstreet goto new_segment; 10354efd50bSKent Overstreet 10454efd50bSKent Overstreet seg_size += bv.bv_len; 10554efd50bSKent Overstreet bvprv = bv; 106578270bfSMing Lei bvprvp = &bvprv; 10752cc6eeaSMing Lei sectors += bv.bv_len >> 9; 10854efd50bSKent Overstreet continue; 10954efd50bSKent Overstreet } 11054efd50bSKent Overstreet new_segment: 11154efd50bSKent Overstreet if (nsegs == queue_max_segments(q)) 11254efd50bSKent Overstreet goto split; 11354efd50bSKent Overstreet 11454efd50bSKent Overstreet nsegs++; 11554efd50bSKent Overstreet bvprv = bv; 116578270bfSMing Lei bvprvp = &bvprv; 11754efd50bSKent Overstreet seg_size = bv.bv_len; 11852cc6eeaSMing Lei sectors += bv.bv_len >> 9; 11902e70742SMing Lei 12002e70742SMing Lei if (nsegs == 1 && seg_size > front_seg_size) 12102e70742SMing Lei front_seg_size = seg_size; 12254efd50bSKent Overstreet } 12354efd50bSKent Overstreet 12402e70742SMing Lei do_split = false; 12554efd50bSKent Overstreet split: 126bdced438SMing Lei *segs = nsegs; 12702e70742SMing Lei 12802e70742SMing Lei if (do_split) { 12902e70742SMing Lei new = bio_split(bio, sectors, GFP_NOIO, bs); 13002e70742SMing Lei if (new) 13102e70742SMing Lei bio = new; 13202e70742SMing Lei } 13302e70742SMing Lei 13402e70742SMing Lei bio->bi_seg_front_size = front_seg_size; 13502e70742SMing Lei if (seg_size > bio->bi_seg_back_size) 13602e70742SMing Lei bio->bi_seg_back_size = seg_size; 13702e70742SMing Lei 13802e70742SMing Lei return do_split ? new : NULL; 13954efd50bSKent Overstreet } 14054efd50bSKent Overstreet 14154efd50bSKent Overstreet void blk_queue_split(struct request_queue *q, struct bio **bio, 14254efd50bSKent Overstreet struct bio_set *bs) 14354efd50bSKent Overstreet { 144bdced438SMing Lei struct bio *split, *res; 145bdced438SMing Lei unsigned nsegs; 14654efd50bSKent Overstreet 14754efd50bSKent Overstreet if ((*bio)->bi_rw & REQ_DISCARD) 148bdced438SMing Lei split = blk_bio_discard_split(q, *bio, bs, &nsegs); 14954efd50bSKent Overstreet else if ((*bio)->bi_rw & REQ_WRITE_SAME) 150bdced438SMing Lei split = blk_bio_write_same_split(q, *bio, bs, &nsegs); 15154efd50bSKent Overstreet else 152bdced438SMing Lei split = blk_bio_segment_split(q, *bio, q->bio_split, &nsegs); 153bdced438SMing Lei 154bdced438SMing Lei /* physical segments can be figured out during splitting */ 155bdced438SMing Lei res = split ? split : *bio; 156bdced438SMing Lei res->bi_phys_segments = nsegs; 157bdced438SMing Lei bio_set_flag(res, BIO_SEG_VALID); 15854efd50bSKent Overstreet 15954efd50bSKent Overstreet if (split) { 1606ac45aebSMing Lei /* there isn't chance to merge the splitted bio */ 1616ac45aebSMing Lei split->bi_rw |= REQ_NOMERGE; 1626ac45aebSMing Lei 16354efd50bSKent Overstreet bio_chain(split, *bio); 164*cda22646SMike Krinkin trace_block_split(q, split, (*bio)->bi_iter.bi_sector); 16554efd50bSKent Overstreet generic_make_request(*bio); 16654efd50bSKent Overstreet *bio = split; 16754efd50bSKent Overstreet } 16854efd50bSKent Overstreet } 16954efd50bSKent Overstreet EXPORT_SYMBOL(blk_queue_split); 17054efd50bSKent Overstreet 1711e428079SJens Axboe static unsigned int __blk_recalc_rq_segments(struct request_queue *q, 17207388549SMing Lei struct bio *bio, 17307388549SMing Lei bool no_sg_merge) 174d6d48196SJens Axboe { 1757988613bSKent Overstreet struct bio_vec bv, bvprv = { NULL }; 17654efd50bSKent Overstreet int cluster, prev = 0; 1771e428079SJens Axboe unsigned int seg_size, nr_phys_segs; 17859247eaeSJens Axboe struct bio *fbio, *bbio; 1797988613bSKent Overstreet struct bvec_iter iter; 180d6d48196SJens Axboe 1811e428079SJens Axboe if (!bio) 1821e428079SJens Axboe return 0; 183d6d48196SJens Axboe 1845cb8850cSKent Overstreet /* 1855cb8850cSKent Overstreet * This should probably be returning 0, but blk_add_request_payload() 1865cb8850cSKent Overstreet * (Christoph!!!!) 1875cb8850cSKent Overstreet */ 1885cb8850cSKent Overstreet if (bio->bi_rw & REQ_DISCARD) 1895cb8850cSKent Overstreet return 1; 1905cb8850cSKent Overstreet 1915cb8850cSKent Overstreet if (bio->bi_rw & REQ_WRITE_SAME) 1925cb8850cSKent Overstreet return 1; 1935cb8850cSKent Overstreet 1941e428079SJens Axboe fbio = bio; 195e692cb66SMartin K. Petersen cluster = blk_queue_cluster(q); 1965df97b91SMikulas Patocka seg_size = 0; 1972c8919deSAndi Kleen nr_phys_segs = 0; 1981e428079SJens Axboe for_each_bio(bio) { 1997988613bSKent Overstreet bio_for_each_segment(bv, bio, iter) { 200d6d48196SJens Axboe /* 20105f1dd53SJens Axboe * If SG merging is disabled, each bio vector is 20205f1dd53SJens Axboe * a segment 20305f1dd53SJens Axboe */ 20405f1dd53SJens Axboe if (no_sg_merge) 20505f1dd53SJens Axboe goto new_segment; 20605f1dd53SJens Axboe 20754efd50bSKent Overstreet if (prev && cluster) { 2087988613bSKent Overstreet if (seg_size + bv.bv_len 209ae03bf63SMartin K. Petersen > queue_max_segment_size(q)) 210d6d48196SJens Axboe goto new_segment; 2117988613bSKent Overstreet if (!BIOVEC_PHYS_MERGEABLE(&bvprv, &bv)) 212d6d48196SJens Axboe goto new_segment; 2137988613bSKent Overstreet if (!BIOVEC_SEG_BOUNDARY(q, &bvprv, &bv)) 214d6d48196SJens Axboe goto new_segment; 215d6d48196SJens Axboe 2167988613bSKent Overstreet seg_size += bv.bv_len; 217d6d48196SJens Axboe bvprv = bv; 218d6d48196SJens Axboe continue; 219d6d48196SJens Axboe } 220d6d48196SJens Axboe new_segment: 2211e428079SJens Axboe if (nr_phys_segs == 1 && seg_size > 2221e428079SJens Axboe fbio->bi_seg_front_size) 2231e428079SJens Axboe fbio->bi_seg_front_size = seg_size; 22486771427SFUJITA Tomonori 225d6d48196SJens Axboe nr_phys_segs++; 226d6d48196SJens Axboe bvprv = bv; 22754efd50bSKent Overstreet prev = 1; 2287988613bSKent Overstreet seg_size = bv.bv_len; 229d6d48196SJens Axboe } 23059247eaeSJens Axboe bbio = bio; 2311e428079SJens Axboe } 232d6d48196SJens Axboe 23359247eaeSJens Axboe if (nr_phys_segs == 1 && seg_size > fbio->bi_seg_front_size) 23459247eaeSJens Axboe fbio->bi_seg_front_size = seg_size; 23559247eaeSJens Axboe if (seg_size > bbio->bi_seg_back_size) 23659247eaeSJens Axboe bbio->bi_seg_back_size = seg_size; 2371e428079SJens Axboe 2381e428079SJens Axboe return nr_phys_segs; 2391e428079SJens Axboe } 2401e428079SJens Axboe 2411e428079SJens Axboe void blk_recalc_rq_segments(struct request *rq) 2421e428079SJens Axboe { 24307388549SMing Lei bool no_sg_merge = !!test_bit(QUEUE_FLAG_NO_SG_MERGE, 24407388549SMing Lei &rq->q->queue_flags); 24507388549SMing Lei 24607388549SMing Lei rq->nr_phys_segments = __blk_recalc_rq_segments(rq->q, rq->bio, 24707388549SMing Lei no_sg_merge); 248d6d48196SJens Axboe } 249d6d48196SJens Axboe 250d6d48196SJens Axboe void blk_recount_segments(struct request_queue *q, struct bio *bio) 251d6d48196SJens Axboe { 2527f60dcaaSMing Lei unsigned short seg_cnt; 253764f612cSMing Lei 2547f60dcaaSMing Lei /* estimate segment number by bi_vcnt for non-cloned bio */ 2557f60dcaaSMing Lei if (bio_flagged(bio, BIO_CLONED)) 2567f60dcaaSMing Lei seg_cnt = bio_segments(bio); 2577f60dcaaSMing Lei else 2587f60dcaaSMing Lei seg_cnt = bio->bi_vcnt; 2597f60dcaaSMing Lei 2607f60dcaaSMing Lei if (test_bit(QUEUE_FLAG_NO_SG_MERGE, &q->queue_flags) && 2617f60dcaaSMing Lei (seg_cnt < queue_max_segments(q))) 2627f60dcaaSMing Lei bio->bi_phys_segments = seg_cnt; 26305f1dd53SJens Axboe else { 264d6d48196SJens Axboe struct bio *nxt = bio->bi_next; 2651e428079SJens Axboe 266d6d48196SJens Axboe bio->bi_next = NULL; 2677f60dcaaSMing Lei bio->bi_phys_segments = __blk_recalc_rq_segments(q, bio, false); 268d6d48196SJens Axboe bio->bi_next = nxt; 26905f1dd53SJens Axboe } 27005f1dd53SJens Axboe 271b7c44ed9SJens Axboe bio_set_flag(bio, BIO_SEG_VALID); 272d6d48196SJens Axboe } 273d6d48196SJens Axboe EXPORT_SYMBOL(blk_recount_segments); 274d6d48196SJens Axboe 275d6d48196SJens Axboe static int blk_phys_contig_segment(struct request_queue *q, struct bio *bio, 276d6d48196SJens Axboe struct bio *nxt) 277d6d48196SJens Axboe { 2782b8221e1SKent Overstreet struct bio_vec end_bv = { NULL }, nxt_bv; 279f619d254SKent Overstreet struct bvec_iter iter; 280f619d254SKent Overstreet 281e692cb66SMartin K. Petersen if (!blk_queue_cluster(q)) 282d6d48196SJens Axboe return 0; 283d6d48196SJens Axboe 28486771427SFUJITA Tomonori if (bio->bi_seg_back_size + nxt->bi_seg_front_size > 285ae03bf63SMartin K. Petersen queue_max_segment_size(q)) 286d6d48196SJens Axboe return 0; 287d6d48196SJens Axboe 288e17fc0a1SDavid Woodhouse if (!bio_has_data(bio)) 289e17fc0a1SDavid Woodhouse return 1; 290e17fc0a1SDavid Woodhouse 291f619d254SKent Overstreet bio_for_each_segment(end_bv, bio, iter) 292f619d254SKent Overstreet if (end_bv.bv_len == iter.bi_size) 293f619d254SKent Overstreet break; 294f619d254SKent Overstreet 295f619d254SKent Overstreet nxt_bv = bio_iovec(nxt); 296f619d254SKent Overstreet 297f619d254SKent Overstreet if (!BIOVEC_PHYS_MERGEABLE(&end_bv, &nxt_bv)) 298e17fc0a1SDavid Woodhouse return 0; 299e17fc0a1SDavid Woodhouse 300d6d48196SJens Axboe /* 301e17fc0a1SDavid Woodhouse * bio and nxt are contiguous in memory; check if the queue allows 302d6d48196SJens Axboe * these two to be merged into one 303d6d48196SJens Axboe */ 304f619d254SKent Overstreet if (BIOVEC_SEG_BOUNDARY(q, &end_bv, &nxt_bv)) 305d6d48196SJens Axboe return 1; 306d6d48196SJens Axboe 307d6d48196SJens Axboe return 0; 308d6d48196SJens Axboe } 309d6d48196SJens Axboe 3107988613bSKent Overstreet static inline void 311963ab9e5SAsias He __blk_segment_map_sg(struct request_queue *q, struct bio_vec *bvec, 3127988613bSKent Overstreet struct scatterlist *sglist, struct bio_vec *bvprv, 313963ab9e5SAsias He struct scatterlist **sg, int *nsegs, int *cluster) 314963ab9e5SAsias He { 315963ab9e5SAsias He 316963ab9e5SAsias He int nbytes = bvec->bv_len; 317963ab9e5SAsias He 3187988613bSKent Overstreet if (*sg && *cluster) { 319963ab9e5SAsias He if ((*sg)->length + nbytes > queue_max_segment_size(q)) 320963ab9e5SAsias He goto new_segment; 321963ab9e5SAsias He 3227988613bSKent Overstreet if (!BIOVEC_PHYS_MERGEABLE(bvprv, bvec)) 323963ab9e5SAsias He goto new_segment; 3247988613bSKent Overstreet if (!BIOVEC_SEG_BOUNDARY(q, bvprv, bvec)) 325963ab9e5SAsias He goto new_segment; 326963ab9e5SAsias He 327963ab9e5SAsias He (*sg)->length += nbytes; 328963ab9e5SAsias He } else { 329963ab9e5SAsias He new_segment: 330963ab9e5SAsias He if (!*sg) 331963ab9e5SAsias He *sg = sglist; 332963ab9e5SAsias He else { 333963ab9e5SAsias He /* 334963ab9e5SAsias He * If the driver previously mapped a shorter 335963ab9e5SAsias He * list, we could see a termination bit 336963ab9e5SAsias He * prematurely unless it fully inits the sg 337963ab9e5SAsias He * table on each mapping. We KNOW that there 338963ab9e5SAsias He * must be more entries here or the driver 339963ab9e5SAsias He * would be buggy, so force clear the 340963ab9e5SAsias He * termination bit to avoid doing a full 341963ab9e5SAsias He * sg_init_table() in drivers for each command. 342963ab9e5SAsias He */ 343c8164d89SPaolo Bonzini sg_unmark_end(*sg); 344963ab9e5SAsias He *sg = sg_next(*sg); 345963ab9e5SAsias He } 346963ab9e5SAsias He 347963ab9e5SAsias He sg_set_page(*sg, bvec->bv_page, nbytes, bvec->bv_offset); 348963ab9e5SAsias He (*nsegs)++; 349963ab9e5SAsias He } 3507988613bSKent Overstreet *bvprv = *bvec; 351963ab9e5SAsias He } 352963ab9e5SAsias He 3535cb8850cSKent Overstreet static int __blk_bios_map_sg(struct request_queue *q, struct bio *bio, 3545cb8850cSKent Overstreet struct scatterlist *sglist, 3555cb8850cSKent Overstreet struct scatterlist **sg) 3565cb8850cSKent Overstreet { 3575cb8850cSKent Overstreet struct bio_vec bvec, bvprv = { NULL }; 3585cb8850cSKent Overstreet struct bvec_iter iter; 3595cb8850cSKent Overstreet int nsegs, cluster; 3605cb8850cSKent Overstreet 3615cb8850cSKent Overstreet nsegs = 0; 3625cb8850cSKent Overstreet cluster = blk_queue_cluster(q); 3635cb8850cSKent Overstreet 3645cb8850cSKent Overstreet if (bio->bi_rw & REQ_DISCARD) { 3655cb8850cSKent Overstreet /* 3665cb8850cSKent Overstreet * This is a hack - drivers should be neither modifying the 3675cb8850cSKent Overstreet * biovec, nor relying on bi_vcnt - but because of 3685cb8850cSKent Overstreet * blk_add_request_payload(), a discard bio may or may not have 3695cb8850cSKent Overstreet * a payload we need to set up here (thank you Christoph) and 3705cb8850cSKent Overstreet * bi_vcnt is really the only way of telling if we need to. 3715cb8850cSKent Overstreet */ 3725cb8850cSKent Overstreet 3735cb8850cSKent Overstreet if (bio->bi_vcnt) 3745cb8850cSKent Overstreet goto single_segment; 3755cb8850cSKent Overstreet 3765cb8850cSKent Overstreet return 0; 3775cb8850cSKent Overstreet } 3785cb8850cSKent Overstreet 3795cb8850cSKent Overstreet if (bio->bi_rw & REQ_WRITE_SAME) { 3805cb8850cSKent Overstreet single_segment: 3815cb8850cSKent Overstreet *sg = sglist; 3825cb8850cSKent Overstreet bvec = bio_iovec(bio); 3835cb8850cSKent Overstreet sg_set_page(*sg, bvec.bv_page, bvec.bv_len, bvec.bv_offset); 3845cb8850cSKent Overstreet return 1; 3855cb8850cSKent Overstreet } 3865cb8850cSKent Overstreet 3875cb8850cSKent Overstreet for_each_bio(bio) 3885cb8850cSKent Overstreet bio_for_each_segment(bvec, bio, iter) 3895cb8850cSKent Overstreet __blk_segment_map_sg(q, &bvec, sglist, &bvprv, sg, 3905cb8850cSKent Overstreet &nsegs, &cluster); 3915cb8850cSKent Overstreet 3925cb8850cSKent Overstreet return nsegs; 3935cb8850cSKent Overstreet } 3945cb8850cSKent Overstreet 395d6d48196SJens Axboe /* 396d6d48196SJens Axboe * map a request to scatterlist, return number of sg entries setup. Caller 397d6d48196SJens Axboe * must make sure sg can hold rq->nr_phys_segments entries 398d6d48196SJens Axboe */ 399d6d48196SJens Axboe int blk_rq_map_sg(struct request_queue *q, struct request *rq, 400d6d48196SJens Axboe struct scatterlist *sglist) 401d6d48196SJens Axboe { 4025cb8850cSKent Overstreet struct scatterlist *sg = NULL; 4035cb8850cSKent Overstreet int nsegs = 0; 404d6d48196SJens Axboe 4055cb8850cSKent Overstreet if (rq->bio) 4065cb8850cSKent Overstreet nsegs = __blk_bios_map_sg(q, rq->bio, sglist, &sg); 407f18573abSFUJITA Tomonori 408f18573abSFUJITA Tomonori if (unlikely(rq->cmd_flags & REQ_COPY_USER) && 4092e46e8b2STejun Heo (blk_rq_bytes(rq) & q->dma_pad_mask)) { 4102e46e8b2STejun Heo unsigned int pad_len = 4112e46e8b2STejun Heo (q->dma_pad_mask & ~blk_rq_bytes(rq)) + 1; 412f18573abSFUJITA Tomonori 413f18573abSFUJITA Tomonori sg->length += pad_len; 414f18573abSFUJITA Tomonori rq->extra_len += pad_len; 415f18573abSFUJITA Tomonori } 416f18573abSFUJITA Tomonori 4172fb98e84STejun Heo if (q->dma_drain_size && q->dma_drain_needed(rq)) { 4187b6d91daSChristoph Hellwig if (rq->cmd_flags & REQ_WRITE) 419db0a2e00STejun Heo memset(q->dma_drain_buffer, 0, q->dma_drain_size); 420db0a2e00STejun Heo 421da81ed16SDan Williams sg_unmark_end(sg); 422d6d48196SJens Axboe sg = sg_next(sg); 423d6d48196SJens Axboe sg_set_page(sg, virt_to_page(q->dma_drain_buffer), 424d6d48196SJens Axboe q->dma_drain_size, 425d6d48196SJens Axboe ((unsigned long)q->dma_drain_buffer) & 426d6d48196SJens Axboe (PAGE_SIZE - 1)); 427d6d48196SJens Axboe nsegs++; 4287a85f889SFUJITA Tomonori rq->extra_len += q->dma_drain_size; 429d6d48196SJens Axboe } 430d6d48196SJens Axboe 431d6d48196SJens Axboe if (sg) 432d6d48196SJens Axboe sg_mark_end(sg); 433d6d48196SJens Axboe 43412e57f59SMing Lei /* 43512e57f59SMing Lei * Something must have been wrong if the figured number of 43612e57f59SMing Lei * segment is bigger than number of req's physical segments 43712e57f59SMing Lei */ 43812e57f59SMing Lei WARN_ON(nsegs > rq->nr_phys_segments); 43912e57f59SMing Lei 440d6d48196SJens Axboe return nsegs; 441d6d48196SJens Axboe } 442d6d48196SJens Axboe EXPORT_SYMBOL(blk_rq_map_sg); 443d6d48196SJens Axboe 444d6d48196SJens Axboe static inline int ll_new_hw_segment(struct request_queue *q, 445d6d48196SJens Axboe struct request *req, 446d6d48196SJens Axboe struct bio *bio) 447d6d48196SJens Axboe { 448d6d48196SJens Axboe int nr_phys_segs = bio_phys_segments(q, bio); 449d6d48196SJens Axboe 45013f05c8dSMartin K. Petersen if (req->nr_phys_segments + nr_phys_segs > queue_max_segments(q)) 45113f05c8dSMartin K. Petersen goto no_merge; 45213f05c8dSMartin K. Petersen 4534eaf99beSMartin K. Petersen if (blk_integrity_merge_bio(q, req, bio) == false) 45413f05c8dSMartin K. Petersen goto no_merge; 455d6d48196SJens Axboe 456d6d48196SJens Axboe /* 457d6d48196SJens Axboe * This will form the start of a new hw segment. Bump both 458d6d48196SJens Axboe * counters. 459d6d48196SJens Axboe */ 460d6d48196SJens Axboe req->nr_phys_segments += nr_phys_segs; 461d6d48196SJens Axboe return 1; 46213f05c8dSMartin K. Petersen 46313f05c8dSMartin K. Petersen no_merge: 46413f05c8dSMartin K. Petersen req->cmd_flags |= REQ_NOMERGE; 46513f05c8dSMartin K. Petersen if (req == q->last_merge) 46613f05c8dSMartin K. Petersen q->last_merge = NULL; 46713f05c8dSMartin K. Petersen return 0; 468d6d48196SJens Axboe } 469d6d48196SJens Axboe 470d6d48196SJens Axboe int ll_back_merge_fn(struct request_queue *q, struct request *req, 471d6d48196SJens Axboe struct bio *bio) 472d6d48196SJens Axboe { 4735e7c4274SJens Axboe if (req_gap_back_merge(req, bio)) 4745e7c4274SJens Axboe return 0; 4757f39add3SSagi Grimberg if (blk_integrity_rq(req) && 4767f39add3SSagi Grimberg integrity_req_gap_back_merge(req, bio)) 4777f39add3SSagi Grimberg return 0; 478f31dc1cdSMartin K. Petersen if (blk_rq_sectors(req) + bio_sectors(bio) > 479f31dc1cdSMartin K. Petersen blk_rq_get_max_sectors(req)) { 480d6d48196SJens Axboe req->cmd_flags |= REQ_NOMERGE; 481d6d48196SJens Axboe if (req == q->last_merge) 482d6d48196SJens Axboe q->last_merge = NULL; 483d6d48196SJens Axboe return 0; 484d6d48196SJens Axboe } 4852cdf79caSJens Axboe if (!bio_flagged(req->biotail, BIO_SEG_VALID)) 486d6d48196SJens Axboe blk_recount_segments(q, req->biotail); 4872cdf79caSJens Axboe if (!bio_flagged(bio, BIO_SEG_VALID)) 488d6d48196SJens Axboe blk_recount_segments(q, bio); 489d6d48196SJens Axboe 490d6d48196SJens Axboe return ll_new_hw_segment(q, req, bio); 491d6d48196SJens Axboe } 492d6d48196SJens Axboe 493d6d48196SJens Axboe int ll_front_merge_fn(struct request_queue *q, struct request *req, 494d6d48196SJens Axboe struct bio *bio) 495d6d48196SJens Axboe { 4965e7c4274SJens Axboe 4975e7c4274SJens Axboe if (req_gap_front_merge(req, bio)) 4985e7c4274SJens Axboe return 0; 4997f39add3SSagi Grimberg if (blk_integrity_rq(req) && 5007f39add3SSagi Grimberg integrity_req_gap_front_merge(req, bio)) 5017f39add3SSagi Grimberg return 0; 502f31dc1cdSMartin K. Petersen if (blk_rq_sectors(req) + bio_sectors(bio) > 503f31dc1cdSMartin K. Petersen blk_rq_get_max_sectors(req)) { 504d6d48196SJens Axboe req->cmd_flags |= REQ_NOMERGE; 505d6d48196SJens Axboe if (req == q->last_merge) 506d6d48196SJens Axboe q->last_merge = NULL; 507d6d48196SJens Axboe return 0; 508d6d48196SJens Axboe } 5092cdf79caSJens Axboe if (!bio_flagged(bio, BIO_SEG_VALID)) 510d6d48196SJens Axboe blk_recount_segments(q, bio); 5112cdf79caSJens Axboe if (!bio_flagged(req->bio, BIO_SEG_VALID)) 512d6d48196SJens Axboe blk_recount_segments(q, req->bio); 513d6d48196SJens Axboe 514d6d48196SJens Axboe return ll_new_hw_segment(q, req, bio); 515d6d48196SJens Axboe } 516d6d48196SJens Axboe 517e7e24500SJens Axboe /* 518e7e24500SJens Axboe * blk-mq uses req->special to carry normal driver per-request payload, it 519e7e24500SJens Axboe * does not indicate a prepared command that we cannot merge with. 520e7e24500SJens Axboe */ 521e7e24500SJens Axboe static bool req_no_special_merge(struct request *req) 522e7e24500SJens Axboe { 523e7e24500SJens Axboe struct request_queue *q = req->q; 524e7e24500SJens Axboe 525e7e24500SJens Axboe return !q->mq_ops && req->special; 526e7e24500SJens Axboe } 527e7e24500SJens Axboe 528d6d48196SJens Axboe static int ll_merge_requests_fn(struct request_queue *q, struct request *req, 529d6d48196SJens Axboe struct request *next) 530d6d48196SJens Axboe { 531d6d48196SJens Axboe int total_phys_segments; 53286771427SFUJITA Tomonori unsigned int seg_size = 53386771427SFUJITA Tomonori req->biotail->bi_seg_back_size + next->bio->bi_seg_front_size; 534d6d48196SJens Axboe 535d6d48196SJens Axboe /* 536d6d48196SJens Axboe * First check if the either of the requests are re-queued 537d6d48196SJens Axboe * requests. Can't merge them if they are. 538d6d48196SJens Axboe */ 539e7e24500SJens Axboe if (req_no_special_merge(req) || req_no_special_merge(next)) 540d6d48196SJens Axboe return 0; 541d6d48196SJens Axboe 5425e7c4274SJens Axboe if (req_gap_back_merge(req, next->bio)) 543854fbb9cSKeith Busch return 0; 544854fbb9cSKeith Busch 545d6d48196SJens Axboe /* 546d6d48196SJens Axboe * Will it become too large? 547d6d48196SJens Axboe */ 548f31dc1cdSMartin K. Petersen if ((blk_rq_sectors(req) + blk_rq_sectors(next)) > 549f31dc1cdSMartin K. Petersen blk_rq_get_max_sectors(req)) 550d6d48196SJens Axboe return 0; 551d6d48196SJens Axboe 552d6d48196SJens Axboe total_phys_segments = req->nr_phys_segments + next->nr_phys_segments; 55386771427SFUJITA Tomonori if (blk_phys_contig_segment(q, req->biotail, next->bio)) { 55486771427SFUJITA Tomonori if (req->nr_phys_segments == 1) 55586771427SFUJITA Tomonori req->bio->bi_seg_front_size = seg_size; 55686771427SFUJITA Tomonori if (next->nr_phys_segments == 1) 55786771427SFUJITA Tomonori next->biotail->bi_seg_back_size = seg_size; 558d6d48196SJens Axboe total_phys_segments--; 55986771427SFUJITA Tomonori } 560d6d48196SJens Axboe 5618a78362cSMartin K. Petersen if (total_phys_segments > queue_max_segments(q)) 562d6d48196SJens Axboe return 0; 563d6d48196SJens Axboe 5644eaf99beSMartin K. Petersen if (blk_integrity_merge_rq(q, req, next) == false) 56513f05c8dSMartin K. Petersen return 0; 56613f05c8dSMartin K. Petersen 567d6d48196SJens Axboe /* Merge is OK... */ 568d6d48196SJens Axboe req->nr_phys_segments = total_phys_segments; 569d6d48196SJens Axboe return 1; 570d6d48196SJens Axboe } 571d6d48196SJens Axboe 57280a761fdSTejun Heo /** 57380a761fdSTejun Heo * blk_rq_set_mixed_merge - mark a request as mixed merge 57480a761fdSTejun Heo * @rq: request to mark as mixed merge 57580a761fdSTejun Heo * 57680a761fdSTejun Heo * Description: 57780a761fdSTejun Heo * @rq is about to be mixed merged. Make sure the attributes 57880a761fdSTejun Heo * which can be mixed are set in each bio and mark @rq as mixed 57980a761fdSTejun Heo * merged. 58080a761fdSTejun Heo */ 58180a761fdSTejun Heo void blk_rq_set_mixed_merge(struct request *rq) 58280a761fdSTejun Heo { 58380a761fdSTejun Heo unsigned int ff = rq->cmd_flags & REQ_FAILFAST_MASK; 58480a761fdSTejun Heo struct bio *bio; 58580a761fdSTejun Heo 58680a761fdSTejun Heo if (rq->cmd_flags & REQ_MIXED_MERGE) 58780a761fdSTejun Heo return; 58880a761fdSTejun Heo 58980a761fdSTejun Heo /* 59080a761fdSTejun Heo * @rq will no longer represent mixable attributes for all the 59180a761fdSTejun Heo * contained bios. It will just track those of the first one. 59280a761fdSTejun Heo * Distributes the attributs to each bio. 59380a761fdSTejun Heo */ 59480a761fdSTejun Heo for (bio = rq->bio; bio; bio = bio->bi_next) { 59580a761fdSTejun Heo WARN_ON_ONCE((bio->bi_rw & REQ_FAILFAST_MASK) && 59680a761fdSTejun Heo (bio->bi_rw & REQ_FAILFAST_MASK) != ff); 59780a761fdSTejun Heo bio->bi_rw |= ff; 59880a761fdSTejun Heo } 59980a761fdSTejun Heo rq->cmd_flags |= REQ_MIXED_MERGE; 60080a761fdSTejun Heo } 60180a761fdSTejun Heo 60226308eabSJerome Marchand static void blk_account_io_merge(struct request *req) 60326308eabSJerome Marchand { 60426308eabSJerome Marchand if (blk_do_io_stat(req)) { 60526308eabSJerome Marchand struct hd_struct *part; 60626308eabSJerome Marchand int cpu; 60726308eabSJerome Marchand 60826308eabSJerome Marchand cpu = part_stat_lock(); 60909e099d4SJerome Marchand part = req->part; 61026308eabSJerome Marchand 61126308eabSJerome Marchand part_round_stats(cpu, part); 612316d315bSNikanth Karthikesan part_dec_in_flight(part, rq_data_dir(req)); 61326308eabSJerome Marchand 6146c23a968SJens Axboe hd_struct_put(part); 61526308eabSJerome Marchand part_stat_unlock(); 61626308eabSJerome Marchand } 61726308eabSJerome Marchand } 61826308eabSJerome Marchand 619d6d48196SJens Axboe /* 620d6d48196SJens Axboe * Has to be called with the request spinlock acquired 621d6d48196SJens Axboe */ 622d6d48196SJens Axboe static int attempt_merge(struct request_queue *q, struct request *req, 623d6d48196SJens Axboe struct request *next) 624d6d48196SJens Axboe { 625d6d48196SJens Axboe if (!rq_mergeable(req) || !rq_mergeable(next)) 626d6d48196SJens Axboe return 0; 627d6d48196SJens Axboe 628f31dc1cdSMartin K. Petersen if (!blk_check_merge_flags(req->cmd_flags, next->cmd_flags)) 629f31dc1cdSMartin K. Petersen return 0; 630f31dc1cdSMartin K. Petersen 631d6d48196SJens Axboe /* 632d6d48196SJens Axboe * not contiguous 633d6d48196SJens Axboe */ 63483096ebfSTejun Heo if (blk_rq_pos(req) + blk_rq_sectors(req) != blk_rq_pos(next)) 635d6d48196SJens Axboe return 0; 636d6d48196SJens Axboe 637d6d48196SJens Axboe if (rq_data_dir(req) != rq_data_dir(next) 638d6d48196SJens Axboe || req->rq_disk != next->rq_disk 639e7e24500SJens Axboe || req_no_special_merge(next)) 640d6d48196SJens Axboe return 0; 641d6d48196SJens Axboe 6424363ac7cSMartin K. Petersen if (req->cmd_flags & REQ_WRITE_SAME && 6434363ac7cSMartin K. Petersen !blk_write_same_mergeable(req->bio, next->bio)) 6444363ac7cSMartin K. Petersen return 0; 6454363ac7cSMartin K. Petersen 646d6d48196SJens Axboe /* 647d6d48196SJens Axboe * If we are allowed to merge, then append bio list 648d6d48196SJens Axboe * from next to rq and release next. merge_requests_fn 649d6d48196SJens Axboe * will have updated segment counts, update sector 650d6d48196SJens Axboe * counts here. 651d6d48196SJens Axboe */ 652d6d48196SJens Axboe if (!ll_merge_requests_fn(q, req, next)) 653d6d48196SJens Axboe return 0; 654d6d48196SJens Axboe 655d6d48196SJens Axboe /* 65680a761fdSTejun Heo * If failfast settings disagree or any of the two is already 65780a761fdSTejun Heo * a mixed merge, mark both as mixed before proceeding. This 65880a761fdSTejun Heo * makes sure that all involved bios have mixable attributes 65980a761fdSTejun Heo * set properly. 66080a761fdSTejun Heo */ 66180a761fdSTejun Heo if ((req->cmd_flags | next->cmd_flags) & REQ_MIXED_MERGE || 66280a761fdSTejun Heo (req->cmd_flags & REQ_FAILFAST_MASK) != 66380a761fdSTejun Heo (next->cmd_flags & REQ_FAILFAST_MASK)) { 66480a761fdSTejun Heo blk_rq_set_mixed_merge(req); 66580a761fdSTejun Heo blk_rq_set_mixed_merge(next); 66680a761fdSTejun Heo } 66780a761fdSTejun Heo 66880a761fdSTejun Heo /* 669d6d48196SJens Axboe * At this point we have either done a back merge 670d6d48196SJens Axboe * or front merge. We need the smaller start_time of 671d6d48196SJens Axboe * the merged requests to be the current request 672d6d48196SJens Axboe * for accounting purposes. 673d6d48196SJens Axboe */ 674d6d48196SJens Axboe if (time_after(req->start_time, next->start_time)) 675d6d48196SJens Axboe req->start_time = next->start_time; 676d6d48196SJens Axboe 677d6d48196SJens Axboe req->biotail->bi_next = next->bio; 678d6d48196SJens Axboe req->biotail = next->biotail; 679d6d48196SJens Axboe 680a2dec7b3STejun Heo req->__data_len += blk_rq_bytes(next); 681d6d48196SJens Axboe 682d6d48196SJens Axboe elv_merge_requests(q, req, next); 683d6d48196SJens Axboe 68442dad764SJerome Marchand /* 68542dad764SJerome Marchand * 'next' is going away, so update stats accordingly 68642dad764SJerome Marchand */ 68742dad764SJerome Marchand blk_account_io_merge(next); 688d6d48196SJens Axboe 689d6d48196SJens Axboe req->ioprio = ioprio_best(req->ioprio, next->ioprio); 690ab780f1eSJens Axboe if (blk_rq_cpu_valid(next)) 691ab780f1eSJens Axboe req->cpu = next->cpu; 692d6d48196SJens Axboe 6931cd96c24SBoaz Harrosh /* owner-ship of bio passed from next to req */ 6941cd96c24SBoaz Harrosh next->bio = NULL; 695d6d48196SJens Axboe __blk_put_request(q, next); 696d6d48196SJens Axboe return 1; 697d6d48196SJens Axboe } 698d6d48196SJens Axboe 699d6d48196SJens Axboe int attempt_back_merge(struct request_queue *q, struct request *rq) 700d6d48196SJens Axboe { 701d6d48196SJens Axboe struct request *next = elv_latter_request(q, rq); 702d6d48196SJens Axboe 703d6d48196SJens Axboe if (next) 704d6d48196SJens Axboe return attempt_merge(q, rq, next); 705d6d48196SJens Axboe 706d6d48196SJens Axboe return 0; 707d6d48196SJens Axboe } 708d6d48196SJens Axboe 709d6d48196SJens Axboe int attempt_front_merge(struct request_queue *q, struct request *rq) 710d6d48196SJens Axboe { 711d6d48196SJens Axboe struct request *prev = elv_former_request(q, rq); 712d6d48196SJens Axboe 713d6d48196SJens Axboe if (prev) 714d6d48196SJens Axboe return attempt_merge(q, prev, rq); 715d6d48196SJens Axboe 716d6d48196SJens Axboe return 0; 717d6d48196SJens Axboe } 7185e84ea3aSJens Axboe 7195e84ea3aSJens Axboe int blk_attempt_req_merge(struct request_queue *q, struct request *rq, 7205e84ea3aSJens Axboe struct request *next) 7215e84ea3aSJens Axboe { 7225e84ea3aSJens Axboe return attempt_merge(q, rq, next); 7235e84ea3aSJens Axboe } 724050c8ea8STejun Heo 725050c8ea8STejun Heo bool blk_rq_merge_ok(struct request *rq, struct bio *bio) 726050c8ea8STejun Heo { 727e2a60da7SMartin K. Petersen if (!rq_mergeable(rq) || !bio_mergeable(bio)) 728050c8ea8STejun Heo return false; 729050c8ea8STejun Heo 730f31dc1cdSMartin K. Petersen if (!blk_check_merge_flags(rq->cmd_flags, bio->bi_rw)) 731f31dc1cdSMartin K. Petersen return false; 732f31dc1cdSMartin K. Petersen 733050c8ea8STejun Heo /* different data direction or already started, don't merge */ 734050c8ea8STejun Heo if (bio_data_dir(bio) != rq_data_dir(rq)) 735050c8ea8STejun Heo return false; 736050c8ea8STejun Heo 737050c8ea8STejun Heo /* must be same device and not a special request */ 738e7e24500SJens Axboe if (rq->rq_disk != bio->bi_bdev->bd_disk || req_no_special_merge(rq)) 739050c8ea8STejun Heo return false; 740050c8ea8STejun Heo 741050c8ea8STejun Heo /* only merge integrity protected bio into ditto rq */ 7424eaf99beSMartin K. Petersen if (blk_integrity_merge_bio(rq->q, rq, bio) == false) 743050c8ea8STejun Heo return false; 744050c8ea8STejun Heo 7454363ac7cSMartin K. Petersen /* must be using the same buffer */ 7464363ac7cSMartin K. Petersen if (rq->cmd_flags & REQ_WRITE_SAME && 7474363ac7cSMartin K. Petersen !blk_write_same_mergeable(rq->bio, bio)) 7484363ac7cSMartin K. Petersen return false; 7494363ac7cSMartin K. Petersen 750050c8ea8STejun Heo return true; 751050c8ea8STejun Heo } 752050c8ea8STejun Heo 753050c8ea8STejun Heo int blk_try_merge(struct request *rq, struct bio *bio) 754050c8ea8STejun Heo { 7554f024f37SKent Overstreet if (blk_rq_pos(rq) + blk_rq_sectors(rq) == bio->bi_iter.bi_sector) 756050c8ea8STejun Heo return ELEVATOR_BACK_MERGE; 7574f024f37SKent Overstreet else if (blk_rq_pos(rq) - bio_sectors(bio) == bio->bi_iter.bi_sector) 758050c8ea8STejun Heo return ELEVATOR_FRONT_MERGE; 759050c8ea8STejun Heo return ELEVATOR_NO_MERGE; 760050c8ea8STejun Heo } 761