1d6d48196SJens Axboe /* 2d6d48196SJens Axboe * Functions related to segment and merge handling 3d6d48196SJens Axboe */ 4d6d48196SJens Axboe #include <linux/kernel.h> 5d6d48196SJens Axboe #include <linux/module.h> 6d6d48196SJens Axboe #include <linux/bio.h> 7d6d48196SJens Axboe #include <linux/blkdev.h> 8d6d48196SJens Axboe #include <linux/scatterlist.h> 9d6d48196SJens Axboe 10d6d48196SJens Axboe #include "blk.h" 11d6d48196SJens Axboe 121e428079SJens Axboe static unsigned int __blk_recalc_rq_segments(struct request_queue *q, 1359247eaeSJens Axboe struct bio *bio) 14d6d48196SJens Axboe { 15d6d48196SJens Axboe unsigned int phys_size; 16d6d48196SJens Axboe struct bio_vec *bv, *bvprv = NULL; 171e428079SJens Axboe int cluster, i, high, highprv = 1; 181e428079SJens Axboe unsigned int seg_size, nr_phys_segs; 1959247eaeSJens Axboe struct bio *fbio, *bbio; 20d6d48196SJens Axboe 211e428079SJens Axboe if (!bio) 221e428079SJens Axboe return 0; 23d6d48196SJens Axboe 241e428079SJens Axboe fbio = bio; 2575ad23bcSNick Piggin cluster = test_bit(QUEUE_FLAG_CLUSTER, &q->queue_flags); 265df97b91SMikulas Patocka seg_size = 0; 275df97b91SMikulas Patocka phys_size = nr_phys_segs = 0; 281e428079SJens Axboe for_each_bio(bio) { 291e428079SJens Axboe bio_for_each_segment(bv, bio, i) { 30d6d48196SJens Axboe /* 311e428079SJens Axboe * the trick here is making sure that a high page is 321e428079SJens Axboe * never considered part of another segment, since that 331e428079SJens Axboe * might change with the bounce page. 34d6d48196SJens Axboe */ 35d6d48196SJens Axboe high = page_to_pfn(bv->bv_page) > q->bounce_pfn; 36d6d48196SJens Axboe if (high || highprv) 37b8b3e16cSMikulas Patocka goto new_segment; 38d6d48196SJens Axboe if (cluster) { 39d6d48196SJens Axboe if (seg_size + bv->bv_len > q->max_segment_size) 40d6d48196SJens Axboe goto new_segment; 41d6d48196SJens Axboe if (!BIOVEC_PHYS_MERGEABLE(bvprv, bv)) 42d6d48196SJens Axboe goto new_segment; 43d6d48196SJens Axboe if (!BIOVEC_SEG_BOUNDARY(q, bvprv, bv)) 44d6d48196SJens Axboe goto new_segment; 45d6d48196SJens Axboe 46d6d48196SJens Axboe seg_size += bv->bv_len; 47d6d48196SJens Axboe bvprv = bv; 48d6d48196SJens Axboe continue; 49d6d48196SJens Axboe } 50d6d48196SJens Axboe new_segment: 511e428079SJens Axboe if (nr_phys_segs == 1 && seg_size > 521e428079SJens Axboe fbio->bi_seg_front_size) 531e428079SJens Axboe fbio->bi_seg_front_size = seg_size; 5486771427SFUJITA Tomonori 55d6d48196SJens Axboe nr_phys_segs++; 56d6d48196SJens Axboe bvprv = bv; 57d6d48196SJens Axboe seg_size = bv->bv_len; 58d6d48196SJens Axboe highprv = high; 59d6d48196SJens Axboe } 6059247eaeSJens Axboe bbio = bio; 611e428079SJens Axboe } 62d6d48196SJens Axboe 6359247eaeSJens Axboe if (nr_phys_segs == 1 && seg_size > fbio->bi_seg_front_size) 6459247eaeSJens Axboe fbio->bi_seg_front_size = seg_size; 6559247eaeSJens Axboe if (seg_size > bbio->bi_seg_back_size) 6659247eaeSJens Axboe bbio->bi_seg_back_size = seg_size; 671e428079SJens Axboe 681e428079SJens Axboe return nr_phys_segs; 691e428079SJens Axboe } 701e428079SJens Axboe 711e428079SJens Axboe void blk_recalc_rq_segments(struct request *rq) 721e428079SJens Axboe { 7359247eaeSJens Axboe rq->nr_phys_segments = __blk_recalc_rq_segments(rq->q, rq->bio); 74d6d48196SJens Axboe } 75d6d48196SJens Axboe 76d6d48196SJens Axboe void blk_recount_segments(struct request_queue *q, struct bio *bio) 77d6d48196SJens Axboe { 78d6d48196SJens Axboe struct bio *nxt = bio->bi_next; 791e428079SJens Axboe 80d6d48196SJens Axboe bio->bi_next = NULL; 8159247eaeSJens Axboe bio->bi_phys_segments = __blk_recalc_rq_segments(q, bio); 82d6d48196SJens Axboe bio->bi_next = nxt; 83d6d48196SJens Axboe bio->bi_flags |= (1 << BIO_SEG_VALID); 84d6d48196SJens Axboe } 85d6d48196SJens Axboe EXPORT_SYMBOL(blk_recount_segments); 86d6d48196SJens Axboe 87d6d48196SJens Axboe static int blk_phys_contig_segment(struct request_queue *q, struct bio *bio, 88d6d48196SJens Axboe struct bio *nxt) 89d6d48196SJens Axboe { 9075ad23bcSNick Piggin if (!test_bit(QUEUE_FLAG_CLUSTER, &q->queue_flags)) 91d6d48196SJens Axboe return 0; 92d6d48196SJens Axboe 9386771427SFUJITA Tomonori if (bio->bi_seg_back_size + nxt->bi_seg_front_size > 9486771427SFUJITA Tomonori q->max_segment_size) 95d6d48196SJens Axboe return 0; 96d6d48196SJens Axboe 97e17fc0a1SDavid Woodhouse if (!bio_has_data(bio)) 98e17fc0a1SDavid Woodhouse return 1; 99e17fc0a1SDavid Woodhouse 100e17fc0a1SDavid Woodhouse if (!BIOVEC_PHYS_MERGEABLE(__BVEC_END(bio), __BVEC_START(nxt))) 101e17fc0a1SDavid Woodhouse return 0; 102e17fc0a1SDavid Woodhouse 103d6d48196SJens Axboe /* 104e17fc0a1SDavid Woodhouse * bio and nxt are contiguous in memory; check if the queue allows 105d6d48196SJens Axboe * these two to be merged into one 106d6d48196SJens Axboe */ 107d6d48196SJens Axboe if (BIO_SEG_BOUNDARY(q, bio, nxt)) 108d6d48196SJens Axboe return 1; 109d6d48196SJens Axboe 110d6d48196SJens Axboe return 0; 111d6d48196SJens Axboe } 112d6d48196SJens Axboe 113d6d48196SJens Axboe /* 114d6d48196SJens Axboe * map a request to scatterlist, return number of sg entries setup. Caller 115d6d48196SJens Axboe * must make sure sg can hold rq->nr_phys_segments entries 116d6d48196SJens Axboe */ 117d6d48196SJens Axboe int blk_rq_map_sg(struct request_queue *q, struct request *rq, 118d6d48196SJens Axboe struct scatterlist *sglist) 119d6d48196SJens Axboe { 120d6d48196SJens Axboe struct bio_vec *bvec, *bvprv; 121d6d48196SJens Axboe struct req_iterator iter; 122d6d48196SJens Axboe struct scatterlist *sg; 123d6d48196SJens Axboe int nsegs, cluster; 124d6d48196SJens Axboe 125d6d48196SJens Axboe nsegs = 0; 12675ad23bcSNick Piggin cluster = test_bit(QUEUE_FLAG_CLUSTER, &q->queue_flags); 127d6d48196SJens Axboe 128d6d48196SJens Axboe /* 129d6d48196SJens Axboe * for each bio in rq 130d6d48196SJens Axboe */ 131d6d48196SJens Axboe bvprv = NULL; 132d6d48196SJens Axboe sg = NULL; 133d6d48196SJens Axboe rq_for_each_segment(bvec, rq, iter) { 134d6d48196SJens Axboe int nbytes = bvec->bv_len; 135d6d48196SJens Axboe 136d6d48196SJens Axboe if (bvprv && cluster) { 137d6d48196SJens Axboe if (sg->length + nbytes > q->max_segment_size) 138d6d48196SJens Axboe goto new_segment; 139d6d48196SJens Axboe 140d6d48196SJens Axboe if (!BIOVEC_PHYS_MERGEABLE(bvprv, bvec)) 141d6d48196SJens Axboe goto new_segment; 142d6d48196SJens Axboe if (!BIOVEC_SEG_BOUNDARY(q, bvprv, bvec)) 143d6d48196SJens Axboe goto new_segment; 144d6d48196SJens Axboe 145d6d48196SJens Axboe sg->length += nbytes; 146d6d48196SJens Axboe } else { 147d6d48196SJens Axboe new_segment: 148d6d48196SJens Axboe if (!sg) 149d6d48196SJens Axboe sg = sglist; 150d6d48196SJens Axboe else { 151d6d48196SJens Axboe /* 152d6d48196SJens Axboe * If the driver previously mapped a shorter 153d6d48196SJens Axboe * list, we could see a termination bit 154d6d48196SJens Axboe * prematurely unless it fully inits the sg 155d6d48196SJens Axboe * table on each mapping. We KNOW that there 156d6d48196SJens Axboe * must be more entries here or the driver 157d6d48196SJens Axboe * would be buggy, so force clear the 158d6d48196SJens Axboe * termination bit to avoid doing a full 159d6d48196SJens Axboe * sg_init_table() in drivers for each command. 160d6d48196SJens Axboe */ 161d6d48196SJens Axboe sg->page_link &= ~0x02; 162d6d48196SJens Axboe sg = sg_next(sg); 163d6d48196SJens Axboe } 164d6d48196SJens Axboe 165d6d48196SJens Axboe sg_set_page(sg, bvec->bv_page, nbytes, bvec->bv_offset); 166d6d48196SJens Axboe nsegs++; 167d6d48196SJens Axboe } 168d6d48196SJens Axboe bvprv = bvec; 169d6d48196SJens Axboe } /* segments in rq */ 170d6d48196SJens Axboe 171f18573abSFUJITA Tomonori 172f18573abSFUJITA Tomonori if (unlikely(rq->cmd_flags & REQ_COPY_USER) && 1732e46e8b2STejun Heo (blk_rq_bytes(rq) & q->dma_pad_mask)) { 1742e46e8b2STejun Heo unsigned int pad_len = 1752e46e8b2STejun Heo (q->dma_pad_mask & ~blk_rq_bytes(rq)) + 1; 176f18573abSFUJITA Tomonori 177f18573abSFUJITA Tomonori sg->length += pad_len; 178f18573abSFUJITA Tomonori rq->extra_len += pad_len; 179f18573abSFUJITA Tomonori } 180f18573abSFUJITA Tomonori 1812fb98e84STejun Heo if (q->dma_drain_size && q->dma_drain_needed(rq)) { 182db0a2e00STejun Heo if (rq->cmd_flags & REQ_RW) 183db0a2e00STejun Heo memset(q->dma_drain_buffer, 0, q->dma_drain_size); 184db0a2e00STejun Heo 185d6d48196SJens Axboe sg->page_link &= ~0x02; 186d6d48196SJens Axboe sg = sg_next(sg); 187d6d48196SJens Axboe sg_set_page(sg, virt_to_page(q->dma_drain_buffer), 188d6d48196SJens Axboe q->dma_drain_size, 189d6d48196SJens Axboe ((unsigned long)q->dma_drain_buffer) & 190d6d48196SJens Axboe (PAGE_SIZE - 1)); 191d6d48196SJens Axboe nsegs++; 1927a85f889SFUJITA Tomonori rq->extra_len += q->dma_drain_size; 193d6d48196SJens Axboe } 194d6d48196SJens Axboe 195d6d48196SJens Axboe if (sg) 196d6d48196SJens Axboe sg_mark_end(sg); 197d6d48196SJens Axboe 198d6d48196SJens Axboe return nsegs; 199d6d48196SJens Axboe } 200d6d48196SJens Axboe EXPORT_SYMBOL(blk_rq_map_sg); 201d6d48196SJens Axboe 202d6d48196SJens Axboe static inline int ll_new_hw_segment(struct request_queue *q, 203d6d48196SJens Axboe struct request *req, 204d6d48196SJens Axboe struct bio *bio) 205d6d48196SJens Axboe { 206d6d48196SJens Axboe int nr_phys_segs = bio_phys_segments(q, bio); 207d6d48196SJens Axboe 2085df97b91SMikulas Patocka if (req->nr_phys_segments + nr_phys_segs > q->max_hw_segments 209d6d48196SJens Axboe || req->nr_phys_segments + nr_phys_segs > q->max_phys_segments) { 210d6d48196SJens Axboe req->cmd_flags |= REQ_NOMERGE; 211d6d48196SJens Axboe if (req == q->last_merge) 212d6d48196SJens Axboe q->last_merge = NULL; 213d6d48196SJens Axboe return 0; 214d6d48196SJens Axboe } 215d6d48196SJens Axboe 216d6d48196SJens Axboe /* 217d6d48196SJens Axboe * This will form the start of a new hw segment. Bump both 218d6d48196SJens Axboe * counters. 219d6d48196SJens Axboe */ 220d6d48196SJens Axboe req->nr_phys_segments += nr_phys_segs; 221d6d48196SJens Axboe return 1; 222d6d48196SJens Axboe } 223d6d48196SJens Axboe 224d6d48196SJens Axboe int ll_back_merge_fn(struct request_queue *q, struct request *req, 225d6d48196SJens Axboe struct bio *bio) 226d6d48196SJens Axboe { 227d6d48196SJens Axboe unsigned short max_sectors; 228d6d48196SJens Axboe 229d6d48196SJens Axboe if (unlikely(blk_pc_request(req))) 230d6d48196SJens Axboe max_sectors = q->max_hw_sectors; 231d6d48196SJens Axboe else 232d6d48196SJens Axboe max_sectors = q->max_sectors; 233d6d48196SJens Axboe 23483096ebfSTejun Heo if (blk_rq_sectors(req) + bio_sectors(bio) > max_sectors) { 235d6d48196SJens Axboe req->cmd_flags |= REQ_NOMERGE; 236d6d48196SJens Axboe if (req == q->last_merge) 237d6d48196SJens Axboe q->last_merge = NULL; 238d6d48196SJens Axboe return 0; 239d6d48196SJens Axboe } 2402cdf79caSJens Axboe if (!bio_flagged(req->biotail, BIO_SEG_VALID)) 241d6d48196SJens Axboe blk_recount_segments(q, req->biotail); 2422cdf79caSJens Axboe if (!bio_flagged(bio, BIO_SEG_VALID)) 243d6d48196SJens Axboe blk_recount_segments(q, bio); 244d6d48196SJens Axboe 245d6d48196SJens Axboe return ll_new_hw_segment(q, req, bio); 246d6d48196SJens Axboe } 247d6d48196SJens Axboe 248d6d48196SJens Axboe int ll_front_merge_fn(struct request_queue *q, struct request *req, 249d6d48196SJens Axboe struct bio *bio) 250d6d48196SJens Axboe { 251d6d48196SJens Axboe unsigned short max_sectors; 252d6d48196SJens Axboe 253d6d48196SJens Axboe if (unlikely(blk_pc_request(req))) 254d6d48196SJens Axboe max_sectors = q->max_hw_sectors; 255d6d48196SJens Axboe else 256d6d48196SJens Axboe max_sectors = q->max_sectors; 257d6d48196SJens Axboe 258d6d48196SJens Axboe 25983096ebfSTejun Heo if (blk_rq_sectors(req) + bio_sectors(bio) > max_sectors) { 260d6d48196SJens Axboe req->cmd_flags |= REQ_NOMERGE; 261d6d48196SJens Axboe if (req == q->last_merge) 262d6d48196SJens Axboe q->last_merge = NULL; 263d6d48196SJens Axboe return 0; 264d6d48196SJens Axboe } 2652cdf79caSJens Axboe if (!bio_flagged(bio, BIO_SEG_VALID)) 266d6d48196SJens Axboe blk_recount_segments(q, bio); 2672cdf79caSJens Axboe if (!bio_flagged(req->bio, BIO_SEG_VALID)) 268d6d48196SJens Axboe blk_recount_segments(q, req->bio); 269d6d48196SJens Axboe 270d6d48196SJens Axboe return ll_new_hw_segment(q, req, bio); 271d6d48196SJens Axboe } 272d6d48196SJens Axboe 273d6d48196SJens Axboe static int ll_merge_requests_fn(struct request_queue *q, struct request *req, 274d6d48196SJens Axboe struct request *next) 275d6d48196SJens Axboe { 276d6d48196SJens Axboe int total_phys_segments; 27786771427SFUJITA Tomonori unsigned int seg_size = 27886771427SFUJITA Tomonori req->biotail->bi_seg_back_size + next->bio->bi_seg_front_size; 279d6d48196SJens Axboe 280d6d48196SJens Axboe /* 281d6d48196SJens Axboe * First check if the either of the requests are re-queued 282d6d48196SJens Axboe * requests. Can't merge them if they are. 283d6d48196SJens Axboe */ 284d6d48196SJens Axboe if (req->special || next->special) 285d6d48196SJens Axboe return 0; 286d6d48196SJens Axboe 287d6d48196SJens Axboe /* 288d6d48196SJens Axboe * Will it become too large? 289d6d48196SJens Axboe */ 29083096ebfSTejun Heo if ((blk_rq_sectors(req) + blk_rq_sectors(next)) > q->max_sectors) 291d6d48196SJens Axboe return 0; 292d6d48196SJens Axboe 293d6d48196SJens Axboe total_phys_segments = req->nr_phys_segments + next->nr_phys_segments; 29486771427SFUJITA Tomonori if (blk_phys_contig_segment(q, req->biotail, next->bio)) { 29586771427SFUJITA Tomonori if (req->nr_phys_segments == 1) 29686771427SFUJITA Tomonori req->bio->bi_seg_front_size = seg_size; 29786771427SFUJITA Tomonori if (next->nr_phys_segments == 1) 29886771427SFUJITA Tomonori next->biotail->bi_seg_back_size = seg_size; 299d6d48196SJens Axboe total_phys_segments--; 30086771427SFUJITA Tomonori } 301d6d48196SJens Axboe 302d6d48196SJens Axboe if (total_phys_segments > q->max_phys_segments) 303d6d48196SJens Axboe return 0; 304d6d48196SJens Axboe 3055df97b91SMikulas Patocka if (total_phys_segments > q->max_hw_segments) 306d6d48196SJens Axboe return 0; 307d6d48196SJens Axboe 308d6d48196SJens Axboe /* Merge is OK... */ 309d6d48196SJens Axboe req->nr_phys_segments = total_phys_segments; 310d6d48196SJens Axboe return 1; 311d6d48196SJens Axboe } 312d6d48196SJens Axboe 31326308eabSJerome Marchand static void blk_account_io_merge(struct request *req) 31426308eabSJerome Marchand { 31526308eabSJerome Marchand if (blk_do_io_stat(req)) { 31626308eabSJerome Marchand struct hd_struct *part; 31726308eabSJerome Marchand int cpu; 31826308eabSJerome Marchand 31926308eabSJerome Marchand cpu = part_stat_lock(); 32083096ebfSTejun Heo part = disk_map_sector_rcu(req->rq_disk, blk_rq_pos(req)); 32126308eabSJerome Marchand 32226308eabSJerome Marchand part_round_stats(cpu, part); 32326308eabSJerome Marchand part_dec_in_flight(part); 32426308eabSJerome Marchand 32526308eabSJerome Marchand part_stat_unlock(); 32626308eabSJerome Marchand } 32726308eabSJerome Marchand } 32826308eabSJerome Marchand 329d6d48196SJens Axboe /* 330d6d48196SJens Axboe * Has to be called with the request spinlock acquired 331d6d48196SJens Axboe */ 332d6d48196SJens Axboe static int attempt_merge(struct request_queue *q, struct request *req, 333d6d48196SJens Axboe struct request *next) 334d6d48196SJens Axboe { 335d6d48196SJens Axboe if (!rq_mergeable(req) || !rq_mergeable(next)) 336d6d48196SJens Axboe return 0; 337d6d48196SJens Axboe 338d6d48196SJens Axboe /* 339d6d48196SJens Axboe * not contiguous 340d6d48196SJens Axboe */ 34183096ebfSTejun Heo if (blk_rq_pos(req) + blk_rq_sectors(req) != blk_rq_pos(next)) 342d6d48196SJens Axboe return 0; 343d6d48196SJens Axboe 344d6d48196SJens Axboe if (rq_data_dir(req) != rq_data_dir(next) 345d6d48196SJens Axboe || req->rq_disk != next->rq_disk 346d6d48196SJens Axboe || next->special) 347d6d48196SJens Axboe return 0; 348d6d48196SJens Axboe 3497ba1ba12SMartin K. Petersen if (blk_integrity_rq(req) != blk_integrity_rq(next)) 3507ba1ba12SMartin K. Petersen return 0; 3517ba1ba12SMartin K. Petersen 352d6d48196SJens Axboe /* 353d6d48196SJens Axboe * If we are allowed to merge, then append bio list 354d6d48196SJens Axboe * from next to rq and release next. merge_requests_fn 355d6d48196SJens Axboe * will have updated segment counts, update sector 356d6d48196SJens Axboe * counts here. 357d6d48196SJens Axboe */ 358d6d48196SJens Axboe if (!ll_merge_requests_fn(q, req, next)) 359d6d48196SJens Axboe return 0; 360d6d48196SJens Axboe 361d6d48196SJens Axboe /* 362d6d48196SJens Axboe * At this point we have either done a back merge 363d6d48196SJens Axboe * or front merge. We need the smaller start_time of 364d6d48196SJens Axboe * the merged requests to be the current request 365d6d48196SJens Axboe * for accounting purposes. 366d6d48196SJens Axboe */ 367d6d48196SJens Axboe if (time_after(req->start_time, next->start_time)) 368d6d48196SJens Axboe req->start_time = next->start_time; 369d6d48196SJens Axboe 370d6d48196SJens Axboe req->biotail->bi_next = next->bio; 371d6d48196SJens Axboe req->biotail = next->biotail; 372d6d48196SJens Axboe 373*a2dec7b3STejun Heo req->__data_len += blk_rq_bytes(next); 374d6d48196SJens Axboe 375d6d48196SJens Axboe elv_merge_requests(q, req, next); 376d6d48196SJens Axboe 37742dad764SJerome Marchand /* 37842dad764SJerome Marchand * 'next' is going away, so update stats accordingly 37942dad764SJerome Marchand */ 38042dad764SJerome Marchand blk_account_io_merge(next); 381d6d48196SJens Axboe 382d6d48196SJens Axboe req->ioprio = ioprio_best(req->ioprio, next->ioprio); 383ab780f1eSJens Axboe if (blk_rq_cpu_valid(next)) 384ab780f1eSJens Axboe req->cpu = next->cpu; 385d6d48196SJens Axboe 3861cd96c24SBoaz Harrosh /* owner-ship of bio passed from next to req */ 3871cd96c24SBoaz Harrosh next->bio = NULL; 388d6d48196SJens Axboe __blk_put_request(q, next); 389d6d48196SJens Axboe return 1; 390d6d48196SJens Axboe } 391d6d48196SJens Axboe 392d6d48196SJens Axboe int attempt_back_merge(struct request_queue *q, struct request *rq) 393d6d48196SJens Axboe { 394d6d48196SJens Axboe struct request *next = elv_latter_request(q, rq); 395d6d48196SJens Axboe 396d6d48196SJens Axboe if (next) 397d6d48196SJens Axboe return attempt_merge(q, rq, next); 398d6d48196SJens Axboe 399d6d48196SJens Axboe return 0; 400d6d48196SJens Axboe } 401d6d48196SJens Axboe 402d6d48196SJens Axboe int attempt_front_merge(struct request_queue *q, struct request *rq) 403d6d48196SJens Axboe { 404d6d48196SJens Axboe struct request *prev = elv_former_request(q, rq); 405d6d48196SJens Axboe 406d6d48196SJens Axboe if (prev) 407d6d48196SJens Axboe return attempt_merge(q, prev, rq); 408d6d48196SJens Axboe 409d6d48196SJens Axboe return 0; 410d6d48196SJens Axboe } 411