186db1e29SJens Axboe /* 286db1e29SJens Axboe * Functions related to mapping data to requests 386db1e29SJens Axboe */ 486db1e29SJens Axboe #include <linux/kernel.h> 586db1e29SJens Axboe #include <linux/module.h> 686db1e29SJens Axboe #include <linux/bio.h> 786db1e29SJens Axboe #include <linux/blkdev.h> 8*afdc1a78SFUJITA Tomonori #include <scsi/sg.h> /* for struct sg_iovec */ 986db1e29SJens Axboe 1086db1e29SJens Axboe #include "blk.h" 1186db1e29SJens Axboe 1286db1e29SJens Axboe int blk_rq_append_bio(struct request_queue *q, struct request *rq, 1386db1e29SJens Axboe struct bio *bio) 1486db1e29SJens Axboe { 1586db1e29SJens Axboe if (!rq->bio) 1686db1e29SJens Axboe blk_rq_bio_prep(q, rq, bio); 1786db1e29SJens Axboe else if (!ll_back_merge_fn(q, rq, bio)) 1886db1e29SJens Axboe return -EINVAL; 1986db1e29SJens Axboe else { 2086db1e29SJens Axboe rq->biotail->bi_next = bio; 2186db1e29SJens Axboe rq->biotail = bio; 2286db1e29SJens Axboe 2386db1e29SJens Axboe rq->data_len += bio->bi_size; 2486db1e29SJens Axboe } 2586db1e29SJens Axboe return 0; 2686db1e29SJens Axboe } 2786db1e29SJens Axboe EXPORT_SYMBOL(blk_rq_append_bio); 2886db1e29SJens Axboe 2986db1e29SJens Axboe static int __blk_rq_unmap_user(struct bio *bio) 3086db1e29SJens Axboe { 3186db1e29SJens Axboe int ret = 0; 3286db1e29SJens Axboe 3386db1e29SJens Axboe if (bio) { 3486db1e29SJens Axboe if (bio_flagged(bio, BIO_USER_MAPPED)) 3586db1e29SJens Axboe bio_unmap_user(bio); 3686db1e29SJens Axboe else 3786db1e29SJens Axboe ret = bio_uncopy_user(bio); 3886db1e29SJens Axboe } 3986db1e29SJens Axboe 4086db1e29SJens Axboe return ret; 4186db1e29SJens Axboe } 4286db1e29SJens Axboe 4386db1e29SJens Axboe static int __blk_rq_map_user(struct request_queue *q, struct request *rq, 4486db1e29SJens Axboe void __user *ubuf, unsigned int len) 4586db1e29SJens Axboe { 4686db1e29SJens Axboe unsigned long uaddr; 47e3790c7dSTejun Heo unsigned int alignment; 4886db1e29SJens Axboe struct bio *bio, *orig_bio; 4986db1e29SJens Axboe int reading, ret; 5086db1e29SJens Axboe 5186db1e29SJens Axboe reading = rq_data_dir(rq) == READ; 5286db1e29SJens Axboe 5386db1e29SJens Axboe /* 5486db1e29SJens Axboe * if alignment requirement is satisfied, map in user pages for 5586db1e29SJens Axboe * direct dma. else, set up kernel bounce buffers 5686db1e29SJens Axboe */ 5786db1e29SJens Axboe uaddr = (unsigned long) ubuf; 58e3790c7dSTejun Heo alignment = queue_dma_alignment(q) | q->dma_pad_mask; 59e3790c7dSTejun Heo if (!(uaddr & alignment) && !(len & alignment)) 6086db1e29SJens Axboe bio = bio_map_user(q, NULL, uaddr, len, reading); 6186db1e29SJens Axboe else 6286db1e29SJens Axboe bio = bio_copy_user(q, uaddr, len, reading); 6386db1e29SJens Axboe 6486db1e29SJens Axboe if (IS_ERR(bio)) 6586db1e29SJens Axboe return PTR_ERR(bio); 6686db1e29SJens Axboe 6786db1e29SJens Axboe orig_bio = bio; 6886db1e29SJens Axboe blk_queue_bounce(q, &bio); 6986db1e29SJens Axboe 7086db1e29SJens Axboe /* 7186db1e29SJens Axboe * We link the bounce buffer in and could have to traverse it 7286db1e29SJens Axboe * later so we have to get a ref to prevent it from being freed 7386db1e29SJens Axboe */ 7486db1e29SJens Axboe bio_get(bio); 7586db1e29SJens Axboe 7686db1e29SJens Axboe ret = blk_rq_append_bio(q, rq, bio); 7786db1e29SJens Axboe if (!ret) 7886db1e29SJens Axboe return bio->bi_size; 7986db1e29SJens Axboe 8086db1e29SJens Axboe /* if it was boucned we must call the end io function */ 8186db1e29SJens Axboe bio_endio(bio, 0); 8286db1e29SJens Axboe __blk_rq_unmap_user(orig_bio); 8386db1e29SJens Axboe bio_put(bio); 8486db1e29SJens Axboe return ret; 8586db1e29SJens Axboe } 8686db1e29SJens Axboe 8786db1e29SJens Axboe /** 8886db1e29SJens Axboe * blk_rq_map_user - map user data to a request, for REQ_BLOCK_PC usage 8986db1e29SJens Axboe * @q: request queue where request should be inserted 9086db1e29SJens Axboe * @rq: request structure to fill 9186db1e29SJens Axboe * @ubuf: the user buffer 9286db1e29SJens Axboe * @len: length of user data 9386db1e29SJens Axboe * 9486db1e29SJens Axboe * Description: 9586db1e29SJens Axboe * Data will be mapped directly for zero copy io, if possible. Otherwise 9686db1e29SJens Axboe * a kernel bounce buffer is used. 9786db1e29SJens Axboe * 9886db1e29SJens Axboe * A matching blk_rq_unmap_user() must be issued at the end of io, while 9986db1e29SJens Axboe * still in process context. 10086db1e29SJens Axboe * 10186db1e29SJens Axboe * Note: The mapped bio may need to be bounced through blk_queue_bounce() 10286db1e29SJens Axboe * before being submitted to the device, as pages mapped may be out of 10386db1e29SJens Axboe * reach. It's the callers responsibility to make sure this happens. The 10486db1e29SJens Axboe * original bio must be passed back in to blk_rq_unmap_user() for proper 10586db1e29SJens Axboe * unmapping. 10686db1e29SJens Axboe */ 10786db1e29SJens Axboe int blk_rq_map_user(struct request_queue *q, struct request *rq, 10886db1e29SJens Axboe void __user *ubuf, unsigned long len) 10986db1e29SJens Axboe { 11086db1e29SJens Axboe unsigned long bytes_read = 0; 11186db1e29SJens Axboe struct bio *bio = NULL; 11286db1e29SJens Axboe int ret; 11386db1e29SJens Axboe 11486db1e29SJens Axboe if (len > (q->max_hw_sectors << 9)) 11586db1e29SJens Axboe return -EINVAL; 11686db1e29SJens Axboe if (!len || !ubuf) 11786db1e29SJens Axboe return -EINVAL; 11886db1e29SJens Axboe 11986db1e29SJens Axboe while (bytes_read != len) { 12086db1e29SJens Axboe unsigned long map_len, end, start; 12186db1e29SJens Axboe 12286db1e29SJens Axboe map_len = min_t(unsigned long, len - bytes_read, BIO_MAX_SIZE); 12386db1e29SJens Axboe end = ((unsigned long)ubuf + map_len + PAGE_SIZE - 1) 12486db1e29SJens Axboe >> PAGE_SHIFT; 12586db1e29SJens Axboe start = (unsigned long)ubuf >> PAGE_SHIFT; 12686db1e29SJens Axboe 12786db1e29SJens Axboe /* 12886db1e29SJens Axboe * A bad offset could cause us to require BIO_MAX_PAGES + 1 12986db1e29SJens Axboe * pages. If this happens we just lower the requested 13086db1e29SJens Axboe * mapping len by a page so that we can fit 13186db1e29SJens Axboe */ 13286db1e29SJens Axboe if (end - start > BIO_MAX_PAGES) 13386db1e29SJens Axboe map_len -= PAGE_SIZE; 13486db1e29SJens Axboe 13586db1e29SJens Axboe ret = __blk_rq_map_user(q, rq, ubuf, map_len); 13686db1e29SJens Axboe if (ret < 0) 13786db1e29SJens Axboe goto unmap_rq; 13886db1e29SJens Axboe if (!bio) 13986db1e29SJens Axboe bio = rq->bio; 14086db1e29SJens Axboe bytes_read += ret; 14186db1e29SJens Axboe ubuf += ret; 14286db1e29SJens Axboe } 14386db1e29SJens Axboe 14440b01b9bSTejun Heo /* 14540b01b9bSTejun Heo * __blk_rq_map_user() copies the buffers if starting address 146e3790c7dSTejun Heo * or length isn't aligned to dma_pad_mask. As the copied 147e3790c7dSTejun Heo * buffer is always page aligned, we know that there's enough 148e3790c7dSTejun Heo * room for padding. Extend the last bio and update 149e3790c7dSTejun Heo * rq->data_len accordingly. 15040b01b9bSTejun Heo * 15140b01b9bSTejun Heo * On unmap, bio_uncopy_user() will use unmodified 15240b01b9bSTejun Heo * bio_map_data pointed to by bio->bi_private. 15340b01b9bSTejun Heo */ 154e3790c7dSTejun Heo if (len & q->dma_pad_mask) { 155e3790c7dSTejun Heo unsigned int pad_len = (q->dma_pad_mask & ~len) + 1; 15656d94a37SHarvey Harrison struct bio *tail = rq->biotail; 157e3790c7dSTejun Heo 15856d94a37SHarvey Harrison tail->bi_io_vec[tail->bi_vcnt - 1].bv_len += pad_len; 15956d94a37SHarvey Harrison tail->bi_size += pad_len; 16040b01b9bSTejun Heo 1617a85f889SFUJITA Tomonori rq->extra_len += pad_len; 16240b01b9bSTejun Heo } 16340b01b9bSTejun Heo 16486db1e29SJens Axboe rq->buffer = rq->data = NULL; 16586db1e29SJens Axboe return 0; 16686db1e29SJens Axboe unmap_rq: 16786db1e29SJens Axboe blk_rq_unmap_user(bio); 16884e9e03cSJens Axboe rq->bio = NULL; 16986db1e29SJens Axboe return ret; 17086db1e29SJens Axboe } 17186db1e29SJens Axboe EXPORT_SYMBOL(blk_rq_map_user); 17286db1e29SJens Axboe 17386db1e29SJens Axboe /** 17486db1e29SJens Axboe * blk_rq_map_user_iov - map user data to a request, for REQ_BLOCK_PC usage 17586db1e29SJens Axboe * @q: request queue where request should be inserted 17686db1e29SJens Axboe * @rq: request to map data to 17786db1e29SJens Axboe * @iov: pointer to the iovec 17886db1e29SJens Axboe * @iov_count: number of elements in the iovec 17986db1e29SJens Axboe * @len: I/O byte count 18086db1e29SJens Axboe * 18186db1e29SJens Axboe * Description: 18286db1e29SJens Axboe * Data will be mapped directly for zero copy io, if possible. Otherwise 18386db1e29SJens Axboe * a kernel bounce buffer is used. 18486db1e29SJens Axboe * 18586db1e29SJens Axboe * A matching blk_rq_unmap_user() must be issued at the end of io, while 18686db1e29SJens Axboe * still in process context. 18786db1e29SJens Axboe * 18886db1e29SJens Axboe * Note: The mapped bio may need to be bounced through blk_queue_bounce() 18986db1e29SJens Axboe * before being submitted to the device, as pages mapped may be out of 19086db1e29SJens Axboe * reach. It's the callers responsibility to make sure this happens. The 19186db1e29SJens Axboe * original bio must be passed back in to blk_rq_unmap_user() for proper 19286db1e29SJens Axboe * unmapping. 19386db1e29SJens Axboe */ 19486db1e29SJens Axboe int blk_rq_map_user_iov(struct request_queue *q, struct request *rq, 19586db1e29SJens Axboe struct sg_iovec *iov, int iov_count, unsigned int len) 19686db1e29SJens Axboe { 19786db1e29SJens Axboe struct bio *bio; 198*afdc1a78SFUJITA Tomonori int i, read = rq_data_dir(rq) == READ; 199*afdc1a78SFUJITA Tomonori int unaligned = 0; 20086db1e29SJens Axboe 20186db1e29SJens Axboe if (!iov || iov_count <= 0) 20286db1e29SJens Axboe return -EINVAL; 20386db1e29SJens Axboe 204*afdc1a78SFUJITA Tomonori for (i = 0; i < iov_count; i++) { 205*afdc1a78SFUJITA Tomonori unsigned long uaddr = (unsigned long)iov[i].iov_base; 206*afdc1a78SFUJITA Tomonori 207*afdc1a78SFUJITA Tomonori if (uaddr & queue_dma_alignment(q)) { 208*afdc1a78SFUJITA Tomonori unaligned = 1; 209*afdc1a78SFUJITA Tomonori break; 210*afdc1a78SFUJITA Tomonori } 211*afdc1a78SFUJITA Tomonori } 212*afdc1a78SFUJITA Tomonori 213*afdc1a78SFUJITA Tomonori if (unaligned || (q->dma_pad_mask & len)) 214*afdc1a78SFUJITA Tomonori bio = bio_copy_user_iov(q, iov, iov_count, read); 215*afdc1a78SFUJITA Tomonori else 216*afdc1a78SFUJITA Tomonori bio = bio_map_user_iov(q, NULL, iov, iov_count, read); 217*afdc1a78SFUJITA Tomonori 21886db1e29SJens Axboe if (IS_ERR(bio)) 21986db1e29SJens Axboe return PTR_ERR(bio); 22086db1e29SJens Axboe 22186db1e29SJens Axboe if (bio->bi_size != len) { 22286db1e29SJens Axboe bio_endio(bio, 0); 22386db1e29SJens Axboe bio_unmap_user(bio); 22486db1e29SJens Axboe return -EINVAL; 22586db1e29SJens Axboe } 22686db1e29SJens Axboe 22786db1e29SJens Axboe bio_get(bio); 22886db1e29SJens Axboe blk_rq_bio_prep(q, rq, bio); 22986db1e29SJens Axboe rq->buffer = rq->data = NULL; 23086db1e29SJens Axboe return 0; 23186db1e29SJens Axboe } 23286db1e29SJens Axboe 23386db1e29SJens Axboe /** 23486db1e29SJens Axboe * blk_rq_unmap_user - unmap a request with user data 23586db1e29SJens Axboe * @bio: start of bio list 23686db1e29SJens Axboe * 23786db1e29SJens Axboe * Description: 23886db1e29SJens Axboe * Unmap a rq previously mapped by blk_rq_map_user(). The caller must 23986db1e29SJens Axboe * supply the original rq->bio from the blk_rq_map_user() return, since 24086db1e29SJens Axboe * the io completion may have changed rq->bio. 24186db1e29SJens Axboe */ 24286db1e29SJens Axboe int blk_rq_unmap_user(struct bio *bio) 24386db1e29SJens Axboe { 24486db1e29SJens Axboe struct bio *mapped_bio; 24586db1e29SJens Axboe int ret = 0, ret2; 24686db1e29SJens Axboe 24786db1e29SJens Axboe while (bio) { 24886db1e29SJens Axboe mapped_bio = bio; 24986db1e29SJens Axboe if (unlikely(bio_flagged(bio, BIO_BOUNCED))) 25086db1e29SJens Axboe mapped_bio = bio->bi_private; 25186db1e29SJens Axboe 25286db1e29SJens Axboe ret2 = __blk_rq_unmap_user(mapped_bio); 25386db1e29SJens Axboe if (ret2 && !ret) 25486db1e29SJens Axboe ret = ret2; 25586db1e29SJens Axboe 25686db1e29SJens Axboe mapped_bio = bio; 25786db1e29SJens Axboe bio = bio->bi_next; 25886db1e29SJens Axboe bio_put(mapped_bio); 25986db1e29SJens Axboe } 26086db1e29SJens Axboe 26186db1e29SJens Axboe return ret; 26286db1e29SJens Axboe } 26386db1e29SJens Axboe EXPORT_SYMBOL(blk_rq_unmap_user); 26486db1e29SJens Axboe 26586db1e29SJens Axboe /** 26686db1e29SJens Axboe * blk_rq_map_kern - map kernel data to a request, for REQ_BLOCK_PC usage 26786db1e29SJens Axboe * @q: request queue where request should be inserted 26886db1e29SJens Axboe * @rq: request to fill 26986db1e29SJens Axboe * @kbuf: the kernel buffer 27086db1e29SJens Axboe * @len: length of user data 27186db1e29SJens Axboe * @gfp_mask: memory allocation flags 27286db1e29SJens Axboe */ 27386db1e29SJens Axboe int blk_rq_map_kern(struct request_queue *q, struct request *rq, void *kbuf, 27486db1e29SJens Axboe unsigned int len, gfp_t gfp_mask) 27586db1e29SJens Axboe { 27686db1e29SJens Axboe struct bio *bio; 27786db1e29SJens Axboe 27886db1e29SJens Axboe if (len > (q->max_hw_sectors << 9)) 27986db1e29SJens Axboe return -EINVAL; 28086db1e29SJens Axboe if (!len || !kbuf) 28186db1e29SJens Axboe return -EINVAL; 28286db1e29SJens Axboe 28386db1e29SJens Axboe bio = bio_map_kern(q, kbuf, len, gfp_mask); 28486db1e29SJens Axboe if (IS_ERR(bio)) 28586db1e29SJens Axboe return PTR_ERR(bio); 28686db1e29SJens Axboe 28786db1e29SJens Axboe if (rq_data_dir(rq) == WRITE) 28886db1e29SJens Axboe bio->bi_rw |= (1 << BIO_RW); 28986db1e29SJens Axboe 29086db1e29SJens Axboe blk_rq_bio_prep(q, rq, bio); 29186db1e29SJens Axboe blk_queue_bounce(q, &rq->bio); 29286db1e29SJens Axboe rq->buffer = rq->data = NULL; 29386db1e29SJens Axboe return 0; 29486db1e29SJens Axboe } 29586db1e29SJens Axboe EXPORT_SYMBOL(blk_rq_map_kern); 296