1b2441318SGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0 20a19e61eSDong Jia Shi /* 30a19e61eSDong Jia Shi * channel program interfaces 40a19e61eSDong Jia Shi * 50a19e61eSDong Jia Shi * Copyright IBM Corp. 2017 60a19e61eSDong Jia Shi * 70a19e61eSDong Jia Shi * Author(s): Dong Jia Shi <bjsdjshi@linux.vnet.ibm.com> 80a19e61eSDong Jia Shi * Xiao Feng Ren <renxiaof@linux.vnet.ibm.com> 90a19e61eSDong Jia Shi */ 100a19e61eSDong Jia Shi 11725b94d7SJared Rossi #include <linux/ratelimit.h> 120a19e61eSDong Jia Shi #include <linux/mm.h> 130a19e61eSDong Jia Shi #include <linux/slab.h> 14c2863febSNicolin Chen #include <linux/highmem.h> 150a19e61eSDong Jia Shi #include <linux/iommu.h> 160a19e61eSDong Jia Shi #include <linux/vfio.h> 170a19e61eSDong Jia Shi #include <asm/idals.h> 180a19e61eSDong Jia Shi 190a19e61eSDong Jia Shi #include "vfio_ccw_cp.h" 200a587956SJason Gunthorpe #include "vfio_ccw_private.h" 210a19e61eSDong Jia Shi 2213314605SNicolin Chen struct page_array { 2313314605SNicolin Chen /* Array that stores pages need to pin. */ 2413314605SNicolin Chen dma_addr_t *pa_iova; 2534a255e6SNicolin Chen /* Array that receives the pinned pages. */ 2634a255e6SNicolin Chen struct page **pa_page; 275c1cfb1cSDong Jia Shi /* Number of pages pinned from @pa_iova. */ 280a19e61eSDong Jia Shi int pa_nr; 290a19e61eSDong Jia Shi }; 300a19e61eSDong Jia Shi 310a19e61eSDong Jia Shi struct ccwchain { 320a19e61eSDong Jia Shi struct list_head next; 330a19e61eSDong Jia Shi struct ccw1 *ch_ccw; 340a19e61eSDong Jia Shi /* Guest physical address of the current chain. */ 350a19e61eSDong Jia Shi u64 ch_iova; 360a19e61eSDong Jia Shi /* Count of the valid ccws in chain. */ 370a19e61eSDong Jia Shi int ch_len; 380a19e61eSDong Jia Shi /* Pinned PAGEs for the original data. */ 3913314605SNicolin Chen struct page_array *ch_pa; 400a19e61eSDong Jia Shi }; 410a19e61eSDong Jia Shi 420a19e61eSDong Jia Shi /* 4313314605SNicolin Chen * page_array_alloc() - alloc memory for page array 4413314605SNicolin Chen * @pa: page_array on which to perform the operation 4562a97a56SEric Farman * @len: number of pages that should be pinned from @iova 460a19e61eSDong Jia Shi * 4713314605SNicolin Chen * Attempt to allocate memory for page array. 480a19e61eSDong Jia Shi * 4913314605SNicolin Chen * Usage of page_array: 5013314605SNicolin Chen * We expect (pa_nr == 0) and (pa_iova == NULL), any field in 515c1cfb1cSDong Jia Shi * this structure will be filled in by this function. 520a19e61eSDong Jia Shi * 530a19e61eSDong Jia Shi * Returns: 5413314605SNicolin Chen * 0 if page array is allocated 5513314605SNicolin Chen * -EINVAL if pa->pa_nr is not initially zero, or pa->pa_iova is not NULL 56e4f3f18bSEric Farman * -ENOMEM if alloc failed 570a19e61eSDong Jia Shi */ 5861783394SEric Farman static int page_array_alloc(struct page_array *pa, unsigned int len) 590a19e61eSDong Jia Shi { 6013314605SNicolin Chen if (pa->pa_nr || pa->pa_iova) 610a19e61eSDong Jia Shi return -EINVAL; 620a19e61eSDong Jia Shi 6362a97a56SEric Farman if (len == 0) 640a19e61eSDong Jia Shi return -EINVAL; 650a19e61eSDong Jia Shi 6662a97a56SEric Farman pa->pa_nr = len; 6762a97a56SEric Farman 6862a97a56SEric Farman pa->pa_iova = kcalloc(len, sizeof(*pa->pa_iova), GFP_KERNEL); 6962a97a56SEric Farman if (!pa->pa_iova) 7062a97a56SEric Farman return -ENOMEM; 7162a97a56SEric Farman 7262a97a56SEric Farman pa->pa_page = kcalloc(len, sizeof(*pa->pa_page), GFP_KERNEL); 7362a97a56SEric Farman if (!pa->pa_page) { 7462a97a56SEric Farman kfree(pa->pa_iova); 750a19e61eSDong Jia Shi return -ENOMEM; 76c1ab6926SFarhan Ali } 770a19e61eSDong Jia Shi 78e4f3f18bSEric Farman return 0; 79e4f3f18bSEric Farman } 80e4f3f18bSEric Farman 81e4f3f18bSEric Farman /* 8213314605SNicolin Chen * page_array_unpin() - Unpin user pages in memory 8313314605SNicolin Chen * @pa: page_array on which to perform the operation 84cfedb3d5SNicolin Chen * @vdev: the vfio device to perform the operation 85cfedb3d5SNicolin Chen * @pa_nr: number of user pages to unpin 86cfedb3d5SNicolin Chen * 87cfedb3d5SNicolin Chen * Only unpin if any pages were pinned to begin with, i.e. pa_nr > 0, 88cfedb3d5SNicolin Chen * otherwise only clear pa->pa_nr 89cfedb3d5SNicolin Chen */ 9013314605SNicolin Chen static void page_array_unpin(struct page_array *pa, 91cfedb3d5SNicolin Chen struct vfio_device *vdev, int pa_nr) 92cfedb3d5SNicolin Chen { 93cfedb3d5SNicolin Chen int unpinned = 0, npage = 1; 94cfedb3d5SNicolin Chen 95cfedb3d5SNicolin Chen while (unpinned < pa_nr) { 9613314605SNicolin Chen dma_addr_t *first = &pa->pa_iova[unpinned]; 9713314605SNicolin Chen dma_addr_t *last = &first[npage]; 98cfedb3d5SNicolin Chen 99cfedb3d5SNicolin Chen if (unpinned + npage < pa_nr && 10013314605SNicolin Chen *first + npage * PAGE_SIZE == *last) { 101cfedb3d5SNicolin Chen npage++; 102cfedb3d5SNicolin Chen continue; 103cfedb3d5SNicolin Chen } 104cfedb3d5SNicolin Chen 10513314605SNicolin Chen vfio_unpin_pages(vdev, *first, npage); 106cfedb3d5SNicolin Chen unpinned += npage; 107cfedb3d5SNicolin Chen npage = 1; 108cfedb3d5SNicolin Chen } 109cfedb3d5SNicolin Chen 110cfedb3d5SNicolin Chen pa->pa_nr = 0; 111cfedb3d5SNicolin Chen } 112cfedb3d5SNicolin Chen 113cfedb3d5SNicolin Chen /* 11413314605SNicolin Chen * page_array_pin() - Pin user pages in memory 11513314605SNicolin Chen * @pa: page_array on which to perform the operation 1168a54e238SEric Farman * @vdev: the vfio device to perform pin operations 117e4f3f18bSEric Farman * 118e4f3f18bSEric Farman * Returns number of pages pinned upon success. 119e4f3f18bSEric Farman * If the pin request partially succeeds, or fails completely, 120e4f3f18bSEric Farman * all pages are left unpinned and a negative error value is returned. 121e4f3f18bSEric Farman */ 12213314605SNicolin Chen static int page_array_pin(struct page_array *pa, struct vfio_device *vdev) 123e4f3f18bSEric Farman { 124cfedb3d5SNicolin Chen int pinned = 0, npage = 1; 125e4f3f18bSEric Farman int ret = 0; 126e4f3f18bSEric Farman 127cfedb3d5SNicolin Chen while (pinned < pa->pa_nr) { 12813314605SNicolin Chen dma_addr_t *first = &pa->pa_iova[pinned]; 12913314605SNicolin Chen dma_addr_t *last = &first[npage]; 1305c1cfb1cSDong Jia Shi 131cfedb3d5SNicolin Chen if (pinned + npage < pa->pa_nr && 13213314605SNicolin Chen *first + npage * PAGE_SIZE == *last) { 133cfedb3d5SNicolin Chen npage++; 134cfedb3d5SNicolin Chen continue; 135cfedb3d5SNicolin Chen } 136cfedb3d5SNicolin Chen 13713314605SNicolin Chen ret = vfio_pin_pages(vdev, *first, npage, 138cfedb3d5SNicolin Chen IOMMU_READ | IOMMU_WRITE, 13934a255e6SNicolin Chen &pa->pa_page[pinned]); 1405c1cfb1cSDong Jia Shi if (ret < 0) { 1415c1cfb1cSDong Jia Shi goto err_out; 142cfedb3d5SNicolin Chen } else if (ret > 0 && ret != npage) { 143cfedb3d5SNicolin Chen pinned += ret; 1440a19e61eSDong Jia Shi ret = -EINVAL; 1455c1cfb1cSDong Jia Shi goto err_out; 1465c1cfb1cSDong Jia Shi } 147cfedb3d5SNicolin Chen pinned += npage; 148cfedb3d5SNicolin Chen npage = 1; 149cfedb3d5SNicolin Chen } 1500a19e61eSDong Jia Shi 1510a19e61eSDong Jia Shi return ret; 1525c1cfb1cSDong Jia Shi 1535c1cfb1cSDong Jia Shi err_out: 15413314605SNicolin Chen page_array_unpin(pa, vdev, pinned); 1555c1cfb1cSDong Jia Shi return ret; 1565c1cfb1cSDong Jia Shi } 1575c1cfb1cSDong Jia Shi 1585c1cfb1cSDong Jia Shi /* Unpin the pages before releasing the memory. */ 15913314605SNicolin Chen static void page_array_unpin_free(struct page_array *pa, struct vfio_device *vdev) 1605c1cfb1cSDong Jia Shi { 16113314605SNicolin Chen page_array_unpin(pa, vdev, pa->pa_nr); 16262a97a56SEric Farman kfree(pa->pa_page); 16313314605SNicolin Chen kfree(pa->pa_iova); 1640a19e61eSDong Jia Shi } 1650a19e61eSDong Jia Shi 1665a4fe7c4SEric Farman static bool page_array_iova_pinned(struct page_array *pa, u64 iova, u64 length) 1670a19e61eSDong Jia Shi { 1685a4fe7c4SEric Farman u64 iova_pfn_start = iova >> PAGE_SHIFT; 1695a4fe7c4SEric Farman u64 iova_pfn_end = (iova + length - 1) >> PAGE_SHIFT; 1705a4fe7c4SEric Farman u64 pfn; 1710a19e61eSDong Jia Shi int i; 1720a19e61eSDong Jia Shi 1735a4fe7c4SEric Farman for (i = 0; i < pa->pa_nr; i++) { 1745a4fe7c4SEric Farman pfn = pa->pa_iova[i] >> PAGE_SHIFT; 1755a4fe7c4SEric Farman if (pfn >= iova_pfn_start && pfn <= iova_pfn_end) 1760a19e61eSDong Jia Shi return true; 1775a4fe7c4SEric Farman } 1780a19e61eSDong Jia Shi 1790a19e61eSDong Jia Shi return false; 1800a19e61eSDong Jia Shi } 18113314605SNicolin Chen /* Create the list of IDAL words for a page_array. */ 18213314605SNicolin Chen static inline void page_array_idal_create_words(struct page_array *pa, 1830a19e61eSDong Jia Shi unsigned long *idaws) 1840a19e61eSDong Jia Shi { 185e7eaf91bSEric Farman int i; 1860a19e61eSDong Jia Shi 1870a19e61eSDong Jia Shi /* 1880a19e61eSDong Jia Shi * Idal words (execept the first one) rely on the memory being 4k 1890a19e61eSDong Jia Shi * aligned. If a user virtual address is 4K aligned, then it's 1900a19e61eSDong Jia Shi * corresponding kernel physical address will also be 4K aligned. Thus 1910a19e61eSDong Jia Shi * there will be no problem here to simply use the phys to create an 1920a19e61eSDong Jia Shi * idaw. 1930a19e61eSDong Jia Shi */ 194e7eaf91bSEric Farman 19561f3a16bSEric Farman for (i = 0; i < pa->pa_nr; i++) { 19634a255e6SNicolin Chen idaws[i] = page_to_phys(pa->pa_page[i]); 1978aabf0edSEric Farman 19861f3a16bSEric Farman /* Incorporate any offset from each starting address */ 19961f3a16bSEric Farman idaws[i] += pa->pa_iova[i] & (PAGE_SIZE - 1); 20061f3a16bSEric Farman } 2010a19e61eSDong Jia Shi } 2020a19e61eSDong Jia Shi 203dbd66558SCornelia Huck static void convert_ccw0_to_ccw1(struct ccw1 *source, unsigned long len) 2047f8e89a8SEric Farman { 2057f8e89a8SEric Farman struct ccw0 ccw0; 2067f8e89a8SEric Farman struct ccw1 *pccw1 = source; 2077f8e89a8SEric Farman int i; 2087f8e89a8SEric Farman 2097f8e89a8SEric Farman for (i = 0; i < len; i++) { 2107f8e89a8SEric Farman ccw0 = *(struct ccw0 *)pccw1; 2117f8e89a8SEric Farman if ((pccw1->cmd_code & 0x0f) == CCW_CMD_TIC) { 2127f8e89a8SEric Farman pccw1->cmd_code = CCW_CMD_TIC; 2137f8e89a8SEric Farman pccw1->flags = 0; 2147f8e89a8SEric Farman pccw1->count = 0; 2157f8e89a8SEric Farman } else { 2167f8e89a8SEric Farman pccw1->cmd_code = ccw0.cmd_code; 2177f8e89a8SEric Farman pccw1->flags = ccw0.flags; 2187f8e89a8SEric Farman pccw1->count = ccw0.count; 2197f8e89a8SEric Farman } 2207f8e89a8SEric Farman pccw1->cda = ccw0.cda; 2217f8e89a8SEric Farman pccw1++; 2227f8e89a8SEric Farman } 2237f8e89a8SEric Farman } 2240a19e61eSDong Jia Shi 225*1b676fe3SEric Farman #define idal_is_2k(_cp) (!(_cp)->orb.cmd.c64 || (_cp)->orb.cmd.i2k) 226*1b676fe3SEric Farman 2270a19e61eSDong Jia Shi /* 2280a19e61eSDong Jia Shi * Helpers to operate ccwchain. 2290a19e61eSDong Jia Shi */ 2305d87fbf7SEric Farman #define ccw_is_read(_ccw) (((_ccw)->cmd_code & 0x03) == 0x02) 2315d87fbf7SEric Farman #define ccw_is_read_backward(_ccw) (((_ccw)->cmd_code & 0x0F) == 0x0C) 2325d87fbf7SEric Farman #define ccw_is_sense(_ccw) (((_ccw)->cmd_code & 0x0F) == CCW_CMD_BASIC_SENSE) 2335d87fbf7SEric Farman 2340a19e61eSDong Jia Shi #define ccw_is_noop(_ccw) ((_ccw)->cmd_code == CCW_CMD_NOOP) 2350a19e61eSDong Jia Shi 2360a19e61eSDong Jia Shi #define ccw_is_tic(_ccw) ((_ccw)->cmd_code == CCW_CMD_TIC) 2370a19e61eSDong Jia Shi 2380a19e61eSDong Jia Shi #define ccw_is_idal(_ccw) ((_ccw)->flags & CCW_FLAG_IDA) 2395d87fbf7SEric Farman #define ccw_is_skip(_ccw) ((_ccw)->flags & CCW_FLAG_SKIP) 2400a19e61eSDong Jia Shi 2410a19e61eSDong Jia Shi #define ccw_is_chain(_ccw) ((_ccw)->flags & (CCW_FLAG_CC | CCW_FLAG_DC)) 2420a19e61eSDong Jia Shi 24348bd0eeeSEric Farman /* 2445d87fbf7SEric Farman * ccw_does_data_transfer() 2455d87fbf7SEric Farman * 2465d87fbf7SEric Farman * Determine whether a CCW will move any data, such that the guest pages 2475d87fbf7SEric Farman * would need to be pinned before performing the I/O. 2485d87fbf7SEric Farman * 2495d87fbf7SEric Farman * Returns 1 if yes, 0 if no. 2505d87fbf7SEric Farman */ 2515d87fbf7SEric Farman static inline int ccw_does_data_transfer(struct ccw1 *ccw) 2525d87fbf7SEric Farman { 253453eac31SEric Farman /* If the count field is zero, then no data will be transferred */ 254453eac31SEric Farman if (ccw->count == 0) 255453eac31SEric Farman return 0; 256453eac31SEric Farman 2579b6e57e5SEric Farman /* If the command is a NOP, then no data will be transferred */ 2589b6e57e5SEric Farman if (ccw_is_noop(ccw)) 2599b6e57e5SEric Farman return 0; 2609b6e57e5SEric Farman 2615d87fbf7SEric Farman /* If the skip flag is off, then data will be transferred */ 2625d87fbf7SEric Farman if (!ccw_is_skip(ccw)) 2635d87fbf7SEric Farman return 1; 2645d87fbf7SEric Farman 2655d87fbf7SEric Farman /* 2665d87fbf7SEric Farman * If the skip flag is on, it is only meaningful if the command 2675d87fbf7SEric Farman * code is a read, read backward, sense, or sense ID. In those 2685d87fbf7SEric Farman * cases, no data will be transferred. 2695d87fbf7SEric Farman */ 2705d87fbf7SEric Farman if (ccw_is_read(ccw) || ccw_is_read_backward(ccw)) 2715d87fbf7SEric Farman return 0; 2725d87fbf7SEric Farman 2735d87fbf7SEric Farman if (ccw_is_sense(ccw)) 2745d87fbf7SEric Farman return 0; 2755d87fbf7SEric Farman 2765d87fbf7SEric Farman /* The skip flag is on, but it is ignored for this command code. */ 2775d87fbf7SEric Farman return 1; 2785d87fbf7SEric Farman } 2795d87fbf7SEric Farman 2805d87fbf7SEric Farman /* 28148bd0eeeSEric Farman * is_cpa_within_range() 28248bd0eeeSEric Farman * 28348bd0eeeSEric Farman * @cpa: channel program address being questioned 28448bd0eeeSEric Farman * @head: address of the beginning of a CCW chain 28548bd0eeeSEric Farman * @len: number of CCWs within the chain 28648bd0eeeSEric Farman * 28748bd0eeeSEric Farman * Determine whether the address of a CCW (whether a new chain, 28848bd0eeeSEric Farman * or the target of a TIC) falls within a range (including the end points). 28948bd0eeeSEric Farman * 29048bd0eeeSEric Farman * Returns 1 if yes, 0 if no. 29148bd0eeeSEric Farman */ 29248bd0eeeSEric Farman static inline int is_cpa_within_range(u32 cpa, u32 head, int len) 29348bd0eeeSEric Farman { 29448bd0eeeSEric Farman u32 tail = head + (len - 1) * sizeof(struct ccw1); 29548bd0eeeSEric Farman 29648bd0eeeSEric Farman return (head <= cpa && cpa <= tail); 29748bd0eeeSEric Farman } 29848bd0eeeSEric Farman 29948bd0eeeSEric Farman static inline int is_tic_within_range(struct ccw1 *ccw, u32 head, int len) 30048bd0eeeSEric Farman { 30148bd0eeeSEric Farman if (!ccw_is_tic(ccw)) 30248bd0eeeSEric Farman return 0; 30348bd0eeeSEric Farman 30448bd0eeeSEric Farman return is_cpa_within_range(ccw->cda, head, len); 30548bd0eeeSEric Farman } 30648bd0eeeSEric Farman 3070a19e61eSDong Jia Shi static struct ccwchain *ccwchain_alloc(struct channel_program *cp, int len) 3080a19e61eSDong Jia Shi { 3090a19e61eSDong Jia Shi struct ccwchain *chain; 3100a19e61eSDong Jia Shi 3114b946d65SEric Farman chain = kzalloc(sizeof(*chain), GFP_KERNEL); 3120a19e61eSDong Jia Shi if (!chain) 3130a19e61eSDong Jia Shi return NULL; 3140a19e61eSDong Jia Shi 3154b946d65SEric Farman chain->ch_ccw = kcalloc(len, sizeof(*chain->ch_ccw), GFP_DMA | GFP_KERNEL); 3164b946d65SEric Farman if (!chain->ch_ccw) 3174b946d65SEric Farman goto out_err; 3180a19e61eSDong Jia Shi 3194b946d65SEric Farman chain->ch_pa = kcalloc(len, sizeof(*chain->ch_pa), GFP_KERNEL); 3204b946d65SEric Farman if (!chain->ch_pa) 3214b946d65SEric Farman goto out_err; 3220a19e61eSDong Jia Shi 3230a19e61eSDong Jia Shi list_add_tail(&chain->next, &cp->ccwchain_list); 3240a19e61eSDong Jia Shi 3250a19e61eSDong Jia Shi return chain; 3264b946d65SEric Farman 3274b946d65SEric Farman out_err: 3284b946d65SEric Farman kfree(chain->ch_ccw); 3294b946d65SEric Farman kfree(chain); 3304b946d65SEric Farman return NULL; 3310a19e61eSDong Jia Shi } 3320a19e61eSDong Jia Shi 3330a19e61eSDong Jia Shi static void ccwchain_free(struct ccwchain *chain) 3340a19e61eSDong Jia Shi { 3350a19e61eSDong Jia Shi list_del(&chain->next); 3364b946d65SEric Farman kfree(chain->ch_pa); 3374b946d65SEric Farman kfree(chain->ch_ccw); 3380a19e61eSDong Jia Shi kfree(chain); 3390a19e61eSDong Jia Shi } 3400a19e61eSDong Jia Shi 3410a19e61eSDong Jia Shi /* Free resource for a ccw that allocated memory for its cda. */ 3420a19e61eSDong Jia Shi static void ccwchain_cda_free(struct ccwchain *chain, int idx) 3430a19e61eSDong Jia Shi { 3444b946d65SEric Farman struct ccw1 *ccw = &chain->ch_ccw[idx]; 3450a19e61eSDong Jia Shi 3469b6e57e5SEric Farman if (ccw_is_tic(ccw)) 347408358b5SJason J. Herne return; 3480a19e61eSDong Jia Shi 3495de2322dSEric Farman kfree(phys_to_virt(ccw->cda)); 3500a19e61eSDong Jia Shi } 3510a19e61eSDong Jia Shi 3520a19e61eSDong Jia Shi /** 3530a19e61eSDong Jia Shi * ccwchain_calc_length - calculate the length of the ccw chain. 3540a19e61eSDong Jia Shi * @iova: guest physical address of the target ccw chain 3550a19e61eSDong Jia Shi * @cp: channel_program on which to perform the operation 3560a19e61eSDong Jia Shi * 3570a19e61eSDong Jia Shi * This is the chain length not considering any TICs. 3580a19e61eSDong Jia Shi * You need to do a new round for each TIC target. 3590a19e61eSDong Jia Shi * 360fb9e7880SHalil Pasic * The program is also validated for absence of not yet supported 361fb9e7880SHalil Pasic * indirect data addressing scenarios. 362fb9e7880SHalil Pasic * 3630a19e61eSDong Jia Shi * Returns: the length of the ccw chain or -errno. 3640a19e61eSDong Jia Shi */ 3650a19e61eSDong Jia Shi static int ccwchain_calc_length(u64 iova, struct channel_program *cp) 3660a19e61eSDong Jia Shi { 3671d897e47SEric Farman struct ccw1 *ccw = cp->guest_cp; 368ded563f3SEric Farman int cnt = 0; 3690a19e61eSDong Jia Shi 3700a19e61eSDong Jia Shi do { 3710a19e61eSDong Jia Shi cnt++; 3720a19e61eSDong Jia Shi 373fb9e7880SHalil Pasic /* 374fb9e7880SHalil Pasic * As we don't want to fail direct addressing even if the 375fb9e7880SHalil Pasic * orb specified one of the unsupported formats, we defer 376fb9e7880SHalil Pasic * checking for IDAWs in unsupported formats to here. 377fb9e7880SHalil Pasic */ 3781d897e47SEric Farman if ((!cp->orb.cmd.c64 || cp->orb.cmd.i2k) && ccw_is_idal(ccw)) 379fb9e7880SHalil Pasic return -EOPNOTSUPP; 380fb9e7880SHalil Pasic 38148bd0eeeSEric Farman /* 38248bd0eeeSEric Farman * We want to keep counting if the current CCW has the 38348bd0eeeSEric Farman * command-chaining flag enabled, or if it is a TIC CCW 38448bd0eeeSEric Farman * that loops back into the current chain. The latter 38548bd0eeeSEric Farman * is used for device orientation, where the CCW PRIOR to 38648bd0eeeSEric Farman * the TIC can either jump to the TIC or a CCW immediately 38748bd0eeeSEric Farman * after the TIC, depending on the results of its operation. 38848bd0eeeSEric Farman */ 38948bd0eeeSEric Farman if (!ccw_is_chain(ccw) && !is_tic_within_range(ccw, iova, cnt)) 3900a19e61eSDong Jia Shi break; 3910a19e61eSDong Jia Shi 3920a19e61eSDong Jia Shi ccw++; 3930a19e61eSDong Jia Shi } while (cnt < CCWCHAIN_LEN_MAX + 1); 3940a19e61eSDong Jia Shi 3950a19e61eSDong Jia Shi if (cnt == CCWCHAIN_LEN_MAX + 1) 3960a19e61eSDong Jia Shi cnt = -EINVAL; 3970a19e61eSDong Jia Shi 3980a19e61eSDong Jia Shi return cnt; 3990a19e61eSDong Jia Shi } 4000a19e61eSDong Jia Shi 4010a19e61eSDong Jia Shi static int tic_target_chain_exists(struct ccw1 *tic, struct channel_program *cp) 4020a19e61eSDong Jia Shi { 4030a19e61eSDong Jia Shi struct ccwchain *chain; 4042904337fSEric Farman u32 ccw_head; 4050a19e61eSDong Jia Shi 4060a19e61eSDong Jia Shi list_for_each_entry(chain, &cp->ccwchain_list, next) { 4070a19e61eSDong Jia Shi ccw_head = chain->ch_iova; 4082904337fSEric Farman if (is_cpa_within_range(tic->cda, ccw_head, chain->ch_len)) 4090a19e61eSDong Jia Shi return 1; 4100a19e61eSDong Jia Shi } 4110a19e61eSDong Jia Shi 4120a19e61eSDong Jia Shi return 0; 4130a19e61eSDong Jia Shi } 4140a19e61eSDong Jia Shi 4150a19e61eSDong Jia Shi static int ccwchain_loop_tic(struct ccwchain *chain, 4160a19e61eSDong Jia Shi struct channel_program *cp); 4170a19e61eSDong Jia Shi 418363fe5f7SEric Farman static int ccwchain_handle_ccw(u32 cda, struct channel_program *cp) 4190a19e61eSDong Jia Shi { 4200a587956SJason Gunthorpe struct vfio_device *vdev = 4210a587956SJason Gunthorpe &container_of(cp, struct vfio_ccw_private, cp)->vdev; 4220a19e61eSDong Jia Shi struct ccwchain *chain; 4238b515be5SFarhan Ali int len, ret; 4240a19e61eSDong Jia Shi 425ded563f3SEric Farman /* Copy 2K (the most we support today) of possible CCWs */ 426c5e8083fSEric Farman ret = vfio_dma_rw(vdev, cda, cp->guest_cp, CCWCHAIN_LEN_MAX * sizeof(struct ccw1), false); 427c5e8083fSEric Farman if (ret) 428c5e8083fSEric Farman return ret; 429ded563f3SEric Farman 4307f8e89a8SEric Farman /* Convert any Format-0 CCWs to Format-1 */ 4317f8e89a8SEric Farman if (!cp->orb.cmd.fmt) 432c382cbc6SEric Farman convert_ccw0_to_ccw1(cp->guest_cp, CCWCHAIN_LEN_MAX); 4337f8e89a8SEric Farman 434ded563f3SEric Farman /* Count the CCWs in the current chain */ 435363fe5f7SEric Farman len = ccwchain_calc_length(cda, cp); 4360a19e61eSDong Jia Shi if (len < 0) 4370a19e61eSDong Jia Shi return len; 4380a19e61eSDong Jia Shi 4390a19e61eSDong Jia Shi /* Need alloc a new chain for this one. */ 4400a19e61eSDong Jia Shi chain = ccwchain_alloc(cp, len); 4410a19e61eSDong Jia Shi if (!chain) 4420a19e61eSDong Jia Shi return -ENOMEM; 4434b946d65SEric Farman 4444b946d65SEric Farman chain->ch_len = len; 445363fe5f7SEric Farman chain->ch_iova = cda; 4460a19e61eSDong Jia Shi 44762465902SEric Farman /* Copy the actual CCWs into the new chain */ 44862465902SEric Farman memcpy(chain->ch_ccw, cp->guest_cp, len * sizeof(struct ccw1)); 4490a19e61eSDong Jia Shi 4500a19e61eSDong Jia Shi /* Loop for tics on this new chain. */ 4518b515be5SFarhan Ali ret = ccwchain_loop_tic(chain, cp); 4528b515be5SFarhan Ali 4538b515be5SFarhan Ali if (ret) 4548b515be5SFarhan Ali ccwchain_free(chain); 4558b515be5SFarhan Ali 4568b515be5SFarhan Ali return ret; 4570a19e61eSDong Jia Shi } 4580a19e61eSDong Jia Shi 4590a19e61eSDong Jia Shi /* Loop for TICs. */ 4600a19e61eSDong Jia Shi static int ccwchain_loop_tic(struct ccwchain *chain, struct channel_program *cp) 4610a19e61eSDong Jia Shi { 4620a19e61eSDong Jia Shi struct ccw1 *tic; 4630a19e61eSDong Jia Shi int i, ret; 4640a19e61eSDong Jia Shi 4650a19e61eSDong Jia Shi for (i = 0; i < chain->ch_len; i++) { 4664b946d65SEric Farman tic = &chain->ch_ccw[i]; 4670a19e61eSDong Jia Shi 4680a19e61eSDong Jia Shi if (!ccw_is_tic(tic)) 4690a19e61eSDong Jia Shi continue; 4700a19e61eSDong Jia Shi 471e64bd689SEric Farman /* May transfer to an existing chain. */ 472e64bd689SEric Farman if (tic_target_chain_exists(tic, cp)) 473e64bd689SEric Farman continue; 474e64bd689SEric Farman 475363fe5f7SEric Farman /* Build a ccwchain for the next segment */ 476363fe5f7SEric Farman ret = ccwchain_handle_ccw(tic->cda, cp); 4770a19e61eSDong Jia Shi if (ret) 4780a19e61eSDong Jia Shi return ret; 4790a19e61eSDong Jia Shi } 4800a19e61eSDong Jia Shi 4810a19e61eSDong Jia Shi return 0; 4820a19e61eSDong Jia Shi } 4830a19e61eSDong Jia Shi 484a4c60404SEric Farman static int ccwchain_fetch_tic(struct ccw1 *ccw, 4850a19e61eSDong Jia Shi struct channel_program *cp) 4860a19e61eSDong Jia Shi { 4870a19e61eSDong Jia Shi struct ccwchain *iter; 4882904337fSEric Farman u32 ccw_head; 4890a19e61eSDong Jia Shi 4900a19e61eSDong Jia Shi list_for_each_entry(iter, &cp->ccwchain_list, next) { 4910a19e61eSDong Jia Shi ccw_head = iter->ch_iova; 4922904337fSEric Farman if (is_cpa_within_range(ccw->cda, ccw_head, iter->ch_len)) { 493c389377cSJason J. Herne ccw->cda = (__u32) (addr_t) (((char *)iter->ch_ccw) + 4940a19e61eSDong Jia Shi (ccw->cda - ccw_head)); 4950a19e61eSDong Jia Shi return 0; 4960a19e61eSDong Jia Shi } 4970a19e61eSDong Jia Shi } 4980a19e61eSDong Jia Shi 4990a19e61eSDong Jia Shi return -EFAULT; 5000a19e61eSDong Jia Shi } 5010a19e61eSDong Jia Shi 50261f3a16bSEric Farman static unsigned long *get_guest_idal(struct ccw1 *ccw, 50361f3a16bSEric Farman struct channel_program *cp, 50461f3a16bSEric Farman int idaw_nr) 50561f3a16bSEric Farman { 50661f3a16bSEric Farman struct vfio_device *vdev = 50761f3a16bSEric Farman &container_of(cp, struct vfio_ccw_private, cp)->vdev; 50861f3a16bSEric Farman unsigned long *idaws; 509*1b676fe3SEric Farman unsigned int *idaws_f1; 51061f3a16bSEric Farman int idal_len = idaw_nr * sizeof(*idaws); 511*1b676fe3SEric Farman int idaw_size = idal_is_2k(cp) ? PAGE_SIZE / 2 : PAGE_SIZE; 51261f3a16bSEric Farman int idaw_mask = ~(idaw_size - 1); 51361f3a16bSEric Farman int i, ret; 51461f3a16bSEric Farman 51561f3a16bSEric Farman idaws = kcalloc(idaw_nr, sizeof(*idaws), GFP_DMA | GFP_KERNEL); 51661f3a16bSEric Farman if (!idaws) 51761f3a16bSEric Farman return ERR_PTR(-ENOMEM); 51861f3a16bSEric Farman 51961f3a16bSEric Farman if (ccw_is_idal(ccw)) { 52061f3a16bSEric Farman /* Copy IDAL from guest */ 52161f3a16bSEric Farman ret = vfio_dma_rw(vdev, ccw->cda, idaws, idal_len, false); 52261f3a16bSEric Farman if (ret) { 52361f3a16bSEric Farman kfree(idaws); 52461f3a16bSEric Farman return ERR_PTR(ret); 52561f3a16bSEric Farman } 52661f3a16bSEric Farman } else { 52761f3a16bSEric Farman /* Fabricate an IDAL based off CCW data address */ 52861f3a16bSEric Farman if (cp->orb.cmd.c64) { 52961f3a16bSEric Farman idaws[0] = ccw->cda; 53061f3a16bSEric Farman for (i = 1; i < idaw_nr; i++) 53161f3a16bSEric Farman idaws[i] = (idaws[i - 1] + idaw_size) & idaw_mask; 53261f3a16bSEric Farman } else { 533*1b676fe3SEric Farman idaws_f1 = (unsigned int *)idaws; 534*1b676fe3SEric Farman idaws_f1[0] = ccw->cda; 535*1b676fe3SEric Farman for (i = 1; i < idaw_nr; i++) 536*1b676fe3SEric Farman idaws_f1[i] = (idaws_f1[i - 1] + idaw_size) & idaw_mask; 53761f3a16bSEric Farman } 53861f3a16bSEric Farman } 53961f3a16bSEric Farman 54061f3a16bSEric Farman return idaws; 54161f3a16bSEric Farman } 54261f3a16bSEric Farman 543b21f9cb1SEric Farman /* 544b21f9cb1SEric Farman * ccw_count_idaws() - Calculate the number of IDAWs needed to transfer 545b21f9cb1SEric Farman * a specified amount of data 546b21f9cb1SEric Farman * 547b21f9cb1SEric Farman * @ccw: The Channel Command Word being translated 548b21f9cb1SEric Farman * @cp: Channel Program being processed 5496a6dc14aSEric Farman * 5506a6dc14aSEric Farman * The ORB is examined, since it specifies what IDAWs could actually be 5516a6dc14aSEric Farman * used by any CCW in the channel program, regardless of whether or not 5526a6dc14aSEric Farman * the CCW actually does. An ORB that does not specify Format-2-IDAW 5536a6dc14aSEric Farman * Control could still contain a CCW with an IDAL, which would be 5546a6dc14aSEric Farman * Format-1 and thus only move 2K with each IDAW. Thus all CCWs within 5556a6dc14aSEric Farman * the channel program must follow the same size requirements. 556b21f9cb1SEric Farman */ 557b21f9cb1SEric Farman static int ccw_count_idaws(struct ccw1 *ccw, 5580a19e61eSDong Jia Shi struct channel_program *cp) 5590a19e61eSDong Jia Shi { 5600a587956SJason Gunthorpe struct vfio_device *vdev = 5610a587956SJason Gunthorpe &container_of(cp, struct vfio_ccw_private, cp)->vdev; 56201aa26c6SEric Farman u64 iova; 563667e5dbaSEric Farman int size = cp->orb.cmd.c64 ? sizeof(u64) : sizeof(u32); 5646238f921SDong Jia Shi int ret; 565453eac31SEric Farman int bytes = 1; 5660a19e61eSDong Jia Shi 567e8573b39SEric Farman if (ccw->count) 568453eac31SEric Farman bytes = ccw->count; 569e8573b39SEric Farman 57001aa26c6SEric Farman if (ccw_is_idal(ccw)) { 571667e5dbaSEric Farman /* Read first IDAW to check its starting address. */ 572667e5dbaSEric Farman /* All subsequent IDAWs will be 2K- or 4K-aligned. */ 573667e5dbaSEric Farman ret = vfio_dma_rw(vdev, ccw->cda, &iova, size, false); 57401aa26c6SEric Farman if (ret) 57501aa26c6SEric Farman return ret; 576667e5dbaSEric Farman 577667e5dbaSEric Farman /* 578667e5dbaSEric Farman * Format-1 IDAWs only occupy the first 32 bits, 579667e5dbaSEric Farman * and bit 0 is always off. 580667e5dbaSEric Farman */ 581667e5dbaSEric Farman if (!cp->orb.cmd.c64) 582667e5dbaSEric Farman iova = iova >> 32; 58301aa26c6SEric Farman } else { 58401aa26c6SEric Farman iova = ccw->cda; 58501aa26c6SEric Farman } 586b21f9cb1SEric Farman 5876a6dc14aSEric Farman /* Format-1 IDAWs operate on 2K each */ 5886a6dc14aSEric Farman if (!cp->orb.cmd.c64) 5896a6dc14aSEric Farman return idal_2k_nr_words((void *)iova, bytes); 5906a6dc14aSEric Farman 5916a6dc14aSEric Farman /* Using the 2K variant of Format-2 IDAWs? */ 5926a6dc14aSEric Farman if (cp->orb.cmd.i2k) 5936a6dc14aSEric Farman return idal_2k_nr_words((void *)iova, bytes); 5946a6dc14aSEric Farman 5956a6dc14aSEric Farman /* The 'usual' case is 4K Format-2 IDAWs */ 596b21f9cb1SEric Farman return idal_nr_words((void *)iova, bytes); 597b21f9cb1SEric Farman } 598b21f9cb1SEric Farman 599b21f9cb1SEric Farman static int ccwchain_fetch_ccw(struct ccw1 *ccw, 600b21f9cb1SEric Farman struct page_array *pa, 601b21f9cb1SEric Farman struct channel_program *cp) 602b21f9cb1SEric Farman { 603b21f9cb1SEric Farman struct vfio_device *vdev = 604b21f9cb1SEric Farman &container_of(cp, struct vfio_ccw_private, cp)->vdev; 605b21f9cb1SEric Farman unsigned long *idaws; 606*1b676fe3SEric Farman unsigned int *idaws_f1; 607b21f9cb1SEric Farman int ret; 60861f3a16bSEric Farman int idaw_nr; 609b21f9cb1SEric Farman int i; 610b21f9cb1SEric Farman 611b21f9cb1SEric Farman /* Calculate size of IDAL */ 612b21f9cb1SEric Farman idaw_nr = ccw_count_idaws(ccw, cp); 613b21f9cb1SEric Farman if (idaw_nr < 0) 614b21f9cb1SEric Farman return idaw_nr; 615b21f9cb1SEric Farman 616e8573b39SEric Farman /* Allocate an IDAL from host storage */ 61761f3a16bSEric Farman idaws = get_guest_idal(ccw, cp, idaw_nr); 61861f3a16bSEric Farman if (IS_ERR(idaws)) { 61961f3a16bSEric Farman ret = PTR_ERR(idaws); 620e8573b39SEric Farman goto out_init; 6214cebc5d6SDong Jia Shi } 6224cebc5d6SDong Jia Shi 6230a19e61eSDong Jia Shi /* 62413314605SNicolin Chen * Allocate an array of pages to pin/translate. 62501aa26c6SEric Farman * The number of pages is actually the count of the idaws 62601aa26c6SEric Farman * required for the data transfer, since we only only support 62701aa26c6SEric Farman * 4K IDAWs today. 6280a19e61eSDong Jia Shi */ 62961783394SEric Farman ret = page_array_alloc(pa, idaw_nr); 630e4f3f18bSEric Farman if (ret < 0) 631e8573b39SEric Farman goto out_free_idaws; 632e4f3f18bSEric Farman 63301aa26c6SEric Farman /* 63413314605SNicolin Chen * Copy guest IDAWs into page_array, in case the memory they 63501aa26c6SEric Farman * occupy is not contiguous. 63601aa26c6SEric Farman */ 637*1b676fe3SEric Farman idaws_f1 = (unsigned int *)idaws; 63861f3a16bSEric Farman for (i = 0; i < idaw_nr; i++) { 63961f3a16bSEric Farman if (cp->orb.cmd.c64) 64013314605SNicolin Chen pa->pa_iova[i] = idaws[i]; 641*1b676fe3SEric Farman else 642*1b676fe3SEric Farman pa->pa_iova[i] = idaws_f1[i]; 64301aa26c6SEric Farman } 64401aa26c6SEric Farman 6455d87fbf7SEric Farman if (ccw_does_data_transfer(ccw)) { 64613314605SNicolin Chen ret = page_array_pin(pa, vdev); 6476238f921SDong Jia Shi if (ret < 0) 648806212f9SEric Farman goto out_unpin; 6495d87fbf7SEric Farman } else { 650e7eaf91bSEric Farman pa->pa_nr = 0; 6515d87fbf7SEric Farman } 6520a19e61eSDong Jia Shi 6530a19e61eSDong Jia Shi ccw->cda = (__u32) virt_to_phys(idaws); 6540a19e61eSDong Jia Shi ccw->flags |= CCW_FLAG_IDA; 6550a19e61eSDong Jia Shi 65613314605SNicolin Chen /* Populate the IDAL with pinned/translated addresses from page */ 65713314605SNicolin Chen page_array_idal_create_words(pa, idaws); 6580a19e61eSDong Jia Shi 6590a19e61eSDong Jia Shi return 0; 6606238f921SDong Jia Shi 6616238f921SDong Jia Shi out_unpin: 66213314605SNicolin Chen page_array_unpin_free(pa, vdev); 663e8573b39SEric Farman out_free_idaws: 664e8573b39SEric Farman kfree(idaws); 6656238f921SDong Jia Shi out_init: 6666238f921SDong Jia Shi ccw->cda = 0; 6676238f921SDong Jia Shi return ret; 6680a19e61eSDong Jia Shi } 6690a19e61eSDong Jia Shi 6700a19e61eSDong Jia Shi /* 6710a19e61eSDong Jia Shi * Fetch one ccw. 6720a19e61eSDong Jia Shi * To reduce memory copy, we'll pin the cda page in memory, 6730a19e61eSDong Jia Shi * and to get rid of the cda 2G limitiaion of ccw1, we'll translate 6740a19e61eSDong Jia Shi * direct ccws to idal ccws. 6750a19e61eSDong Jia Shi */ 676a4c60404SEric Farman static int ccwchain_fetch_one(struct ccw1 *ccw, 677a4c60404SEric Farman struct page_array *pa, 6780a19e61eSDong Jia Shi struct channel_program *cp) 679a4c60404SEric Farman 6800a19e61eSDong Jia Shi { 6810a19e61eSDong Jia Shi if (ccw_is_tic(ccw)) 682a4c60404SEric Farman return ccwchain_fetch_tic(ccw, cp); 6830a19e61eSDong Jia Shi 684a4c60404SEric Farman return ccwchain_fetch_ccw(ccw, pa, cp); 6850a19e61eSDong Jia Shi } 6860a19e61eSDong Jia Shi 6870a19e61eSDong Jia Shi /** 6880a19e61eSDong Jia Shi * cp_init() - allocate ccwchains for a channel program. 6890a19e61eSDong Jia Shi * @cp: channel_program on which to perform the operation 6900a19e61eSDong Jia Shi * @orb: control block for the channel program from the guest 6910a19e61eSDong Jia Shi * 6920a19e61eSDong Jia Shi * This creates one or more ccwchain(s), and copies the raw data of 6930a19e61eSDong Jia Shi * the target channel program from @orb->cmd.iova to the new ccwchain(s). 6940a19e61eSDong Jia Shi * 6950a19e61eSDong Jia Shi * Limitations: 696725b94d7SJared Rossi * 1. Supports idal(c64) ccw chaining. 697725b94d7SJared Rossi * 2. Supports 4k idaw. 6980a19e61eSDong Jia Shi * 6990a19e61eSDong Jia Shi * Returns: 7000a19e61eSDong Jia Shi * %0 on success and a negative error value on failure. 7010a19e61eSDong Jia Shi */ 7020a587956SJason Gunthorpe int cp_init(struct channel_program *cp, union orb *orb) 7030a19e61eSDong Jia Shi { 7040a587956SJason Gunthorpe struct vfio_device *vdev = 7050a587956SJason Gunthorpe &container_of(cp, struct vfio_ccw_private, cp)->vdev; 706725b94d7SJared Rossi /* custom ratelimit used to avoid flood during guest IPL */ 707725b94d7SJared Rossi static DEFINE_RATELIMIT_STATE(ratelimit_state, 5 * HZ, 1); 70899afcb05SEric Farman int ret; 7090a19e61eSDong Jia Shi 710c6c82e0cSEric Farman /* this is an error in the caller */ 711c6c82e0cSEric Farman if (cp->initialized) 712c6c82e0cSEric Farman return -EBUSY; 713c6c82e0cSEric Farman 7140a19e61eSDong Jia Shi /* 715725b94d7SJared Rossi * We only support prefetching the channel program. We assume all channel 716725b94d7SJared Rossi * programs executed by supported guests likewise support prefetching. 717725b94d7SJared Rossi * Executing a channel program that does not specify prefetching will 718725b94d7SJared Rossi * typically not cause an error, but a warning is issued to help identify 719725b94d7SJared Rossi * the problem if something does break. 7200a19e61eSDong Jia Shi */ 721725b94d7SJared Rossi if (!orb->cmd.pfch && __ratelimit(&ratelimit_state)) 7220a587956SJason Gunthorpe dev_warn( 7230a587956SJason Gunthorpe vdev->dev, 7240a587956SJason Gunthorpe "Prefetching channel program even though prefetch not specified in ORB"); 7250a19e61eSDong Jia Shi 7260a19e61eSDong Jia Shi INIT_LIST_HEAD(&cp->ccwchain_list); 7270a19e61eSDong Jia Shi memcpy(&cp->orb, orb, sizeof(*orb)); 7280a19e61eSDong Jia Shi 72999afcb05SEric Farman /* Build a ccwchain for the first CCW segment */ 73099afcb05SEric Farman ret = ccwchain_handle_ccw(orb->cmd.cpa, cp); 73199afcb05SEric Farman 732254cb663SEric Farman if (!ret) 733c9f597a4SFarhan Ali cp->initialized = true; 734c9f597a4SFarhan Ali 7350a19e61eSDong Jia Shi return ret; 7360a19e61eSDong Jia Shi } 7370a19e61eSDong Jia Shi 7380a19e61eSDong Jia Shi 7390a19e61eSDong Jia Shi /** 7400a19e61eSDong Jia Shi * cp_free() - free resources for channel program. 7410a19e61eSDong Jia Shi * @cp: channel_program on which to perform the operation 7420a19e61eSDong Jia Shi * 7430a19e61eSDong Jia Shi * This unpins the memory pages and frees the memory space occupied by 7440a19e61eSDong Jia Shi * @cp, which must have been returned by a previous call to cp_init(). 7450a19e61eSDong Jia Shi * Otherwise, undefined behavior occurs. 7460a19e61eSDong Jia Shi */ 7470a19e61eSDong Jia Shi void cp_free(struct channel_program *cp) 7480a19e61eSDong Jia Shi { 7490a587956SJason Gunthorpe struct vfio_device *vdev = 7500a587956SJason Gunthorpe &container_of(cp, struct vfio_ccw_private, cp)->vdev; 751812271b9SEric Farman struct ccwchain *chain, *temp; 752812271b9SEric Farman int i; 753812271b9SEric Farman 754812271b9SEric Farman if (!cp->initialized) 755812271b9SEric Farman return; 756812271b9SEric Farman 757812271b9SEric Farman cp->initialized = false; 758812271b9SEric Farman list_for_each_entry_safe(chain, temp, &cp->ccwchain_list, next) { 759812271b9SEric Farman for (i = 0; i < chain->ch_len; i++) { 7604b946d65SEric Farman page_array_unpin_free(&chain->ch_pa[i], vdev); 761812271b9SEric Farman ccwchain_cda_free(chain, i); 762812271b9SEric Farman } 763812271b9SEric Farman ccwchain_free(chain); 764812271b9SEric Farman } 7650a19e61eSDong Jia Shi } 7660a19e61eSDong Jia Shi 7670a19e61eSDong Jia Shi /** 7680a19e61eSDong Jia Shi * cp_prefetch() - translate a guest physical address channel program to 7690a19e61eSDong Jia Shi * a real-device runnable channel program. 7700a19e61eSDong Jia Shi * @cp: channel_program on which to perform the operation 7710a19e61eSDong Jia Shi * 7720a19e61eSDong Jia Shi * This function translates the guest-physical-address channel program 7730a19e61eSDong Jia Shi * and stores the result to ccwchain list. @cp must have been 7740a19e61eSDong Jia Shi * initialized by a previous call with cp_init(). Otherwise, undefined 7750a19e61eSDong Jia Shi * behavior occurs. 776d66a7355SHalil Pasic * For each chain composing the channel program: 777d66a7355SHalil Pasic * - On entry ch_len holds the count of CCWs to be translated. 778d66a7355SHalil Pasic * - On exit ch_len is adjusted to the count of successfully translated CCWs. 779d66a7355SHalil Pasic * This allows cp_free to find in ch_len the count of CCWs to free in a chain. 7800a19e61eSDong Jia Shi * 7810a19e61eSDong Jia Shi * The S/390 CCW Translation APIS (prefixed by 'cp_') are introduced 7820a19e61eSDong Jia Shi * as helpers to do ccw chain translation inside the kernel. Basically 7830a19e61eSDong Jia Shi * they accept a channel program issued by a virtual machine, and 7840a19e61eSDong Jia Shi * translate the channel program to a real-device runnable channel 7850a19e61eSDong Jia Shi * program. 7860a19e61eSDong Jia Shi * 7870a19e61eSDong Jia Shi * These APIs will copy the ccws into kernel-space buffers, and update 7880a19e61eSDong Jia Shi * the guest phsical addresses with their corresponding host physical 7890a19e61eSDong Jia Shi * addresses. Then channel I/O device drivers could issue the 7900a19e61eSDong Jia Shi * translated channel program to real devices to perform an I/O 7910a19e61eSDong Jia Shi * operation. 7920a19e61eSDong Jia Shi * 7930a19e61eSDong Jia Shi * These interfaces are designed to support translation only for 7940a19e61eSDong Jia Shi * channel programs, which are generated and formatted by a 7950a19e61eSDong Jia Shi * guest. Thus this will make it possible for things like VFIO to 7960a19e61eSDong Jia Shi * leverage the interfaces to passthrough a channel I/O mediated 7970a19e61eSDong Jia Shi * device in QEMU. 7980a19e61eSDong Jia Shi * 7990a19e61eSDong Jia Shi * We support direct ccw chaining by translating them to idal ccws. 8000a19e61eSDong Jia Shi * 8010a19e61eSDong Jia Shi * Returns: 8020a19e61eSDong Jia Shi * %0 on success and a negative error value on failure. 8030a19e61eSDong Jia Shi */ 8040a19e61eSDong Jia Shi int cp_prefetch(struct channel_program *cp) 8050a19e61eSDong Jia Shi { 8060a19e61eSDong Jia Shi struct ccwchain *chain; 807a4c60404SEric Farman struct ccw1 *ccw; 808a4c60404SEric Farman struct page_array *pa; 8090a19e61eSDong Jia Shi int len, idx, ret; 8100a19e61eSDong Jia Shi 81171189f26SCornelia Huck /* this is an error in the caller */ 81271189f26SCornelia Huck if (!cp->initialized) 81371189f26SCornelia Huck return -EINVAL; 81471189f26SCornelia Huck 8150a19e61eSDong Jia Shi list_for_each_entry(chain, &cp->ccwchain_list, next) { 8160a19e61eSDong Jia Shi len = chain->ch_len; 8170a19e61eSDong Jia Shi for (idx = 0; idx < len; idx++) { 8184b946d65SEric Farman ccw = &chain->ch_ccw[idx]; 8194b946d65SEric Farman pa = &chain->ch_pa[idx]; 820a4c60404SEric Farman 821a4c60404SEric Farman ret = ccwchain_fetch_one(ccw, pa, cp); 8220a19e61eSDong Jia Shi if (ret) 823d66a7355SHalil Pasic goto out_err; 8240a19e61eSDong Jia Shi } 8250a19e61eSDong Jia Shi } 8260a19e61eSDong Jia Shi 8270a19e61eSDong Jia Shi return 0; 828d66a7355SHalil Pasic out_err: 829d66a7355SHalil Pasic /* Only cleanup the chain elements that were actually translated. */ 830d66a7355SHalil Pasic chain->ch_len = idx; 831d66a7355SHalil Pasic list_for_each_entry_continue(chain, &cp->ccwchain_list, next) { 832d66a7355SHalil Pasic chain->ch_len = 0; 833d66a7355SHalil Pasic } 834d66a7355SHalil Pasic return ret; 8350a19e61eSDong Jia Shi } 8360a19e61eSDong Jia Shi 8370a19e61eSDong Jia Shi /** 8380a19e61eSDong Jia Shi * cp_get_orb() - get the orb of the channel program 8390a19e61eSDong Jia Shi * @cp: channel_program on which to perform the operation 8409fbed59fSEric Farman * @sch: subchannel the operation will be performed against 8410a19e61eSDong Jia Shi * 8420a19e61eSDong Jia Shi * This function returns the address of the updated orb of the channel 8430a19e61eSDong Jia Shi * program. Channel I/O device drivers could use this orb to issue a 8440a19e61eSDong Jia Shi * ssch. 8450a19e61eSDong Jia Shi */ 8469fbed59fSEric Farman union orb *cp_get_orb(struct channel_program *cp, struct subchannel *sch) 8470a19e61eSDong Jia Shi { 8480a19e61eSDong Jia Shi union orb *orb; 8490a19e61eSDong Jia Shi struct ccwchain *chain; 8500a19e61eSDong Jia Shi struct ccw1 *cpa; 8510a19e61eSDong Jia Shi 85271189f26SCornelia Huck /* this is an error in the caller */ 85371189f26SCornelia Huck if (!cp->initialized) 85471189f26SCornelia Huck return NULL; 85571189f26SCornelia Huck 8560a19e61eSDong Jia Shi orb = &cp->orb; 8570a19e61eSDong Jia Shi 8589fbed59fSEric Farman orb->cmd.intparm = (u32)virt_to_phys(sch); 8590a19e61eSDong Jia Shi orb->cmd.fmt = 1; 8600a19e61eSDong Jia Shi 861254cb663SEric Farman /* 862254cb663SEric Farman * Everything built by vfio-ccw is a Format-2 IDAL. 863*1b676fe3SEric Farman * If the input was a Format-1 IDAL, indicate that 864*1b676fe3SEric Farman * 2K Format-2 IDAWs were created here. 865254cb663SEric Farman */ 866*1b676fe3SEric Farman if (!orb->cmd.c64) 867*1b676fe3SEric Farman orb->cmd.i2k = 1; 868254cb663SEric Farman orb->cmd.c64 = 1; 869254cb663SEric Farman 8700a19e61eSDong Jia Shi if (orb->cmd.lpm == 0) 8719fbed59fSEric Farman orb->cmd.lpm = sch->lpm; 8720a19e61eSDong Jia Shi 8730a19e61eSDong Jia Shi chain = list_first_entry(&cp->ccwchain_list, struct ccwchain, next); 8740a19e61eSDong Jia Shi cpa = chain->ch_ccw; 8755de2322dSEric Farman orb->cmd.cpa = (__u32)virt_to_phys(cpa); 8760a19e61eSDong Jia Shi 8770a19e61eSDong Jia Shi return orb; 8780a19e61eSDong Jia Shi } 8790a19e61eSDong Jia Shi 8800a19e61eSDong Jia Shi /** 8810a19e61eSDong Jia Shi * cp_update_scsw() - update scsw for a channel program. 8820a19e61eSDong Jia Shi * @cp: channel_program on which to perform the operation 8830a19e61eSDong Jia Shi * @scsw: I/O results of the channel program and also the target to be 8840a19e61eSDong Jia Shi * updated 8850a19e61eSDong Jia Shi * 8860a19e61eSDong Jia Shi * @scsw contains the I/O results of the channel program that pointed 8870a19e61eSDong Jia Shi * to by @cp. However what @scsw->cpa stores is a host physical 8880a19e61eSDong Jia Shi * address, which is meaningless for the guest, which is waiting for 8890a19e61eSDong Jia Shi * the I/O results. 8900a19e61eSDong Jia Shi * 8910a19e61eSDong Jia Shi * This function updates @scsw->cpa to its coressponding guest physical 8920a19e61eSDong Jia Shi * address. 8930a19e61eSDong Jia Shi */ 8940a19e61eSDong Jia Shi void cp_update_scsw(struct channel_program *cp, union scsw *scsw) 8950a19e61eSDong Jia Shi { 8960a19e61eSDong Jia Shi struct ccwchain *chain; 8970a19e61eSDong Jia Shi u32 cpa = scsw->cmd.cpa; 8982904337fSEric Farman u32 ccw_head; 8990a19e61eSDong Jia Shi 90071189f26SCornelia Huck if (!cp->initialized) 90171189f26SCornelia Huck return; 90271189f26SCornelia Huck 9030a19e61eSDong Jia Shi /* 9040a19e61eSDong Jia Shi * LATER: 9050a19e61eSDong Jia Shi * For now, only update the cmd.cpa part. We may need to deal with 9060a19e61eSDong Jia Shi * other portions of the schib as well, even if we don't return them 9070a19e61eSDong Jia Shi * in the ioctl directly. Path status changes etc. 9080a19e61eSDong Jia Shi */ 9090a19e61eSDong Jia Shi list_for_each_entry(chain, &cp->ccwchain_list, next) { 9100a19e61eSDong Jia Shi ccw_head = (u32)(u64)chain->ch_ccw; 91115f0eb3dSEric Farman /* 91215f0eb3dSEric Farman * On successful execution, cpa points just beyond the end 91315f0eb3dSEric Farman * of the chain. 91415f0eb3dSEric Farman */ 91515f0eb3dSEric Farman if (is_cpa_within_range(cpa, ccw_head, chain->ch_len + 1)) { 9160a19e61eSDong Jia Shi /* 9170a19e61eSDong Jia Shi * (cpa - ccw_head) is the offset value of the host 9180a19e61eSDong Jia Shi * physical ccw to its chain head. 9190a19e61eSDong Jia Shi * Adding this value to the guest physical ccw chain 9200a19e61eSDong Jia Shi * head gets us the guest cpa. 9210a19e61eSDong Jia Shi */ 9220a19e61eSDong Jia Shi cpa = chain->ch_iova + (cpa - ccw_head); 9230a19e61eSDong Jia Shi break; 9240a19e61eSDong Jia Shi } 9250a19e61eSDong Jia Shi } 9260a19e61eSDong Jia Shi 9270a19e61eSDong Jia Shi scsw->cmd.cpa = cpa; 9280a19e61eSDong Jia Shi } 9290a19e61eSDong Jia Shi 9300a19e61eSDong Jia Shi /** 9310a19e61eSDong Jia Shi * cp_iova_pinned() - check if an iova is pinned for a ccw chain. 932364e3f90SSebastian Ott * @cp: channel_program on which to perform the operation 9330a19e61eSDong Jia Shi * @iova: the iova to check 9345a4fe7c4SEric Farman * @length: the length to check from @iova 9350a19e61eSDong Jia Shi * 9360a19e61eSDong Jia Shi * If the @iova is currently pinned for the ccw chain, return true; 9370a19e61eSDong Jia Shi * else return false. 9380a19e61eSDong Jia Shi */ 9395a4fe7c4SEric Farman bool cp_iova_pinned(struct channel_program *cp, u64 iova, u64 length) 9400a19e61eSDong Jia Shi { 9410a19e61eSDong Jia Shi struct ccwchain *chain; 9420a19e61eSDong Jia Shi int i; 9430a19e61eSDong Jia Shi 94471189f26SCornelia Huck if (!cp->initialized) 94571189f26SCornelia Huck return false; 94671189f26SCornelia Huck 9470a19e61eSDong Jia Shi list_for_each_entry(chain, &cp->ccwchain_list, next) { 9480a19e61eSDong Jia Shi for (i = 0; i < chain->ch_len; i++) 9494b946d65SEric Farman if (page_array_iova_pinned(&chain->ch_pa[i], iova, length)) 9500a19e61eSDong Jia Shi return true; 9510a19e61eSDong Jia Shi } 9520a19e61eSDong Jia Shi 9530a19e61eSDong Jia Shi return false; 9540a19e61eSDong Jia Shi } 955