11dcac3e1SXiao Feng Ren /* 21dcac3e1SXiao Feng Ren * vfio based subchannel assignment support 31dcac3e1SXiao Feng Ren * 41dcac3e1SXiao Feng Ren * Copyright 2017 IBM Corp. 51dcac3e1SXiao Feng Ren * Author(s): Dong Jia Shi <bjsdjshi@linux.vnet.ibm.com> 61dcac3e1SXiao Feng Ren * Xiao Feng Ren <renxiaof@linux.vnet.ibm.com> 71dcac3e1SXiao Feng Ren * Pierre Morel <pmorel@linux.vnet.ibm.com> 81dcac3e1SXiao Feng Ren * 91dcac3e1SXiao Feng Ren * This work is licensed under the terms of the GNU GPL, version 2 or (at 1008b824aaSCornelia Huck * your option) any later version. See the COPYING file in the top-level 111dcac3e1SXiao Feng Ren * directory. 121dcac3e1SXiao Feng Ren */ 131dcac3e1SXiao Feng Ren 14e9808d09SPhilippe Mathieu-Daudé #include "qemu/osdep.h" 151dcac3e1SXiao Feng Ren #include <linux/vfio.h> 16c14e706cSDong Jia Shi #include <linux/vfio_ccw.h> 171dcac3e1SXiao Feng Ren #include <sys/ioctl.h> 181dcac3e1SXiao Feng Ren 191dcac3e1SXiao Feng Ren #include "qapi/error.h" 201dcac3e1SXiao Feng Ren #include "hw/sysbus.h" 211dcac3e1SXiao Feng Ren #include "hw/vfio/vfio.h" 221dcac3e1SXiao Feng Ren #include "hw/vfio/vfio-common.h" 231dcac3e1SXiao Feng Ren #include "hw/s390x/s390-ccw.h" 241dcac3e1SXiao Feng Ren #include "hw/s390x/ccw-device.h" 25d791937fSPhilippe Mathieu-Daudé #include "exec/address-spaces.h" 264886b3e9SDong Jia Shi #include "qemu/error-report.h" 271dcac3e1SXiao Feng Ren 281dcac3e1SXiao Feng Ren #define TYPE_VFIO_CCW "vfio-ccw" 291dcac3e1SXiao Feng Ren typedef struct VFIOCCWDevice { 301dcac3e1SXiao Feng Ren S390CCWDevice cdev; 311dcac3e1SXiao Feng Ren VFIODevice vdev; 32c14e706cSDong Jia Shi uint64_t io_region_size; 33c14e706cSDong Jia Shi uint64_t io_region_offset; 34c14e706cSDong Jia Shi struct ccw_io_region *io_region; 354886b3e9SDong Jia Shi EventNotifier io_notifier; 369a51c9eeSHalil Pasic bool force_orb_pfch; 379a51c9eeSHalil Pasic bool warned_orb_pfch; 381dcac3e1SXiao Feng Ren } VFIOCCWDevice; 391dcac3e1SXiao Feng Ren 409a51c9eeSHalil Pasic static inline void warn_once_pfch(VFIOCCWDevice *vcdev, SubchDev *sch, 419a51c9eeSHalil Pasic const char *msg) 429a51c9eeSHalil Pasic { 43c55510b7SCornelia Huck warn_report_once_cond(&vcdev->warned_orb_pfch, 44c55510b7SCornelia Huck "vfio-ccw (devno %x.%x.%04x): %s", 459a51c9eeSHalil Pasic sch->cssid, sch->ssid, sch->devno, msg); 469a51c9eeSHalil Pasic } 479a51c9eeSHalil Pasic 481dcac3e1SXiao Feng Ren static void vfio_ccw_compute_needs_reset(VFIODevice *vdev) 491dcac3e1SXiao Feng Ren { 501dcac3e1SXiao Feng Ren vdev->needs_reset = false; 511dcac3e1SXiao Feng Ren } 521dcac3e1SXiao Feng Ren 531dcac3e1SXiao Feng Ren /* 541dcac3e1SXiao Feng Ren * We don't need vfio_hot_reset_multi and vfio_eoi operations for 551dcac3e1SXiao Feng Ren * vfio_ccw device now. 561dcac3e1SXiao Feng Ren */ 571dcac3e1SXiao Feng Ren struct VFIODeviceOps vfio_ccw_ops = { 581dcac3e1SXiao Feng Ren .vfio_compute_needs_reset = vfio_ccw_compute_needs_reset, 591dcac3e1SXiao Feng Ren }; 601dcac3e1SXiao Feng Ren 6166dc50f7SHalil Pasic static IOInstEnding vfio_ccw_handle_request(SubchDev *sch) 628ca2b376SXiao Feng Ren { 6366dc50f7SHalil Pasic S390CCWDevice *cdev = sch->driver_data; 648ca2b376SXiao Feng Ren VFIOCCWDevice *vcdev = DO_UPCAST(VFIOCCWDevice, cdev, cdev); 658ca2b376SXiao Feng Ren struct ccw_io_region *region = vcdev->io_region; 668ca2b376SXiao Feng Ren int ret; 678ca2b376SXiao Feng Ren 689a51c9eeSHalil Pasic if (!(sch->orb.ctrl0 & ORB_CTRL0_MASK_PFCH)) { 699a51c9eeSHalil Pasic if (!(vcdev->force_orb_pfch)) { 709a51c9eeSHalil Pasic warn_once_pfch(vcdev, sch, "requires PFCH flag set"); 719a51c9eeSHalil Pasic sch_gen_unit_exception(sch); 729a51c9eeSHalil Pasic css_inject_io_interrupt(sch); 739a51c9eeSHalil Pasic return IOINST_CC_EXPECTED; 749a51c9eeSHalil Pasic } else { 759a51c9eeSHalil Pasic sch->orb.ctrl0 |= ORB_CTRL0_MASK_PFCH; 769a51c9eeSHalil Pasic warn_once_pfch(vcdev, sch, "PFCH flag forced"); 779a51c9eeSHalil Pasic } 789a51c9eeSHalil Pasic } 799a51c9eeSHalil Pasic 808ca2b376SXiao Feng Ren QEMU_BUILD_BUG_ON(sizeof(region->orb_area) != sizeof(ORB)); 818ca2b376SXiao Feng Ren QEMU_BUILD_BUG_ON(sizeof(region->scsw_area) != sizeof(SCSW)); 828ca2b376SXiao Feng Ren QEMU_BUILD_BUG_ON(sizeof(region->irb_area) != sizeof(IRB)); 838ca2b376SXiao Feng Ren 848ca2b376SXiao Feng Ren memset(region, 0, sizeof(*region)); 858ca2b376SXiao Feng Ren 8666dc50f7SHalil Pasic memcpy(region->orb_area, &sch->orb, sizeof(ORB)); 8766dc50f7SHalil Pasic memcpy(region->scsw_area, &sch->curr_status.scsw, sizeof(SCSW)); 888ca2b376SXiao Feng Ren 898ca2b376SXiao Feng Ren again: 908ca2b376SXiao Feng Ren ret = pwrite(vcdev->vdev.fd, region, 918ca2b376SXiao Feng Ren vcdev->io_region_size, vcdev->io_region_offset); 928ca2b376SXiao Feng Ren if (ret != vcdev->io_region_size) { 938ca2b376SXiao Feng Ren if (errno == EAGAIN) { 948ca2b376SXiao Feng Ren goto again; 958ca2b376SXiao Feng Ren } 968ca2b376SXiao Feng Ren error_report("vfio-ccw: wirte I/O region failed with errno=%d", errno); 9766dc50f7SHalil Pasic ret = -errno; 9866dc50f7SHalil Pasic } else { 9966dc50f7SHalil Pasic ret = region->ret_code; 1008ca2b376SXiao Feng Ren } 10166dc50f7SHalil Pasic switch (ret) { 10266dc50f7SHalil Pasic case 0: 10366dc50f7SHalil Pasic return IOINST_CC_EXPECTED; 10466dc50f7SHalil Pasic case -EBUSY: 10566dc50f7SHalil Pasic return IOINST_CC_BUSY; 10666dc50f7SHalil Pasic case -ENODEV: 10766dc50f7SHalil Pasic case -EACCES: 10866dc50f7SHalil Pasic return IOINST_CC_NOT_OPERATIONAL; 10966dc50f7SHalil Pasic case -EFAULT: 11066dc50f7SHalil Pasic default: 11166dc50f7SHalil Pasic sch_gen_unit_exception(sch); 11266dc50f7SHalil Pasic css_inject_io_interrupt(sch); 11366dc50f7SHalil Pasic return IOINST_CC_EXPECTED; 11466dc50f7SHalil Pasic } 1158ca2b376SXiao Feng Ren } 1168ca2b376SXiao Feng Ren 1171dcac3e1SXiao Feng Ren static void vfio_ccw_reset(DeviceState *dev) 1181dcac3e1SXiao Feng Ren { 1191dcac3e1SXiao Feng Ren CcwDevice *ccw_dev = DO_UPCAST(CcwDevice, parent_obj, dev); 1201dcac3e1SXiao Feng Ren S390CCWDevice *cdev = DO_UPCAST(S390CCWDevice, parent_obj, ccw_dev); 1211dcac3e1SXiao Feng Ren VFIOCCWDevice *vcdev = DO_UPCAST(VFIOCCWDevice, cdev, cdev); 1221dcac3e1SXiao Feng Ren 1231dcac3e1SXiao Feng Ren ioctl(vcdev->vdev.fd, VFIO_DEVICE_RESET); 1241dcac3e1SXiao Feng Ren } 1251dcac3e1SXiao Feng Ren 1264886b3e9SDong Jia Shi static void vfio_ccw_io_notifier_handler(void *opaque) 1274886b3e9SDong Jia Shi { 1284886b3e9SDong Jia Shi VFIOCCWDevice *vcdev = opaque; 1298ca2b376SXiao Feng Ren struct ccw_io_region *region = vcdev->io_region; 1308ca2b376SXiao Feng Ren S390CCWDevice *cdev = S390_CCW_DEVICE(vcdev); 1318ca2b376SXiao Feng Ren CcwDevice *ccw_dev = CCW_DEVICE(cdev); 1328ca2b376SXiao Feng Ren SubchDev *sch = ccw_dev->sch; 133*e1d0b372SDaniel P. Berrangé SCHIB *schib = &sch->curr_status; 134*e1d0b372SDaniel P. Berrangé SCSW s; 1358ca2b376SXiao Feng Ren IRB irb; 1368ca2b376SXiao Feng Ren int size; 1374886b3e9SDong Jia Shi 1384886b3e9SDong Jia Shi if (!event_notifier_test_and_clear(&vcdev->io_notifier)) { 1394886b3e9SDong Jia Shi return; 1404886b3e9SDong Jia Shi } 1418ca2b376SXiao Feng Ren 1428ca2b376SXiao Feng Ren size = pread(vcdev->vdev.fd, region, vcdev->io_region_size, 1438ca2b376SXiao Feng Ren vcdev->io_region_offset); 1448ca2b376SXiao Feng Ren if (size == -1) { 1458ca2b376SXiao Feng Ren switch (errno) { 1468ca2b376SXiao Feng Ren case ENODEV: 1478ca2b376SXiao Feng Ren /* Generate a deferred cc 3 condition. */ 148*e1d0b372SDaniel P. Berrangé schib->scsw.flags |= SCSW_FLAGS_MASK_CC; 149*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl &= ~SCSW_CTRL_MASK_STCTL; 150*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl |= (SCSW_STCTL_ALERT | SCSW_STCTL_STATUS_PEND); 1518ca2b376SXiao Feng Ren goto read_err; 1528ca2b376SXiao Feng Ren case EFAULT: 1538ca2b376SXiao Feng Ren /* Memory problem, generate channel data check. */ 154*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl &= ~SCSW_ACTL_START_PEND; 155*e1d0b372SDaniel P. Berrangé schib->scsw.cstat = SCSW_CSTAT_DATA_CHECK; 156*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl &= ~SCSW_CTRL_MASK_STCTL; 157*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl |= SCSW_STCTL_PRIMARY | SCSW_STCTL_SECONDARY | 1588ca2b376SXiao Feng Ren SCSW_STCTL_ALERT | SCSW_STCTL_STATUS_PEND; 1598ca2b376SXiao Feng Ren goto read_err; 1608ca2b376SXiao Feng Ren default: 1618ca2b376SXiao Feng Ren /* Error, generate channel program check. */ 162*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl &= ~SCSW_ACTL_START_PEND; 163*e1d0b372SDaniel P. Berrangé schib->scsw.cstat = SCSW_CSTAT_PROG_CHECK; 164*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl &= ~SCSW_CTRL_MASK_STCTL; 165*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl |= SCSW_STCTL_PRIMARY | SCSW_STCTL_SECONDARY | 1668ca2b376SXiao Feng Ren SCSW_STCTL_ALERT | SCSW_STCTL_STATUS_PEND; 1678ca2b376SXiao Feng Ren goto read_err; 1688ca2b376SXiao Feng Ren } 1698ca2b376SXiao Feng Ren } else if (size != vcdev->io_region_size) { 1708ca2b376SXiao Feng Ren /* Information transfer error, generate channel-control check. */ 171*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl &= ~SCSW_ACTL_START_PEND; 172*e1d0b372SDaniel P. Berrangé schib->scsw.cstat = SCSW_CSTAT_CHN_CTRL_CHK; 173*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl &= ~SCSW_CTRL_MASK_STCTL; 174*e1d0b372SDaniel P. Berrangé schib->scsw.ctrl |= SCSW_STCTL_PRIMARY | SCSW_STCTL_SECONDARY | 1758ca2b376SXiao Feng Ren SCSW_STCTL_ALERT | SCSW_STCTL_STATUS_PEND; 1768ca2b376SXiao Feng Ren goto read_err; 1778ca2b376SXiao Feng Ren } 1788ca2b376SXiao Feng Ren 1798ca2b376SXiao Feng Ren memcpy(&irb, region->irb_area, sizeof(IRB)); 1808ca2b376SXiao Feng Ren 1818ca2b376SXiao Feng Ren /* Update control block via irb. */ 182*e1d0b372SDaniel P. Berrangé s = schib->scsw; 183*e1d0b372SDaniel P. Berrangé copy_scsw_to_guest(&s, &irb.scsw); 184*e1d0b372SDaniel P. Berrangé schib->scsw = s; 1858ca2b376SXiao Feng Ren 186334e7685SDong Jia Shi /* If a uint check is pending, copy sense data. */ 187*e1d0b372SDaniel P. Berrangé if ((schib->scsw.dstat & SCSW_DSTAT_UNIT_CHECK) && 188*e1d0b372SDaniel P. Berrangé (schib->pmcw.chars & PMCW_CHARS_MASK_CSENSE)) { 189334e7685SDong Jia Shi memcpy(sch->sense_data, irb.ecw, sizeof(irb.ecw)); 190334e7685SDong Jia Shi } 191334e7685SDong Jia Shi 1928ca2b376SXiao Feng Ren read_err: 1938ca2b376SXiao Feng Ren css_inject_io_interrupt(sch); 1944886b3e9SDong Jia Shi } 1954886b3e9SDong Jia Shi 1964886b3e9SDong Jia Shi static void vfio_ccw_register_io_notifier(VFIOCCWDevice *vcdev, Error **errp) 1974886b3e9SDong Jia Shi { 1984886b3e9SDong Jia Shi VFIODevice *vdev = &vcdev->vdev; 1994886b3e9SDong Jia Shi struct vfio_irq_info *irq_info; 2004886b3e9SDong Jia Shi struct vfio_irq_set *irq_set; 2014886b3e9SDong Jia Shi size_t argsz; 2024886b3e9SDong Jia Shi int32_t *pfd; 2034886b3e9SDong Jia Shi 2044886b3e9SDong Jia Shi if (vdev->num_irqs < VFIO_CCW_IO_IRQ_INDEX + 1) { 2054886b3e9SDong Jia Shi error_setg(errp, "vfio: unexpected number of io irqs %u", 2064886b3e9SDong Jia Shi vdev->num_irqs); 2074886b3e9SDong Jia Shi return; 2084886b3e9SDong Jia Shi } 2094886b3e9SDong Jia Shi 21028e22d4bSJing Zhang argsz = sizeof(*irq_info); 2114886b3e9SDong Jia Shi irq_info = g_malloc0(argsz); 2124886b3e9SDong Jia Shi irq_info->index = VFIO_CCW_IO_IRQ_INDEX; 2134886b3e9SDong Jia Shi irq_info->argsz = argsz; 2144886b3e9SDong Jia Shi if (ioctl(vdev->fd, VFIO_DEVICE_GET_IRQ_INFO, 2154886b3e9SDong Jia Shi irq_info) < 0 || irq_info->count < 1) { 2164886b3e9SDong Jia Shi error_setg_errno(errp, errno, "vfio: Error getting irq info"); 2174886b3e9SDong Jia Shi goto out_free_info; 2184886b3e9SDong Jia Shi } 2194886b3e9SDong Jia Shi 2204886b3e9SDong Jia Shi if (event_notifier_init(&vcdev->io_notifier, 0)) { 2214886b3e9SDong Jia Shi error_setg_errno(errp, errno, 2224886b3e9SDong Jia Shi "vfio: Unable to init event notifier for IO"); 2234886b3e9SDong Jia Shi goto out_free_info; 2244886b3e9SDong Jia Shi } 2254886b3e9SDong Jia Shi 2264886b3e9SDong Jia Shi argsz = sizeof(*irq_set) + sizeof(*pfd); 2274886b3e9SDong Jia Shi irq_set = g_malloc0(argsz); 2284886b3e9SDong Jia Shi irq_set->argsz = argsz; 2294886b3e9SDong Jia Shi irq_set->flags = VFIO_IRQ_SET_DATA_EVENTFD | 2304886b3e9SDong Jia Shi VFIO_IRQ_SET_ACTION_TRIGGER; 2314886b3e9SDong Jia Shi irq_set->index = VFIO_CCW_IO_IRQ_INDEX; 2324886b3e9SDong Jia Shi irq_set->start = 0; 2334886b3e9SDong Jia Shi irq_set->count = 1; 2344886b3e9SDong Jia Shi pfd = (int32_t *) &irq_set->data; 2354886b3e9SDong Jia Shi 2364886b3e9SDong Jia Shi *pfd = event_notifier_get_fd(&vcdev->io_notifier); 2374886b3e9SDong Jia Shi qemu_set_fd_handler(*pfd, vfio_ccw_io_notifier_handler, NULL, vcdev); 2384886b3e9SDong Jia Shi if (ioctl(vdev->fd, VFIO_DEVICE_SET_IRQS, irq_set)) { 2394886b3e9SDong Jia Shi error_setg(errp, "vfio: Failed to set up io notification"); 2404886b3e9SDong Jia Shi qemu_set_fd_handler(*pfd, NULL, NULL, vcdev); 2414886b3e9SDong Jia Shi event_notifier_cleanup(&vcdev->io_notifier); 2424886b3e9SDong Jia Shi } 2434886b3e9SDong Jia Shi 2444886b3e9SDong Jia Shi g_free(irq_set); 2454886b3e9SDong Jia Shi 2464886b3e9SDong Jia Shi out_free_info: 2474886b3e9SDong Jia Shi g_free(irq_info); 2484886b3e9SDong Jia Shi } 2494886b3e9SDong Jia Shi 2504886b3e9SDong Jia Shi static void vfio_ccw_unregister_io_notifier(VFIOCCWDevice *vcdev) 2514886b3e9SDong Jia Shi { 2524886b3e9SDong Jia Shi struct vfio_irq_set *irq_set; 2534886b3e9SDong Jia Shi size_t argsz; 2544886b3e9SDong Jia Shi int32_t *pfd; 2554886b3e9SDong Jia Shi 2564886b3e9SDong Jia Shi argsz = sizeof(*irq_set) + sizeof(*pfd); 2574886b3e9SDong Jia Shi irq_set = g_malloc0(argsz); 2584886b3e9SDong Jia Shi irq_set->argsz = argsz; 2594886b3e9SDong Jia Shi irq_set->flags = VFIO_IRQ_SET_DATA_EVENTFD | 2604886b3e9SDong Jia Shi VFIO_IRQ_SET_ACTION_TRIGGER; 2614886b3e9SDong Jia Shi irq_set->index = VFIO_CCW_IO_IRQ_INDEX; 2624886b3e9SDong Jia Shi irq_set->start = 0; 2634886b3e9SDong Jia Shi irq_set->count = 1; 2644886b3e9SDong Jia Shi pfd = (int32_t *) &irq_set->data; 2654886b3e9SDong Jia Shi *pfd = -1; 2664886b3e9SDong Jia Shi 2674886b3e9SDong Jia Shi if (ioctl(vcdev->vdev.fd, VFIO_DEVICE_SET_IRQS, irq_set)) { 2684886b3e9SDong Jia Shi error_report("vfio: Failed to de-assign device io fd: %m"); 2694886b3e9SDong Jia Shi } 2704886b3e9SDong Jia Shi 2714886b3e9SDong Jia Shi qemu_set_fd_handler(event_notifier_get_fd(&vcdev->io_notifier), 2724886b3e9SDong Jia Shi NULL, NULL, vcdev); 2734886b3e9SDong Jia Shi event_notifier_cleanup(&vcdev->io_notifier); 2744886b3e9SDong Jia Shi 2754886b3e9SDong Jia Shi g_free(irq_set); 2764886b3e9SDong Jia Shi } 2774886b3e9SDong Jia Shi 278c14e706cSDong Jia Shi static void vfio_ccw_get_region(VFIOCCWDevice *vcdev, Error **errp) 279c14e706cSDong Jia Shi { 280c14e706cSDong Jia Shi VFIODevice *vdev = &vcdev->vdev; 281c14e706cSDong Jia Shi struct vfio_region_info *info; 282c14e706cSDong Jia Shi int ret; 283c14e706cSDong Jia Shi 284c14e706cSDong Jia Shi /* Sanity check device */ 285c14e706cSDong Jia Shi if (!(vdev->flags & VFIO_DEVICE_FLAGS_CCW)) { 286c14e706cSDong Jia Shi error_setg(errp, "vfio: Um, this isn't a vfio-ccw device"); 287c14e706cSDong Jia Shi return; 288c14e706cSDong Jia Shi } 289c14e706cSDong Jia Shi 290c14e706cSDong Jia Shi if (vdev->num_regions < VFIO_CCW_CONFIG_REGION_INDEX + 1) { 291c14e706cSDong Jia Shi error_setg(errp, "vfio: Unexpected number of the I/O region %u", 292c14e706cSDong Jia Shi vdev->num_regions); 293c14e706cSDong Jia Shi return; 294c14e706cSDong Jia Shi } 295c14e706cSDong Jia Shi 296c14e706cSDong Jia Shi ret = vfio_get_region_info(vdev, VFIO_CCW_CONFIG_REGION_INDEX, &info); 297c14e706cSDong Jia Shi if (ret) { 298c14e706cSDong Jia Shi error_setg_errno(errp, -ret, "vfio: Error getting config info"); 299c14e706cSDong Jia Shi return; 300c14e706cSDong Jia Shi } 301c14e706cSDong Jia Shi 302c14e706cSDong Jia Shi vcdev->io_region_size = info->size; 303c14e706cSDong Jia Shi if (sizeof(*vcdev->io_region) != vcdev->io_region_size) { 304c14e706cSDong Jia Shi error_setg(errp, "vfio: Unexpected size of the I/O region"); 305c14e706cSDong Jia Shi g_free(info); 306c14e706cSDong Jia Shi return; 307c14e706cSDong Jia Shi } 308c14e706cSDong Jia Shi 309c14e706cSDong Jia Shi vcdev->io_region_offset = info->offset; 310c14e706cSDong Jia Shi vcdev->io_region = g_malloc0(info->size); 311c14e706cSDong Jia Shi 312c14e706cSDong Jia Shi g_free(info); 313c14e706cSDong Jia Shi } 314c14e706cSDong Jia Shi 315c14e706cSDong Jia Shi static void vfio_ccw_put_region(VFIOCCWDevice *vcdev) 316c14e706cSDong Jia Shi { 317c14e706cSDong Jia Shi g_free(vcdev->io_region); 318c14e706cSDong Jia Shi } 319c14e706cSDong Jia Shi 320c96f2c2aSGreg Kurz static void vfio_ccw_put_device(VFIOCCWDevice *vcdev) 3211dcac3e1SXiao Feng Ren { 3221dcac3e1SXiao Feng Ren g_free(vcdev->vdev.name); 3231dcac3e1SXiao Feng Ren vfio_put_base_device(&vcdev->vdev); 3241dcac3e1SXiao Feng Ren } 3251dcac3e1SXiao Feng Ren 326c96f2c2aSGreg Kurz static void vfio_ccw_get_device(VFIOGroup *group, VFIOCCWDevice *vcdev, 327c96f2c2aSGreg Kurz Error **errp) 328c96f2c2aSGreg Kurz { 329c96f2c2aSGreg Kurz char *name = g_strdup_printf("%x.%x.%04x", vcdev->cdev.hostid.cssid, 330c96f2c2aSGreg Kurz vcdev->cdev.hostid.ssid, 331c96f2c2aSGreg Kurz vcdev->cdev.hostid.devid); 332c96f2c2aSGreg Kurz VFIODevice *vbasedev; 333c96f2c2aSGreg Kurz 334c96f2c2aSGreg Kurz QLIST_FOREACH(vbasedev, &group->device_list, next) { 335c96f2c2aSGreg Kurz if (strcmp(vbasedev->name, name) == 0) { 336c96f2c2aSGreg Kurz error_setg(errp, "vfio: subchannel %s has already been attached", 337c96f2c2aSGreg Kurz name); 338c96f2c2aSGreg Kurz goto out_err; 339c96f2c2aSGreg Kurz } 340c96f2c2aSGreg Kurz } 341c96f2c2aSGreg Kurz 342238e9172SAlex Williamson /* 343238e9172SAlex Williamson * All vfio-ccw devices are believed to operate in a way compatible with 344238e9172SAlex Williamson * memory ballooning, ie. pages pinned in the host are in the current 345238e9172SAlex Williamson * working set of the guest driver and therefore never overlap with pages 346238e9172SAlex Williamson * available to the guest balloon driver. This needs to be set before 347238e9172SAlex Williamson * vfio_get_device() for vfio common to handle the balloon inhibitor. 348238e9172SAlex Williamson */ 349238e9172SAlex Williamson vcdev->vdev.balloon_allowed = true; 350238e9172SAlex Williamson 351c96f2c2aSGreg Kurz if (vfio_get_device(group, vcdev->cdev.mdevid, &vcdev->vdev, errp)) { 352c96f2c2aSGreg Kurz goto out_err; 353c96f2c2aSGreg Kurz } 354c96f2c2aSGreg Kurz 355c96f2c2aSGreg Kurz vcdev->vdev.ops = &vfio_ccw_ops; 356c96f2c2aSGreg Kurz vcdev->vdev.type = VFIO_DEVICE_TYPE_CCW; 357c96f2c2aSGreg Kurz vcdev->vdev.name = name; 358c96f2c2aSGreg Kurz vcdev->vdev.dev = &vcdev->cdev.parent_obj.parent_obj; 359c96f2c2aSGreg Kurz 360c96f2c2aSGreg Kurz return; 361c96f2c2aSGreg Kurz 362c96f2c2aSGreg Kurz out_err: 363c96f2c2aSGreg Kurz g_free(name); 364c96f2c2aSGreg Kurz } 365c96f2c2aSGreg Kurz 3661dcac3e1SXiao Feng Ren static VFIOGroup *vfio_ccw_get_group(S390CCWDevice *cdev, Error **errp) 3671dcac3e1SXiao Feng Ren { 3681dcac3e1SXiao Feng Ren char *tmp, group_path[PATH_MAX]; 3691dcac3e1SXiao Feng Ren ssize_t len; 3701dcac3e1SXiao Feng Ren int groupid; 3711dcac3e1SXiao Feng Ren 3721dcac3e1SXiao Feng Ren tmp = g_strdup_printf("/sys/bus/css/devices/%x.%x.%04x/%s/iommu_group", 3731dcac3e1SXiao Feng Ren cdev->hostid.cssid, cdev->hostid.ssid, 3741dcac3e1SXiao Feng Ren cdev->hostid.devid, cdev->mdevid); 3751dcac3e1SXiao Feng Ren len = readlink(tmp, group_path, sizeof(group_path)); 3761dcac3e1SXiao Feng Ren g_free(tmp); 3771dcac3e1SXiao Feng Ren 3781dcac3e1SXiao Feng Ren if (len <= 0 || len >= sizeof(group_path)) { 3791dcac3e1SXiao Feng Ren error_setg(errp, "vfio: no iommu_group found"); 3801dcac3e1SXiao Feng Ren return NULL; 3811dcac3e1SXiao Feng Ren } 3821dcac3e1SXiao Feng Ren 3831dcac3e1SXiao Feng Ren group_path[len] = 0; 3841dcac3e1SXiao Feng Ren 3851dcac3e1SXiao Feng Ren if (sscanf(basename(group_path), "%d", &groupid) != 1) { 3861dcac3e1SXiao Feng Ren error_setg(errp, "vfio: failed to read %s", group_path); 3871dcac3e1SXiao Feng Ren return NULL; 3881dcac3e1SXiao Feng Ren } 3891dcac3e1SXiao Feng Ren 3901dcac3e1SXiao Feng Ren return vfio_get_group(groupid, &address_space_memory, errp); 3911dcac3e1SXiao Feng Ren } 3921dcac3e1SXiao Feng Ren 3931dcac3e1SXiao Feng Ren static void vfio_ccw_realize(DeviceState *dev, Error **errp) 3941dcac3e1SXiao Feng Ren { 3951dcac3e1SXiao Feng Ren VFIOGroup *group; 3961dcac3e1SXiao Feng Ren CcwDevice *ccw_dev = DO_UPCAST(CcwDevice, parent_obj, dev); 3971dcac3e1SXiao Feng Ren S390CCWDevice *cdev = DO_UPCAST(S390CCWDevice, parent_obj, ccw_dev); 3981dcac3e1SXiao Feng Ren VFIOCCWDevice *vcdev = DO_UPCAST(VFIOCCWDevice, cdev, cdev); 3991dcac3e1SXiao Feng Ren S390CCWDeviceClass *cdc = S390_CCW_DEVICE_GET_CLASS(cdev); 4001dcac3e1SXiao Feng Ren Error *err = NULL; 4011dcac3e1SXiao Feng Ren 4021dcac3e1SXiao Feng Ren /* Call the class init function for subchannel. */ 4031dcac3e1SXiao Feng Ren if (cdc->realize) { 4041dcac3e1SXiao Feng Ren cdc->realize(cdev, vcdev->vdev.sysfsdev, &err); 4051dcac3e1SXiao Feng Ren if (err) { 4061dcac3e1SXiao Feng Ren goto out_err_propagate; 4071dcac3e1SXiao Feng Ren } 4081dcac3e1SXiao Feng Ren } 4091dcac3e1SXiao Feng Ren 4101dcac3e1SXiao Feng Ren group = vfio_ccw_get_group(cdev, &err); 4111dcac3e1SXiao Feng Ren if (!group) { 4121dcac3e1SXiao Feng Ren goto out_group_err; 4131dcac3e1SXiao Feng Ren } 4141dcac3e1SXiao Feng Ren 415c96f2c2aSGreg Kurz vfio_ccw_get_device(group, vcdev, &err); 416c96f2c2aSGreg Kurz if (err) { 4171dcac3e1SXiao Feng Ren goto out_device_err; 4181dcac3e1SXiao Feng Ren } 4191dcac3e1SXiao Feng Ren 420c14e706cSDong Jia Shi vfio_ccw_get_region(vcdev, &err); 421c14e706cSDong Jia Shi if (err) { 422c14e706cSDong Jia Shi goto out_region_err; 423c14e706cSDong Jia Shi } 424c14e706cSDong Jia Shi 4254886b3e9SDong Jia Shi vfio_ccw_register_io_notifier(vcdev, &err); 4264886b3e9SDong Jia Shi if (err) { 4274886b3e9SDong Jia Shi goto out_notifier_err; 4284886b3e9SDong Jia Shi } 4294886b3e9SDong Jia Shi 4301dcac3e1SXiao Feng Ren return; 4311dcac3e1SXiao Feng Ren 4324886b3e9SDong Jia Shi out_notifier_err: 4334886b3e9SDong Jia Shi vfio_ccw_put_region(vcdev); 434c14e706cSDong Jia Shi out_region_err: 435c96f2c2aSGreg Kurz vfio_ccw_put_device(vcdev); 4361dcac3e1SXiao Feng Ren out_device_err: 4371dcac3e1SXiao Feng Ren vfio_put_group(group); 4381dcac3e1SXiao Feng Ren out_group_err: 4391dcac3e1SXiao Feng Ren if (cdc->unrealize) { 4401dcac3e1SXiao Feng Ren cdc->unrealize(cdev, NULL); 4411dcac3e1SXiao Feng Ren } 4421dcac3e1SXiao Feng Ren out_err_propagate: 4431dcac3e1SXiao Feng Ren error_propagate(errp, err); 4441dcac3e1SXiao Feng Ren } 4451dcac3e1SXiao Feng Ren 4461dcac3e1SXiao Feng Ren static void vfio_ccw_unrealize(DeviceState *dev, Error **errp) 4471dcac3e1SXiao Feng Ren { 4481dcac3e1SXiao Feng Ren CcwDevice *ccw_dev = DO_UPCAST(CcwDevice, parent_obj, dev); 4491dcac3e1SXiao Feng Ren S390CCWDevice *cdev = DO_UPCAST(S390CCWDevice, parent_obj, ccw_dev); 4501dcac3e1SXiao Feng Ren VFIOCCWDevice *vcdev = DO_UPCAST(VFIOCCWDevice, cdev, cdev); 4511dcac3e1SXiao Feng Ren S390CCWDeviceClass *cdc = S390_CCW_DEVICE_GET_CLASS(cdev); 4521dcac3e1SXiao Feng Ren VFIOGroup *group = vcdev->vdev.group; 4531dcac3e1SXiao Feng Ren 4544886b3e9SDong Jia Shi vfio_ccw_unregister_io_notifier(vcdev); 455c14e706cSDong Jia Shi vfio_ccw_put_region(vcdev); 456c96f2c2aSGreg Kurz vfio_ccw_put_device(vcdev); 4571dcac3e1SXiao Feng Ren vfio_put_group(group); 4581dcac3e1SXiao Feng Ren 4591dcac3e1SXiao Feng Ren if (cdc->unrealize) { 4601dcac3e1SXiao Feng Ren cdc->unrealize(cdev, errp); 4611dcac3e1SXiao Feng Ren } 4621dcac3e1SXiao Feng Ren } 4631dcac3e1SXiao Feng Ren 4641dcac3e1SXiao Feng Ren static Property vfio_ccw_properties[] = { 4651dcac3e1SXiao Feng Ren DEFINE_PROP_STRING("sysfsdev", VFIOCCWDevice, vdev.sysfsdev), 4669a51c9eeSHalil Pasic DEFINE_PROP_BOOL("force-orb-pfch", VFIOCCWDevice, force_orb_pfch, false), 4671dcac3e1SXiao Feng Ren DEFINE_PROP_END_OF_LIST(), 4681dcac3e1SXiao Feng Ren }; 4691dcac3e1SXiao Feng Ren 4701dcac3e1SXiao Feng Ren static const VMStateDescription vfio_ccw_vmstate = { 4711dcac3e1SXiao Feng Ren .name = TYPE_VFIO_CCW, 4721dcac3e1SXiao Feng Ren .unmigratable = 1, 4731dcac3e1SXiao Feng Ren }; 4741dcac3e1SXiao Feng Ren 4751dcac3e1SXiao Feng Ren static void vfio_ccw_class_init(ObjectClass *klass, void *data) 4761dcac3e1SXiao Feng Ren { 4771dcac3e1SXiao Feng Ren DeviceClass *dc = DEVICE_CLASS(klass); 4788ca2b376SXiao Feng Ren S390CCWDeviceClass *cdc = S390_CCW_DEVICE_CLASS(klass); 4791dcac3e1SXiao Feng Ren 4801dcac3e1SXiao Feng Ren dc->props = vfio_ccw_properties; 4811dcac3e1SXiao Feng Ren dc->vmsd = &vfio_ccw_vmstate; 4821dcac3e1SXiao Feng Ren dc->desc = "VFIO-based subchannel assignment"; 483bd2aef10SCornelia Huck set_bit(DEVICE_CATEGORY_MISC, dc->categories); 4841dcac3e1SXiao Feng Ren dc->realize = vfio_ccw_realize; 4851dcac3e1SXiao Feng Ren dc->unrealize = vfio_ccw_unrealize; 4861dcac3e1SXiao Feng Ren dc->reset = vfio_ccw_reset; 4878ca2b376SXiao Feng Ren 4888ca2b376SXiao Feng Ren cdc->handle_request = vfio_ccw_handle_request; 4891dcac3e1SXiao Feng Ren } 4901dcac3e1SXiao Feng Ren 4911dcac3e1SXiao Feng Ren static const TypeInfo vfio_ccw_info = { 4921dcac3e1SXiao Feng Ren .name = TYPE_VFIO_CCW, 4931dcac3e1SXiao Feng Ren .parent = TYPE_S390_CCW, 4941dcac3e1SXiao Feng Ren .instance_size = sizeof(VFIOCCWDevice), 4951dcac3e1SXiao Feng Ren .class_init = vfio_ccw_class_init, 4961dcac3e1SXiao Feng Ren }; 4971dcac3e1SXiao Feng Ren 4981dcac3e1SXiao Feng Ren static void register_vfio_ccw_type(void) 4991dcac3e1SXiao Feng Ren { 5001dcac3e1SXiao Feng Ren type_register_static(&vfio_ccw_info); 5011dcac3e1SXiao Feng Ren } 5021dcac3e1SXiao Feng Ren 5031dcac3e1SXiao Feng Ren type_init(register_vfio_ccw_type) 504