1d2912cb1SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
289e1f7d4SAlex Williamson /*
389e1f7d4SAlex Williamson  * VFIO PCI interrupt handling
489e1f7d4SAlex Williamson  *
589e1f7d4SAlex Williamson  * Copyright (C) 2012 Red Hat, Inc.  All rights reserved.
689e1f7d4SAlex Williamson  *     Author: Alex Williamson <alex.williamson@redhat.com>
789e1f7d4SAlex Williamson  *
889e1f7d4SAlex Williamson  * Derived from original vfio:
989e1f7d4SAlex Williamson  * Copyright 2010 Cisco Systems, Inc.  All rights reserved.
1089e1f7d4SAlex Williamson  * Author: Tom Lyon, pugs@cisco.com
1189e1f7d4SAlex Williamson  */
1289e1f7d4SAlex Williamson 
1389e1f7d4SAlex Williamson #include <linux/device.h>
1489e1f7d4SAlex Williamson #include <linux/interrupt.h>
1589e1f7d4SAlex Williamson #include <linux/eventfd.h>
16b8f02af0SGavin Shan #include <linux/msi.h>
1789e1f7d4SAlex Williamson #include <linux/pci.h>
1889e1f7d4SAlex Williamson #include <linux/file.h>
1989e1f7d4SAlex Williamson #include <linux/vfio.h>
2089e1f7d4SAlex Williamson #include <linux/wait.h>
2125e9789dSArnd Bergmann #include <linux/slab.h>
2289e1f7d4SAlex Williamson 
23e34a0425SJason Gunthorpe #include "vfio_pci_priv.h"
24e34a0425SJason Gunthorpe 
25e34a0425SJason Gunthorpe struct vfio_pci_irq_ctx {
26e34a0425SJason Gunthorpe 	struct eventfd_ctx	*trigger;
27e34a0425SJason Gunthorpe 	struct virqfd		*unmask;
28e34a0425SJason Gunthorpe 	struct virqfd		*mask;
29e34a0425SJason Gunthorpe 	char			*name;
30e34a0425SJason Gunthorpe 	bool			masked;
31e34a0425SJason Gunthorpe 	struct irq_bypass_producer	producer;
32e34a0425SJason Gunthorpe };
3389e1f7d4SAlex Williamson 
irq_is(struct vfio_pci_core_device * vdev,int type)34c462a8c5SJason Gunthorpe static bool irq_is(struct vfio_pci_core_device *vdev, int type)
35c462a8c5SJason Gunthorpe {
36c462a8c5SJason Gunthorpe 	return vdev->irq_type == type;
37c462a8c5SJason Gunthorpe }
38c462a8c5SJason Gunthorpe 
is_intx(struct vfio_pci_core_device * vdev)39c462a8c5SJason Gunthorpe static bool is_intx(struct vfio_pci_core_device *vdev)
40c462a8c5SJason Gunthorpe {
41c462a8c5SJason Gunthorpe 	return vdev->irq_type == VFIO_PCI_INTX_IRQ_INDEX;
42c462a8c5SJason Gunthorpe }
43c462a8c5SJason Gunthorpe 
is_irq_none(struct vfio_pci_core_device * vdev)44c462a8c5SJason Gunthorpe static bool is_irq_none(struct vfio_pci_core_device *vdev)
45c462a8c5SJason Gunthorpe {
46c462a8c5SJason Gunthorpe 	return !(vdev->irq_type == VFIO_PCI_INTX_IRQ_INDEX ||
47c462a8c5SJason Gunthorpe 		 vdev->irq_type == VFIO_PCI_MSI_IRQ_INDEX ||
48c462a8c5SJason Gunthorpe 		 vdev->irq_type == VFIO_PCI_MSIX_IRQ_INDEX);
49c462a8c5SJason Gunthorpe }
50c462a8c5SJason Gunthorpe 
51d977e0f7SReinette Chatre static
vfio_irq_ctx_get(struct vfio_pci_core_device * vdev,unsigned long index)52d977e0f7SReinette Chatre struct vfio_pci_irq_ctx *vfio_irq_ctx_get(struct vfio_pci_core_device *vdev,
53d977e0f7SReinette Chatre 					  unsigned long index)
54d977e0f7SReinette Chatre {
55b156e48fSReinette Chatre 	return xa_load(&vdev->ctx, index);
56b156e48fSReinette Chatre }
57b156e48fSReinette Chatre 
vfio_irq_ctx_free(struct vfio_pci_core_device * vdev,struct vfio_pci_irq_ctx * ctx,unsigned long index)58b156e48fSReinette Chatre static void vfio_irq_ctx_free(struct vfio_pci_core_device *vdev,
59b156e48fSReinette Chatre 			      struct vfio_pci_irq_ctx *ctx, unsigned long index)
60b156e48fSReinette Chatre {
61b156e48fSReinette Chatre 	xa_erase(&vdev->ctx, index);
62b156e48fSReinette Chatre 	kfree(ctx);
63b156e48fSReinette Chatre }
64b156e48fSReinette Chatre 
65b156e48fSReinette Chatre static struct vfio_pci_irq_ctx *
vfio_irq_ctx_alloc(struct vfio_pci_core_device * vdev,unsigned long index)66b156e48fSReinette Chatre vfio_irq_ctx_alloc(struct vfio_pci_core_device *vdev, unsigned long index)
67b156e48fSReinette Chatre {
68b156e48fSReinette Chatre 	struct vfio_pci_irq_ctx *ctx;
69b156e48fSReinette Chatre 	int ret;
70b156e48fSReinette Chatre 
71b156e48fSReinette Chatre 	ctx = kzalloc(sizeof(*ctx), GFP_KERNEL_ACCOUNT);
72b156e48fSReinette Chatre 	if (!ctx)
73d977e0f7SReinette Chatre 		return NULL;
74b156e48fSReinette Chatre 
75b156e48fSReinette Chatre 	ret = xa_insert(&vdev->ctx, index, ctx, GFP_KERNEL_ACCOUNT);
76b156e48fSReinette Chatre 	if (ret) {
77b156e48fSReinette Chatre 		kfree(ctx);
78b156e48fSReinette Chatre 		return NULL;
79d977e0f7SReinette Chatre 	}
80d977e0f7SReinette Chatre 
81b156e48fSReinette Chatre 	return ctx;
82d977e0f7SReinette Chatre }
83d977e0f7SReinette Chatre 
8489e1f7d4SAlex Williamson /*
8589e1f7d4SAlex Williamson  * INTx
8689e1f7d4SAlex Williamson  */
vfio_send_intx_eventfd(void * opaque,void * unused)8709bbcb88SAntonios Motakis static void vfio_send_intx_eventfd(void *opaque, void *unused)
8889e1f7d4SAlex Williamson {
8953647510SMax Gurtovoy 	struct vfio_pci_core_device *vdev = opaque;
9009bbcb88SAntonios Motakis 
91d977e0f7SReinette Chatre 	if (likely(is_intx(vdev) && !vdev->virq_disabled)) {
92d977e0f7SReinette Chatre 		struct vfio_pci_irq_ctx *ctx;
9369276a55SAlex Williamson 		struct eventfd_ctx *trigger;
94d977e0f7SReinette Chatre 
95d977e0f7SReinette Chatre 		ctx = vfio_irq_ctx_get(vdev, 0);
96d977e0f7SReinette Chatre 		if (WARN_ON_ONCE(!ctx))
97d977e0f7SReinette Chatre 			return;
9869276a55SAlex Williamson 
9969276a55SAlex Williamson 		trigger = READ_ONCE(ctx->trigger);
10069276a55SAlex Williamson 		if (likely(trigger))
10169276a55SAlex Williamson 			eventfd_signal(trigger, 1);
102d977e0f7SReinette Chatre 	}
10389e1f7d4SAlex Williamson }
10489e1f7d4SAlex Williamson 
1054813724cSAbhishek Sahu /* Returns true if the INTx vfio_pci_irq_ctx.masked value is changed. */
__vfio_pci_intx_mask(struct vfio_pci_core_device * vdev)10604a4a017SAlex Williamson static bool __vfio_pci_intx_mask(struct vfio_pci_core_device *vdev)
10789e1f7d4SAlex Williamson {
10889e1f7d4SAlex Williamson 	struct pci_dev *pdev = vdev->pdev;
109d977e0f7SReinette Chatre 	struct vfio_pci_irq_ctx *ctx;
11089e1f7d4SAlex Williamson 	unsigned long flags;
1114813724cSAbhishek Sahu 	bool masked_changed = false;
11289e1f7d4SAlex Williamson 
11304a4a017SAlex Williamson 	lockdep_assert_held(&vdev->igate);
11404a4a017SAlex Williamson 
11589e1f7d4SAlex Williamson 	spin_lock_irqsave(&vdev->irqlock, flags);
11689e1f7d4SAlex Williamson 
11789e1f7d4SAlex Williamson 	/*
11889e1f7d4SAlex Williamson 	 * Masking can come from interrupt, ioctl, or config space
11989e1f7d4SAlex Williamson 	 * via INTx disable.  The latter means this can get called
12089e1f7d4SAlex Williamson 	 * even when not using intx delivery.  In this case, just
12189e1f7d4SAlex Williamson 	 * try to have the physical bit follow the virtual bit.
12289e1f7d4SAlex Williamson 	 */
12389e1f7d4SAlex Williamson 	if (unlikely(!is_intx(vdev))) {
12489e1f7d4SAlex Williamson 		if (vdev->pci_2_3)
12589e1f7d4SAlex Williamson 			pci_intx(pdev, 0);
126d977e0f7SReinette Chatre 		goto out_unlock;
127d977e0f7SReinette Chatre 	}
128d977e0f7SReinette Chatre 
129d977e0f7SReinette Chatre 	ctx = vfio_irq_ctx_get(vdev, 0);
130d977e0f7SReinette Chatre 	if (WARN_ON_ONCE(!ctx))
131d977e0f7SReinette Chatre 		goto out_unlock;
132d977e0f7SReinette Chatre 
133d977e0f7SReinette Chatre 	if (!ctx->masked) {
13489e1f7d4SAlex Williamson 		/*
13589e1f7d4SAlex Williamson 		 * Can't use check_and_mask here because we always want to
13689e1f7d4SAlex Williamson 		 * mask, not just when something is pending.
13789e1f7d4SAlex Williamson 		 */
13889e1f7d4SAlex Williamson 		if (vdev->pci_2_3)
13989e1f7d4SAlex Williamson 			pci_intx(pdev, 0);
14089e1f7d4SAlex Williamson 		else
14189e1f7d4SAlex Williamson 			disable_irq_nosync(pdev->irq);
14289e1f7d4SAlex Williamson 
143d977e0f7SReinette Chatre 		ctx->masked = true;
1444813724cSAbhishek Sahu 		masked_changed = true;
14589e1f7d4SAlex Williamson 	}
14689e1f7d4SAlex Williamson 
147d977e0f7SReinette Chatre out_unlock:
14889e1f7d4SAlex Williamson 	spin_unlock_irqrestore(&vdev->irqlock, flags);
1494813724cSAbhishek Sahu 	return masked_changed;
15089e1f7d4SAlex Williamson }
15189e1f7d4SAlex Williamson 
vfio_pci_intx_mask(struct vfio_pci_core_device * vdev)15204a4a017SAlex Williamson bool vfio_pci_intx_mask(struct vfio_pci_core_device *vdev)
15304a4a017SAlex Williamson {
15404a4a017SAlex Williamson 	bool mask_changed;
15504a4a017SAlex Williamson 
15604a4a017SAlex Williamson 	mutex_lock(&vdev->igate);
15704a4a017SAlex Williamson 	mask_changed = __vfio_pci_intx_mask(vdev);
15804a4a017SAlex Williamson 	mutex_unlock(&vdev->igate);
15904a4a017SAlex Williamson 
16004a4a017SAlex Williamson 	return mask_changed;
16104a4a017SAlex Williamson }
16204a4a017SAlex Williamson 
16389e1f7d4SAlex Williamson /*
16489e1f7d4SAlex Williamson  * If this is triggered by an eventfd, we can't call eventfd_signal
16589e1f7d4SAlex Williamson  * or else we'll deadlock on the eventfd wait queue.  Return >0 when
16689e1f7d4SAlex Williamson  * a signal is necessary, which can then be handled via a work queue
16789e1f7d4SAlex Williamson  * or directly depending on the caller.
16889e1f7d4SAlex Williamson  */
vfio_pci_intx_unmask_handler(void * opaque,void * unused)16909bbcb88SAntonios Motakis static int vfio_pci_intx_unmask_handler(void *opaque, void *unused)
17089e1f7d4SAlex Williamson {
17153647510SMax Gurtovoy 	struct vfio_pci_core_device *vdev = opaque;
17289e1f7d4SAlex Williamson 	struct pci_dev *pdev = vdev->pdev;
173d977e0f7SReinette Chatre 	struct vfio_pci_irq_ctx *ctx;
17489e1f7d4SAlex Williamson 	unsigned long flags;
17589e1f7d4SAlex Williamson 	int ret = 0;
17689e1f7d4SAlex Williamson 
17789e1f7d4SAlex Williamson 	spin_lock_irqsave(&vdev->irqlock, flags);
17889e1f7d4SAlex Williamson 
17989e1f7d4SAlex Williamson 	/*
18089e1f7d4SAlex Williamson 	 * Unmasking comes from ioctl or config, so again, have the
18189e1f7d4SAlex Williamson 	 * physical bit follow the virtual even when not using INTx.
18289e1f7d4SAlex Williamson 	 */
18389e1f7d4SAlex Williamson 	if (unlikely(!is_intx(vdev))) {
18489e1f7d4SAlex Williamson 		if (vdev->pci_2_3)
18589e1f7d4SAlex Williamson 			pci_intx(pdev, 1);
186d977e0f7SReinette Chatre 		goto out_unlock;
187d977e0f7SReinette Chatre 	}
188d977e0f7SReinette Chatre 
189d977e0f7SReinette Chatre 	ctx = vfio_irq_ctx_get(vdev, 0);
190d977e0f7SReinette Chatre 	if (WARN_ON_ONCE(!ctx))
191d977e0f7SReinette Chatre 		goto out_unlock;
192d977e0f7SReinette Chatre 
193d977e0f7SReinette Chatre 	if (ctx->masked && !vdev->virq_disabled) {
19489e1f7d4SAlex Williamson 		/*
19589e1f7d4SAlex Williamson 		 * A pending interrupt here would immediately trigger,
19689e1f7d4SAlex Williamson 		 * but we can avoid that overhead by just re-sending
19789e1f7d4SAlex Williamson 		 * the interrupt to the user.
19889e1f7d4SAlex Williamson 		 */
19989e1f7d4SAlex Williamson 		if (vdev->pci_2_3) {
20089e1f7d4SAlex Williamson 			if (!pci_check_and_unmask_intx(pdev))
20189e1f7d4SAlex Williamson 				ret = 1;
20289e1f7d4SAlex Williamson 		} else
20389e1f7d4SAlex Williamson 			enable_irq(pdev->irq);
20489e1f7d4SAlex Williamson 
205d977e0f7SReinette Chatre 		ctx->masked = (ret > 0);
20689e1f7d4SAlex Williamson 	}
20789e1f7d4SAlex Williamson 
208d977e0f7SReinette Chatre out_unlock:
20989e1f7d4SAlex Williamson 	spin_unlock_irqrestore(&vdev->irqlock, flags);
21089e1f7d4SAlex Williamson 
21189e1f7d4SAlex Williamson 	return ret;
21289e1f7d4SAlex Williamson }
21389e1f7d4SAlex Williamson 
__vfio_pci_intx_unmask(struct vfio_pci_core_device * vdev)21404a4a017SAlex Williamson static void __vfio_pci_intx_unmask(struct vfio_pci_core_device *vdev)
21589e1f7d4SAlex Williamson {
21604a4a017SAlex Williamson 	lockdep_assert_held(&vdev->igate);
21704a4a017SAlex Williamson 
21889e1f7d4SAlex Williamson 	if (vfio_pci_intx_unmask_handler(vdev, NULL) > 0)
21989e1f7d4SAlex Williamson 		vfio_send_intx_eventfd(vdev, NULL);
22089e1f7d4SAlex Williamson }
22189e1f7d4SAlex Williamson 
vfio_pci_intx_unmask(struct vfio_pci_core_device * vdev)22204a4a017SAlex Williamson void vfio_pci_intx_unmask(struct vfio_pci_core_device *vdev)
22304a4a017SAlex Williamson {
22404a4a017SAlex Williamson 	mutex_lock(&vdev->igate);
22504a4a017SAlex Williamson 	__vfio_pci_intx_unmask(vdev);
22604a4a017SAlex Williamson 	mutex_unlock(&vdev->igate);
22704a4a017SAlex Williamson }
22804a4a017SAlex Williamson 
vfio_intx_handler(int irq,void * dev_id)22989e1f7d4SAlex Williamson static irqreturn_t vfio_intx_handler(int irq, void *dev_id)
23089e1f7d4SAlex Williamson {
23153647510SMax Gurtovoy 	struct vfio_pci_core_device *vdev = dev_id;
232d977e0f7SReinette Chatre 	struct vfio_pci_irq_ctx *ctx;
23389e1f7d4SAlex Williamson 	unsigned long flags;
23489e1f7d4SAlex Williamson 	int ret = IRQ_NONE;
23589e1f7d4SAlex Williamson 
236d977e0f7SReinette Chatre 	ctx = vfio_irq_ctx_get(vdev, 0);
237d977e0f7SReinette Chatre 	if (WARN_ON_ONCE(!ctx))
238d977e0f7SReinette Chatre 		return ret;
239d977e0f7SReinette Chatre 
24089e1f7d4SAlex Williamson 	spin_lock_irqsave(&vdev->irqlock, flags);
24189e1f7d4SAlex Williamson 
24289e1f7d4SAlex Williamson 	if (!vdev->pci_2_3) {
24389e1f7d4SAlex Williamson 		disable_irq_nosync(vdev->pdev->irq);
244d977e0f7SReinette Chatre 		ctx->masked = true;
24589e1f7d4SAlex Williamson 		ret = IRQ_HANDLED;
246d977e0f7SReinette Chatre 	} else if (!ctx->masked &&  /* may be shared */
24789e1f7d4SAlex Williamson 		   pci_check_and_mask_intx(vdev->pdev)) {
248d977e0f7SReinette Chatre 		ctx->masked = true;
24989e1f7d4SAlex Williamson 		ret = IRQ_HANDLED;
25089e1f7d4SAlex Williamson 	}
25189e1f7d4SAlex Williamson 
25289e1f7d4SAlex Williamson 	spin_unlock_irqrestore(&vdev->irqlock, flags);
25389e1f7d4SAlex Williamson 
25489e1f7d4SAlex Williamson 	if (ret == IRQ_HANDLED)
25589e1f7d4SAlex Williamson 		vfio_send_intx_eventfd(vdev, NULL);
25689e1f7d4SAlex Williamson 
25789e1f7d4SAlex Williamson 	return ret;
25889e1f7d4SAlex Williamson }
25989e1f7d4SAlex Williamson 
vfio_intx_enable(struct vfio_pci_core_device * vdev,struct eventfd_ctx * trigger)26069276a55SAlex Williamson static int vfio_intx_enable(struct vfio_pci_core_device *vdev,
26169276a55SAlex Williamson 			    struct eventfd_ctx *trigger)
26289e1f7d4SAlex Williamson {
26369276a55SAlex Williamson 	struct pci_dev *pdev = vdev->pdev;
264d977e0f7SReinette Chatre 	struct vfio_pci_irq_ctx *ctx;
26569276a55SAlex Williamson 	unsigned long irqflags;
26669276a55SAlex Williamson 	char *name;
26769276a55SAlex Williamson 	int ret;
268d977e0f7SReinette Chatre 
26989e1f7d4SAlex Williamson 	if (!is_irq_none(vdev))
27089e1f7d4SAlex Williamson 		return -EINVAL;
27189e1f7d4SAlex Williamson 
27269276a55SAlex Williamson 	if (!pdev->irq)
27389e1f7d4SAlex Williamson 		return -ENODEV;
27489e1f7d4SAlex Williamson 
27569276a55SAlex Williamson 	name = kasprintf(GFP_KERNEL_ACCOUNT, "vfio-intx(%s)", pci_name(pdev));
27669276a55SAlex Williamson 	if (!name)
27769276a55SAlex Williamson 		return -ENOMEM;
27869276a55SAlex Williamson 
279b156e48fSReinette Chatre 	ctx = vfio_irq_ctx_alloc(vdev, 0);
2800bd22a49SYe Bin 	if (!ctx) {
2810bd22a49SYe Bin 		kfree(name);
282b156e48fSReinette Chatre 		return -ENOMEM;
2830bd22a49SYe Bin 	}
28489e1f7d4SAlex Williamson 
28569276a55SAlex Williamson 	ctx->name = name;
28669276a55SAlex Williamson 	ctx->trigger = trigger;
28769276a55SAlex Williamson 
288899649b7SAlex Williamson 	/*
28969276a55SAlex Williamson 	 * Fill the initial masked state based on virq_disabled.  After
29069276a55SAlex Williamson 	 * enable, changing the DisINTx bit in vconfig directly changes INTx
29169276a55SAlex Williamson 	 * masking.  igate prevents races during setup, once running masked
29269276a55SAlex Williamson 	 * is protected via irqlock.
29369276a55SAlex Williamson 	 *
29469276a55SAlex Williamson 	 * Devices supporting DisINTx also reflect the current mask state in
29569276a55SAlex Williamson 	 * the physical DisINTx bit, which is not affected during IRQ setup.
29669276a55SAlex Williamson 	 *
29769276a55SAlex Williamson 	 * Devices without DisINTx support require an exclusive interrupt.
29869276a55SAlex Williamson 	 * IRQ masking is performed at the IRQ chip.  Again, igate protects
29969276a55SAlex Williamson 	 * against races during setup and IRQ handlers and irqfds are not
30069276a55SAlex Williamson 	 * yet active, therefore masked is stable and can be used to
30169276a55SAlex Williamson 	 * conditionally auto-enable the IRQ.
30269276a55SAlex Williamson 	 *
30369276a55SAlex Williamson 	 * irq_type must be stable while the IRQ handler is registered,
30469276a55SAlex Williamson 	 * therefore it must be set before request_irq().
305899649b7SAlex Williamson 	 */
306d977e0f7SReinette Chatre 	ctx->masked = vdev->virq_disabled;
30769276a55SAlex Williamson 	if (vdev->pci_2_3) {
30869276a55SAlex Williamson 		pci_intx(pdev, !ctx->masked);
30969276a55SAlex Williamson 		irqflags = IRQF_SHARED;
31069276a55SAlex Williamson 	} else {
31169276a55SAlex Williamson 		irqflags = ctx->masked ? IRQF_NO_AUTOEN : 0;
31269276a55SAlex Williamson 	}
313899649b7SAlex Williamson 
31489e1f7d4SAlex Williamson 	vdev->irq_type = VFIO_PCI_INTX_IRQ_INDEX;
31589e1f7d4SAlex Williamson 
31669276a55SAlex Williamson 	ret = request_irq(pdev->irq, vfio_intx_handler,
31769276a55SAlex Williamson 			  irqflags, ctx->name, vdev);
31869276a55SAlex Williamson 	if (ret) {
31969276a55SAlex Williamson 		vdev->irq_type = VFIO_PCI_NUM_IRQS;
32069276a55SAlex Williamson 		kfree(name);
32169276a55SAlex Williamson 		vfio_irq_ctx_free(vdev, ctx, 0);
32269276a55SAlex Williamson 		return ret;
32369276a55SAlex Williamson 	}
32469276a55SAlex Williamson 
32589e1f7d4SAlex Williamson 	return 0;
32689e1f7d4SAlex Williamson }
32789e1f7d4SAlex Williamson 
vfio_intx_set_signal(struct vfio_pci_core_device * vdev,struct eventfd_ctx * trigger)32869276a55SAlex Williamson static int vfio_intx_set_signal(struct vfio_pci_core_device *vdev,
32969276a55SAlex Williamson 				struct eventfd_ctx *trigger)
33089e1f7d4SAlex Williamson {
33189e1f7d4SAlex Williamson 	struct pci_dev *pdev = vdev->pdev;
332d977e0f7SReinette Chatre 	struct vfio_pci_irq_ctx *ctx;
33369276a55SAlex Williamson 	struct eventfd_ctx *old;
33489e1f7d4SAlex Williamson 
335d977e0f7SReinette Chatre 	ctx = vfio_irq_ctx_get(vdev, 0);
336d977e0f7SReinette Chatre 	if (WARN_ON_ONCE(!ctx))
337d977e0f7SReinette Chatre 		return -EINVAL;
338d977e0f7SReinette Chatre 
33969276a55SAlex Williamson 	old = ctx->trigger;
34069276a55SAlex Williamson 
34169276a55SAlex Williamson 	WRITE_ONCE(ctx->trigger, trigger);
34269276a55SAlex Williamson 
34369276a55SAlex Williamson 	/* Releasing an old ctx requires synchronizing in-flight users */
34469276a55SAlex Williamson 	if (old) {
34569276a55SAlex Williamson 		synchronize_irq(pdev->irq);
34669276a55SAlex Williamson 		vfio_virqfd_flush_thread(&ctx->unmask);
34769276a55SAlex Williamson 		eventfd_ctx_put(old);
34889e1f7d4SAlex Williamson 	}
34989e1f7d4SAlex Williamson 
35089e1f7d4SAlex Williamson 	return 0;
35189e1f7d4SAlex Williamson }
35289e1f7d4SAlex Williamson 
vfio_intx_disable(struct vfio_pci_core_device * vdev)35353647510SMax Gurtovoy static void vfio_intx_disable(struct vfio_pci_core_device *vdev)
35489e1f7d4SAlex Williamson {
35569276a55SAlex Williamson 	struct pci_dev *pdev = vdev->pdev;
356d977e0f7SReinette Chatre 	struct vfio_pci_irq_ctx *ctx;
357d977e0f7SReinette Chatre 
358d977e0f7SReinette Chatre 	ctx = vfio_irq_ctx_get(vdev, 0);
359d977e0f7SReinette Chatre 	WARN_ON_ONCE(!ctx);
360d977e0f7SReinette Chatre 	if (ctx) {
361d977e0f7SReinette Chatre 		vfio_virqfd_disable(&ctx->unmask);
362d977e0f7SReinette Chatre 		vfio_virqfd_disable(&ctx->mask);
36369276a55SAlex Williamson 		free_irq(pdev->irq, vdev);
36469276a55SAlex Williamson 		if (ctx->trigger)
36569276a55SAlex Williamson 			eventfd_ctx_put(ctx->trigger);
36669276a55SAlex Williamson 		kfree(ctx->name);
367b156e48fSReinette Chatre 		vfio_irq_ctx_free(vdev, ctx, 0);
36889e1f7d4SAlex Williamson 	}
36969276a55SAlex Williamson 	vdev->irq_type = VFIO_PCI_NUM_IRQS;
37069276a55SAlex Williamson }
37189e1f7d4SAlex Williamson 
37289e1f7d4SAlex Williamson /*
37389e1f7d4SAlex Williamson  * MSI/MSI-X
37489e1f7d4SAlex Williamson  */
vfio_msihandler(int irq,void * arg)37589e1f7d4SAlex Williamson static irqreturn_t vfio_msihandler(int irq, void *arg)
37689e1f7d4SAlex Williamson {
37789e1f7d4SAlex Williamson 	struct eventfd_ctx *trigger = arg;
37889e1f7d4SAlex Williamson 
37989e1f7d4SAlex Williamson 	eventfd_signal(trigger, 1);
38089e1f7d4SAlex Williamson 	return IRQ_HANDLED;
38189e1f7d4SAlex Williamson }
38289e1f7d4SAlex Williamson 
vfio_msi_enable(struct vfio_pci_core_device * vdev,int nvec,bool msix)38353647510SMax Gurtovoy static int vfio_msi_enable(struct vfio_pci_core_device *vdev, int nvec, bool msix)
38489e1f7d4SAlex Williamson {
38589e1f7d4SAlex Williamson 	struct pci_dev *pdev = vdev->pdev;
38661771468SChristoph Hellwig 	unsigned int flag = msix ? PCI_IRQ_MSIX : PCI_IRQ_MSI;
38789e1f7d4SAlex Williamson 	int ret;
388abafbc55SAlex Williamson 	u16 cmd;
38989e1f7d4SAlex Williamson 
39089e1f7d4SAlex Williamson 	if (!is_irq_none(vdev))
39189e1f7d4SAlex Williamson 		return -EINVAL;
39289e1f7d4SAlex Williamson 
39361771468SChristoph Hellwig 	/* return the number of supported vectors if we can't get all: */
394abafbc55SAlex Williamson 	cmd = vfio_pci_memory_lock_and_enable(vdev);
39561771468SChristoph Hellwig 	ret = pci_alloc_irq_vectors(pdev, 1, nvec, flag);
39694cccde6SAlexander Gordeev 	if (ret < nvec) {
39794cccde6SAlexander Gordeev 		if (ret > 0)
39861771468SChristoph Hellwig 			pci_free_irq_vectors(pdev);
399abafbc55SAlex Williamson 		vfio_pci_memory_unlock_and_restore(vdev, cmd);
40089e1f7d4SAlex Williamson 		return ret;
40189e1f7d4SAlex Williamson 	}
402abafbc55SAlex Williamson 	vfio_pci_memory_unlock_and_restore(vdev, cmd);
40389e1f7d4SAlex Williamson 
40489e1f7d4SAlex Williamson 	vdev->irq_type = msix ? VFIO_PCI_MSIX_IRQ_INDEX :
40589e1f7d4SAlex Williamson 				VFIO_PCI_MSI_IRQ_INDEX;
40689e1f7d4SAlex Williamson 
40789e1f7d4SAlex Williamson 	if (!msix) {
40889e1f7d4SAlex Williamson 		/*
40989e1f7d4SAlex Williamson 		 * Compute the virtual hardware field for max msi vectors -
41089e1f7d4SAlex Williamson 		 * it is the log base 2 of the number of vectors.
41189e1f7d4SAlex Williamson 		 */
41289e1f7d4SAlex Williamson 		vdev->msi_qmax = fls(nvec * 2 - 1) - 1;
41389e1f7d4SAlex Williamson 	}
41489e1f7d4SAlex Williamson 
41589e1f7d4SAlex Williamson 	return 0;
41689e1f7d4SAlex Williamson }
41789e1f7d4SAlex Williamson 
418e4163438SReinette Chatre /*
419e4163438SReinette Chatre  * vfio_msi_alloc_irq() returns the Linux IRQ number of an MSI or MSI-X device
420e4163438SReinette Chatre  * interrupt vector. If a Linux IRQ number is not available then a new
421e4163438SReinette Chatre  * interrupt is allocated if dynamic MSI-X is supported.
422e4163438SReinette Chatre  *
423e4163438SReinette Chatre  * Where is vfio_msi_free_irq()? Allocated interrupts are maintained,
424e4163438SReinette Chatre  * essentially forming a cache that subsequent allocations can draw from.
425e4163438SReinette Chatre  * Interrupts are freed using pci_free_irq_vectors() when MSI/MSI-X is
426e4163438SReinette Chatre  * disabled.
427e4163438SReinette Chatre  */
vfio_msi_alloc_irq(struct vfio_pci_core_device * vdev,unsigned int vector,bool msix)428e4163438SReinette Chatre static int vfio_msi_alloc_irq(struct vfio_pci_core_device *vdev,
429e4163438SReinette Chatre 			      unsigned int vector, bool msix)
430e4163438SReinette Chatre {
431e4163438SReinette Chatre 	struct pci_dev *pdev = vdev->pdev;
432e4163438SReinette Chatre 	struct msi_map map;
433e4163438SReinette Chatre 	int irq;
434e4163438SReinette Chatre 	u16 cmd;
435e4163438SReinette Chatre 
436e4163438SReinette Chatre 	irq = pci_irq_vector(pdev, vector);
437e4163438SReinette Chatre 	if (WARN_ON_ONCE(irq == 0))
438e4163438SReinette Chatre 		return -EINVAL;
439e4163438SReinette Chatre 	if (irq > 0 || !msix || !vdev->has_dyn_msix)
440e4163438SReinette Chatre 		return irq;
441e4163438SReinette Chatre 
442e4163438SReinette Chatre 	cmd = vfio_pci_memory_lock_and_enable(vdev);
443e4163438SReinette Chatre 	map = pci_msix_alloc_irq_at(pdev, vector, NULL);
444e4163438SReinette Chatre 	vfio_pci_memory_unlock_and_restore(vdev, cmd);
445e4163438SReinette Chatre 
446e4163438SReinette Chatre 	return map.index < 0 ? map.index : map.virq;
447e4163438SReinette Chatre }
448e4163438SReinette Chatre 
vfio_msi_set_vector_signal(struct vfio_pci_core_device * vdev,unsigned int vector,int fd,bool msix)44953647510SMax Gurtovoy static int vfio_msi_set_vector_signal(struct vfio_pci_core_device *vdev,
4506578ed85SReinette Chatre 				      unsigned int vector, int fd, bool msix)
45189e1f7d4SAlex Williamson {
45289e1f7d4SAlex Williamson 	struct pci_dev *pdev = vdev->pdev;
453d977e0f7SReinette Chatre 	struct vfio_pci_irq_ctx *ctx;
45489e1f7d4SAlex Williamson 	struct eventfd_ctx *trigger;
455e4163438SReinette Chatre 	int irq = -EINVAL, ret;
456abafbc55SAlex Williamson 	u16 cmd;
45789e1f7d4SAlex Williamson 
458b156e48fSReinette Chatre 	ctx = vfio_irq_ctx_get(vdev, vector);
459b156e48fSReinette Chatre 
460b156e48fSReinette Chatre 	if (ctx) {
461d977e0f7SReinette Chatre 		irq_bypass_unregister_producer(&ctx->producer);
462e4163438SReinette Chatre 		irq = pci_irq_vector(pdev, vector);
463abafbc55SAlex Williamson 		cmd = vfio_pci_memory_lock_and_enable(vdev);
464d977e0f7SReinette Chatre 		free_irq(irq, ctx->trigger);
465abafbc55SAlex Williamson 		vfio_pci_memory_unlock_and_restore(vdev, cmd);
466e4163438SReinette Chatre 		/* Interrupt stays allocated, will be freed at MSI-X disable. */
467d977e0f7SReinette Chatre 		kfree(ctx->name);
468d977e0f7SReinette Chatre 		eventfd_ctx_put(ctx->trigger);
469b156e48fSReinette Chatre 		vfio_irq_ctx_free(vdev, ctx, vector);
47089e1f7d4SAlex Williamson 	}
47189e1f7d4SAlex Williamson 
47289e1f7d4SAlex Williamson 	if (fd < 0)
47389e1f7d4SAlex Williamson 		return 0;
47489e1f7d4SAlex Williamson 
475e4163438SReinette Chatre 	if (irq == -EINVAL) {
476e4163438SReinette Chatre 		/* Interrupt stays allocated, will be freed at MSI-X disable. */
477e4163438SReinette Chatre 		irq = vfio_msi_alloc_irq(vdev, vector, msix);
478e4163438SReinette Chatre 		if (irq < 0)
479e4163438SReinette Chatre 			return irq;
480e4163438SReinette Chatre 	}
481e4163438SReinette Chatre 
482b156e48fSReinette Chatre 	ctx = vfio_irq_ctx_alloc(vdev, vector);
483b156e48fSReinette Chatre 	if (!ctx)
484b156e48fSReinette Chatre 		return -ENOMEM;
485b156e48fSReinette Chatre 
486d977e0f7SReinette Chatre 	ctx->name = kasprintf(GFP_KERNEL_ACCOUNT, "vfio-msi%s[%d](%s)",
487d977e0f7SReinette Chatre 			      msix ? "x" : "", vector, pci_name(pdev));
488b156e48fSReinette Chatre 	if (!ctx->name) {
489b156e48fSReinette Chatre 		ret = -ENOMEM;
490b156e48fSReinette Chatre 		goto out_free_ctx;
491b156e48fSReinette Chatre 	}
49289e1f7d4SAlex Williamson 
49389e1f7d4SAlex Williamson 	trigger = eventfd_ctx_fdget(fd);
49489e1f7d4SAlex Williamson 	if (IS_ERR(trigger)) {
49588503365SReinette Chatre 		ret = PTR_ERR(trigger);
49688503365SReinette Chatre 		goto out_free_name;
49789e1f7d4SAlex Williamson 	}
49889e1f7d4SAlex Williamson 
499b8f02af0SGavin Shan 	/*
5009387cf59SReinette Chatre 	 * If the vector was previously allocated, refresh the on-device
5019387cf59SReinette Chatre 	 * message data before enabling in case it had been cleared or
5029387cf59SReinette Chatre 	 * corrupted (e.g. due to backdoor resets) since writing.
503b8f02af0SGavin Shan 	 */
504abafbc55SAlex Williamson 	cmd = vfio_pci_memory_lock_and_enable(vdev);
505b8f02af0SGavin Shan 	if (msix) {
506b8f02af0SGavin Shan 		struct msi_msg msg;
507b8f02af0SGavin Shan 
508b8f02af0SGavin Shan 		get_cached_msi_msg(irq, &msg);
50983a18912SJiang Liu 		pci_write_msi_msg(irq, &msg);
510b8f02af0SGavin Shan 	}
511b8f02af0SGavin Shan 
512d977e0f7SReinette Chatre 	ret = request_irq(irq, vfio_msihandler, 0, ctx->name, trigger);
513abafbc55SAlex Williamson 	vfio_pci_memory_unlock_and_restore(vdev, cmd);
51488503365SReinette Chatre 	if (ret)
51588503365SReinette Chatre 		goto out_put_eventfd_ctx;
51689e1f7d4SAlex Williamson 
517d977e0f7SReinette Chatre 	ctx->producer.token = trigger;
518d977e0f7SReinette Chatre 	ctx->producer.irq = irq;
519d977e0f7SReinette Chatre 	ret = irq_bypass_register_producer(&ctx->producer);
520852b1beeSAlex Williamson 	if (unlikely(ret)) {
5216d7425f1SFeng Wu 		dev_info(&pdev->dev,
5226d7425f1SFeng Wu 		"irq bypass producer (token %p) registration fails: %d\n",
523d977e0f7SReinette Chatre 		ctx->producer.token, ret);
5246d7425f1SFeng Wu 
525d977e0f7SReinette Chatre 		ctx->producer.token = NULL;
526852b1beeSAlex Williamson 	}
527d977e0f7SReinette Chatre 	ctx->trigger = trigger;
52889e1f7d4SAlex Williamson 
52989e1f7d4SAlex Williamson 	return 0;
53088503365SReinette Chatre 
53188503365SReinette Chatre out_put_eventfd_ctx:
53288503365SReinette Chatre 	eventfd_ctx_put(trigger);
53388503365SReinette Chatre out_free_name:
53488503365SReinette Chatre 	kfree(ctx->name);
535b156e48fSReinette Chatre out_free_ctx:
536b156e48fSReinette Chatre 	vfio_irq_ctx_free(vdev, ctx, vector);
53788503365SReinette Chatre 	return ret;
53889e1f7d4SAlex Williamson }
53989e1f7d4SAlex Williamson 
vfio_msi_set_block(struct vfio_pci_core_device * vdev,unsigned start,unsigned count,int32_t * fds,bool msix)54053647510SMax Gurtovoy static int vfio_msi_set_block(struct vfio_pci_core_device *vdev, unsigned start,
54189e1f7d4SAlex Williamson 			      unsigned count, int32_t *fds, bool msix)
54289e1f7d4SAlex Williamson {
5436578ed85SReinette Chatre 	unsigned int i, j;
5446578ed85SReinette Chatre 	int ret = 0;
54589e1f7d4SAlex Williamson 
54689e1f7d4SAlex Williamson 	for (i = 0, j = start; i < count && !ret; i++, j++) {
54789e1f7d4SAlex Williamson 		int fd = fds ? fds[i] : -1;
54889e1f7d4SAlex Williamson 		ret = vfio_msi_set_vector_signal(vdev, j, fd, msix);
54989e1f7d4SAlex Williamson 	}
55089e1f7d4SAlex Williamson 
55189e1f7d4SAlex Williamson 	if (ret) {
5526578ed85SReinette Chatre 		for (i = start; i < j; i++)
5536578ed85SReinette Chatre 			vfio_msi_set_vector_signal(vdev, i, -1, msix);
55489e1f7d4SAlex Williamson 	}
55589e1f7d4SAlex Williamson 
55689e1f7d4SAlex Williamson 	return ret;
55789e1f7d4SAlex Williamson }
55889e1f7d4SAlex Williamson 
vfio_msi_disable(struct vfio_pci_core_device * vdev,bool msix)55953647510SMax Gurtovoy static void vfio_msi_disable(struct vfio_pci_core_device *vdev, bool msix)
56089e1f7d4SAlex Williamson {
56189e1f7d4SAlex Williamson 	struct pci_dev *pdev = vdev->pdev;
562d977e0f7SReinette Chatre 	struct vfio_pci_irq_ctx *ctx;
563b156e48fSReinette Chatre 	unsigned long i;
564abafbc55SAlex Williamson 	u16 cmd;
56589e1f7d4SAlex Williamson 
566b156e48fSReinette Chatre 	xa_for_each(&vdev->ctx, i, ctx) {
567d977e0f7SReinette Chatre 		vfio_virqfd_disable(&ctx->unmask);
568d977e0f7SReinette Chatre 		vfio_virqfd_disable(&ctx->mask);
569a65f35cfSReinette Chatre 		vfio_msi_set_vector_signal(vdev, i, -1, msix);
57089e1f7d4SAlex Williamson 	}
57189e1f7d4SAlex Williamson 
572abafbc55SAlex Williamson 	cmd = vfio_pci_memory_lock_and_enable(vdev);
57361771468SChristoph Hellwig 	pci_free_irq_vectors(pdev);
574abafbc55SAlex Williamson 	vfio_pci_memory_unlock_and_restore(vdev, cmd);
57589e1f7d4SAlex Williamson 
576c93a97eeSAlex Williamson 	/*
577c93a97eeSAlex Williamson 	 * Both disable paths above use pci_intx_for_msi() to clear DisINTx
578c93a97eeSAlex Williamson 	 * via their shutdown paths.  Restore for NoINTx devices.
579c93a97eeSAlex Williamson 	 */
580c93a97eeSAlex Williamson 	if (vdev->nointx)
581c93a97eeSAlex Williamson 		pci_intx(pdev, 0);
582c93a97eeSAlex Williamson 
58389e1f7d4SAlex Williamson 	vdev->irq_type = VFIO_PCI_NUM_IRQS;
58489e1f7d4SAlex Williamson }
58589e1f7d4SAlex Williamson 
58689e1f7d4SAlex Williamson /*
58789e1f7d4SAlex Williamson  * IOCTL support
58889e1f7d4SAlex Williamson  */
vfio_pci_set_intx_unmask(struct vfio_pci_core_device * vdev,unsigned index,unsigned start,unsigned count,uint32_t flags,void * data)58953647510SMax Gurtovoy static int vfio_pci_set_intx_unmask(struct vfio_pci_core_device *vdev,
59089e1f7d4SAlex Williamson 				    unsigned index, unsigned start,
59189e1f7d4SAlex Williamson 				    unsigned count, uint32_t flags, void *data)
59289e1f7d4SAlex Williamson {
59389e1f7d4SAlex Williamson 	if (!is_intx(vdev) || start != 0 || count != 1)
59489e1f7d4SAlex Williamson 		return -EINVAL;
59589e1f7d4SAlex Williamson 
59689e1f7d4SAlex Williamson 	if (flags & VFIO_IRQ_SET_DATA_NONE) {
59704a4a017SAlex Williamson 		__vfio_pci_intx_unmask(vdev);
59889e1f7d4SAlex Williamson 	} else if (flags & VFIO_IRQ_SET_DATA_BOOL) {
59989e1f7d4SAlex Williamson 		uint8_t unmask = *(uint8_t *)data;
60089e1f7d4SAlex Williamson 		if (unmask)
60104a4a017SAlex Williamson 			__vfio_pci_intx_unmask(vdev);
60289e1f7d4SAlex Williamson 	} else if (flags & VFIO_IRQ_SET_DATA_EVENTFD) {
603d977e0f7SReinette Chatre 		struct vfio_pci_irq_ctx *ctx = vfio_irq_ctx_get(vdev, 0);
60489e1f7d4SAlex Williamson 		int32_t fd = *(int32_t *)data;
605d977e0f7SReinette Chatre 
606d977e0f7SReinette Chatre 		if (WARN_ON_ONCE(!ctx))
607d977e0f7SReinette Chatre 			return -EINVAL;
60889e1f7d4SAlex Williamson 		if (fd >= 0)
60909bbcb88SAntonios Motakis 			return vfio_virqfd_enable((void *) vdev,
610bdc5e102SAntonios Motakis 						  vfio_pci_intx_unmask_handler,
61189e1f7d4SAlex Williamson 						  vfio_send_intx_eventfd, NULL,
612d977e0f7SReinette Chatre 						  &ctx->unmask, fd);
61389e1f7d4SAlex Williamson 
614d977e0f7SReinette Chatre 		vfio_virqfd_disable(&ctx->unmask);
61589e1f7d4SAlex Williamson 	}
61689e1f7d4SAlex Williamson 
61789e1f7d4SAlex Williamson 	return 0;
61889e1f7d4SAlex Williamson }
61989e1f7d4SAlex Williamson 
vfio_pci_set_intx_mask(struct vfio_pci_core_device * vdev,unsigned index,unsigned start,unsigned count,uint32_t flags,void * data)62053647510SMax Gurtovoy static int vfio_pci_set_intx_mask(struct vfio_pci_core_device *vdev,
62189e1f7d4SAlex Williamson 				  unsigned index, unsigned start,
62289e1f7d4SAlex Williamson 				  unsigned count, uint32_t flags, void *data)
62389e1f7d4SAlex Williamson {
62489e1f7d4SAlex Williamson 	if (!is_intx(vdev) || start != 0 || count != 1)
62589e1f7d4SAlex Williamson 		return -EINVAL;
62689e1f7d4SAlex Williamson 
62789e1f7d4SAlex Williamson 	if (flags & VFIO_IRQ_SET_DATA_NONE) {
62804a4a017SAlex Williamson 		__vfio_pci_intx_mask(vdev);
62989e1f7d4SAlex Williamson 	} else if (flags & VFIO_IRQ_SET_DATA_BOOL) {
63089e1f7d4SAlex Williamson 		uint8_t mask = *(uint8_t *)data;
63189e1f7d4SAlex Williamson 		if (mask)
63204a4a017SAlex Williamson 			__vfio_pci_intx_mask(vdev);
63389e1f7d4SAlex Williamson 	} else if (flags & VFIO_IRQ_SET_DATA_EVENTFD) {
63489e1f7d4SAlex Williamson 		return -ENOTTY; /* XXX implement me */
63589e1f7d4SAlex Williamson 	}
63689e1f7d4SAlex Williamson 
63789e1f7d4SAlex Williamson 	return 0;
63889e1f7d4SAlex Williamson }
63989e1f7d4SAlex Williamson 
vfio_pci_set_intx_trigger(struct vfio_pci_core_device * vdev,unsigned index,unsigned start,unsigned count,uint32_t flags,void * data)64053647510SMax Gurtovoy static int vfio_pci_set_intx_trigger(struct vfio_pci_core_device *vdev,
64189e1f7d4SAlex Williamson 				     unsigned index, unsigned start,
64289e1f7d4SAlex Williamson 				     unsigned count, uint32_t flags, void *data)
64389e1f7d4SAlex Williamson {
64489e1f7d4SAlex Williamson 	if (is_intx(vdev) && !count && (flags & VFIO_IRQ_SET_DATA_NONE)) {
64589e1f7d4SAlex Williamson 		vfio_intx_disable(vdev);
64689e1f7d4SAlex Williamson 		return 0;
64789e1f7d4SAlex Williamson 	}
64889e1f7d4SAlex Williamson 
64989e1f7d4SAlex Williamson 	if (!(is_intx(vdev) || is_irq_none(vdev)) || start != 0 || count != 1)
65089e1f7d4SAlex Williamson 		return -EINVAL;
65189e1f7d4SAlex Williamson 
65289e1f7d4SAlex Williamson 	if (flags & VFIO_IRQ_SET_DATA_EVENTFD) {
65369276a55SAlex Williamson 		struct eventfd_ctx *trigger = NULL;
65489e1f7d4SAlex Williamson 		int32_t fd = *(int32_t *)data;
65589e1f7d4SAlex Williamson 		int ret;
65689e1f7d4SAlex Williamson 
65769276a55SAlex Williamson 		if (fd >= 0) {
65869276a55SAlex Williamson 			trigger = eventfd_ctx_fdget(fd);
65969276a55SAlex Williamson 			if (IS_ERR(trigger))
66069276a55SAlex Williamson 				return PTR_ERR(trigger);
66169276a55SAlex Williamson 		}
66269276a55SAlex Williamson 
66389e1f7d4SAlex Williamson 		if (is_intx(vdev))
66469276a55SAlex Williamson 			ret = vfio_intx_set_signal(vdev, trigger);
66569276a55SAlex Williamson 		else
66669276a55SAlex Williamson 			ret = vfio_intx_enable(vdev, trigger);
66789e1f7d4SAlex Williamson 
66869276a55SAlex Williamson 		if (ret && trigger)
66969276a55SAlex Williamson 			eventfd_ctx_put(trigger);
67089e1f7d4SAlex Williamson 
67189e1f7d4SAlex Williamson 		return ret;
67289e1f7d4SAlex Williamson 	}
67389e1f7d4SAlex Williamson 
67489e1f7d4SAlex Williamson 	if (!is_intx(vdev))
67589e1f7d4SAlex Williamson 		return -EINVAL;
67689e1f7d4SAlex Williamson 
67789e1f7d4SAlex Williamson 	if (flags & VFIO_IRQ_SET_DATA_NONE) {
67889e1f7d4SAlex Williamson 		vfio_send_intx_eventfd(vdev, NULL);
67989e1f7d4SAlex Williamson 	} else if (flags & VFIO_IRQ_SET_DATA_BOOL) {
68089e1f7d4SAlex Williamson 		uint8_t trigger = *(uint8_t *)data;
68189e1f7d4SAlex Williamson 		if (trigger)
68289e1f7d4SAlex Williamson 			vfio_send_intx_eventfd(vdev, NULL);
68389e1f7d4SAlex Williamson 	}
68489e1f7d4SAlex Williamson 	return 0;
68589e1f7d4SAlex Williamson }
68689e1f7d4SAlex Williamson 
vfio_pci_set_msi_trigger(struct vfio_pci_core_device * vdev,unsigned index,unsigned start,unsigned count,uint32_t flags,void * data)68753647510SMax Gurtovoy static int vfio_pci_set_msi_trigger(struct vfio_pci_core_device *vdev,
68889e1f7d4SAlex Williamson 				    unsigned index, unsigned start,
68989e1f7d4SAlex Williamson 				    unsigned count, uint32_t flags, void *data)
69089e1f7d4SAlex Williamson {
691d977e0f7SReinette Chatre 	struct vfio_pci_irq_ctx *ctx;
6926578ed85SReinette Chatre 	unsigned int i;
69389e1f7d4SAlex Williamson 	bool msix = (index == VFIO_PCI_MSIX_IRQ_INDEX) ? true : false;
69489e1f7d4SAlex Williamson 
69589e1f7d4SAlex Williamson 	if (irq_is(vdev, index) && !count && (flags & VFIO_IRQ_SET_DATA_NONE)) {
69689e1f7d4SAlex Williamson 		vfio_msi_disable(vdev, msix);
69789e1f7d4SAlex Williamson 		return 0;
69889e1f7d4SAlex Williamson 	}
69989e1f7d4SAlex Williamson 
70089e1f7d4SAlex Williamson 	if (!(irq_is(vdev, index) || is_irq_none(vdev)))
70189e1f7d4SAlex Williamson 		return -EINVAL;
70289e1f7d4SAlex Williamson 
70389e1f7d4SAlex Williamson 	if (flags & VFIO_IRQ_SET_DATA_EVENTFD) {
70489e1f7d4SAlex Williamson 		int32_t *fds = data;
70589e1f7d4SAlex Williamson 		int ret;
70689e1f7d4SAlex Williamson 
70789e1f7d4SAlex Williamson 		if (vdev->irq_type == index)
70889e1f7d4SAlex Williamson 			return vfio_msi_set_block(vdev, start, count,
70989e1f7d4SAlex Williamson 						  fds, msix);
71089e1f7d4SAlex Williamson 
71189e1f7d4SAlex Williamson 		ret = vfio_msi_enable(vdev, start + count, msix);
71289e1f7d4SAlex Williamson 		if (ret)
71389e1f7d4SAlex Williamson 			return ret;
71489e1f7d4SAlex Williamson 
71589e1f7d4SAlex Williamson 		ret = vfio_msi_set_block(vdev, start, count, fds, msix);
71689e1f7d4SAlex Williamson 		if (ret)
71789e1f7d4SAlex Williamson 			vfio_msi_disable(vdev, msix);
71889e1f7d4SAlex Williamson 
71989e1f7d4SAlex Williamson 		return ret;
72089e1f7d4SAlex Williamson 	}
72189e1f7d4SAlex Williamson 
72263972f63SReinette Chatre 	if (!irq_is(vdev, index))
72389e1f7d4SAlex Williamson 		return -EINVAL;
72489e1f7d4SAlex Williamson 
72589e1f7d4SAlex Williamson 	for (i = start; i < start + count; i++) {
726d977e0f7SReinette Chatre 		ctx = vfio_irq_ctx_get(vdev, i);
727b156e48fSReinette Chatre 		if (!ctx)
72889e1f7d4SAlex Williamson 			continue;
72989e1f7d4SAlex Williamson 		if (flags & VFIO_IRQ_SET_DATA_NONE) {
730d977e0f7SReinette Chatre 			eventfd_signal(ctx->trigger, 1);
73189e1f7d4SAlex Williamson 		} else if (flags & VFIO_IRQ_SET_DATA_BOOL) {
73289e1f7d4SAlex Williamson 			uint8_t *bools = data;
73389e1f7d4SAlex Williamson 			if (bools[i - start])
734d977e0f7SReinette Chatre 				eventfd_signal(ctx->trigger, 1);
73589e1f7d4SAlex Williamson 		}
73689e1f7d4SAlex Williamson 	}
73789e1f7d4SAlex Williamson 	return 0;
73889e1f7d4SAlex Williamson }
73989e1f7d4SAlex Williamson 
vfio_pci_set_ctx_trigger_single(struct eventfd_ctx ** ctx,unsigned int count,uint32_t flags,void * data)740cac80d6eSAlex Williamson static int vfio_pci_set_ctx_trigger_single(struct eventfd_ctx **ctx,
741c8952a70SAlex Williamson 					   unsigned int count, uint32_t flags,
742c8952a70SAlex Williamson 					   void *data)
743dad9f897SVijay Mohan Pandarathil {
744dad9f897SVijay Mohan Pandarathil 	/* DATA_NONE/DATA_BOOL enables loopback testing */
745dad9f897SVijay Mohan Pandarathil 	if (flags & VFIO_IRQ_SET_DATA_NONE) {
746c8952a70SAlex Williamson 		if (*ctx) {
747c8952a70SAlex Williamson 			if (count) {
748cac80d6eSAlex Williamson 				eventfd_signal(*ctx, 1);
749c8952a70SAlex Williamson 			} else {
750c8952a70SAlex Williamson 				eventfd_ctx_put(*ctx);
751c8952a70SAlex Williamson 				*ctx = NULL;
752c8952a70SAlex Williamson 			}
753dad9f897SVijay Mohan Pandarathil 			return 0;
754dad9f897SVijay Mohan Pandarathil 		}
755c8952a70SAlex Williamson 	} else if (flags & VFIO_IRQ_SET_DATA_BOOL) {
756c8952a70SAlex Williamson 		uint8_t trigger;
757dad9f897SVijay Mohan Pandarathil 
758c8952a70SAlex Williamson 		if (!count)
759c8952a70SAlex Williamson 			return -EINVAL;
760c8952a70SAlex Williamson 
761c8952a70SAlex Williamson 		trigger = *(uint8_t *)data;
762c8952a70SAlex Williamson 		if (trigger && *ctx)
763c8952a70SAlex Williamson 			eventfd_signal(*ctx, 1);
764c8952a70SAlex Williamson 
765c8952a70SAlex Williamson 		return 0;
766c8952a70SAlex Williamson 	} else if (flags & VFIO_IRQ_SET_DATA_EVENTFD) {
767c8952a70SAlex Williamson 		int32_t fd;
768c8952a70SAlex Williamson 
769c8952a70SAlex Williamson 		if (!count)
770c8952a70SAlex Williamson 			return -EINVAL;
771c8952a70SAlex Williamson 
772c8952a70SAlex Williamson 		fd = *(int32_t *)data;
773dad9f897SVijay Mohan Pandarathil 		if (fd == -1) {
774cac80d6eSAlex Williamson 			if (*ctx)
775cac80d6eSAlex Williamson 				eventfd_ctx_put(*ctx);
776cac80d6eSAlex Williamson 			*ctx = NULL;
777dad9f897SVijay Mohan Pandarathil 		} else if (fd >= 0) {
778dad9f897SVijay Mohan Pandarathil 			struct eventfd_ctx *efdctx;
779c8952a70SAlex Williamson 
780dad9f897SVijay Mohan Pandarathil 			efdctx = eventfd_ctx_fdget(fd);
781dad9f897SVijay Mohan Pandarathil 			if (IS_ERR(efdctx))
782dad9f897SVijay Mohan Pandarathil 				return PTR_ERR(efdctx);
783c8952a70SAlex Williamson 
784cac80d6eSAlex Williamson 			if (*ctx)
785cac80d6eSAlex Williamson 				eventfd_ctx_put(*ctx);
786c8952a70SAlex Williamson 
787cac80d6eSAlex Williamson 			*ctx = efdctx;
788c8952a70SAlex Williamson 		}
789dad9f897SVijay Mohan Pandarathil 		return 0;
790c8952a70SAlex Williamson 	}
791c8952a70SAlex Williamson 
792dad9f897SVijay Mohan Pandarathil 	return -EINVAL;
793dad9f897SVijay Mohan Pandarathil }
794cac80d6eSAlex Williamson 
vfio_pci_set_err_trigger(struct vfio_pci_core_device * vdev,unsigned index,unsigned start,unsigned count,uint32_t flags,void * data)79553647510SMax Gurtovoy static int vfio_pci_set_err_trigger(struct vfio_pci_core_device *vdev,
796cac80d6eSAlex Williamson 				    unsigned index, unsigned start,
797cac80d6eSAlex Williamson 				    unsigned count, uint32_t flags, void *data)
798cac80d6eSAlex Williamson {
799c8952a70SAlex Williamson 	if (index != VFIO_PCI_ERR_IRQ_INDEX || start != 0 || count > 1)
800cac80d6eSAlex Williamson 		return -EINVAL;
801cac80d6eSAlex Williamson 
802c8952a70SAlex Williamson 	return vfio_pci_set_ctx_trigger_single(&vdev->err_trigger,
803c8952a70SAlex Williamson 					       count, flags, data);
804cac80d6eSAlex Williamson }
805cac80d6eSAlex Williamson 
vfio_pci_set_req_trigger(struct vfio_pci_core_device * vdev,unsigned index,unsigned start,unsigned count,uint32_t flags,void * data)80653647510SMax Gurtovoy static int vfio_pci_set_req_trigger(struct vfio_pci_core_device *vdev,
8076140a8f5SAlex Williamson 				    unsigned index, unsigned start,
8086140a8f5SAlex Williamson 				    unsigned count, uint32_t flags, void *data)
8096140a8f5SAlex Williamson {
810c8952a70SAlex Williamson 	if (index != VFIO_PCI_REQ_IRQ_INDEX || start != 0 || count > 1)
8116140a8f5SAlex Williamson 		return -EINVAL;
8126140a8f5SAlex Williamson 
813c8952a70SAlex Williamson 	return vfio_pci_set_ctx_trigger_single(&vdev->req_trigger,
814c8952a70SAlex Williamson 					       count, flags, data);
8156140a8f5SAlex Williamson }
8166140a8f5SAlex Williamson 
vfio_pci_set_irqs_ioctl(struct vfio_pci_core_device * vdev,uint32_t flags,unsigned index,unsigned start,unsigned count,void * data)81753647510SMax Gurtovoy int vfio_pci_set_irqs_ioctl(struct vfio_pci_core_device *vdev, uint32_t flags,
81889e1f7d4SAlex Williamson 			    unsigned index, unsigned start, unsigned count,
81989e1f7d4SAlex Williamson 			    void *data)
82089e1f7d4SAlex Williamson {
82153647510SMax Gurtovoy 	int (*func)(struct vfio_pci_core_device *vdev, unsigned index,
82289e1f7d4SAlex Williamson 		    unsigned start, unsigned count, uint32_t flags,
82389e1f7d4SAlex Williamson 		    void *data) = NULL;
82489e1f7d4SAlex Williamson 
82589e1f7d4SAlex Williamson 	switch (index) {
82689e1f7d4SAlex Williamson 	case VFIO_PCI_INTX_IRQ_INDEX:
82789e1f7d4SAlex Williamson 		switch (flags & VFIO_IRQ_SET_ACTION_TYPE_MASK) {
82889e1f7d4SAlex Williamson 		case VFIO_IRQ_SET_ACTION_MASK:
82989e1f7d4SAlex Williamson 			func = vfio_pci_set_intx_mask;
83089e1f7d4SAlex Williamson 			break;
83189e1f7d4SAlex Williamson 		case VFIO_IRQ_SET_ACTION_UNMASK:
83289e1f7d4SAlex Williamson 			func = vfio_pci_set_intx_unmask;
83389e1f7d4SAlex Williamson 			break;
83489e1f7d4SAlex Williamson 		case VFIO_IRQ_SET_ACTION_TRIGGER:
83589e1f7d4SAlex Williamson 			func = vfio_pci_set_intx_trigger;
83689e1f7d4SAlex Williamson 			break;
83789e1f7d4SAlex Williamson 		}
83889e1f7d4SAlex Williamson 		break;
83989e1f7d4SAlex Williamson 	case VFIO_PCI_MSI_IRQ_INDEX:
84089e1f7d4SAlex Williamson 	case VFIO_PCI_MSIX_IRQ_INDEX:
84189e1f7d4SAlex Williamson 		switch (flags & VFIO_IRQ_SET_ACTION_TYPE_MASK) {
84289e1f7d4SAlex Williamson 		case VFIO_IRQ_SET_ACTION_MASK:
84389e1f7d4SAlex Williamson 		case VFIO_IRQ_SET_ACTION_UNMASK:
84489e1f7d4SAlex Williamson 			/* XXX Need masking support exported */
84589e1f7d4SAlex Williamson 			break;
84689e1f7d4SAlex Williamson 		case VFIO_IRQ_SET_ACTION_TRIGGER:
84789e1f7d4SAlex Williamson 			func = vfio_pci_set_msi_trigger;
84889e1f7d4SAlex Williamson 			break;
84989e1f7d4SAlex Williamson 		}
85089e1f7d4SAlex Williamson 		break;
851dad9f897SVijay Mohan Pandarathil 	case VFIO_PCI_ERR_IRQ_INDEX:
852dad9f897SVijay Mohan Pandarathil 		switch (flags & VFIO_IRQ_SET_ACTION_TYPE_MASK) {
853dad9f897SVijay Mohan Pandarathil 		case VFIO_IRQ_SET_ACTION_TRIGGER:
854dad9f897SVijay Mohan Pandarathil 			if (pci_is_pcie(vdev->pdev))
855dad9f897SVijay Mohan Pandarathil 				func = vfio_pci_set_err_trigger;
856dad9f897SVijay Mohan Pandarathil 			break;
857dad9f897SVijay Mohan Pandarathil 		}
858ec76f400SAlexey Kardashevskiy 		break;
8596140a8f5SAlex Williamson 	case VFIO_PCI_REQ_IRQ_INDEX:
8606140a8f5SAlex Williamson 		switch (flags & VFIO_IRQ_SET_ACTION_TYPE_MASK) {
8616140a8f5SAlex Williamson 		case VFIO_IRQ_SET_ACTION_TRIGGER:
8626140a8f5SAlex Williamson 			func = vfio_pci_set_req_trigger;
8636140a8f5SAlex Williamson 			break;
8646140a8f5SAlex Williamson 		}
865ec76f400SAlexey Kardashevskiy 		break;
86689e1f7d4SAlex Williamson 	}
86789e1f7d4SAlex Williamson 
86889e1f7d4SAlex Williamson 	if (!func)
86989e1f7d4SAlex Williamson 		return -ENOTTY;
87089e1f7d4SAlex Williamson 
87189e1f7d4SAlex Williamson 	return func(vdev, index, start, count, flags, data);
87289e1f7d4SAlex Williamson }
873