1*351e1581SHaiyang Zhang // SPDX-License-Identifier: GPL-2.0-only 2*351e1581SHaiyang Zhang /* Copyright (c) 2019, Microsoft Corporation. 3*351e1581SHaiyang Zhang * 4*351e1581SHaiyang Zhang * Author: 5*351e1581SHaiyang Zhang * Haiyang Zhang <haiyangz@microsoft.com> 6*351e1581SHaiyang Zhang */ 7*351e1581SHaiyang Zhang 8*351e1581SHaiyang Zhang #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 9*351e1581SHaiyang Zhang 10*351e1581SHaiyang Zhang #include <linux/netdevice.h> 11*351e1581SHaiyang Zhang #include <linux/etherdevice.h> 12*351e1581SHaiyang Zhang #include <linux/ethtool.h> 13*351e1581SHaiyang Zhang #include <linux/bpf.h> 14*351e1581SHaiyang Zhang #include <linux/bpf_trace.h> 15*351e1581SHaiyang Zhang #include <linux/kernel.h> 16*351e1581SHaiyang Zhang #include <net/xdp.h> 17*351e1581SHaiyang Zhang 18*351e1581SHaiyang Zhang #include <linux/mutex.h> 19*351e1581SHaiyang Zhang #include <linux/rtnetlink.h> 20*351e1581SHaiyang Zhang 21*351e1581SHaiyang Zhang #include "hyperv_net.h" 22*351e1581SHaiyang Zhang 23*351e1581SHaiyang Zhang u32 netvsc_run_xdp(struct net_device *ndev, struct netvsc_channel *nvchan, 24*351e1581SHaiyang Zhang struct xdp_buff *xdp) 25*351e1581SHaiyang Zhang { 26*351e1581SHaiyang Zhang void *data = nvchan->rsc.data[0]; 27*351e1581SHaiyang Zhang u32 len = nvchan->rsc.len[0]; 28*351e1581SHaiyang Zhang struct page *page = NULL; 29*351e1581SHaiyang Zhang struct bpf_prog *prog; 30*351e1581SHaiyang Zhang u32 act = XDP_PASS; 31*351e1581SHaiyang Zhang 32*351e1581SHaiyang Zhang xdp->data_hard_start = NULL; 33*351e1581SHaiyang Zhang 34*351e1581SHaiyang Zhang rcu_read_lock(); 35*351e1581SHaiyang Zhang prog = rcu_dereference(nvchan->bpf_prog); 36*351e1581SHaiyang Zhang 37*351e1581SHaiyang Zhang if (!prog) 38*351e1581SHaiyang Zhang goto out; 39*351e1581SHaiyang Zhang 40*351e1581SHaiyang Zhang /* allocate page buffer for data */ 41*351e1581SHaiyang Zhang page = alloc_page(GFP_ATOMIC); 42*351e1581SHaiyang Zhang if (!page) { 43*351e1581SHaiyang Zhang act = XDP_DROP; 44*351e1581SHaiyang Zhang goto out; 45*351e1581SHaiyang Zhang } 46*351e1581SHaiyang Zhang 47*351e1581SHaiyang Zhang xdp->data_hard_start = page_address(page); 48*351e1581SHaiyang Zhang xdp->data = xdp->data_hard_start + NETVSC_XDP_HDRM; 49*351e1581SHaiyang Zhang xdp_set_data_meta_invalid(xdp); 50*351e1581SHaiyang Zhang xdp->data_end = xdp->data + len; 51*351e1581SHaiyang Zhang xdp->rxq = &nvchan->xdp_rxq; 52*351e1581SHaiyang Zhang xdp->handle = 0; 53*351e1581SHaiyang Zhang 54*351e1581SHaiyang Zhang memcpy(xdp->data, data, len); 55*351e1581SHaiyang Zhang 56*351e1581SHaiyang Zhang act = bpf_prog_run_xdp(prog, xdp); 57*351e1581SHaiyang Zhang 58*351e1581SHaiyang Zhang switch (act) { 59*351e1581SHaiyang Zhang case XDP_PASS: 60*351e1581SHaiyang Zhang case XDP_TX: 61*351e1581SHaiyang Zhang case XDP_DROP: 62*351e1581SHaiyang Zhang break; 63*351e1581SHaiyang Zhang 64*351e1581SHaiyang Zhang case XDP_ABORTED: 65*351e1581SHaiyang Zhang trace_xdp_exception(ndev, prog, act); 66*351e1581SHaiyang Zhang break; 67*351e1581SHaiyang Zhang 68*351e1581SHaiyang Zhang default: 69*351e1581SHaiyang Zhang bpf_warn_invalid_xdp_action(act); 70*351e1581SHaiyang Zhang } 71*351e1581SHaiyang Zhang 72*351e1581SHaiyang Zhang out: 73*351e1581SHaiyang Zhang rcu_read_unlock(); 74*351e1581SHaiyang Zhang 75*351e1581SHaiyang Zhang if (page && act != XDP_PASS && act != XDP_TX) { 76*351e1581SHaiyang Zhang __free_page(page); 77*351e1581SHaiyang Zhang xdp->data_hard_start = NULL; 78*351e1581SHaiyang Zhang } 79*351e1581SHaiyang Zhang 80*351e1581SHaiyang Zhang return act; 81*351e1581SHaiyang Zhang } 82*351e1581SHaiyang Zhang 83*351e1581SHaiyang Zhang unsigned int netvsc_xdp_fraglen(unsigned int len) 84*351e1581SHaiyang Zhang { 85*351e1581SHaiyang Zhang return SKB_DATA_ALIGN(len) + 86*351e1581SHaiyang Zhang SKB_DATA_ALIGN(sizeof(struct skb_shared_info)); 87*351e1581SHaiyang Zhang } 88*351e1581SHaiyang Zhang 89*351e1581SHaiyang Zhang struct bpf_prog *netvsc_xdp_get(struct netvsc_device *nvdev) 90*351e1581SHaiyang Zhang { 91*351e1581SHaiyang Zhang return rtnl_dereference(nvdev->chan_table[0].bpf_prog); 92*351e1581SHaiyang Zhang } 93*351e1581SHaiyang Zhang 94*351e1581SHaiyang Zhang int netvsc_xdp_set(struct net_device *dev, struct bpf_prog *prog, 95*351e1581SHaiyang Zhang struct netlink_ext_ack *extack, 96*351e1581SHaiyang Zhang struct netvsc_device *nvdev) 97*351e1581SHaiyang Zhang { 98*351e1581SHaiyang Zhang struct bpf_prog *old_prog; 99*351e1581SHaiyang Zhang int buf_max, i; 100*351e1581SHaiyang Zhang 101*351e1581SHaiyang Zhang old_prog = netvsc_xdp_get(nvdev); 102*351e1581SHaiyang Zhang 103*351e1581SHaiyang Zhang if (!old_prog && !prog) 104*351e1581SHaiyang Zhang return 0; 105*351e1581SHaiyang Zhang 106*351e1581SHaiyang Zhang buf_max = NETVSC_XDP_HDRM + netvsc_xdp_fraglen(dev->mtu + ETH_HLEN); 107*351e1581SHaiyang Zhang if (prog && buf_max > PAGE_SIZE) { 108*351e1581SHaiyang Zhang netdev_err(dev, "XDP: mtu:%u too large, buf_max:%u\n", 109*351e1581SHaiyang Zhang dev->mtu, buf_max); 110*351e1581SHaiyang Zhang NL_SET_ERR_MSG_MOD(extack, "XDP: mtu too large"); 111*351e1581SHaiyang Zhang 112*351e1581SHaiyang Zhang return -EOPNOTSUPP; 113*351e1581SHaiyang Zhang } 114*351e1581SHaiyang Zhang 115*351e1581SHaiyang Zhang if (prog && (dev->features & NETIF_F_LRO)) { 116*351e1581SHaiyang Zhang netdev_err(dev, "XDP: not support LRO\n"); 117*351e1581SHaiyang Zhang NL_SET_ERR_MSG_MOD(extack, "XDP: not support LRO"); 118*351e1581SHaiyang Zhang 119*351e1581SHaiyang Zhang return -EOPNOTSUPP; 120*351e1581SHaiyang Zhang } 121*351e1581SHaiyang Zhang 122*351e1581SHaiyang Zhang if (prog) 123*351e1581SHaiyang Zhang bpf_prog_add(prog, nvdev->num_chn); 124*351e1581SHaiyang Zhang 125*351e1581SHaiyang Zhang for (i = 0; i < nvdev->num_chn; i++) 126*351e1581SHaiyang Zhang rcu_assign_pointer(nvdev->chan_table[i].bpf_prog, prog); 127*351e1581SHaiyang Zhang 128*351e1581SHaiyang Zhang if (old_prog) 129*351e1581SHaiyang Zhang for (i = 0; i < nvdev->num_chn; i++) 130*351e1581SHaiyang Zhang bpf_prog_put(old_prog); 131*351e1581SHaiyang Zhang 132*351e1581SHaiyang Zhang return 0; 133*351e1581SHaiyang Zhang } 134*351e1581SHaiyang Zhang 135*351e1581SHaiyang Zhang int netvsc_vf_setxdp(struct net_device *vf_netdev, struct bpf_prog *prog) 136*351e1581SHaiyang Zhang { 137*351e1581SHaiyang Zhang struct netdev_bpf xdp; 138*351e1581SHaiyang Zhang bpf_op_t ndo_bpf; 139*351e1581SHaiyang Zhang 140*351e1581SHaiyang Zhang ASSERT_RTNL(); 141*351e1581SHaiyang Zhang 142*351e1581SHaiyang Zhang if (!vf_netdev) 143*351e1581SHaiyang Zhang return 0; 144*351e1581SHaiyang Zhang 145*351e1581SHaiyang Zhang ndo_bpf = vf_netdev->netdev_ops->ndo_bpf; 146*351e1581SHaiyang Zhang if (!ndo_bpf) 147*351e1581SHaiyang Zhang return 0; 148*351e1581SHaiyang Zhang 149*351e1581SHaiyang Zhang memset(&xdp, 0, sizeof(xdp)); 150*351e1581SHaiyang Zhang 151*351e1581SHaiyang Zhang xdp.command = XDP_SETUP_PROG; 152*351e1581SHaiyang Zhang xdp.prog = prog; 153*351e1581SHaiyang Zhang 154*351e1581SHaiyang Zhang return ndo_bpf(vf_netdev, &xdp); 155*351e1581SHaiyang Zhang } 156*351e1581SHaiyang Zhang 157*351e1581SHaiyang Zhang static u32 netvsc_xdp_query(struct netvsc_device *nvdev) 158*351e1581SHaiyang Zhang { 159*351e1581SHaiyang Zhang struct bpf_prog *prog = netvsc_xdp_get(nvdev); 160*351e1581SHaiyang Zhang 161*351e1581SHaiyang Zhang if (prog) 162*351e1581SHaiyang Zhang return prog->aux->id; 163*351e1581SHaiyang Zhang 164*351e1581SHaiyang Zhang return 0; 165*351e1581SHaiyang Zhang } 166*351e1581SHaiyang Zhang 167*351e1581SHaiyang Zhang int netvsc_bpf(struct net_device *dev, struct netdev_bpf *bpf) 168*351e1581SHaiyang Zhang { 169*351e1581SHaiyang Zhang struct net_device_context *ndevctx = netdev_priv(dev); 170*351e1581SHaiyang Zhang struct netvsc_device *nvdev = rtnl_dereference(ndevctx->nvdev); 171*351e1581SHaiyang Zhang struct net_device *vf_netdev = rtnl_dereference(ndevctx->vf_netdev); 172*351e1581SHaiyang Zhang struct netlink_ext_ack *extack = bpf->extack; 173*351e1581SHaiyang Zhang int ret; 174*351e1581SHaiyang Zhang 175*351e1581SHaiyang Zhang if (!nvdev || nvdev->destroy) { 176*351e1581SHaiyang Zhang if (bpf->command == XDP_QUERY_PROG) { 177*351e1581SHaiyang Zhang bpf->prog_id = 0; 178*351e1581SHaiyang Zhang return 0; /* Query must always succeed */ 179*351e1581SHaiyang Zhang } else { 180*351e1581SHaiyang Zhang return -ENODEV; 181*351e1581SHaiyang Zhang } 182*351e1581SHaiyang Zhang } 183*351e1581SHaiyang Zhang 184*351e1581SHaiyang Zhang switch (bpf->command) { 185*351e1581SHaiyang Zhang case XDP_SETUP_PROG: 186*351e1581SHaiyang Zhang ret = netvsc_xdp_set(dev, bpf->prog, extack, nvdev); 187*351e1581SHaiyang Zhang 188*351e1581SHaiyang Zhang if (ret) 189*351e1581SHaiyang Zhang return ret; 190*351e1581SHaiyang Zhang 191*351e1581SHaiyang Zhang ret = netvsc_vf_setxdp(vf_netdev, bpf->prog); 192*351e1581SHaiyang Zhang 193*351e1581SHaiyang Zhang if (ret) { 194*351e1581SHaiyang Zhang netdev_err(dev, "vf_setxdp failed:%d\n", ret); 195*351e1581SHaiyang Zhang NL_SET_ERR_MSG_MOD(extack, "vf_setxdp failed"); 196*351e1581SHaiyang Zhang 197*351e1581SHaiyang Zhang netvsc_xdp_set(dev, NULL, extack, nvdev); 198*351e1581SHaiyang Zhang } 199*351e1581SHaiyang Zhang 200*351e1581SHaiyang Zhang return ret; 201*351e1581SHaiyang Zhang 202*351e1581SHaiyang Zhang case XDP_QUERY_PROG: 203*351e1581SHaiyang Zhang bpf->prog_id = netvsc_xdp_query(nvdev); 204*351e1581SHaiyang Zhang return 0; 205*351e1581SHaiyang Zhang 206*351e1581SHaiyang Zhang default: 207*351e1581SHaiyang Zhang return -EINVAL; 208*351e1581SHaiyang Zhang } 209*351e1581SHaiyang Zhang } 210