xref: /openbmc/linux/drivers/net/hyperv/netvsc.c (revision a56fe611)
19952f691SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
295fa0405SHaiyang Zhang /*
395fa0405SHaiyang Zhang  * Copyright (c) 2009, Microsoft Corporation.
495fa0405SHaiyang Zhang  *
595fa0405SHaiyang Zhang  * Authors:
695fa0405SHaiyang Zhang  *   Haiyang Zhang <haiyangz@microsoft.com>
795fa0405SHaiyang Zhang  *   Hank Janssen  <hjanssen@microsoft.com>
895fa0405SHaiyang Zhang  */
995fa0405SHaiyang Zhang #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
1095fa0405SHaiyang Zhang 
1195fa0405SHaiyang Zhang #include <linux/kernel.h>
1295fa0405SHaiyang Zhang #include <linux/sched.h>
1395fa0405SHaiyang Zhang #include <linux/wait.h>
1495fa0405SHaiyang Zhang #include <linux/mm.h>
1595fa0405SHaiyang Zhang #include <linux/delay.h>
1695fa0405SHaiyang Zhang #include <linux/io.h>
1795fa0405SHaiyang Zhang #include <linux/slab.h>
1895fa0405SHaiyang Zhang #include <linux/netdevice.h>
19f157e78dSHaiyang Zhang #include <linux/if_ether.h>
20d6472302SStephen Rothwell #include <linux/vmalloc.h>
219749fed5Sstephen hemminger #include <linux/rtnetlink.h>
2243bf99ceSstephen hemminger #include <linux/prefetch.h>
231cb9d3b6SHaiyang Zhang #include <linux/filter.h>
249749fed5Sstephen hemminger 
25c25aaf81SKY Srinivasan #include <asm/sync_bitops.h>
2696854bbdSAndrea Parri (Microsoft) #include <asm/mshyperv.h>
2795fa0405SHaiyang Zhang 
2895fa0405SHaiyang Zhang #include "hyperv_net.h"
29ec966381SStephen Hemminger #include "netvsc_trace.h"
3095fa0405SHaiyang Zhang 
3184bf9cefSKY Srinivasan /*
3284bf9cefSKY Srinivasan  * Switch the data path from the synthetic interface to the VF
3384bf9cefSKY Srinivasan  * interface.
3484bf9cefSKY Srinivasan  */
netvsc_switch_datapath(struct net_device * ndev,bool vf)35d0922bf7SHaiyang Zhang int netvsc_switch_datapath(struct net_device *ndev, bool vf)
3684bf9cefSKY Srinivasan {
373d541ac5SVitaly Kuznetsov 	struct net_device_context *net_device_ctx = netdev_priv(ndev);
383d541ac5SVitaly Kuznetsov 	struct hv_device *dev = net_device_ctx->device_ctx;
3979e8cbe7Sstephen hemminger 	struct netvsc_device *nv_dev = rtnl_dereference(net_device_ctx->nvdev);
400a1275caSVitaly Kuznetsov 	struct nvsp_message *init_pkt = &nv_dev->channel_init_pkt;
41d0922bf7SHaiyang Zhang 	int ret, retry = 0;
4284bf9cefSKY Srinivasan 
438b31f8c9SLong Li 	/* Block sending traffic to VF if it's about to be gone */
448b31f8c9SLong Li 	if (!vf)
458b31f8c9SLong Li 		net_device_ctx->data_path_is_vf = vf;
468b31f8c9SLong Li 
4784bf9cefSKY Srinivasan 	memset(init_pkt, 0, sizeof(struct nvsp_message));
4884bf9cefSKY Srinivasan 	init_pkt->hdr.msg_type = NVSP_MSG4_TYPE_SWITCH_DATA_PATH;
4984bf9cefSKY Srinivasan 	if (vf)
5084bf9cefSKY Srinivasan 		init_pkt->msg.v4_msg.active_dp.active_datapath =
5184bf9cefSKY Srinivasan 			NVSP_DATAPATH_VF;
5284bf9cefSKY Srinivasan 	else
5384bf9cefSKY Srinivasan 		init_pkt->msg.v4_msg.active_dp.active_datapath =
5484bf9cefSKY Srinivasan 			NVSP_DATAPATH_SYNTHETIC;
5584bf9cefSKY Srinivasan 
56d0922bf7SHaiyang Zhang again:
57ec966381SStephen Hemminger 	trace_nvsp_send(ndev, init_pkt);
58ec966381SStephen Hemminger 
59d0922bf7SHaiyang Zhang 	ret = vmbus_sendpacket(dev->channel, init_pkt,
6084bf9cefSKY Srinivasan 			       sizeof(struct nvsp_message),
61d0922bf7SHaiyang Zhang 			       (unsigned long)init_pkt, VM_PKT_DATA_INBAND,
628b31f8c9SLong Li 			       VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED);
63d0922bf7SHaiyang Zhang 
64d0922bf7SHaiyang Zhang 	/* If failed to switch to/from VF, let data_path_is_vf stay false,
65d0922bf7SHaiyang Zhang 	 * so we use synthetic path to send data.
66d0922bf7SHaiyang Zhang 	 */
67d0922bf7SHaiyang Zhang 	if (ret) {
68d0922bf7SHaiyang Zhang 		if (ret != -EAGAIN) {
69d0922bf7SHaiyang Zhang 			netdev_err(ndev,
70d0922bf7SHaiyang Zhang 				   "Unable to send sw datapath msg, err: %d\n",
71d0922bf7SHaiyang Zhang 				   ret);
72d0922bf7SHaiyang Zhang 			return ret;
73d0922bf7SHaiyang Zhang 		}
74d0922bf7SHaiyang Zhang 
75d0922bf7SHaiyang Zhang 		if (retry++ < RETRY_MAX) {
76d0922bf7SHaiyang Zhang 			usleep_range(RETRY_US_LO, RETRY_US_HI);
77d0922bf7SHaiyang Zhang 			goto again;
78d0922bf7SHaiyang Zhang 		} else {
79d0922bf7SHaiyang Zhang 			netdev_err(
80d0922bf7SHaiyang Zhang 				ndev,
81d0922bf7SHaiyang Zhang 				"Retry failed to send sw datapath msg, err: %d\n",
82d0922bf7SHaiyang Zhang 				ret);
83d0922bf7SHaiyang Zhang 			return ret;
84d0922bf7SHaiyang Zhang 		}
85d0922bf7SHaiyang Zhang 	}
86d0922bf7SHaiyang Zhang 
878b31f8c9SLong Li 	wait_for_completion(&nv_dev->channel_init_wait);
888b31f8c9SLong Li 	net_device_ctx->data_path_is_vf = vf;
89d0922bf7SHaiyang Zhang 
90d0922bf7SHaiyang Zhang 	return 0;
9184bf9cefSKY Srinivasan }
9284bf9cefSKY Srinivasan 
933ffe64f1SStephen Hemminger /* Worker to setup sub channels on initial setup
943ffe64f1SStephen Hemminger  * Initial hotplug event occurs in softirq context
953ffe64f1SStephen Hemminger  * and can't wait for channels.
963ffe64f1SStephen Hemminger  */
netvsc_subchan_work(struct work_struct * w)973ffe64f1SStephen Hemminger static void netvsc_subchan_work(struct work_struct *w)
983ffe64f1SStephen Hemminger {
993ffe64f1SStephen Hemminger 	struct netvsc_device *nvdev =
1003ffe64f1SStephen Hemminger 		container_of(w, struct netvsc_device, subchan_work);
1013ffe64f1SStephen Hemminger 	struct rndis_device *rdev;
1023ffe64f1SStephen Hemminger 	int i, ret;
1033ffe64f1SStephen Hemminger 
1043ffe64f1SStephen Hemminger 	/* Avoid deadlock with device removal already under RTNL */
1053ffe64f1SStephen Hemminger 	if (!rtnl_trylock()) {
1063ffe64f1SStephen Hemminger 		schedule_work(w);
1073ffe64f1SStephen Hemminger 		return;
1083ffe64f1SStephen Hemminger 	}
1093ffe64f1SStephen Hemminger 
1103ffe64f1SStephen Hemminger 	rdev = nvdev->extension;
1113ffe64f1SStephen Hemminger 	if (rdev) {
11217d91256SHaiyang Zhang 		ret = rndis_set_subchannel(rdev->ndev, nvdev, NULL);
1133ffe64f1SStephen Hemminger 		if (ret == 0) {
1143ffe64f1SStephen Hemminger 			netif_device_attach(rdev->ndev);
1153ffe64f1SStephen Hemminger 		} else {
1163ffe64f1SStephen Hemminger 			/* fallback to only primary channel */
1173ffe64f1SStephen Hemminger 			for (i = 1; i < nvdev->num_chn; i++)
1183ffe64f1SStephen Hemminger 				netif_napi_del(&nvdev->chan_table[i].napi);
1193ffe64f1SStephen Hemminger 
1203ffe64f1SStephen Hemminger 			nvdev->max_chn = 1;
1213ffe64f1SStephen Hemminger 			nvdev->num_chn = 1;
1223ffe64f1SStephen Hemminger 		}
1233ffe64f1SStephen Hemminger 	}
1243ffe64f1SStephen Hemminger 
1253ffe64f1SStephen Hemminger 	rtnl_unlock();
1263ffe64f1SStephen Hemminger }
1273ffe64f1SStephen Hemminger 
alloc_net_device(void)12888098834SVitaly Kuznetsov static struct netvsc_device *alloc_net_device(void)
12995fa0405SHaiyang Zhang {
13095fa0405SHaiyang Zhang 	struct netvsc_device *net_device;
13195fa0405SHaiyang Zhang 
13295fa0405SHaiyang Zhang 	net_device = kzalloc(sizeof(struct netvsc_device), GFP_KERNEL);
13395fa0405SHaiyang Zhang 	if (!net_device)
13495fa0405SHaiyang Zhang 		return NULL;
13595fa0405SHaiyang Zhang 
136dc5cd894SHaiyang Zhang 	init_waitqueue_head(&net_device->wait_drain);
13795fa0405SHaiyang Zhang 	net_device->destroy = false;
138f6f13c12SHaiyang Zhang 	net_device->tx_disable = true;
1390da6edbdSStephen Hemminger 
1407c3877f2SHaiyang Zhang 	net_device->max_pkt = RNDIS_MAX_PKT_DEFAULT;
1417c3877f2SHaiyang Zhang 	net_device->pkt_align = RNDIS_PKT_ALIGN_DEFAULT;
1428b532797Sstephen hemminger 
143fd612602SStephen Hemminger 	init_completion(&net_device->channel_init_wait);
144732e4985Sstephen hemminger 	init_waitqueue_head(&net_device->subchan_open);
1453ffe64f1SStephen Hemminger 	INIT_WORK(&net_device->subchan_work, netvsc_subchan_work);
1467c3877f2SHaiyang Zhang 
14795fa0405SHaiyang Zhang 	return net_device;
14895fa0405SHaiyang Zhang }
14995fa0405SHaiyang Zhang 
free_netvsc_device(struct rcu_head * head)150545a8e79Sstephen hemminger static void free_netvsc_device(struct rcu_head *head)
151f90251c8SHaiyang Zhang {
152545a8e79Sstephen hemminger 	struct netvsc_device *nvdev
153545a8e79Sstephen hemminger 		= container_of(head, struct netvsc_device, rcu);
154c0b558e5SHaiyang Zhang 	int i;
155c0b558e5SHaiyang Zhang 
15602400fceSStephen Hemminger 	kfree(nvdev->extension);
157a56fe611SRick Edgecombe 
158a56fe611SRick Edgecombe 	if (!nvdev->recv_buf_gpadl_handle.decrypted)
15902400fceSStephen Hemminger 		vfree(nvdev->recv_buf);
160a56fe611SRick Edgecombe 	if (!nvdev->send_buf_gpadl_handle.decrypted)
16102400fceSStephen Hemminger 		vfree(nvdev->send_buf);
162e9268a94SChristophe JAILLET 	bitmap_free(nvdev->send_section_map);
16302400fceSStephen Hemminger 
164351e1581SHaiyang Zhang 	for (i = 0; i < VRSS_CHANNEL_MAX; i++) {
165351e1581SHaiyang Zhang 		xdp_rxq_info_unreg(&nvdev->chan_table[i].xdp_rxq);
1660ba35fe9SAndrea Parri (Microsoft) 		kfree(nvdev->chan_table[i].recv_buf);
1677426b1a5Sstephen hemminger 		vfree(nvdev->chan_table[i].mrc.slots);
168351e1581SHaiyang Zhang 	}
169c0b558e5SHaiyang Zhang 
170f90251c8SHaiyang Zhang 	kfree(nvdev);
171f90251c8SHaiyang Zhang }
172f90251c8SHaiyang Zhang 
free_netvsc_device_rcu(struct netvsc_device * nvdev)173545a8e79Sstephen hemminger static void free_netvsc_device_rcu(struct netvsc_device *nvdev)
174545a8e79Sstephen hemminger {
175545a8e79Sstephen hemminger 	call_rcu(&nvdev->rcu, free_netvsc_device);
176545a8e79Sstephen hemminger }
17746b4f7f5Sstephen hemminger 
netvsc_revoke_recv_buf(struct hv_device * device,struct netvsc_device * net_device,struct net_device * ndev)1787992894cSMohammed Gamal static void netvsc_revoke_recv_buf(struct hv_device *device,
1793f076effSMohammed Gamal 				   struct netvsc_device *net_device,
1803f076effSMohammed Gamal 				   struct net_device *ndev)
18195fa0405SHaiyang Zhang {
1827992894cSMohammed Gamal 	struct nvsp_message *revoke_packet;
1837a2a0a84SStephen Hemminger 	int ret;
18495fa0405SHaiyang Zhang 
18595fa0405SHaiyang Zhang 	/*
18695fa0405SHaiyang Zhang 	 * If we got a section count, it means we received a
18795fa0405SHaiyang Zhang 	 * SendReceiveBufferComplete msg (ie sent
18895fa0405SHaiyang Zhang 	 * NvspMessage1TypeSendReceiveBuffer msg) therefore, we need
18995fa0405SHaiyang Zhang 	 * to send a revoke msg here
19095fa0405SHaiyang Zhang 	 */
19195fa0405SHaiyang Zhang 	if (net_device->recv_section_cnt) {
19295fa0405SHaiyang Zhang 		/* Send the revoke receive buffer */
19395fa0405SHaiyang Zhang 		revoke_packet = &net_device->revoke_packet;
19495fa0405SHaiyang Zhang 		memset(revoke_packet, 0, sizeof(struct nvsp_message));
19595fa0405SHaiyang Zhang 
19695fa0405SHaiyang Zhang 		revoke_packet->hdr.msg_type =
19795fa0405SHaiyang Zhang 			NVSP_MSG1_TYPE_REVOKE_RECV_BUF;
19895fa0405SHaiyang Zhang 		revoke_packet->msg.v1_msg.
19995fa0405SHaiyang Zhang 		revoke_recv_buf.id = NETVSC_RECEIVE_BUFFER_ID;
20095fa0405SHaiyang Zhang 
201ec966381SStephen Hemminger 		trace_nvsp_send(ndev, revoke_packet);
202ec966381SStephen Hemminger 
2033d541ac5SVitaly Kuznetsov 		ret = vmbus_sendpacket(device->channel,
20495fa0405SHaiyang Zhang 				       revoke_packet,
20595fa0405SHaiyang Zhang 				       sizeof(struct nvsp_message),
2064d18fcc9SAndres Beltran 				       VMBUS_RQST_ID_NO_RESPONSE,
20795fa0405SHaiyang Zhang 				       VM_PKT_DATA_INBAND, 0);
20873e64fa4SK. Y. Srinivasan 		/* If the failure is because the channel is rescinded;
20973e64fa4SK. Y. Srinivasan 		 * ignore the failure since we cannot send on a rescinded
21073e64fa4SK. Y. Srinivasan 		 * channel. This would allow us to properly cleanup
21173e64fa4SK. Y. Srinivasan 		 * even when the channel is rescinded.
21273e64fa4SK. Y. Srinivasan 		 */
21373e64fa4SK. Y. Srinivasan 		if (device->channel->rescind)
21473e64fa4SK. Y. Srinivasan 			ret = 0;
21595fa0405SHaiyang Zhang 		/*
21695fa0405SHaiyang Zhang 		 * If we failed here, we might as well return and
21795fa0405SHaiyang Zhang 		 * have a leak rather than continue and a bugchk
21895fa0405SHaiyang Zhang 		 */
21995fa0405SHaiyang Zhang 		if (ret != 0) {
22095fa0405SHaiyang Zhang 			netdev_err(ndev, "unable to send "
22195fa0405SHaiyang Zhang 				"revoke receive buffer to netvsp\n");
2227a2a0a84SStephen Hemminger 			return;
22395fa0405SHaiyang Zhang 		}
2248b532797Sstephen hemminger 		net_device->recv_section_cnt = 0;
22595fa0405SHaiyang Zhang 	}
2267992894cSMohammed Gamal }
2277992894cSMohammed Gamal 
netvsc_revoke_send_buf(struct hv_device * device,struct netvsc_device * net_device,struct net_device * ndev)2287992894cSMohammed Gamal static void netvsc_revoke_send_buf(struct hv_device *device,
2293f076effSMohammed Gamal 				   struct netvsc_device *net_device,
2303f076effSMohammed Gamal 				   struct net_device *ndev)
2317992894cSMohammed Gamal {
2327992894cSMohammed Gamal 	struct nvsp_message *revoke_packet;
2337992894cSMohammed Gamal 	int ret;
23495fa0405SHaiyang Zhang 
235c25aaf81SKY Srinivasan 	/* Deal with the send buffer we may have setup.
236c25aaf81SKY Srinivasan 	 * If we got a  send section size, it means we received a
237c51ed182SHaiyang Zhang 	 * NVSP_MSG1_TYPE_SEND_SEND_BUF_COMPLETE msg (ie sent
238c51ed182SHaiyang Zhang 	 * NVSP_MSG1_TYPE_SEND_SEND_BUF msg) therefore, we need
239c25aaf81SKY Srinivasan 	 * to send a revoke msg here
240c25aaf81SKY Srinivasan 	 */
2418b532797Sstephen hemminger 	if (net_device->send_section_cnt) {
242c25aaf81SKY Srinivasan 		/* Send the revoke receive buffer */
243c25aaf81SKY Srinivasan 		revoke_packet = &net_device->revoke_packet;
244c25aaf81SKY Srinivasan 		memset(revoke_packet, 0, sizeof(struct nvsp_message));
245c25aaf81SKY Srinivasan 
246c25aaf81SKY Srinivasan 		revoke_packet->hdr.msg_type =
247c25aaf81SKY Srinivasan 			NVSP_MSG1_TYPE_REVOKE_SEND_BUF;
248c51ed182SHaiyang Zhang 		revoke_packet->msg.v1_msg.revoke_send_buf.id =
249c51ed182SHaiyang Zhang 			NETVSC_SEND_BUFFER_ID;
250c25aaf81SKY Srinivasan 
251ec966381SStephen Hemminger 		trace_nvsp_send(ndev, revoke_packet);
252ec966381SStephen Hemminger 
2533d541ac5SVitaly Kuznetsov 		ret = vmbus_sendpacket(device->channel,
254c25aaf81SKY Srinivasan 				       revoke_packet,
255c25aaf81SKY Srinivasan 				       sizeof(struct nvsp_message),
2564d18fcc9SAndres Beltran 				       VMBUS_RQST_ID_NO_RESPONSE,
257c25aaf81SKY Srinivasan 				       VM_PKT_DATA_INBAND, 0);
25873e64fa4SK. Y. Srinivasan 
25973e64fa4SK. Y. Srinivasan 		/* If the failure is because the channel is rescinded;
26073e64fa4SK. Y. Srinivasan 		 * ignore the failure since we cannot send on a rescinded
26173e64fa4SK. Y. Srinivasan 		 * channel. This would allow us to properly cleanup
26273e64fa4SK. Y. Srinivasan 		 * even when the channel is rescinded.
26373e64fa4SK. Y. Srinivasan 		 */
26473e64fa4SK. Y. Srinivasan 		if (device->channel->rescind)
26573e64fa4SK. Y. Srinivasan 			ret = 0;
26673e64fa4SK. Y. Srinivasan 
267c25aaf81SKY Srinivasan 		/* If we failed here, we might as well return and
268c25aaf81SKY Srinivasan 		 * have a leak rather than continue and a bugchk
269c25aaf81SKY Srinivasan 		 */
270c25aaf81SKY Srinivasan 		if (ret != 0) {
271c25aaf81SKY Srinivasan 			netdev_err(ndev, "unable to send "
272c25aaf81SKY Srinivasan 				   "revoke send buffer to netvsp\n");
2737a2a0a84SStephen Hemminger 			return;
274c25aaf81SKY Srinivasan 		}
2758b532797Sstephen hemminger 		net_device->send_section_cnt = 0;
276c25aaf81SKY Srinivasan 	}
2770cf73780SVitaly Kuznetsov }
2780cf73780SVitaly Kuznetsov 
netvsc_teardown_recv_gpadl(struct hv_device * device,struct netvsc_device * net_device,struct net_device * ndev)2797992894cSMohammed Gamal static void netvsc_teardown_recv_gpadl(struct hv_device *device,
2803f076effSMohammed Gamal 				       struct netvsc_device *net_device,
2813f076effSMohammed Gamal 				       struct net_device *ndev)
2820cf73780SVitaly Kuznetsov {
2830cf73780SVitaly Kuznetsov 	int ret;
2840cf73780SVitaly Kuznetsov 
285d4dccf35STianyu Lan 	if (net_device->recv_buf_gpadl_handle.gpadl_handle) {
2860cf73780SVitaly Kuznetsov 		ret = vmbus_teardown_gpadl(device->channel,
287d4dccf35STianyu Lan 					   &net_device->recv_buf_gpadl_handle);
2880cf73780SVitaly Kuznetsov 
2890cf73780SVitaly Kuznetsov 		/* If we failed here, we might as well return and have a leak
2900cf73780SVitaly Kuznetsov 		 * rather than continue and a bugchk
2910cf73780SVitaly Kuznetsov 		 */
2920cf73780SVitaly Kuznetsov 		if (ret != 0) {
2930cf73780SVitaly Kuznetsov 			netdev_err(ndev,
2940cf73780SVitaly Kuznetsov 				   "unable to teardown receive buffer's gpadl\n");
2950cf73780SVitaly Kuznetsov 			return;
2960cf73780SVitaly Kuznetsov 		}
2970cf73780SVitaly Kuznetsov 	}
2987992894cSMohammed Gamal }
2997992894cSMohammed Gamal 
netvsc_teardown_send_gpadl(struct hv_device * device,struct netvsc_device * net_device,struct net_device * ndev)3007992894cSMohammed Gamal static void netvsc_teardown_send_gpadl(struct hv_device *device,
3013f076effSMohammed Gamal 				       struct netvsc_device *net_device,
3023f076effSMohammed Gamal 				       struct net_device *ndev)
3037992894cSMohammed Gamal {
3047992894cSMohammed Gamal 	int ret;
3050cf73780SVitaly Kuznetsov 
306d4dccf35STianyu Lan 	if (net_device->send_buf_gpadl_handle.gpadl_handle) {
3073d541ac5SVitaly Kuznetsov 		ret = vmbus_teardown_gpadl(device->channel,
308d4dccf35STianyu Lan 					   &net_device->send_buf_gpadl_handle);
309c25aaf81SKY Srinivasan 
310c25aaf81SKY Srinivasan 		/* If we failed here, we might as well return and have a leak
311c25aaf81SKY Srinivasan 		 * rather than continue and a bugchk
312c25aaf81SKY Srinivasan 		 */
313c25aaf81SKY Srinivasan 		if (ret != 0) {
314c25aaf81SKY Srinivasan 			netdev_err(ndev,
315c25aaf81SKY Srinivasan 				   "unable to teardown send buffer's gpadl\n");
3167a2a0a84SStephen Hemminger 			return;
317c25aaf81SKY Srinivasan 		}
318c25aaf81SKY Srinivasan 	}
31995fa0405SHaiyang Zhang }
32095fa0405SHaiyang Zhang 
netvsc_alloc_recv_comp_ring(struct netvsc_device * net_device,u32 q_idx)3217426b1a5Sstephen hemminger int netvsc_alloc_recv_comp_ring(struct netvsc_device *net_device, u32 q_idx)
3227426b1a5Sstephen hemminger {
3237426b1a5Sstephen hemminger 	struct netvsc_channel *nvchan = &net_device->chan_table[q_idx];
3247426b1a5Sstephen hemminger 	int node = cpu_to_node(nvchan->channel->target_cpu);
3257426b1a5Sstephen hemminger 	size_t size;
3267426b1a5Sstephen hemminger 
3277426b1a5Sstephen hemminger 	size = net_device->recv_completion_cnt * sizeof(struct recv_comp_data);
3287426b1a5Sstephen hemminger 	nvchan->mrc.slots = vzalloc_node(size, node);
3297426b1a5Sstephen hemminger 	if (!nvchan->mrc.slots)
3307426b1a5Sstephen hemminger 		nvchan->mrc.slots = vzalloc(size);
3317426b1a5Sstephen hemminger 
3327426b1a5Sstephen hemminger 	return nvchan->mrc.slots ? 0 : -ENOMEM;
3337426b1a5Sstephen hemminger }
3347426b1a5Sstephen hemminger 
netvsc_init_buf(struct hv_device * device,struct netvsc_device * net_device,const struct netvsc_device_info * device_info)33595790837Sstephen hemminger static int netvsc_init_buf(struct hv_device *device,
3368b532797Sstephen hemminger 			   struct netvsc_device *net_device,
3378b532797Sstephen hemminger 			   const struct netvsc_device_info *device_info)
33895fa0405SHaiyang Zhang {
3397426b1a5Sstephen hemminger 	struct nvsp_1_message_send_receive_buffer_complete *resp;
34095833370Sstephen hemminger 	struct net_device *ndev = hv_get_drvdata(device);
34195833370Sstephen hemminger 	struct nvsp_message *init_packet;
3428b532797Sstephen hemminger 	unsigned int buf_size;
3430102eeedSAndrea Parri (Microsoft) 	int i, ret = 0;
34495fa0405SHaiyang Zhang 
3458b532797Sstephen hemminger 	/* Get receive buffer area. */
3460ab09befSAlex Ng 	buf_size = device_info->recv_sections * device_info->recv_section_size;
3478b532797Sstephen hemminger 	buf_size = roundup(buf_size, PAGE_SIZE);
3488b532797Sstephen hemminger 
34911b2b653SHaiyang Zhang 	/* Legacy hosts only allow smaller receive buffer */
35011b2b653SHaiyang Zhang 	if (net_device->nvsp_version <= NVSP_PROTOCOL_VERSION_2)
35111b2b653SHaiyang Zhang 		buf_size = min_t(unsigned int, buf_size,
35211b2b653SHaiyang Zhang 				 NETVSC_RECEIVE_BUFFER_SIZE_LEGACY);
35311b2b653SHaiyang Zhang 
3548b532797Sstephen hemminger 	net_device->recv_buf = vzalloc(buf_size);
35595fa0405SHaiyang Zhang 	if (!net_device->recv_buf) {
3568b532797Sstephen hemminger 		netdev_err(ndev,
3578b532797Sstephen hemminger 			   "unable to allocate receive buffer of size %u\n",
3588b532797Sstephen hemminger 			   buf_size);
35995fa0405SHaiyang Zhang 		ret = -ENOMEM;
36095fa0405SHaiyang Zhang 		goto cleanup;
36195fa0405SHaiyang Zhang 	}
36295fa0405SHaiyang Zhang 
363c5d24bddSHaiyang Zhang 	net_device->recv_buf_size = buf_size;
364c5d24bddSHaiyang Zhang 
36595fa0405SHaiyang Zhang 	/*
36695fa0405SHaiyang Zhang 	 * Establish the gpadl handle for this buffer on this
36795fa0405SHaiyang Zhang 	 * channel.  Note: This call uses the vmbus connection rather
36895fa0405SHaiyang Zhang 	 * than the channel to establish the gpadl handle.
36995fa0405SHaiyang Zhang 	 */
37095fa0405SHaiyang Zhang 	ret = vmbus_establish_gpadl(device->channel, net_device->recv_buf,
3718b532797Sstephen hemminger 				    buf_size,
37295fa0405SHaiyang Zhang 				    &net_device->recv_buf_gpadl_handle);
37395fa0405SHaiyang Zhang 	if (ret != 0) {
37495fa0405SHaiyang Zhang 		netdev_err(ndev,
37595fa0405SHaiyang Zhang 			"unable to establish receive buffer's gpadl\n");
37695fa0405SHaiyang Zhang 		goto cleanup;
37795fa0405SHaiyang Zhang 	}
37895fa0405SHaiyang Zhang 
37995fa0405SHaiyang Zhang 	/* Notify the NetVsp of the gpadl handle */
38095fa0405SHaiyang Zhang 	init_packet = &net_device->channel_init_pkt;
38195fa0405SHaiyang Zhang 	memset(init_packet, 0, sizeof(struct nvsp_message));
38295fa0405SHaiyang Zhang 	init_packet->hdr.msg_type = NVSP_MSG1_TYPE_SEND_RECV_BUF;
38395fa0405SHaiyang Zhang 	init_packet->msg.v1_msg.send_recv_buf.
384d4dccf35STianyu Lan 		gpadl_handle = net_device->recv_buf_gpadl_handle.gpadl_handle;
38595fa0405SHaiyang Zhang 	init_packet->msg.v1_msg.
38695fa0405SHaiyang Zhang 		send_recv_buf.id = NETVSC_RECEIVE_BUFFER_ID;
38795fa0405SHaiyang Zhang 
388ec966381SStephen Hemminger 	trace_nvsp_send(ndev, init_packet);
389ec966381SStephen Hemminger 
39095fa0405SHaiyang Zhang 	/* Send the gpadl notification request */
39195fa0405SHaiyang Zhang 	ret = vmbus_sendpacket(device->channel, init_packet,
39295fa0405SHaiyang Zhang 			       sizeof(struct nvsp_message),
39395fa0405SHaiyang Zhang 			       (unsigned long)init_packet,
39495fa0405SHaiyang Zhang 			       VM_PKT_DATA_INBAND,
39595fa0405SHaiyang Zhang 			       VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED);
39695fa0405SHaiyang Zhang 	if (ret != 0) {
39795fa0405SHaiyang Zhang 		netdev_err(ndev,
39895fa0405SHaiyang Zhang 			"unable to send receive buffer's gpadl to netvsp\n");
39995fa0405SHaiyang Zhang 		goto cleanup;
40095fa0405SHaiyang Zhang 	}
40195fa0405SHaiyang Zhang 
4025362855aSVitaly Kuznetsov 	wait_for_completion(&net_device->channel_init_wait);
40395fa0405SHaiyang Zhang 
40495fa0405SHaiyang Zhang 	/* Check the response */
4057426b1a5Sstephen hemminger 	resp = &init_packet->msg.v1_msg.send_recv_buf_complete;
4067426b1a5Sstephen hemminger 	if (resp->status != NVSP_STAT_SUCCESS) {
4077426b1a5Sstephen hemminger 		netdev_err(ndev,
4087426b1a5Sstephen hemminger 			   "Unable to complete receive buffer initialization with NetVsp - status %d\n",
4097426b1a5Sstephen hemminger 			   resp->status);
41095fa0405SHaiyang Zhang 		ret = -EINVAL;
41195fa0405SHaiyang Zhang 		goto cleanup;
41295fa0405SHaiyang Zhang 	}
41395fa0405SHaiyang Zhang 
41495fa0405SHaiyang Zhang 	/* Parse the response */
4157426b1a5Sstephen hemminger 	netdev_dbg(ndev, "Receive sections: %u sub_allocs: size %u count: %u\n",
4167426b1a5Sstephen hemminger 		   resp->num_sections, resp->sections[0].sub_alloc_size,
4177426b1a5Sstephen hemminger 		   resp->sections[0].num_sub_allocs);
41895fa0405SHaiyang Zhang 
4198b532797Sstephen hemminger 	/* There should only be one section for the entire receive buffer */
4208b532797Sstephen hemminger 	if (resp->num_sections != 1 || resp->sections[0].offset != 0) {
42195fa0405SHaiyang Zhang 		ret = -EINVAL;
42295fa0405SHaiyang Zhang 		goto cleanup;
42395fa0405SHaiyang Zhang 	}
42495fa0405SHaiyang Zhang 
4258b532797Sstephen hemminger 	net_device->recv_section_size = resp->sections[0].sub_alloc_size;
4268b532797Sstephen hemminger 	net_device->recv_section_cnt = resp->sections[0].num_sub_allocs;
4278b532797Sstephen hemminger 
42844144185SAndres Beltran 	/* Ensure buffer will not overflow */
42944144185SAndres Beltran 	if (net_device->recv_section_size < NETVSC_MTU_MIN || (u64)net_device->recv_section_size *
43044144185SAndres Beltran 	    (u64)net_device->recv_section_cnt > (u64)buf_size) {
43144144185SAndres Beltran 		netdev_err(ndev, "invalid recv_section_size %u\n",
43244144185SAndres Beltran 			   net_device->recv_section_size);
43344144185SAndres Beltran 		ret = -EINVAL;
43444144185SAndres Beltran 		goto cleanup;
43544144185SAndres Beltran 	}
43644144185SAndres Beltran 
4370102eeedSAndrea Parri (Microsoft) 	for (i = 0; i < VRSS_CHANNEL_MAX; i++) {
4380102eeedSAndrea Parri (Microsoft) 		struct netvsc_channel *nvchan = &net_device->chan_table[i];
4390102eeedSAndrea Parri (Microsoft) 
4400102eeedSAndrea Parri (Microsoft) 		nvchan->recv_buf = kzalloc(net_device->recv_section_size, GFP_KERNEL);
4410102eeedSAndrea Parri (Microsoft) 		if (nvchan->recv_buf == NULL) {
4420102eeedSAndrea Parri (Microsoft) 			ret = -ENOMEM;
4430102eeedSAndrea Parri (Microsoft) 			goto cleanup;
4440102eeedSAndrea Parri (Microsoft) 		}
4450102eeedSAndrea Parri (Microsoft) 	}
4460102eeedSAndrea Parri (Microsoft) 
447f87238d3SHaiyang Zhang 	/* Setup receive completion ring.
448f87238d3SHaiyang Zhang 	 * Add 1 to the recv_section_cnt because at least one entry in a
449f87238d3SHaiyang Zhang 	 * ring buffer has to be empty.
450f87238d3SHaiyang Zhang 	 */
451f87238d3SHaiyang Zhang 	net_device->recv_completion_cnt = net_device->recv_section_cnt + 1;
4527426b1a5Sstephen hemminger 	ret = netvsc_alloc_recv_comp_ring(net_device, 0);
4537426b1a5Sstephen hemminger 	if (ret)
4547426b1a5Sstephen hemminger 		goto cleanup;
4557426b1a5Sstephen hemminger 
4567426b1a5Sstephen hemminger 	/* Now setup the send buffer. */
4570ab09befSAlex Ng 	buf_size = device_info->send_sections * device_info->send_section_size;
4588b532797Sstephen hemminger 	buf_size = round_up(buf_size, PAGE_SIZE);
4598b532797Sstephen hemminger 
4608b532797Sstephen hemminger 	net_device->send_buf = vzalloc(buf_size);
461c25aaf81SKY Srinivasan 	if (!net_device->send_buf) {
4628b532797Sstephen hemminger 		netdev_err(ndev, "unable to allocate send buffer of size %u\n",
4638b532797Sstephen hemminger 			   buf_size);
464c25aaf81SKY Srinivasan 		ret = -ENOMEM;
465c25aaf81SKY Srinivasan 		goto cleanup;
466c25aaf81SKY Srinivasan 	}
467d4dccf35STianyu Lan 	net_device->send_buf_size = buf_size;
468c25aaf81SKY Srinivasan 
469c25aaf81SKY Srinivasan 	/* Establish the gpadl handle for this buffer on this
470c25aaf81SKY Srinivasan 	 * channel.  Note: This call uses the vmbus connection rather
471c25aaf81SKY Srinivasan 	 * than the channel to establish the gpadl handle.
472c25aaf81SKY Srinivasan 	 */
473c25aaf81SKY Srinivasan 	ret = vmbus_establish_gpadl(device->channel, net_device->send_buf,
4748b532797Sstephen hemminger 				    buf_size,
475c25aaf81SKY Srinivasan 				    &net_device->send_buf_gpadl_handle);
476c25aaf81SKY Srinivasan 	if (ret != 0) {
477c25aaf81SKY Srinivasan 		netdev_err(ndev,
478c25aaf81SKY Srinivasan 			   "unable to establish send buffer's gpadl\n");
479c25aaf81SKY Srinivasan 		goto cleanup;
480c25aaf81SKY Srinivasan 	}
481c25aaf81SKY Srinivasan 
482c25aaf81SKY Srinivasan 	/* Notify the NetVsp of the gpadl handle */
483c25aaf81SKY Srinivasan 	init_packet = &net_device->channel_init_pkt;
484c25aaf81SKY Srinivasan 	memset(init_packet, 0, sizeof(struct nvsp_message));
485c25aaf81SKY Srinivasan 	init_packet->hdr.msg_type = NVSP_MSG1_TYPE_SEND_SEND_BUF;
486c51ed182SHaiyang Zhang 	init_packet->msg.v1_msg.send_send_buf.gpadl_handle =
487d4dccf35STianyu Lan 		net_device->send_buf_gpadl_handle.gpadl_handle;
488c51ed182SHaiyang Zhang 	init_packet->msg.v1_msg.send_send_buf.id = NETVSC_SEND_BUFFER_ID;
489c25aaf81SKY Srinivasan 
490ec966381SStephen Hemminger 	trace_nvsp_send(ndev, init_packet);
491ec966381SStephen Hemminger 
492c25aaf81SKY Srinivasan 	/* Send the gpadl notification request */
493c25aaf81SKY Srinivasan 	ret = vmbus_sendpacket(device->channel, init_packet,
494c25aaf81SKY Srinivasan 			       sizeof(struct nvsp_message),
495c25aaf81SKY Srinivasan 			       (unsigned long)init_packet,
496c25aaf81SKY Srinivasan 			       VM_PKT_DATA_INBAND,
497c25aaf81SKY Srinivasan 			       VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED);
498c25aaf81SKY Srinivasan 	if (ret != 0) {
499c25aaf81SKY Srinivasan 		netdev_err(ndev,
500c25aaf81SKY Srinivasan 			   "unable to send send buffer's gpadl to netvsp\n");
501c25aaf81SKY Srinivasan 		goto cleanup;
502c25aaf81SKY Srinivasan 	}
503c25aaf81SKY Srinivasan 
5045362855aSVitaly Kuznetsov 	wait_for_completion(&net_device->channel_init_wait);
505c25aaf81SKY Srinivasan 
506c25aaf81SKY Srinivasan 	/* Check the response */
507c25aaf81SKY Srinivasan 	if (init_packet->msg.v1_msg.
508c25aaf81SKY Srinivasan 	    send_send_buf_complete.status != NVSP_STAT_SUCCESS) {
509c25aaf81SKY Srinivasan 		netdev_err(ndev, "Unable to complete send buffer "
510c25aaf81SKY Srinivasan 			   "initialization with NetVsp - status %d\n",
511c25aaf81SKY Srinivasan 			   init_packet->msg.v1_msg.
512c51ed182SHaiyang Zhang 			   send_send_buf_complete.status);
513c25aaf81SKY Srinivasan 		ret = -EINVAL;
514c25aaf81SKY Srinivasan 		goto cleanup;
515c25aaf81SKY Srinivasan 	}
516c25aaf81SKY Srinivasan 
517c25aaf81SKY Srinivasan 	/* Parse the response */
518c25aaf81SKY Srinivasan 	net_device->send_section_size = init_packet->msg.
519c25aaf81SKY Srinivasan 				v1_msg.send_send_buf_complete.section_size;
52044144185SAndres Beltran 	if (net_device->send_section_size < NETVSC_MTU_MIN) {
52144144185SAndres Beltran 		netdev_err(ndev, "invalid send_section_size %u\n",
52244144185SAndres Beltran 			   net_device->send_section_size);
52344144185SAndres Beltran 		ret = -EINVAL;
52444144185SAndres Beltran 		goto cleanup;
52544144185SAndres Beltran 	}
526c25aaf81SKY Srinivasan 
5278b532797Sstephen hemminger 	/* Section count is simply the size divided by the section size. */
5288b532797Sstephen hemminger 	net_device->send_section_cnt = buf_size / net_device->send_section_size;
529c25aaf81SKY Srinivasan 
53093ba2222SVitaly Kuznetsov 	netdev_dbg(ndev, "Send section size: %d, Section count:%d\n",
531c25aaf81SKY Srinivasan 		   net_device->send_section_size, net_device->send_section_cnt);
532c25aaf81SKY Srinivasan 
533c25aaf81SKY Srinivasan 	/* Setup state for managing the send buffer. */
534e9268a94SChristophe JAILLET 	net_device->send_section_map = bitmap_zalloc(net_device->send_section_cnt,
535e9268a94SChristophe JAILLET 						     GFP_KERNEL);
536e9268a94SChristophe JAILLET 	if (!net_device->send_section_map) {
537dd1d3f8fSWei Yongjun 		ret = -ENOMEM;
538c25aaf81SKY Srinivasan 		goto cleanup;
539dd1d3f8fSWei Yongjun 	}
540c25aaf81SKY Srinivasan 
54195fa0405SHaiyang Zhang 	goto exit;
54295fa0405SHaiyang Zhang 
54395fa0405SHaiyang Zhang cleanup:
5443f076effSMohammed Gamal 	netvsc_revoke_recv_buf(device, net_device, ndev);
5453f076effSMohammed Gamal 	netvsc_revoke_send_buf(device, net_device, ndev);
5463f076effSMohammed Gamal 	netvsc_teardown_recv_gpadl(device, net_device, ndev);
5473f076effSMohammed Gamal 	netvsc_teardown_send_gpadl(device, net_device, ndev);
54895fa0405SHaiyang Zhang 
54995fa0405SHaiyang Zhang exit:
55095fa0405SHaiyang Zhang 	return ret;
55195fa0405SHaiyang Zhang }
55295fa0405SHaiyang Zhang 
553f157e78dSHaiyang Zhang /* Negotiate NVSP protocol version */
negotiate_nvsp_ver(struct hv_device * device,struct netvsc_device * net_device,struct nvsp_message * init_packet,u32 nvsp_ver)554f157e78dSHaiyang Zhang static int negotiate_nvsp_ver(struct hv_device *device,
555f157e78dSHaiyang Zhang 			      struct netvsc_device *net_device,
556f157e78dSHaiyang Zhang 			      struct nvsp_message *init_packet,
557f157e78dSHaiyang Zhang 			      u32 nvsp_ver)
55895fa0405SHaiyang Zhang {
5590a1275caSVitaly Kuznetsov 	struct net_device *ndev = hv_get_drvdata(device);
5607390fe9cSNicholas Mc Guire 	int ret;
561f157e78dSHaiyang Zhang 
562f157e78dSHaiyang Zhang 	memset(init_packet, 0, sizeof(struct nvsp_message));
563f157e78dSHaiyang Zhang 	init_packet->hdr.msg_type = NVSP_MSG_TYPE_INIT;
564f157e78dSHaiyang Zhang 	init_packet->msg.init_msg.init.min_protocol_ver = nvsp_ver;
565f157e78dSHaiyang Zhang 	init_packet->msg.init_msg.init.max_protocol_ver = nvsp_ver;
566ec966381SStephen Hemminger 	trace_nvsp_send(ndev, init_packet);
567ec966381SStephen Hemminger 
568f157e78dSHaiyang Zhang 	/* Send the init request */
569f157e78dSHaiyang Zhang 	ret = vmbus_sendpacket(device->channel, init_packet,
570f157e78dSHaiyang Zhang 			       sizeof(struct nvsp_message),
571f157e78dSHaiyang Zhang 			       (unsigned long)init_packet,
572f157e78dSHaiyang Zhang 			       VM_PKT_DATA_INBAND,
573f157e78dSHaiyang Zhang 			       VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED);
574f157e78dSHaiyang Zhang 
575f157e78dSHaiyang Zhang 	if (ret != 0)
576f157e78dSHaiyang Zhang 		return ret;
577f157e78dSHaiyang Zhang 
5785362855aSVitaly Kuznetsov 	wait_for_completion(&net_device->channel_init_wait);
579f157e78dSHaiyang Zhang 
580f157e78dSHaiyang Zhang 	if (init_packet->msg.init_msg.init_complete.status !=
581f157e78dSHaiyang Zhang 	    NVSP_STAT_SUCCESS)
582f157e78dSHaiyang Zhang 		return -EINVAL;
583f157e78dSHaiyang Zhang 
584a1eabb01SHaiyang Zhang 	if (nvsp_ver == NVSP_PROTOCOL_VERSION_1)
585f157e78dSHaiyang Zhang 		return 0;
586f157e78dSHaiyang Zhang 
58771790a27SHaiyang Zhang 	/* NVSPv2 or later: Send NDIS config */
588f157e78dSHaiyang Zhang 	memset(init_packet, 0, sizeof(struct nvsp_message));
589f157e78dSHaiyang Zhang 	init_packet->hdr.msg_type = NVSP_MSG2_TYPE_SEND_NDIS_CONFIG;
5900a1275caSVitaly Kuznetsov 	init_packet->msg.v2_msg.send_ndis_config.mtu = ndev->mtu + ETH_HLEN;
5911f5f3a75SHaiyang Zhang 	init_packet->msg.v2_msg.send_ndis_config.capability.ieee8021q = 1;
592f157e78dSHaiyang Zhang 
5937f5d5af0SHaiyang Zhang 	if (nvsp_ver >= NVSP_PROTOCOL_VERSION_5) {
59496854bbdSAndrea Parri (Microsoft) 		if (hv_is_isolation_supported())
59596854bbdSAndrea Parri (Microsoft) 			netdev_info(ndev, "SR-IOV not advertised by guests on the host supporting isolation\n");
59696854bbdSAndrea Parri (Microsoft) 		else
59771790a27SHaiyang Zhang 			init_packet->msg.v2_msg.send_ndis_config.capability.sriov = 1;
59871790a27SHaiyang Zhang 
5997f5d5af0SHaiyang Zhang 		/* Teaming bit is needed to receive link speed updates */
6007f5d5af0SHaiyang Zhang 		init_packet->msg.v2_msg.send_ndis_config.capability.teaming = 1;
6017f5d5af0SHaiyang Zhang 	}
6027f5d5af0SHaiyang Zhang 
603c8e4eff4SHaiyang Zhang 	if (nvsp_ver >= NVSP_PROTOCOL_VERSION_61)
604c8e4eff4SHaiyang Zhang 		init_packet->msg.v2_msg.send_ndis_config.capability.rsc = 1;
605c8e4eff4SHaiyang Zhang 
606ec966381SStephen Hemminger 	trace_nvsp_send(ndev, init_packet);
607ec966381SStephen Hemminger 
608f157e78dSHaiyang Zhang 	ret = vmbus_sendpacket(device->channel, init_packet,
609f157e78dSHaiyang Zhang 				sizeof(struct nvsp_message),
6104d18fcc9SAndres Beltran 				VMBUS_RQST_ID_NO_RESPONSE,
611f157e78dSHaiyang Zhang 				VM_PKT_DATA_INBAND, 0);
612f157e78dSHaiyang Zhang 
613f157e78dSHaiyang Zhang 	return ret;
614f157e78dSHaiyang Zhang }
615f157e78dSHaiyang Zhang 
netvsc_connect_vsp(struct hv_device * device,struct netvsc_device * net_device,const struct netvsc_device_info * device_info)61695790837Sstephen hemminger static int netvsc_connect_vsp(struct hv_device *device,
6178b532797Sstephen hemminger 			      struct netvsc_device *net_device,
6188b532797Sstephen hemminger 			      const struct netvsc_device_info *device_info)
619f157e78dSHaiyang Zhang {
620ec966381SStephen Hemminger 	struct net_device *ndev = hv_get_drvdata(device);
6211b17ca04SColin Ian King 	static const u32 ver_list[] = {
622e5a78fadSStephen Hemminger 		NVSP_PROTOCOL_VERSION_1, NVSP_PROTOCOL_VERSION_2,
6230dcec221SHaiyang Zhang 		NVSP_PROTOCOL_VERSION_4, NVSP_PROTOCOL_VERSION_5,
6240dcec221SHaiyang Zhang 		NVSP_PROTOCOL_VERSION_6, NVSP_PROTOCOL_VERSION_61
62595790837Sstephen hemminger 	};
62695790837Sstephen hemminger 	struct nvsp_message *init_packet;
62795790837Sstephen hemminger 	int ndis_version, i, ret;
62895fa0405SHaiyang Zhang 
62995fa0405SHaiyang Zhang 	init_packet = &net_device->channel_init_pkt;
63095fa0405SHaiyang Zhang 
631f157e78dSHaiyang Zhang 	/* Negotiate the latest NVSP protocol supported */
632e5a78fadSStephen Hemminger 	for (i = ARRAY_SIZE(ver_list) - 1; i >= 0; i--)
633f157e78dSHaiyang Zhang 		if (negotiate_nvsp_ver(device, net_device, init_packet,
634a1eabb01SHaiyang Zhang 				       ver_list[i])  == 0) {
635a1eabb01SHaiyang Zhang 			net_device->nvsp_version = ver_list[i];
636a1eabb01SHaiyang Zhang 			break;
637a1eabb01SHaiyang Zhang 		}
638a1eabb01SHaiyang Zhang 
639a1eabb01SHaiyang Zhang 	if (i < 0) {
64095fa0405SHaiyang Zhang 		ret = -EPROTO;
64195fa0405SHaiyang Zhang 		goto cleanup;
64295fa0405SHaiyang Zhang 	}
643f157e78dSHaiyang Zhang 
64496854bbdSAndrea Parri (Microsoft) 	if (hv_is_isolation_supported() && net_device->nvsp_version < NVSP_PROTOCOL_VERSION_61) {
64596854bbdSAndrea Parri (Microsoft) 		netdev_err(ndev, "Invalid NVSP version 0x%x (expected >= 0x%x) from the host supporting isolation\n",
64696854bbdSAndrea Parri (Microsoft) 			   net_device->nvsp_version, NVSP_PROTOCOL_VERSION_61);
64796854bbdSAndrea Parri (Microsoft) 		ret = -EPROTO;
64896854bbdSAndrea Parri (Microsoft) 		goto cleanup;
64996854bbdSAndrea Parri (Microsoft) 	}
65096854bbdSAndrea Parri (Microsoft) 
651f157e78dSHaiyang Zhang 	pr_debug("Negotiated NVSP version:%x\n", net_device->nvsp_version);
652f157e78dSHaiyang Zhang 
65395fa0405SHaiyang Zhang 	/* Send the ndis version */
65495fa0405SHaiyang Zhang 	memset(init_packet, 0, sizeof(struct nvsp_message));
65595fa0405SHaiyang Zhang 
656a1eabb01SHaiyang Zhang 	if (net_device->nvsp_version <= NVSP_PROTOCOL_VERSION_4)
6571f73db49SKY Srinivasan 		ndis_version = 0x00060001;
658a1eabb01SHaiyang Zhang 	else
659a1eabb01SHaiyang Zhang 		ndis_version = 0x0006001e;
66095fa0405SHaiyang Zhang 
66195fa0405SHaiyang Zhang 	init_packet->hdr.msg_type = NVSP_MSG1_TYPE_SEND_NDIS_VER;
66295fa0405SHaiyang Zhang 	init_packet->msg.v1_msg.
66395fa0405SHaiyang Zhang 		send_ndis_ver.ndis_major_ver =
66495fa0405SHaiyang Zhang 				(ndis_version & 0xFFFF0000) >> 16;
66595fa0405SHaiyang Zhang 	init_packet->msg.v1_msg.
66695fa0405SHaiyang Zhang 		send_ndis_ver.ndis_minor_ver =
66795fa0405SHaiyang Zhang 				ndis_version & 0xFFFF;
66895fa0405SHaiyang Zhang 
669ec966381SStephen Hemminger 	trace_nvsp_send(ndev, init_packet);
670ec966381SStephen Hemminger 
67195fa0405SHaiyang Zhang 	/* Send the init request */
67295fa0405SHaiyang Zhang 	ret = vmbus_sendpacket(device->channel, init_packet,
67395fa0405SHaiyang Zhang 				sizeof(struct nvsp_message),
6744d18fcc9SAndres Beltran 				VMBUS_RQST_ID_NO_RESPONSE,
67595fa0405SHaiyang Zhang 				VM_PKT_DATA_INBAND, 0);
67695fa0405SHaiyang Zhang 	if (ret != 0)
67795fa0405SHaiyang Zhang 		goto cleanup;
67895fa0405SHaiyang Zhang 
67999d3016dSHaiyang Zhang 
6808b532797Sstephen hemminger 	ret = netvsc_init_buf(device, net_device, device_info);
68195fa0405SHaiyang Zhang 
68295fa0405SHaiyang Zhang cleanup:
68395fa0405SHaiyang Zhang 	return ret;
68495fa0405SHaiyang Zhang }
68595fa0405SHaiyang Zhang 
68695fa0405SHaiyang Zhang /*
68795fa0405SHaiyang Zhang  * netvsc_device_remove - Callback when the root bus device is removed
68895fa0405SHaiyang Zhang  */
netvsc_device_remove(struct hv_device * device)689e08f3ea5SStephen Hemminger void netvsc_device_remove(struct hv_device *device)
69095fa0405SHaiyang Zhang {
6913d541ac5SVitaly Kuznetsov 	struct net_device *ndev = hv_get_drvdata(device);
6923d541ac5SVitaly Kuznetsov 	struct net_device_context *net_device_ctx = netdev_priv(ndev);
69379e8cbe7Sstephen hemminger 	struct netvsc_device *net_device
69479e8cbe7Sstephen hemminger 		= rtnl_dereference(net_device_ctx->nvdev);
69515a863bfSstephen hemminger 	int i;
69695fa0405SHaiyang Zhang 
697a56d99d7SMohammed Gamal 	/*
698a56d99d7SMohammed Gamal 	 * Revoke receive buffer. If host is pre-Win2016 then tear down
699a56d99d7SMohammed Gamal 	 * receive buffer GPADL. Do the same for send buffer.
700a56d99d7SMohammed Gamal 	 */
7013f076effSMohammed Gamal 	netvsc_revoke_recv_buf(device, net_device, ndev);
702a56d99d7SMohammed Gamal 	if (vmbus_proto_version < VERSION_WIN10)
7033f076effSMohammed Gamal 		netvsc_teardown_recv_gpadl(device, net_device, ndev);
704a56d99d7SMohammed Gamal 
7053f076effSMohammed Gamal 	netvsc_revoke_send_buf(device, net_device, ndev);
706a56d99d7SMohammed Gamal 	if (vmbus_proto_version < VERSION_WIN10)
7073f076effSMohammed Gamal 		netvsc_teardown_send_gpadl(device, net_device, ndev);
70895fa0405SHaiyang Zhang 
709545a8e79Sstephen hemminger 	RCU_INIT_POINTER(net_device_ctx->nvdev, NULL);
71095fa0405SHaiyang Zhang 
711ac504767SAndrea Parri (Microsoft) 	/* Disable NAPI and disassociate its context from the device. */
712ac504767SAndrea Parri (Microsoft) 	for (i = 0; i < net_device->num_chn; i++) {
713ac504767SAndrea Parri (Microsoft) 		/* See also vmbus_reset_channel_cb(). */
71422a77c0fSSouradeep Chakrabarti 		/* only disable enabled NAPI channel */
71522a77c0fSSouradeep Chakrabarti 		if (i < ndev->real_num_rx_queues)
716ac504767SAndrea Parri (Microsoft) 			napi_disable(&net_device->chan_table[i].napi);
71722a77c0fSSouradeep Chakrabarti 
7188348e046SStephen Hemminger 		netif_napi_del(&net_device->chan_table[i].napi);
719ac504767SAndrea Parri (Microsoft) 	}
7208348e046SStephen Hemminger 
72195fa0405SHaiyang Zhang 	/*
72295fa0405SHaiyang Zhang 	 * At this point, no one should be accessing net_device
72395fa0405SHaiyang Zhang 	 * except in here
72495fa0405SHaiyang Zhang 	 */
72593ba2222SVitaly Kuznetsov 	netdev_dbg(ndev, "net device safe to remove\n");
72695fa0405SHaiyang Zhang 
72795fa0405SHaiyang Zhang 	/* Now, we can close the channel safely */
72895fa0405SHaiyang Zhang 	vmbus_close(device->channel);
72995fa0405SHaiyang Zhang 
730a56d99d7SMohammed Gamal 	/*
731a56d99d7SMohammed Gamal 	 * If host is Win2016 or higher then we do the GPADL tear down
732a56d99d7SMohammed Gamal 	 * here after VMBus is closed.
733a56d99d7SMohammed Gamal 	*/
7347992894cSMohammed Gamal 	if (vmbus_proto_version >= VERSION_WIN10) {
7353f076effSMohammed Gamal 		netvsc_teardown_recv_gpadl(device, net_device, ndev);
7363f076effSMohammed Gamal 		netvsc_teardown_send_gpadl(device, net_device, ndev);
7377992894cSMohammed Gamal 	}
7380cf73780SVitaly Kuznetsov 
73995fa0405SHaiyang Zhang 	/* Release all resources */
740545a8e79Sstephen hemminger 	free_netvsc_device_rcu(net_device);
74195fa0405SHaiyang Zhang }
74295fa0405SHaiyang Zhang 
74333be96e4SHaiyang Zhang #define RING_AVAIL_PERCENT_HIWATER 20
74433be96e4SHaiyang Zhang #define RING_AVAIL_PERCENT_LOWATER 10
74533be96e4SHaiyang Zhang 
netvsc_free_send_slot(struct netvsc_device * net_device,u32 index)746c25aaf81SKY Srinivasan static inline void netvsc_free_send_slot(struct netvsc_device *net_device,
747c25aaf81SKY Srinivasan 					 u32 index)
748c25aaf81SKY Srinivasan {
749c25aaf81SKY Srinivasan 	sync_change_bit(index, net_device->send_section_map);
750c25aaf81SKY Srinivasan }
751c25aaf81SKY Srinivasan 
netvsc_send_tx_complete(struct net_device * ndev,struct netvsc_device * net_device,struct vmbus_channel * channel,const struct vmpacket_descriptor * desc,int budget)752c347b927SStephen Hemminger static void netvsc_send_tx_complete(struct net_device *ndev,
753c347b927SStephen Hemminger 				    struct netvsc_device *net_device,
754c347b927SStephen Hemminger 				    struct vmbus_channel *channel,
755f9645430Sstephen hemminger 				    const struct vmpacket_descriptor *desc,
756f9645430Sstephen hemminger 				    int budget)
75795fa0405SHaiyang Zhang {
75809af87d1SSimon Xiao 	struct net_device_context *ndev_ctx = netdev_priv(ndev);
7594d18fcc9SAndres Beltran 	struct sk_buff *skb;
7605b54dac8SHaiyang Zhang 	u16 q_idx = 0;
7615b54dac8SHaiyang Zhang 	int queue_sends;
7624d18fcc9SAndres Beltran 	u64 cmd_rqst;
7634d18fcc9SAndres Beltran 
76426894cd9SAndrea Parri (Microsoft) 	cmd_rqst = channel->request_addr_callback(channel, desc->trans_id);
7654d18fcc9SAndres Beltran 	if (cmd_rqst == VMBUS_RQST_ERROR) {
76626894cd9SAndrea Parri (Microsoft) 		netdev_err(ndev, "Invalid transaction ID %llx\n", desc->trans_id);
7674d18fcc9SAndres Beltran 		return;
7684d18fcc9SAndres Beltran 	}
7694d18fcc9SAndres Beltran 
7704d18fcc9SAndres Beltran 	skb = (struct sk_buff *)(unsigned long)cmd_rqst;
77133be96e4SHaiyang Zhang 
77295fa0405SHaiyang Zhang 	/* Notify the layer above us */
773bc304dd3SStephen Hemminger 	if (likely(skb)) {
774846da38dSTianyu Lan 		struct hv_netvsc_packet *packet
775bc304dd3SStephen Hemminger 			= (struct hv_netvsc_packet *)skb->cb;
776793e3955Sstephen hemminger 		u32 send_index = packet->send_buf_index;
7771cb9d3b6SHaiyang Zhang 		struct netvsc_stats_tx *tx_stats;
778bc304dd3SStephen Hemminger 
779c25aaf81SKY Srinivasan 		if (send_index != NETVSC_INVALID_INDEX)
780c25aaf81SKY Srinivasan 			netvsc_free_send_slot(net_device, send_index);
781793e3955Sstephen hemminger 		q_idx = packet->q_idx;
782bc304dd3SStephen Hemminger 
7836c80f3fcSSimon Xiao 		tx_stats = &net_device->chan_table[q_idx].tx_stats;
784793e3955Sstephen hemminger 
785793e3955Sstephen hemminger 		u64_stats_update_begin(&tx_stats->syncp);
786793e3955Sstephen hemminger 		tx_stats->packets += packet->total_packets;
787793e3955Sstephen hemminger 		tx_stats->bytes += packet->total_bytes;
788793e3955Sstephen hemminger 		u64_stats_update_end(&tx_stats->syncp);
789793e3955Sstephen hemminger 
790846da38dSTianyu Lan 		netvsc_dma_unmap(ndev_ctx->device_ctx, packet);
791f9645430Sstephen hemminger 		napi_consume_skb(skb, budget);
7925b54dac8SHaiyang Zhang 	}
79395fa0405SHaiyang Zhang 
794b8b835a8Sstephen hemminger 	queue_sends =
795b8b835a8Sstephen hemminger 		atomic_dec_return(&net_device->chan_table[q_idx].queue_sends);
7961d06825bSHaiyang Zhang 
7977b2ee50cSStephen Hemminger 	if (unlikely(net_device->destroy)) {
7987b2ee50cSStephen Hemminger 		if (queue_sends == 0)
799dc5cd894SHaiyang Zhang 			wake_up(&net_device->wait_drain);
8007b2ee50cSStephen Hemminger 	} else {
8017b2ee50cSStephen Hemminger 		struct netdev_queue *txq = netdev_get_tx_queue(ndev, q_idx);
802dc5cd894SHaiyang Zhang 
8031b704c4aSHaiyang Zhang 		if (netif_tx_queue_stopped(txq) && !net_device->tx_disable &&
8046b1f8376SLong Li 		    (hv_get_avail_to_write_percent(&channel->outbound) >
8056b1f8376SLong Li 		     RING_AVAIL_PERCENT_HIWATER || queue_sends < 1)) {
8067b2ee50cSStephen Hemminger 			netif_tx_wake_queue(txq);
80709af87d1SSimon Xiao 			ndev_ctx->eth_stats.wake_queue++;
80809af87d1SSimon Xiao 		}
809bc304dd3SStephen Hemminger 	}
8107b2ee50cSStephen Hemminger }
811bc304dd3SStephen Hemminger 
netvsc_send_completion(struct net_device * ndev,struct netvsc_device * net_device,struct vmbus_channel * incoming_channel,const struct vmpacket_descriptor * desc,int budget)812c347b927SStephen Hemminger static void netvsc_send_completion(struct net_device *ndev,
813c347b927SStephen Hemminger 				   struct netvsc_device *net_device,
814bc304dd3SStephen Hemminger 				   struct vmbus_channel *incoming_channel,
815f9645430Sstephen hemminger 				   const struct vmpacket_descriptor *desc,
816f9645430Sstephen hemminger 				   int budget)
817bc304dd3SStephen Hemminger {
8188b31f8c9SLong Li 	const struct nvsp_message *nvsp_packet;
81944144185SAndres Beltran 	u32 msglen = hv_pkt_datalen(desc);
8208b31f8c9SLong Li 	struct nvsp_message *pkt_rqst;
8218b31f8c9SLong Li 	u64 cmd_rqst;
822dca5161fSMichael Kelley 	u32 status;
8238b31f8c9SLong Li 
8248b31f8c9SLong Li 	/* First check if this is a VMBUS completion without data payload */
8258b31f8c9SLong Li 	if (!msglen) {
826bf5fd8caSAndrea Parri (Microsoft) 		cmd_rqst = incoming_channel->request_addr_callback(incoming_channel,
82726894cd9SAndrea Parri (Microsoft) 								   desc->trans_id);
8288b31f8c9SLong Li 		if (cmd_rqst == VMBUS_RQST_ERROR) {
82926894cd9SAndrea Parri (Microsoft) 			netdev_err(ndev, "Invalid transaction ID %llx\n", desc->trans_id);
8308b31f8c9SLong Li 			return;
8318b31f8c9SLong Li 		}
8328b31f8c9SLong Li 
8338b31f8c9SLong Li 		pkt_rqst = (struct nvsp_message *)(uintptr_t)cmd_rqst;
8348b31f8c9SLong Li 		switch (pkt_rqst->hdr.msg_type) {
8358b31f8c9SLong Li 		case NVSP_MSG4_TYPE_SWITCH_DATA_PATH:
8368b31f8c9SLong Li 			complete(&net_device->channel_init_wait);
8378b31f8c9SLong Li 			break;
8388b31f8c9SLong Li 
8398b31f8c9SLong Li 		default:
8408b31f8c9SLong Li 			netdev_err(ndev, "Unexpected VMBUS completion!!\n");
8418b31f8c9SLong Li 		}
8428b31f8c9SLong Li 		return;
8438b31f8c9SLong Li 	}
84444144185SAndres Beltran 
84544144185SAndres Beltran 	/* Ensure packet is big enough to read header fields */
84644144185SAndres Beltran 	if (msglen < sizeof(struct nvsp_message_header)) {
84744144185SAndres Beltran 		netdev_err(ndev, "nvsp_message length too small: %u\n", msglen);
84844144185SAndres Beltran 		return;
84944144185SAndres Beltran 	}
850bc304dd3SStephen Hemminger 
8518b31f8c9SLong Li 	nvsp_packet = hv_pkt_data(desc);
852bc304dd3SStephen Hemminger 	switch (nvsp_packet->hdr.msg_type) {
853bc304dd3SStephen Hemminger 	case NVSP_MSG_TYPE_INIT_COMPLETE:
85444144185SAndres Beltran 		if (msglen < sizeof(struct nvsp_message_header) +
85544144185SAndres Beltran 				sizeof(struct nvsp_message_init_complete)) {
85644144185SAndres Beltran 			netdev_err(ndev, "nvsp_msg length too small: %u\n",
85744144185SAndres Beltran 				   msglen);
85844144185SAndres Beltran 			return;
85944144185SAndres Beltran 		}
86044144185SAndres Beltran 		fallthrough;
86144144185SAndres Beltran 
862bc304dd3SStephen Hemminger 	case NVSP_MSG1_TYPE_SEND_RECV_BUF_COMPLETE:
86344144185SAndres Beltran 		if (msglen < sizeof(struct nvsp_message_header) +
86444144185SAndres Beltran 				sizeof(struct nvsp_1_message_send_receive_buffer_complete)) {
86544144185SAndres Beltran 			netdev_err(ndev, "nvsp_msg1 length too small: %u\n",
86644144185SAndres Beltran 				   msglen);
86744144185SAndres Beltran 			return;
86844144185SAndres Beltran 		}
86944144185SAndres Beltran 		fallthrough;
87044144185SAndres Beltran 
871bc304dd3SStephen Hemminger 	case NVSP_MSG1_TYPE_SEND_SEND_BUF_COMPLETE:
87244144185SAndres Beltran 		if (msglen < sizeof(struct nvsp_message_header) +
87344144185SAndres Beltran 				sizeof(struct nvsp_1_message_send_send_buffer_complete)) {
87444144185SAndres Beltran 			netdev_err(ndev, "nvsp_msg1 length too small: %u\n",
87544144185SAndres Beltran 				   msglen);
87644144185SAndres Beltran 			return;
87744144185SAndres Beltran 		}
87844144185SAndres Beltran 		fallthrough;
87944144185SAndres Beltran 
880bc304dd3SStephen Hemminger 	case NVSP_MSG5_TYPE_SUBCHANNEL:
88144144185SAndres Beltran 		if (msglen < sizeof(struct nvsp_message_header) +
88244144185SAndres Beltran 				sizeof(struct nvsp_5_subchannel_complete)) {
88344144185SAndres Beltran 			netdev_err(ndev, "nvsp_msg5 length too small: %u\n",
88444144185SAndres Beltran 				   msglen);
88544144185SAndres Beltran 			return;
88644144185SAndres Beltran 		}
887bc304dd3SStephen Hemminger 		/* Copy the response back */
888bc304dd3SStephen Hemminger 		memcpy(&net_device->channel_init_pkt, nvsp_packet,
889bc304dd3SStephen Hemminger 		       sizeof(struct nvsp_message));
890bc304dd3SStephen Hemminger 		complete(&net_device->channel_init_wait);
891bc304dd3SStephen Hemminger 		break;
892bc304dd3SStephen Hemminger 
893bc304dd3SStephen Hemminger 	case NVSP_MSG1_TYPE_SEND_RNDIS_PKT_COMPLETE:
894dca5161fSMichael Kelley 		if (msglen < sizeof(struct nvsp_message_header) +
895dca5161fSMichael Kelley 		    sizeof(struct nvsp_1_message_send_rndis_packet_complete)) {
896dca5161fSMichael Kelley 			if (net_ratelimit())
897dca5161fSMichael Kelley 				netdev_err(ndev, "nvsp_rndis_pkt_complete length too small: %u\n",
898dca5161fSMichael Kelley 					   msglen);
899dca5161fSMichael Kelley 			return;
900dca5161fSMichael Kelley 		}
901dca5161fSMichael Kelley 
902dca5161fSMichael Kelley 		/* If status indicates an error, output a message so we know
903dca5161fSMichael Kelley 		 * there's a problem. But process the completion anyway so the
904dca5161fSMichael Kelley 		 * resources are released.
905dca5161fSMichael Kelley 		 */
906dca5161fSMichael Kelley 		status = nvsp_packet->msg.v1_msg.send_rndis_pkt_complete.status;
907dca5161fSMichael Kelley 		if (status != NVSP_STAT_SUCCESS && net_ratelimit())
908dca5161fSMichael Kelley 			netdev_err(ndev, "nvsp_rndis_pkt_complete error status: %x\n",
909dca5161fSMichael Kelley 				   status);
910dca5161fSMichael Kelley 
911c347b927SStephen Hemminger 		netvsc_send_tx_complete(ndev, net_device, incoming_channel,
912c347b927SStephen Hemminger 					desc, budget);
913bc304dd3SStephen Hemminger 		break;
914bc304dd3SStephen Hemminger 
915bc304dd3SStephen Hemminger 	default:
916bc304dd3SStephen Hemminger 		netdev_err(ndev,
917bc304dd3SStephen Hemminger 			   "Unknown send completion type %d received!!\n",
918bc304dd3SStephen Hemminger 			   nvsp_packet->hdr.msg_type);
91995fa0405SHaiyang Zhang 	}
92095fa0405SHaiyang Zhang }
92195fa0405SHaiyang Zhang 
netvsc_get_next_send_section(struct netvsc_device * net_device)922c25aaf81SKY Srinivasan static u32 netvsc_get_next_send_section(struct netvsc_device *net_device)
923c25aaf81SKY Srinivasan {
924b58a1858Sstephen hemminger 	unsigned long *map_addr = net_device->send_section_map;
925b58a1858Sstephen hemminger 	unsigned int i;
926c25aaf81SKY Srinivasan 
927fdfb70d2Sstephen hemminger 	for_each_clear_bit(i, map_addr, net_device->send_section_cnt) {
928b58a1858Sstephen hemminger 		if (sync_test_and_set_bit(i, map_addr) == 0)
929b58a1858Sstephen hemminger 			return i;
930c25aaf81SKY Srinivasan 	}
931b58a1858Sstephen hemminger 
932b58a1858Sstephen hemminger 	return NETVSC_INVALID_INDEX;
933c25aaf81SKY Srinivasan }
934c25aaf81SKY Srinivasan 
netvsc_copy_to_send_buf(struct netvsc_device * net_device,unsigned int section_index,u32 pend_size,struct hv_netvsc_packet * packet,struct rndis_message * rndis_msg,struct hv_page_buffer * pb,bool xmit_more)93526a11262SStephen Hemminger static void netvsc_copy_to_send_buf(struct netvsc_device *net_device,
936c25aaf81SKY Srinivasan 				    unsigned int section_index,
9377c3877f2SHaiyang Zhang 				    u32 pend_size,
93824476760SKY Srinivasan 				    struct hv_netvsc_packet *packet,
939a9f2e2d6SKY Srinivasan 				    struct rndis_message *rndis_msg,
94002b6de01Sstephen hemminger 				    struct hv_page_buffer *pb,
941cfd8afd9SStephen Hemminger 				    bool xmit_more)
942c25aaf81SKY Srinivasan {
943c25aaf81SKY Srinivasan 	char *start = net_device->send_buf;
9447c3877f2SHaiyang Zhang 	char *dest = start + (section_index * net_device->send_section_size)
9457c3877f2SHaiyang Zhang 		     + pend_size;
946c25aaf81SKY Srinivasan 	int i;
9477c3877f2SHaiyang Zhang 	u32 padding = 0;
948aa0a34beSHaiyang Zhang 	u32 page_count = packet->cp_partial ? packet->rmsg_pgcnt :
949aa0a34beSHaiyang Zhang 		packet->page_buf_cnt;
950b85e06f7SStephen Hemminger 	u32 remain;
9517c3877f2SHaiyang Zhang 
9527c3877f2SHaiyang Zhang 	/* Add padding */
953b85e06f7SStephen Hemminger 	remain = packet->total_data_buflen & (net_device->pkt_align - 1);
954cfd8afd9SStephen Hemminger 	if (xmit_more && remain) {
9557c3877f2SHaiyang Zhang 		padding = net_device->pkt_align - remain;
95624476760SKY Srinivasan 		rndis_msg->msg_len += padding;
9577c3877f2SHaiyang Zhang 		packet->total_data_buflen += padding;
9587c3877f2SHaiyang Zhang 	}
959c25aaf81SKY Srinivasan 
960aa0a34beSHaiyang Zhang 	for (i = 0; i < page_count; i++) {
96111d8620eSBoqun Feng 		char *src = phys_to_virt(pb[i].pfn << HV_HYP_PAGE_SHIFT);
96202b6de01Sstephen hemminger 		u32 offset = pb[i].offset;
96302b6de01Sstephen hemminger 		u32 len = pb[i].len;
964c25aaf81SKY Srinivasan 
965c25aaf81SKY Srinivasan 		memcpy(dest, (src + offset), len);
966c25aaf81SKY Srinivasan 		dest += len;
967c25aaf81SKY Srinivasan 	}
9687c3877f2SHaiyang Zhang 
96926a11262SStephen Hemminger 	if (padding)
9707c3877f2SHaiyang Zhang 		memset(dest, 0, padding);
971c25aaf81SKY Srinivasan }
972c25aaf81SKY Srinivasan 
netvsc_dma_unmap(struct hv_device * hv_dev,struct hv_netvsc_packet * packet)973846da38dSTianyu Lan void netvsc_dma_unmap(struct hv_device *hv_dev,
974846da38dSTianyu Lan 		      struct hv_netvsc_packet *packet)
975846da38dSTianyu Lan {
976846da38dSTianyu Lan 	int i;
977846da38dSTianyu Lan 
978846da38dSTianyu Lan 	if (!hv_is_isolation_supported())
979846da38dSTianyu Lan 		return;
980846da38dSTianyu Lan 
981846da38dSTianyu Lan 	if (!packet->dma_range)
982846da38dSTianyu Lan 		return;
983846da38dSTianyu Lan 
98499f1c460SMichael Kelley 	for (i = 0; i < packet->page_buf_cnt; i++)
985846da38dSTianyu Lan 		dma_unmap_single(&hv_dev->device, packet->dma_range[i].dma,
986846da38dSTianyu Lan 				 packet->dma_range[i].mapping_size,
987846da38dSTianyu Lan 				 DMA_TO_DEVICE);
988846da38dSTianyu Lan 
989846da38dSTianyu Lan 	kfree(packet->dma_range);
990846da38dSTianyu Lan }
991846da38dSTianyu Lan 
992846da38dSTianyu Lan /* netvsc_dma_map - Map swiotlb bounce buffer with data page of
993846da38dSTianyu Lan  * packet sent by vmbus_sendpacket_pagebuffer() in the Isolation
994846da38dSTianyu Lan  * VM.
995846da38dSTianyu Lan  *
996846da38dSTianyu Lan  * In isolation VM, netvsc send buffer has been marked visible to
997846da38dSTianyu Lan  * host and so the data copied to send buffer doesn't need to use
998846da38dSTianyu Lan  * bounce buffer. The data pages handled by vmbus_sendpacket_pagebuffer()
999846da38dSTianyu Lan  * may not be copied to send buffer and so these pages need to be
1000846da38dSTianyu Lan  * mapped with swiotlb bounce buffer. netvsc_dma_map() is to do
1001846da38dSTianyu Lan  * that. The pfns in the struct hv_page_buffer need to be converted
1002846da38dSTianyu Lan  * to bounce buffer's pfn. The loop here is necessary because the
1003846da38dSTianyu Lan  * entries in the page buffer array are not necessarily full
1004846da38dSTianyu Lan  * pages of data.  Each entry in the array has a separate offset and
1005846da38dSTianyu Lan  * len that may be non-zero, even for entries in the middle of the
1006846da38dSTianyu Lan  * array.  And the entries are not physically contiguous.  So each
1007846da38dSTianyu Lan  * entry must be individually mapped rather than as a contiguous unit.
1008846da38dSTianyu Lan  * So not use dma_map_sg() here.
1009846da38dSTianyu Lan  */
netvsc_dma_map(struct hv_device * hv_dev,struct hv_netvsc_packet * packet,struct hv_page_buffer * pb)1010846da38dSTianyu Lan static int netvsc_dma_map(struct hv_device *hv_dev,
1011846da38dSTianyu Lan 			  struct hv_netvsc_packet *packet,
1012846da38dSTianyu Lan 			  struct hv_page_buffer *pb)
1013846da38dSTianyu Lan {
101499f1c460SMichael Kelley 	u32 page_count = packet->page_buf_cnt;
1015846da38dSTianyu Lan 	dma_addr_t dma;
1016846da38dSTianyu Lan 	int i;
1017846da38dSTianyu Lan 
1018846da38dSTianyu Lan 	if (!hv_is_isolation_supported())
1019846da38dSTianyu Lan 		return 0;
1020846da38dSTianyu Lan 
1021846da38dSTianyu Lan 	packet->dma_range = kcalloc(page_count,
1022846da38dSTianyu Lan 				    sizeof(*packet->dma_range),
1023c6aa9d3bSMichael Kelley 				    GFP_ATOMIC);
1024846da38dSTianyu Lan 	if (!packet->dma_range)
1025846da38dSTianyu Lan 		return -ENOMEM;
1026846da38dSTianyu Lan 
1027846da38dSTianyu Lan 	for (i = 0; i < page_count; i++) {
1028846da38dSTianyu Lan 		char *src = phys_to_virt((pb[i].pfn << HV_HYP_PAGE_SHIFT)
1029846da38dSTianyu Lan 					 + pb[i].offset);
1030846da38dSTianyu Lan 		u32 len = pb[i].len;
1031846da38dSTianyu Lan 
1032846da38dSTianyu Lan 		dma = dma_map_single(&hv_dev->device, src, len,
1033846da38dSTianyu Lan 				     DMA_TO_DEVICE);
1034846da38dSTianyu Lan 		if (dma_mapping_error(&hv_dev->device, dma)) {
1035846da38dSTianyu Lan 			kfree(packet->dma_range);
1036846da38dSTianyu Lan 			return -ENOMEM;
1037846da38dSTianyu Lan 		}
1038846da38dSTianyu Lan 
1039846da38dSTianyu Lan 		/* pb[].offset and pb[].len are not changed during dma mapping
1040846da38dSTianyu Lan 		 * and so not reassign.
1041846da38dSTianyu Lan 		 */
1042846da38dSTianyu Lan 		packet->dma_range[i].dma = dma;
1043846da38dSTianyu Lan 		packet->dma_range[i].mapping_size = len;
1044846da38dSTianyu Lan 		pb[i].pfn = dma >> HV_HYP_PAGE_SHIFT;
1045846da38dSTianyu Lan 	}
1046846da38dSTianyu Lan 
1047846da38dSTianyu Lan 	return 0;
1048846da38dSTianyu Lan }
1049846da38dSTianyu Lan 
netvsc_send_pkt(struct hv_device * device,struct hv_netvsc_packet * packet,struct netvsc_device * net_device,struct hv_page_buffer * pb,struct sk_buff * skb)10503a8963acSStephen Hemminger static inline int netvsc_send_pkt(
10510a1275caSVitaly Kuznetsov 	struct hv_device *device,
10527c3877f2SHaiyang Zhang 	struct hv_netvsc_packet *packet,
1053a9f2e2d6SKY Srinivasan 	struct netvsc_device *net_device,
105402b6de01Sstephen hemminger 	struct hv_page_buffer *pb,
10553a3d9a0aSKY Srinivasan 	struct sk_buff *skb)
105695fa0405SHaiyang Zhang {
10577c3877f2SHaiyang Zhang 	struct nvsp_message nvmsg;
1058ec966381SStephen Hemminger 	struct nvsp_1_message_send_rndis_packet *rpkt =
1059956a25c9SJoe Perches 		&nvmsg.msg.v1_msg.send_rndis_pkt;
1060956a25c9SJoe Perches 	struct netvsc_channel * const nvchan =
1061956a25c9SJoe Perches 		&net_device->chan_table[packet->q_idx];
1062b8b835a8Sstephen hemminger 	struct vmbus_channel *out_channel = nvchan->channel;
10630a1275caSVitaly Kuznetsov 	struct net_device *ndev = hv_get_drvdata(device);
106409af87d1SSimon Xiao 	struct net_device_context *ndev_ctx = netdev_priv(ndev);
1065b8b835a8Sstephen hemminger 	struct netdev_queue *txq = netdev_get_tx_queue(ndev, packet->q_idx);
10667c3877f2SHaiyang Zhang 	u64 req_id;
10677c3877f2SHaiyang Zhang 	int ret;
10686b1f8376SLong Li 	u32 ring_avail = hv_get_avail_to_write_percent(&out_channel->outbound);
1069c25aaf81SKY Srinivasan 
1070505e3f00SAndrea Parri (Microsoft) 	memset(&nvmsg, 0, sizeof(struct nvsp_message));
10717c3877f2SHaiyang Zhang 	nvmsg.hdr.msg_type = NVSP_MSG1_TYPE_SEND_RNDIS_PKT;
1072956a25c9SJoe Perches 	if (skb)
1073956a25c9SJoe Perches 		rpkt->channel_type = 0;		/* 0 is RMC_DATA */
10747c3877f2SHaiyang Zhang 	else
1075956a25c9SJoe Perches 		rpkt->channel_type = 1;		/* 1 is RMC_CONTROL */
1076956a25c9SJoe Perches 
1077956a25c9SJoe Perches 	rpkt->send_buf_section_index = packet->send_buf_index;
1078956a25c9SJoe Perches 	if (packet->send_buf_index == NETVSC_INVALID_INDEX)
1079956a25c9SJoe Perches 		rpkt->send_buf_section_size = 0;
1080956a25c9SJoe Perches 	else
1081956a25c9SJoe Perches 		rpkt->send_buf_section_size = packet->total_data_buflen;
108295fa0405SHaiyang Zhang 
10833a3d9a0aSKY Srinivasan 	req_id = (ulong)skb;
1084f1ea3cd7SHaiyang Zhang 
1085c3582a2cSHaiyang Zhang 	if (out_channel->rescind)
1086c3582a2cSHaiyang Zhang 		return -ENODEV;
1087c3582a2cSHaiyang Zhang 
1088ec966381SStephen Hemminger 	trace_nvsp_send_pkt(ndev, out_channel, rpkt);
1089ec966381SStephen Hemminger 
1090846da38dSTianyu Lan 	packet->dma_range = NULL;
109195fa0405SHaiyang Zhang 	if (packet->page_buf_cnt) {
109202b6de01Sstephen hemminger 		if (packet->cp_partial)
109302b6de01Sstephen hemminger 			pb += packet->rmsg_pgcnt;
109402b6de01Sstephen hemminger 
1095846da38dSTianyu Lan 		ret = netvsc_dma_map(ndev_ctx->device_ctx, packet, pb);
1096846da38dSTianyu Lan 		if (ret) {
1097846da38dSTianyu Lan 			ret = -EAGAIN;
1098846da38dSTianyu Lan 			goto exit;
1099846da38dSTianyu Lan 		}
1100846da38dSTianyu Lan 
11015a668d8cSstephen hemminger 		ret = vmbus_sendpacket_pagebuffer(out_channel,
110202b6de01Sstephen hemminger 						  pb, packet->page_buf_cnt,
11035a668d8cSstephen hemminger 						  &nvmsg, sizeof(nvmsg),
11045a668d8cSstephen hemminger 						  req_id);
1105846da38dSTianyu Lan 
1106846da38dSTianyu Lan 		if (ret)
1107846da38dSTianyu Lan 			netvsc_dma_unmap(ndev_ctx->device_ctx, packet);
110895fa0405SHaiyang Zhang 	} else {
11095dd0fb9bSstephen hemminger 		ret = vmbus_sendpacket(out_channel,
11105dd0fb9bSstephen hemminger 				       &nvmsg, sizeof(nvmsg),
11115dd0fb9bSstephen hemminger 				       req_id, VM_PKT_DATA_INBAND,
11123454323cSStephen Hemminger 				       VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED);
111395fa0405SHaiyang Zhang 	}
111495fa0405SHaiyang Zhang 
1115846da38dSTianyu Lan exit:
11161d06825bSHaiyang Zhang 	if (ret == 0) {
1117b8b835a8Sstephen hemminger 		atomic_inc_return(&nvchan->queue_sends);
11185b54dac8SHaiyang Zhang 
111909af87d1SSimon Xiao 		if (ring_avail < RING_AVAIL_PERCENT_LOWATER) {
1120b8b835a8Sstephen hemminger 			netif_tx_stop_queue(txq);
112109af87d1SSimon Xiao 			ndev_ctx->eth_stats.stop_queue++;
112209af87d1SSimon Xiao 		}
11231d06825bSHaiyang Zhang 	} else if (ret == -EAGAIN) {
1124b8b835a8Sstephen hemminger 		netif_tx_stop_queue(txq);
112509af87d1SSimon Xiao 		ndev_ctx->eth_stats.stop_queue++;
11261d06825bSHaiyang Zhang 	} else {
11274a2176c6Sstephen hemminger 		netdev_err(ndev,
11284a2176c6Sstephen hemminger 			   "Unable to send packet pages %u len %u, ret %d\n",
11294a2176c6Sstephen hemminger 			   packet->page_buf_cnt, packet->total_data_buflen,
11304a2176c6Sstephen hemminger 			   ret);
11311d06825bSHaiyang Zhang 	}
113295fa0405SHaiyang Zhang 
113393aa4792SHaiyang Zhang 	if (netif_tx_queue_stopped(txq) &&
113493aa4792SHaiyang Zhang 	    atomic_read(&nvchan->queue_sends) < 1 &&
113593aa4792SHaiyang Zhang 	    !net_device->tx_disable) {
113693aa4792SHaiyang Zhang 		netif_tx_wake_queue(txq);
113793aa4792SHaiyang Zhang 		ndev_ctx->eth_stats.wake_queue++;
113893aa4792SHaiyang Zhang 		if (ret == -EAGAIN)
113993aa4792SHaiyang Zhang 			ret = -ENOSPC;
114093aa4792SHaiyang Zhang 	}
114193aa4792SHaiyang Zhang 
11427c3877f2SHaiyang Zhang 	return ret;
11437c3877f2SHaiyang Zhang }
11447c3877f2SHaiyang Zhang 
1145c85e4924SHaiyang Zhang /* Move packet out of multi send data (msd), and clear msd */
move_pkt_msd(struct hv_netvsc_packet ** msd_send,struct sk_buff ** msd_skb,struct multi_send_data * msdp)1146c85e4924SHaiyang Zhang static inline void move_pkt_msd(struct hv_netvsc_packet **msd_send,
1147c85e4924SHaiyang Zhang 				struct sk_buff **msd_skb,
1148c85e4924SHaiyang Zhang 				struct multi_send_data *msdp)
1149c85e4924SHaiyang Zhang {
1150c85e4924SHaiyang Zhang 	*msd_skb = msdp->skb;
1151c85e4924SHaiyang Zhang 	*msd_send = msdp->pkt;
1152c85e4924SHaiyang Zhang 	msdp->skb = NULL;
1153c85e4924SHaiyang Zhang 	msdp->pkt = NULL;
1154c85e4924SHaiyang Zhang 	msdp->count = 0;
1155c85e4924SHaiyang Zhang }
1156c85e4924SHaiyang Zhang 
11572a926f79Sstephen hemminger /* RCU already held by caller */
1158bd49fea7SShachar Raindel /* Batching/bouncing logic is designed to attempt to optimize
1159bd49fea7SShachar Raindel  * performance.
1160bd49fea7SShachar Raindel  *
1161bd49fea7SShachar Raindel  * For small, non-LSO packets we copy the packet to a send buffer
1162bd49fea7SShachar Raindel  * which is pre-registered with the Hyper-V side. This enables the
1163bd49fea7SShachar Raindel  * hypervisor to avoid remapping the aperture to access the packet
1164bd49fea7SShachar Raindel  * descriptor and data.
1165bd49fea7SShachar Raindel  *
1166bd49fea7SShachar Raindel  * If we already started using a buffer and the netdev is transmitting
1167bd49fea7SShachar Raindel  * a burst of packets, keep on copying into the buffer until it is
1168bd49fea7SShachar Raindel  * full or we are done collecting a burst. If there is an existing
1169bd49fea7SShachar Raindel  * buffer with space for the RNDIS descriptor but not the packet, copy
1170bd49fea7SShachar Raindel  * the RNDIS descriptor to the buffer, keeping the packet in place.
1171bd49fea7SShachar Raindel  *
1172bd49fea7SShachar Raindel  * If we do batching and send more than one packet using a single
1173bd49fea7SShachar Raindel  * NetVSC message, free the SKBs of the packets copied, except for the
1174bd49fea7SShachar Raindel  * last packet. This is done to streamline the handling of the case
1175bd49fea7SShachar Raindel  * where the last packet only had the RNDIS descriptor copied to the
1176bd49fea7SShachar Raindel  * send buffer, with the data pointers included in the NetVSC message.
1177bd49fea7SShachar Raindel  */
netvsc_send(struct net_device * ndev,struct hv_netvsc_packet * packet,struct rndis_message * rndis_msg,struct hv_page_buffer * pb,struct sk_buff * skb,bool xdp_tx)1178cfd8afd9SStephen Hemminger int netvsc_send(struct net_device *ndev,
117924476760SKY Srinivasan 		struct hv_netvsc_packet *packet,
1180a9f2e2d6SKY Srinivasan 		struct rndis_message *rndis_msg,
118102b6de01Sstephen hemminger 		struct hv_page_buffer *pb,
1182351e1581SHaiyang Zhang 		struct sk_buff *skb,
1183351e1581SHaiyang Zhang 		bool xdp_tx)
11847c3877f2SHaiyang Zhang {
1185cfd8afd9SStephen Hemminger 	struct net_device_context *ndev_ctx = netdev_priv(ndev);
11863962981fSstephen hemminger 	struct netvsc_device *net_device
1187867047c4Sstephen hemminger 		= rcu_dereference_bh(ndev_ctx->nvdev);
11882a926f79Sstephen hemminger 	struct hv_device *device = ndev_ctx->device_ctx;
11896c4c137eSStephen Hemminger 	int ret = 0;
1190b8b835a8Sstephen hemminger 	struct netvsc_channel *nvchan;
11917c3877f2SHaiyang Zhang 	u32 pktlen = packet->total_data_buflen, msd_len = 0;
11927c3877f2SHaiyang Zhang 	unsigned int section_index = NETVSC_INVALID_INDEX;
11937c3877f2SHaiyang Zhang 	struct multi_send_data *msdp;
11947c3877f2SHaiyang Zhang 	struct hv_netvsc_packet *msd_send = NULL, *cur_send = NULL;
1195c85e4924SHaiyang Zhang 	struct sk_buff *msd_skb = NULL;
1196cfd8afd9SStephen Hemminger 	bool try_batch, xmit_more;
11977c3877f2SHaiyang Zhang 
1198592b4fe8Sstephen hemminger 	/* If device is rescinded, return error and packet will get dropped. */
11992a926f79Sstephen hemminger 	if (unlikely(!net_device || net_device->destroy))
12007c3877f2SHaiyang Zhang 		return -ENODEV;
12017c3877f2SHaiyang Zhang 
1202b8b835a8Sstephen hemminger 	nvchan = &net_device->chan_table[packet->q_idx];
12037c3877f2SHaiyang Zhang 	packet->send_buf_index = NETVSC_INVALID_INDEX;
1204aa0a34beSHaiyang Zhang 	packet->cp_partial = false;
12057c3877f2SHaiyang Zhang 
1206351e1581SHaiyang Zhang 	/* Send a control message or XDP packet directly without accessing
1207351e1581SHaiyang Zhang 	 * msd (Multi-Send Data) field which may be changed during data packet
1208351e1581SHaiyang Zhang 	 * processing.
1209cf8190e4SHaiyang Zhang 	 */
1210351e1581SHaiyang Zhang 	if (!skb || xdp_tx)
121112f69661SStephen Hemminger 		return netvsc_send_pkt(device, packet, net_device, pb, skb);
1212cf8190e4SHaiyang Zhang 
12137c3877f2SHaiyang Zhang 	/* batch packets in send buffer if possible */
1214b8b835a8Sstephen hemminger 	msdp = &nvchan->msd;
12157c3877f2SHaiyang Zhang 	if (msdp->pkt)
12167c3877f2SHaiyang Zhang 		msd_len = msdp->pkt->total_data_buflen;
12177c3877f2SHaiyang Zhang 
1218ebc1dcf6Sstephen hemminger 	try_batch =  msd_len > 0 && msdp->count < net_device->max_pkt;
1219aa0a34beSHaiyang Zhang 	if (try_batch && msd_len + pktlen + net_device->pkt_align <
12207c3877f2SHaiyang Zhang 	    net_device->send_section_size) {
12217c3877f2SHaiyang Zhang 		section_index = msdp->pkt->send_buf_index;
12227c3877f2SHaiyang Zhang 
1223aa0a34beSHaiyang Zhang 	} else if (try_batch && msd_len + packet->rmsg_size <
1224aa0a34beSHaiyang Zhang 		   net_device->send_section_size) {
1225aa0a34beSHaiyang Zhang 		section_index = msdp->pkt->send_buf_index;
1226aa0a34beSHaiyang Zhang 		packet->cp_partial = true;
1227aa0a34beSHaiyang Zhang 
1228ebc1dcf6Sstephen hemminger 	} else if (pktlen + net_device->pkt_align <
12297c3877f2SHaiyang Zhang 		   net_device->send_section_size) {
12307c3877f2SHaiyang Zhang 		section_index = netvsc_get_next_send_section(net_device);
1231cad5c197Sstephen hemminger 		if (unlikely(section_index == NETVSC_INVALID_INDEX)) {
1232cad5c197Sstephen hemminger 			++ndev_ctx->eth_stats.tx_send_full;
1233cad5c197Sstephen hemminger 		} else {
1234c85e4924SHaiyang Zhang 			move_pkt_msd(&msd_send, &msd_skb, msdp);
12357c3877f2SHaiyang Zhang 			msd_len = 0;
12367c3877f2SHaiyang Zhang 		}
12377c3877f2SHaiyang Zhang 	}
12387c3877f2SHaiyang Zhang 
1239cfd8afd9SStephen Hemminger 	/* Keep aggregating only if stack says more data is coming
1240cfd8afd9SStephen Hemminger 	 * and not doing mixed modes send and not flow blocked
1241cfd8afd9SStephen Hemminger 	 */
12426b16f9eeSFlorian Westphal 	xmit_more = netdev_xmit_more() &&
1243cfd8afd9SStephen Hemminger 		!packet->cp_partial &&
1244cfd8afd9SStephen Hemminger 		!netif_xmit_stopped(netdev_get_tx_queue(ndev, packet->q_idx));
1245cfd8afd9SStephen Hemminger 
12467c3877f2SHaiyang Zhang 	if (section_index != NETVSC_INVALID_INDEX) {
12477c3877f2SHaiyang Zhang 		netvsc_copy_to_send_buf(net_device,
12487c3877f2SHaiyang Zhang 					section_index, msd_len,
1249cfd8afd9SStephen Hemminger 					packet, rndis_msg, pb, xmit_more);
1250b08cc791SKY Srinivasan 
1251aa0a34beSHaiyang Zhang 		packet->send_buf_index = section_index;
1252aa0a34beSHaiyang Zhang 
1253aa0a34beSHaiyang Zhang 		if (packet->cp_partial) {
1254aa0a34beSHaiyang Zhang 			packet->page_buf_cnt -= packet->rmsg_pgcnt;
1255aa0a34beSHaiyang Zhang 			packet->total_data_buflen = msd_len + packet->rmsg_size;
1256aa0a34beSHaiyang Zhang 		} else {
1257aa0a34beSHaiyang Zhang 			packet->page_buf_cnt = 0;
1258aa0a34beSHaiyang Zhang 			packet->total_data_buflen += msd_len;
1259aa0a34beSHaiyang Zhang 		}
12607c3877f2SHaiyang Zhang 
1261793e3955Sstephen hemminger 		if (msdp->pkt) {
1262793e3955Sstephen hemminger 			packet->total_packets += msdp->pkt->total_packets;
1263793e3955Sstephen hemminger 			packet->total_bytes += msdp->pkt->total_bytes;
1264793e3955Sstephen hemminger 		}
1265793e3955Sstephen hemminger 
1266c85e4924SHaiyang Zhang 		if (msdp->skb)
126717db4bceSStephen Hemminger 			dev_consume_skb_any(msdp->skb);
1268ee90b812SHaiyang Zhang 
1269cfd8afd9SStephen Hemminger 		if (xmit_more) {
1270c85e4924SHaiyang Zhang 			msdp->skb = skb;
12717c3877f2SHaiyang Zhang 			msdp->pkt = packet;
12727c3877f2SHaiyang Zhang 			msdp->count++;
12737c3877f2SHaiyang Zhang 		} else {
12747c3877f2SHaiyang Zhang 			cur_send = packet;
1275c85e4924SHaiyang Zhang 			msdp->skb = NULL;
12767c3877f2SHaiyang Zhang 			msdp->pkt = NULL;
12777c3877f2SHaiyang Zhang 			msdp->count = 0;
12787c3877f2SHaiyang Zhang 		}
12797c3877f2SHaiyang Zhang 	} else {
1280c85e4924SHaiyang Zhang 		move_pkt_msd(&msd_send, &msd_skb, msdp);
12817c3877f2SHaiyang Zhang 		cur_send = packet;
12827c3877f2SHaiyang Zhang 	}
12837c3877f2SHaiyang Zhang 
12847c3877f2SHaiyang Zhang 	if (msd_send) {
12856c4c137eSStephen Hemminger 		int m_ret = netvsc_send_pkt(device, msd_send, net_device,
12860a1275caSVitaly Kuznetsov 					    NULL, msd_skb);
12877c3877f2SHaiyang Zhang 
12887c3877f2SHaiyang Zhang 		if (m_ret != 0) {
12897c3877f2SHaiyang Zhang 			netvsc_free_send_slot(net_device,
12907c3877f2SHaiyang Zhang 					      msd_send->send_buf_index);
1291c85e4924SHaiyang Zhang 			dev_kfree_skb_any(msd_skb);
12927c3877f2SHaiyang Zhang 		}
12937c3877f2SHaiyang Zhang 	}
12947c3877f2SHaiyang Zhang 
12957c3877f2SHaiyang Zhang 	if (cur_send)
12960a1275caSVitaly Kuznetsov 		ret = netvsc_send_pkt(device, cur_send, net_device, pb, skb);
12977c3877f2SHaiyang Zhang 
12987aab5159SJerry Snitselaar 	if (ret != 0 && section_index != NETVSC_INVALID_INDEX)
1299d953ca4dSHaiyang Zhang 		netvsc_free_send_slot(net_device, section_index);
1300d953ca4dSHaiyang Zhang 
130195fa0405SHaiyang Zhang 	return ret;
130295fa0405SHaiyang Zhang }
130395fa0405SHaiyang Zhang 
13047426b1a5Sstephen hemminger /* Send pending recv completions */
send_recv_completions(struct net_device * ndev,struct netvsc_device * nvdev,struct netvsc_channel * nvchan)1305cad5c197Sstephen hemminger static int send_recv_completions(struct net_device *ndev,
1306cad5c197Sstephen hemminger 				 struct netvsc_device *nvdev,
1307cad5c197Sstephen hemminger 				 struct netvsc_channel *nvchan)
130895fa0405SHaiyang Zhang {
13097426b1a5Sstephen hemminger 	struct multi_recv_comp *mrc = &nvchan->mrc;
13107426b1a5Sstephen hemminger 	struct recv_comp_msg {
13117426b1a5Sstephen hemminger 		struct nvsp_message_header hdr;
13127426b1a5Sstephen hemminger 		u32 status;
13137426b1a5Sstephen hemminger 	}  __packed;
13147426b1a5Sstephen hemminger 	struct recv_comp_msg msg = {
13157426b1a5Sstephen hemminger 		.hdr.msg_type = NVSP_MSG1_TYPE_SEND_RNDIS_PKT_COMPLETE,
13167426b1a5Sstephen hemminger 	};
131795fa0405SHaiyang Zhang 	int ret;
131895fa0405SHaiyang Zhang 
13197426b1a5Sstephen hemminger 	while (mrc->first != mrc->next) {
13207426b1a5Sstephen hemminger 		const struct recv_comp_data *rcd
13217426b1a5Sstephen hemminger 			= mrc->slots + mrc->first;
132295fa0405SHaiyang Zhang 
13237426b1a5Sstephen hemminger 		msg.status = rcd->status;
13247426b1a5Sstephen hemminger 		ret = vmbus_sendpacket(nvchan->channel, &msg, sizeof(msg),
13257426b1a5Sstephen hemminger 				       rcd->tid, VM_PKT_COMP, 0);
1326cad5c197Sstephen hemminger 		if (unlikely(ret)) {
1327cad5c197Sstephen hemminger 			struct net_device_context *ndev_ctx = netdev_priv(ndev);
1328cad5c197Sstephen hemminger 
1329cad5c197Sstephen hemminger 			++ndev_ctx->eth_stats.rx_comp_busy;
1330c0b558e5SHaiyang Zhang 			return ret;
1331cad5c197Sstephen hemminger 		}
13327426b1a5Sstephen hemminger 
13337426b1a5Sstephen hemminger 		if (++mrc->first == nvdev->recv_completion_cnt)
13347426b1a5Sstephen hemminger 			mrc->first = 0;
133595fa0405SHaiyang Zhang 	}
1336c0b558e5SHaiyang Zhang 
13377426b1a5Sstephen hemminger 	/* receive completion ring has been emptied */
13387426b1a5Sstephen hemminger 	if (unlikely(nvdev->destroy))
13397426b1a5Sstephen hemminger 		wake_up(&nvdev->wait_drain);
13407426b1a5Sstephen hemminger 
13417426b1a5Sstephen hemminger 	return 0;
13427426b1a5Sstephen hemminger }
13437426b1a5Sstephen hemminger 
13447426b1a5Sstephen hemminger /* Count how many receive completions are outstanding */
recv_comp_slot_avail(const struct netvsc_device * nvdev,const struct multi_recv_comp * mrc,u32 * filled,u32 * avail)13457426b1a5Sstephen hemminger static void recv_comp_slot_avail(const struct netvsc_device *nvdev,
13467426b1a5Sstephen hemminger 				 const struct multi_recv_comp *mrc,
1347c0b558e5SHaiyang Zhang 				 u32 *filled, u32 *avail)
1348c0b558e5SHaiyang Zhang {
13497426b1a5Sstephen hemminger 	u32 count = nvdev->recv_completion_cnt;
1350c0b558e5SHaiyang Zhang 
13517426b1a5Sstephen hemminger 	if (mrc->next >= mrc->first)
13527426b1a5Sstephen hemminger 		*filled = mrc->next - mrc->first;
13537426b1a5Sstephen hemminger 	else
13547426b1a5Sstephen hemminger 		*filled = (count - mrc->first) + mrc->next;
1355c0b558e5SHaiyang Zhang 
13567426b1a5Sstephen hemminger 	*avail = count - *filled - 1;
135795fa0405SHaiyang Zhang }
1358c0b558e5SHaiyang Zhang 
13597426b1a5Sstephen hemminger /* Add receive complete to ring to send to host. */
enq_receive_complete(struct net_device * ndev,struct netvsc_device * nvdev,u16 q_idx,u64 tid,u32 status)13607426b1a5Sstephen hemminger static void enq_receive_complete(struct net_device *ndev,
13617426b1a5Sstephen hemminger 				 struct netvsc_device *nvdev, u16 q_idx,
13627426b1a5Sstephen hemminger 				 u64 tid, u32 status)
1363c0b558e5SHaiyang Zhang {
13647426b1a5Sstephen hemminger 	struct netvsc_channel *nvchan = &nvdev->chan_table[q_idx];
13657426b1a5Sstephen hemminger 	struct multi_recv_comp *mrc = &nvchan->mrc;
13667426b1a5Sstephen hemminger 	struct recv_comp_data *rcd;
1367c0b558e5SHaiyang Zhang 	u32 filled, avail;
1368c0b558e5SHaiyang Zhang 
13697426b1a5Sstephen hemminger 	recv_comp_slot_avail(nvdev, mrc, &filled, &avail);
1370c0b558e5SHaiyang Zhang 
13717426b1a5Sstephen hemminger 	if (unlikely(filled > NAPI_POLL_WEIGHT)) {
1372cad5c197Sstephen hemminger 		send_recv_completions(ndev, nvdev, nvchan);
13737426b1a5Sstephen hemminger 		recv_comp_slot_avail(nvdev, mrc, &filled, &avail);
1374c0b558e5SHaiyang Zhang 	}
1375c0b558e5SHaiyang Zhang 
13767426b1a5Sstephen hemminger 	if (unlikely(!avail)) {
13777426b1a5Sstephen hemminger 		netdev_err(ndev, "Recv_comp full buf q:%hd, tid:%llx\n",
13787426b1a5Sstephen hemminger 			   q_idx, tid);
13797426b1a5Sstephen hemminger 		return;
1380c0b558e5SHaiyang Zhang 	}
1381c0b558e5SHaiyang Zhang 
13827426b1a5Sstephen hemminger 	rcd = mrc->slots + mrc->next;
13837426b1a5Sstephen hemminger 	rcd->tid = tid;
13847426b1a5Sstephen hemminger 	rcd->status = status;
1385c0b558e5SHaiyang Zhang 
13867426b1a5Sstephen hemminger 	if (++mrc->next == nvdev->recv_completion_cnt)
13877426b1a5Sstephen hemminger 		mrc->next = 0;
138895fa0405SHaiyang Zhang }
138995fa0405SHaiyang Zhang 
netvsc_receive(struct net_device * ndev,struct netvsc_device * net_device,struct netvsc_channel * nvchan,const struct vmpacket_descriptor * desc)139015a863bfSstephen hemminger static int netvsc_receive(struct net_device *ndev,
1391dc54a08cSstephen hemminger 			  struct netvsc_device *net_device,
1392c8e4eff4SHaiyang Zhang 			  struct netvsc_channel *nvchan,
139344144185SAndres Beltran 			  const struct vmpacket_descriptor *desc)
139495fa0405SHaiyang Zhang {
1395c347b927SStephen Hemminger 	struct net_device_context *net_device_ctx = netdev_priv(ndev);
1396c8e4eff4SHaiyang Zhang 	struct vmbus_channel *channel = nvchan->channel;
1397f3dd3f47Sstephen hemminger 	const struct vmtransfer_page_packet_header *vmxferpage_packet
1398f3dd3f47Sstephen hemminger 		= container_of(desc, const struct vmtransfer_page_packet_header, d);
139944144185SAndres Beltran 	const struct nvsp_message *nvsp = hv_pkt_data(desc);
140044144185SAndres Beltran 	u32 msglen = hv_pkt_datalen(desc);
140115a863bfSstephen hemminger 	u16 q_idx = channel->offermsg.offer.sub_channel_index;
1402dc54a08cSstephen hemminger 	char *recv_buf = net_device->recv_buf;
14034baab261SHaiyang Zhang 	u32 status = NVSP_STAT_SUCCESS;
140445326342SHaiyang Zhang 	int i;
140545326342SHaiyang Zhang 	int count = 0;
140695fa0405SHaiyang Zhang 
140744144185SAndres Beltran 	/* Ensure packet is big enough to read header fields */
140844144185SAndres Beltran 	if (msglen < sizeof(struct nvsp_message_header)) {
140944144185SAndres Beltran 		netif_err(net_device_ctx, rx_err, ndev,
141044144185SAndres Beltran 			  "invalid nvsp header, length too small: %u\n",
141144144185SAndres Beltran 			  msglen);
141244144185SAndres Beltran 		return 0;
141344144185SAndres Beltran 	}
141444144185SAndres Beltran 
141595fa0405SHaiyang Zhang 	/* Make sure this is a valid nvsp packet */
1416dc54a08cSstephen hemminger 	if (unlikely(nvsp->hdr.msg_type != NVSP_MSG1_TYPE_SEND_RNDIS_PKT)) {
1417dc54a08cSstephen hemminger 		netif_err(net_device_ctx, rx_err, ndev,
1418dc54a08cSstephen hemminger 			  "Unknown nvsp packet type received %u\n",
1419dc54a08cSstephen hemminger 			  nvsp->hdr.msg_type);
142015a863bfSstephen hemminger 		return 0;
142195fa0405SHaiyang Zhang 	}
142295fa0405SHaiyang Zhang 
142344144185SAndres Beltran 	/* Validate xfer page pkt header */
142444144185SAndres Beltran 	if ((desc->offset8 << 3) < sizeof(struct vmtransfer_page_packet_header)) {
142544144185SAndres Beltran 		netif_err(net_device_ctx, rx_err, ndev,
142644144185SAndres Beltran 			  "Invalid xfer page pkt, offset too small: %u\n",
142744144185SAndres Beltran 			  desc->offset8 << 3);
142844144185SAndres Beltran 		return 0;
142944144185SAndres Beltran 	}
143044144185SAndres Beltran 
1431dc54a08cSstephen hemminger 	if (unlikely(vmxferpage_packet->xfer_pageset_id != NETVSC_RECEIVE_BUFFER_ID)) {
1432dc54a08cSstephen hemminger 		netif_err(net_device_ctx, rx_err, ndev,
1433dc54a08cSstephen hemminger 			  "Invalid xfer page set id - expecting %x got %x\n",
1434dc54a08cSstephen hemminger 			  NETVSC_RECEIVE_BUFFER_ID,
143595fa0405SHaiyang Zhang 			  vmxferpage_packet->xfer_pageset_id);
143615a863bfSstephen hemminger 		return 0;
143795fa0405SHaiyang Zhang 	}
143895fa0405SHaiyang Zhang 
14394baab261SHaiyang Zhang 	count = vmxferpage_packet->range_cnt;
144095fa0405SHaiyang Zhang 
144144144185SAndres Beltran 	/* Check count for a valid value */
144244144185SAndres Beltran 	if (NETVSC_XFER_HEADER_SIZE(count) > desc->offset8 << 3) {
144344144185SAndres Beltran 		netif_err(net_device_ctx, rx_err, ndev,
144444144185SAndres Beltran 			  "Range count is not valid: %d\n",
144544144185SAndres Beltran 			  count);
144644144185SAndres Beltran 		return 0;
144744144185SAndres Beltran 	}
144844144185SAndres Beltran 
144995fa0405SHaiyang Zhang 	/* Each range represents 1 RNDIS pkt that contains 1 ethernet frame */
14504baab261SHaiyang Zhang 	for (i = 0; i < count; i++) {
1451c5d24bddSHaiyang Zhang 		u32 offset = vmxferpage_packet->ranges[i].byte_offset;
1452dc54a08cSstephen hemminger 		u32 buflen = vmxferpage_packet->ranges[i].byte_count;
1453c5d24bddSHaiyang Zhang 		void *data;
14545c71dadbSHaiyang Zhang 		int ret;
145595fa0405SHaiyang Zhang 
145644144185SAndres Beltran 		if (unlikely(offset > net_device->recv_buf_size ||
145744144185SAndres Beltran 			     buflen > net_device->recv_buf_size - offset)) {
1458c8e4eff4SHaiyang Zhang 			nvchan->rsc.cnt = 0;
1459c5d24bddSHaiyang Zhang 			status = NVSP_STAT_FAIL;
1460c5d24bddSHaiyang Zhang 			netif_err(net_device_ctx, rx_err, ndev,
1461c5d24bddSHaiyang Zhang 				  "Packet offset:%u + len:%u too big\n",
1462c5d24bddSHaiyang Zhang 				  offset, buflen);
1463c5d24bddSHaiyang Zhang 
1464c5d24bddSHaiyang Zhang 			continue;
1465c5d24bddSHaiyang Zhang 		}
1466c5d24bddSHaiyang Zhang 
14670ba35fe9SAndrea Parri (Microsoft) 		/* We're going to copy (sections of) the packet into nvchan->recv_buf;
14680ba35fe9SAndrea Parri (Microsoft) 		 * make sure that nvchan->recv_buf is large enough to hold the packet.
14690ba35fe9SAndrea Parri (Microsoft) 		 */
14700ba35fe9SAndrea Parri (Microsoft) 		if (unlikely(buflen > net_device->recv_section_size)) {
14710ba35fe9SAndrea Parri (Microsoft) 			nvchan->rsc.cnt = 0;
14720ba35fe9SAndrea Parri (Microsoft) 			status = NVSP_STAT_FAIL;
14730ba35fe9SAndrea Parri (Microsoft) 			netif_err(net_device_ctx, rx_err, ndev,
14740ba35fe9SAndrea Parri (Microsoft) 				  "Packet too big: buflen=%u recv_section_size=%u\n",
14750ba35fe9SAndrea Parri (Microsoft) 				  buflen, net_device->recv_section_size);
14760ba35fe9SAndrea Parri (Microsoft) 
14770ba35fe9SAndrea Parri (Microsoft) 			continue;
14780ba35fe9SAndrea Parri (Microsoft) 		}
14790ba35fe9SAndrea Parri (Microsoft) 
1480c5d24bddSHaiyang Zhang 		data = recv_buf + offset;
1481c5d24bddSHaiyang Zhang 
1482c8e4eff4SHaiyang Zhang 		nvchan->rsc.is_last = (i == count - 1);
1483c8e4eff4SHaiyang Zhang 
1484ec966381SStephen Hemminger 		trace_rndis_recv(ndev, q_idx, data);
1485ec966381SStephen Hemminger 
148695fa0405SHaiyang Zhang 		/* Pass it to the upper layer */
14875c71dadbSHaiyang Zhang 		ret = rndis_filter_receive(ndev, net_device,
1488c8e4eff4SHaiyang Zhang 					   nvchan, data, buflen);
14895c71dadbSHaiyang Zhang 
149012bc8dfbSAndrea Parri (Microsoft) 		if (unlikely(ret != NVSP_STAT_SUCCESS)) {
149112bc8dfbSAndrea Parri (Microsoft) 			/* Drop incomplete packet */
149212bc8dfbSAndrea Parri (Microsoft) 			nvchan->rsc.cnt = 0;
14935c71dadbSHaiyang Zhang 			status = NVSP_STAT_FAIL;
149495fa0405SHaiyang Zhang 		}
149512bc8dfbSAndrea Parri (Microsoft) 	}
149695fa0405SHaiyang Zhang 
14977426b1a5Sstephen hemminger 	enq_receive_complete(ndev, net_device, q_idx,
14987426b1a5Sstephen hemminger 			     vmxferpage_packet->d.trans_id, status);
149915a863bfSstephen hemminger 
150015a863bfSstephen hemminger 	return count;
150195fa0405SHaiyang Zhang }
150295fa0405SHaiyang Zhang 
netvsc_send_table(struct net_device * ndev,struct netvsc_device * nvscdev,const struct nvsp_message * nvmsg,u32 msglen)1503c347b927SStephen Hemminger static void netvsc_send_table(struct net_device *ndev,
1504171c1fd9SHaiyang Zhang 			      struct netvsc_device *nvscdev,
150571f21959SHaiyang Zhang 			      const struct nvsp_message *nvmsg,
150671f21959SHaiyang Zhang 			      u32 msglen)
15075b54dac8SHaiyang Zhang {
15087ce10124Sstephen hemminger 	struct net_device_context *net_device_ctx = netdev_priv(ndev);
150971f21959SHaiyang Zhang 	u32 count, offset, *tab;
1510c347b927SStephen Hemminger 	int i;
15115b54dac8SHaiyang Zhang 
151244144185SAndres Beltran 	/* Ensure packet is big enough to read send_table fields */
151344144185SAndres Beltran 	if (msglen < sizeof(struct nvsp_message_header) +
151444144185SAndres Beltran 		     sizeof(struct nvsp_5_send_indirect_table)) {
151544144185SAndres Beltran 		netdev_err(ndev, "nvsp_v5_msg length too small: %u\n", msglen);
151644144185SAndres Beltran 		return;
151744144185SAndres Beltran 	}
151844144185SAndres Beltran 
15195b54dac8SHaiyang Zhang 	count = nvmsg->msg.v5_msg.send_table.count;
152071f21959SHaiyang Zhang 	offset = nvmsg->msg.v5_msg.send_table.offset;
152171f21959SHaiyang Zhang 
15225b54dac8SHaiyang Zhang 	if (count != VRSS_SEND_TAB_SIZE) {
15235b54dac8SHaiyang Zhang 		netdev_err(ndev, "Received wrong send-table size:%u\n", count);
15245b54dac8SHaiyang Zhang 		return;
15255b54dac8SHaiyang Zhang 	}
15265b54dac8SHaiyang Zhang 
1527171c1fd9SHaiyang Zhang 	/* If negotiated version <= NVSP_PROTOCOL_VERSION_6, the offset may be
1528171c1fd9SHaiyang Zhang 	 * wrong due to a host bug. So fix the offset here.
1529171c1fd9SHaiyang Zhang 	 */
1530171c1fd9SHaiyang Zhang 	if (nvscdev->nvsp_version <= NVSP_PROTOCOL_VERSION_6 &&
1531171c1fd9SHaiyang Zhang 	    msglen >= sizeof(struct nvsp_message_header) +
1532171c1fd9SHaiyang Zhang 	    sizeof(union nvsp_6_message_uber) + count * sizeof(u32))
1533171c1fd9SHaiyang Zhang 		offset = sizeof(struct nvsp_message_header) +
1534171c1fd9SHaiyang Zhang 			 sizeof(union nvsp_6_message_uber);
1535171c1fd9SHaiyang Zhang 
1536171c1fd9SHaiyang Zhang 	/* Boundary check for all versions */
1537505e3f00SAndrea Parri (Microsoft) 	if (msglen < count * sizeof(u32) || offset > msglen - count * sizeof(u32)) {
153871f21959SHaiyang Zhang 		netdev_err(ndev, "Received send-table offset too big:%u\n",
153971f21959SHaiyang Zhang 			   offset);
154071f21959SHaiyang Zhang 		return;
154171f21959SHaiyang Zhang 	}
154271f21959SHaiyang Zhang 
154371f21959SHaiyang Zhang 	tab = (void *)nvmsg + offset;
15445b54dac8SHaiyang Zhang 
15455b54dac8SHaiyang Zhang 	for (i = 0; i < count; i++)
154639e91cfbSHaiyang Zhang 		net_device_ctx->tx_table[i] = tab[i];
15475b54dac8SHaiyang Zhang }
15485b54dac8SHaiyang Zhang 
netvsc_send_vf(struct net_device * ndev,const struct nvsp_message * nvmsg,u32 msglen)1549c347b927SStephen Hemminger static void netvsc_send_vf(struct net_device *ndev,
155044144185SAndres Beltran 			   const struct nvsp_message *nvmsg,
155144144185SAndres Beltran 			   u32 msglen)
155271790a27SHaiyang Zhang {
1553c347b927SStephen Hemminger 	struct net_device_context *net_device_ctx = netdev_priv(ndev);
1554c347b927SStephen Hemminger 
155544144185SAndres Beltran 	/* Ensure packet is big enough to read its fields */
155644144185SAndres Beltran 	if (msglen < sizeof(struct nvsp_message_header) +
155744144185SAndres Beltran 		     sizeof(struct nvsp_4_send_vf_association)) {
155844144185SAndres Beltran 		netdev_err(ndev, "nvsp_v4_msg length too small: %u\n", msglen);
155944144185SAndres Beltran 		return;
156044144185SAndres Beltran 	}
156144144185SAndres Beltran 
1562f9a7da91SVitaly Kuznetsov 	net_device_ctx->vf_alloc = nvmsg->msg.v4_msg.vf_assoc.allocated;
1563f9a7da91SVitaly Kuznetsov 	net_device_ctx->vf_serial = nvmsg->msg.v4_msg.vf_assoc.serial;
1564365e1eceSGaurav Kohli 
1565365e1eceSGaurav Kohli 	if (net_device_ctx->vf_alloc)
1566365e1eceSGaurav Kohli 		complete(&net_device_ctx->vf_add);
1567365e1eceSGaurav Kohli 
156800d7ddbaSStephen Hemminger 	netdev_info(ndev, "VF slot %u %s\n",
156900d7ddbaSStephen Hemminger 		    net_device_ctx->vf_serial,
157000d7ddbaSStephen Hemminger 		    net_device_ctx->vf_alloc ? "added" : "removed");
157171790a27SHaiyang Zhang }
157271790a27SHaiyang Zhang 
netvsc_receive_inband(struct net_device * ndev,struct netvsc_device * nvscdev,const struct vmpacket_descriptor * desc)1573c347b927SStephen Hemminger static void netvsc_receive_inband(struct net_device *ndev,
1574171c1fd9SHaiyang Zhang 				  struct netvsc_device *nvscdev,
157544144185SAndres Beltran 				  const struct vmpacket_descriptor *desc)
157671790a27SHaiyang Zhang {
157744144185SAndres Beltran 	const struct nvsp_message *nvmsg = hv_pkt_data(desc);
157844144185SAndres Beltran 	u32 msglen = hv_pkt_datalen(desc);
157944144185SAndres Beltran 
158044144185SAndres Beltran 	/* Ensure packet is big enough to read header fields */
158144144185SAndres Beltran 	if (msglen < sizeof(struct nvsp_message_header)) {
158244144185SAndres Beltran 		netdev_err(ndev, "inband nvsp_message length too small: %u\n", msglen);
158344144185SAndres Beltran 		return;
158444144185SAndres Beltran 	}
158544144185SAndres Beltran 
158671790a27SHaiyang Zhang 	switch (nvmsg->hdr.msg_type) {
158771790a27SHaiyang Zhang 	case NVSP_MSG5_TYPE_SEND_INDIRECTION_TABLE:
1588171c1fd9SHaiyang Zhang 		netvsc_send_table(ndev, nvscdev, nvmsg, msglen);
158971790a27SHaiyang Zhang 		break;
159071790a27SHaiyang Zhang 
159171790a27SHaiyang Zhang 	case NVSP_MSG4_TYPE_SEND_VF_ASSOCIATION:
159296854bbdSAndrea Parri (Microsoft) 		if (hv_is_isolation_supported())
159396854bbdSAndrea Parri (Microsoft) 			netdev_err(ndev, "Ignore VF_ASSOCIATION msg from the host supporting isolation\n");
159496854bbdSAndrea Parri (Microsoft) 		else
159544144185SAndres Beltran 			netvsc_send_vf(ndev, nvmsg, msglen);
159671790a27SHaiyang Zhang 		break;
159771790a27SHaiyang Zhang 	}
159871790a27SHaiyang Zhang }
159971790a27SHaiyang Zhang 
netvsc_process_raw_pkt(struct hv_device * device,struct netvsc_channel * nvchan,struct netvsc_device * net_device,struct net_device * ndev,const struct vmpacket_descriptor * desc,int budget)160015a863bfSstephen hemminger static int netvsc_process_raw_pkt(struct hv_device *device,
1601c8e4eff4SHaiyang Zhang 				  struct netvsc_channel *nvchan,
160299a50bb1SK. Y. Srinivasan 				  struct netvsc_device *net_device,
160399a50bb1SK. Y. Srinivasan 				  struct net_device *ndev,
1604f9645430Sstephen hemminger 				  const struct vmpacket_descriptor *desc,
1605f9645430Sstephen hemminger 				  int budget)
160699a50bb1SK. Y. Srinivasan {
1607c8e4eff4SHaiyang Zhang 	struct vmbus_channel *channel = nvchan->channel;
1608c347b927SStephen Hemminger 	const struct nvsp_message *nvmsg = hv_pkt_data(desc);
160999a50bb1SK. Y. Srinivasan 
1610ec966381SStephen Hemminger 	trace_nvsp_recv(ndev, channel, nvmsg);
1611ec966381SStephen Hemminger 
161299a50bb1SK. Y. Srinivasan 	switch (desc->type) {
161399a50bb1SK. Y. Srinivasan 	case VM_PKT_COMP:
161444144185SAndres Beltran 		netvsc_send_completion(ndev, net_device, channel, desc, budget);
161599a50bb1SK. Y. Srinivasan 		break;
161699a50bb1SK. Y. Srinivasan 
161799a50bb1SK. Y. Srinivasan 	case VM_PKT_DATA_USING_XFER_PAGES:
161844144185SAndres Beltran 		return netvsc_receive(ndev, net_device, nvchan, desc);
161999a50bb1SK. Y. Srinivasan 
162099a50bb1SK. Y. Srinivasan 	case VM_PKT_DATA_INBAND:
162144144185SAndres Beltran 		netvsc_receive_inband(ndev, net_device, desc);
162299a50bb1SK. Y. Srinivasan 		break;
162399a50bb1SK. Y. Srinivasan 
162499a50bb1SK. Y. Srinivasan 	default:
162599a50bb1SK. Y. Srinivasan 		netdev_err(ndev, "unhandled packet type %d, tid %llx\n",
1626f4f1c23dSstephen hemminger 			   desc->type, desc->trans_id);
162799a50bb1SK. Y. Srinivasan 		break;
162899a50bb1SK. Y. Srinivasan 	}
162915a863bfSstephen hemminger 
163015a863bfSstephen hemminger 	return 0;
163115a863bfSstephen hemminger }
163215a863bfSstephen hemminger 
netvsc_channel_to_device(struct vmbus_channel * channel)163315a863bfSstephen hemminger static struct hv_device *netvsc_channel_to_device(struct vmbus_channel *channel)
163415a863bfSstephen hemminger {
163515a863bfSstephen hemminger 	struct vmbus_channel *primary = channel->primary_channel;
163615a863bfSstephen hemminger 
163715a863bfSstephen hemminger 	return primary ? primary->device_obj : channel->device_obj;
163815a863bfSstephen hemminger }
163915a863bfSstephen hemminger 
1640262b7f14Sstephen hemminger /* Network processing softirq
1641262b7f14Sstephen hemminger  * Process data in incoming ring buffer from host
1642262b7f14Sstephen hemminger  * Stops when ring is empty or budget is met or exceeded.
1643262b7f14Sstephen hemminger  */
netvsc_poll(struct napi_struct * napi,int budget)164415a863bfSstephen hemminger int netvsc_poll(struct napi_struct *napi, int budget)
164515a863bfSstephen hemminger {
164615a863bfSstephen hemminger 	struct netvsc_channel *nvchan
164715a863bfSstephen hemminger 		= container_of(napi, struct netvsc_channel, napi);
164835fbbccfSstephen hemminger 	struct netvsc_device *net_device = nvchan->net_device;
164915a863bfSstephen hemminger 	struct vmbus_channel *channel = nvchan->channel;
165015a863bfSstephen hemminger 	struct hv_device *device = netvsc_channel_to_device(channel);
165115a863bfSstephen hemminger 	struct net_device *ndev = hv_get_drvdata(device);
165215a863bfSstephen hemminger 	int work_done = 0;
16536b81b193SHaiyang Zhang 	int ret;
165415a863bfSstephen hemminger 
1655f4f1c23dSstephen hemminger 	/* If starting a new interval */
1656f4f1c23dSstephen hemminger 	if (!nvchan->desc)
1657f4f1c23dSstephen hemminger 		nvchan->desc = hv_pkt_iter_first(channel);
165815a863bfSstephen hemminger 
16591cb9d3b6SHaiyang Zhang 	nvchan->xdp_flush = false;
16601cb9d3b6SHaiyang Zhang 
1661f4f1c23dSstephen hemminger 	while (nvchan->desc && work_done < budget) {
1662c8e4eff4SHaiyang Zhang 		work_done += netvsc_process_raw_pkt(device, nvchan, net_device,
1663f9645430Sstephen hemminger 						    ndev, nvchan->desc, budget);
1664f4f1c23dSstephen hemminger 		nvchan->desc = hv_pkt_iter_next(channel, nvchan->desc);
166515a863bfSstephen hemminger 	}
166615a863bfSstephen hemminger 
16671cb9d3b6SHaiyang Zhang 	if (nvchan->xdp_flush)
16681cb9d3b6SHaiyang Zhang 		xdp_do_flush();
16691cb9d3b6SHaiyang Zhang 
16706b81b193SHaiyang Zhang 	/* Send any pending receive completions */
16716b81b193SHaiyang Zhang 	ret = send_recv_completions(ndev, net_device, nvchan);
16726b81b193SHaiyang Zhang 
16736b81b193SHaiyang Zhang 	/* If it did not exhaust NAPI budget this time
1674f4f1c23dSstephen hemminger 	 *  and not doing busy poll
1675f4e40363Sstephen hemminger 	 * then re-enable host interrupts
16766b81b193SHaiyang Zhang 	 *  and reschedule if ring is not empty
16776b81b193SHaiyang Zhang 	 *   or sending receive completion failed.
1678262b7f14Sstephen hemminger 	 */
16796b81b193SHaiyang Zhang 	if (work_done < budget &&
168015a863bfSstephen hemminger 	    napi_complete_done(napi, work_done) &&
16816b81b193SHaiyang Zhang 	    (ret || hv_end_read(&channel->inbound)) &&
1682d64e38aeSStephen Hemminger 	    napi_schedule_prep(napi)) {
16837426b1a5Sstephen hemminger 		hv_begin_read(&channel->inbound);
1684d64e38aeSStephen Hemminger 		__napi_schedule(napi);
16857426b1a5Sstephen hemminger 	}
1686f4f1c23dSstephen hemminger 
1687f4f1c23dSstephen hemminger 	/* Driver may overshoot since multiple packets per descriptor */
1688f4f1c23dSstephen hemminger 	return min(work_done, budget);
168999a50bb1SK. Y. Srinivasan }
169099a50bb1SK. Y. Srinivasan 
1691262b7f14Sstephen hemminger /* Call back when data is available in host ring buffer.
1692262b7f14Sstephen hemminger  * Processing is deferred until network softirq (NAPI)
1693262b7f14Sstephen hemminger  */
netvsc_channel_cb(void * context)16945b54dac8SHaiyang Zhang void netvsc_channel_cb(void *context)
169595fa0405SHaiyang Zhang {
16966de38af6Sstephen hemminger 	struct netvsc_channel *nvchan = context;
169743bf99ceSstephen hemminger 	struct vmbus_channel *channel = nvchan->channel;
169843bf99ceSstephen hemminger 	struct hv_ring_buffer_info *rbi = &channel->inbound;
169943bf99ceSstephen hemminger 
170043bf99ceSstephen hemminger 	/* preload first vmpacket descriptor */
170143bf99ceSstephen hemminger 	prefetch(hv_get_ring_buffer(rbi) + rbi->priv_read_index);
170295fa0405SHaiyang Zhang 
1703f4f1c23dSstephen hemminger 	if (napi_schedule_prep(&nvchan->napi)) {
170452d3b494SAdrian Vladu 		/* disable interrupts from host */
170543bf99ceSstephen hemminger 		hv_begin_read(rbi);
17060d6dd357Sstephen hemminger 
170768633edaSStephen Hemminger 		__napi_schedule_irqoff(&nvchan->napi);
1708f4f1c23dSstephen hemminger 	}
170995fa0405SHaiyang Zhang }
171095fa0405SHaiyang Zhang 
171195fa0405SHaiyang Zhang /*
171295fa0405SHaiyang Zhang  * netvsc_device_add - Callback when the device belonging to this
171395fa0405SHaiyang Zhang  * driver is added
171495fa0405SHaiyang Zhang  */
netvsc_device_add(struct hv_device * device,const struct netvsc_device_info * device_info)17159749fed5Sstephen hemminger struct netvsc_device *netvsc_device_add(struct hv_device *device,
17162c7f83caSstephen hemminger 				const struct netvsc_device_info *device_info)
171795fa0405SHaiyang Zhang {
171888098834SVitaly Kuznetsov 	int i, ret = 0;
171995fa0405SHaiyang Zhang 	struct netvsc_device *net_device;
172088098834SVitaly Kuznetsov 	struct net_device *ndev = hv_get_drvdata(device);
172188098834SVitaly Kuznetsov 	struct net_device_context *net_device_ctx = netdev_priv(ndev);
172295fa0405SHaiyang Zhang 
172388098834SVitaly Kuznetsov 	net_device = alloc_net_device();
1724b1c84927SDan Carpenter 	if (!net_device)
17259749fed5Sstephen hemminger 		return ERR_PTR(-ENOMEM);
172695fa0405SHaiyang Zhang 
17276b0cbe31SHaiyang Zhang 	for (i = 0; i < VRSS_SEND_TAB_SIZE; i++)
17286b0cbe31SHaiyang Zhang 		net_device_ctx->tx_table[i] = 0;
17296b0cbe31SHaiyang Zhang 
173015a863bfSstephen hemminger 	/* Because the device uses NAPI, all the interrupt batching and
173115a863bfSstephen hemminger 	 * control is done via Net softirq, not the channel handling
173215a863bfSstephen hemminger 	 */
173315a863bfSstephen hemminger 	set_channel_read_mode(device->channel, HV_CALL_ISR);
173415a863bfSstephen hemminger 
1735bffb1842SK. Y. Srinivasan 	/* If we're reopening the device we may have multiple queues, fill the
1736bffb1842SK. Y. Srinivasan 	 * chn_table with the default channel to use it before subchannels are
1737bffb1842SK. Y. Srinivasan 	 * opened.
1738bffb1842SK. Y. Srinivasan 	 * Initialize the channel state before we open;
1739bffb1842SK. Y. Srinivasan 	 * we can be interrupted as soon as we open the channel.
1740bffb1842SK. Y. Srinivasan 	 */
1741bffb1842SK. Y. Srinivasan 
1742bffb1842SK. Y. Srinivasan 	for (i = 0; i < VRSS_CHANNEL_MAX; i++) {
1743bffb1842SK. Y. Srinivasan 		struct netvsc_channel *nvchan = &net_device->chan_table[i];
1744bffb1842SK. Y. Srinivasan 
1745bffb1842SK. Y. Srinivasan 		nvchan->channel = device->channel;
174635fbbccfSstephen hemminger 		nvchan->net_device = net_device;
17474a0dee1fSFlorian Fainelli 		u64_stats_init(&nvchan->tx_stats.syncp);
17484a0dee1fSFlorian Fainelli 		u64_stats_init(&nvchan->rx_stats.syncp);
1749351e1581SHaiyang Zhang 
1750b02e5a0eSBjörn Töpel 		ret = xdp_rxq_info_reg(&nvchan->xdp_rxq, ndev, i, 0);
1751351e1581SHaiyang Zhang 
1752351e1581SHaiyang Zhang 		if (ret) {
1753351e1581SHaiyang Zhang 			netdev_err(ndev, "xdp_rxq_info_reg fail: %d\n", ret);
1754351e1581SHaiyang Zhang 			goto cleanup2;
1755351e1581SHaiyang Zhang 		}
1756351e1581SHaiyang Zhang 
1757351e1581SHaiyang Zhang 		ret = xdp_rxq_info_reg_mem_model(&nvchan->xdp_rxq,
1758351e1581SHaiyang Zhang 						 MEM_TYPE_PAGE_SHARED, NULL);
1759351e1581SHaiyang Zhang 
1760351e1581SHaiyang Zhang 		if (ret) {
1761351e1581SHaiyang Zhang 			netdev_err(ndev, "xdp reg_mem_model fail: %d\n", ret);
1762351e1581SHaiyang Zhang 			goto cleanup2;
1763351e1581SHaiyang Zhang 		}
1764bffb1842SK. Y. Srinivasan 	}
1765bffb1842SK. Y. Srinivasan 
17662be0f264Sstephen hemminger 	/* Enable NAPI handler before init callbacks */
1767b48b89f9SJakub Kicinski 	netif_napi_add(ndev, &net_device->chan_table[0].napi, netvsc_poll);
17682be0f264Sstephen hemminger 
176995fa0405SHaiyang Zhang 	/* Open the channel */
1770bf5fd8caSAndrea Parri (Microsoft) 	device->channel->next_request_id_callback = vmbus_next_request_id;
1771bf5fd8caSAndrea Parri (Microsoft) 	device->channel->request_addr_callback = vmbus_request_addr;
17724d18fcc9SAndres Beltran 	device->channel->rqstor_size = netvsc_rqstor_size(netvsc_ring_bytes);
1773adae1e93SAndres Beltran 	device->channel->max_pkt_size = NETVSC_MAX_PKT_SIZE;
1774adae1e93SAndres Beltran 
1775a7f99d0fSStephen Hemminger 	ret = vmbus_open(device->channel, netvsc_ring_bytes,
1776a7f99d0fSStephen Hemminger 			 netvsc_ring_bytes,  NULL, 0,
1777a7f99d0fSStephen Hemminger 			 netvsc_channel_cb, net_device->chan_table);
177895fa0405SHaiyang Zhang 
177995fa0405SHaiyang Zhang 	if (ret != 0) {
178095fa0405SHaiyang Zhang 		netdev_err(ndev, "unable to open channel: %d\n", ret);
178195fa0405SHaiyang Zhang 		goto cleanup;
178295fa0405SHaiyang Zhang 	}
178395fa0405SHaiyang Zhang 
178495fa0405SHaiyang Zhang 	/* Channel is opened */
178593ba2222SVitaly Kuznetsov 	netdev_dbg(ndev, "hv_netvsc channel opened successfully\n");
178695fa0405SHaiyang Zhang 
178715a863bfSstephen hemminger 	napi_enable(&net_device->chan_table[0].napi);
178888098834SVitaly Kuznetsov 
178995fa0405SHaiyang Zhang 	/* Connect with the NetVsp */
17908b532797Sstephen hemminger 	ret = netvsc_connect_vsp(device, net_device, device_info);
179195fa0405SHaiyang Zhang 	if (ret != 0) {
179295fa0405SHaiyang Zhang 		netdev_err(ndev,
179395fa0405SHaiyang Zhang 			"unable to connect to NetVSP - %d\n", ret);
179495fa0405SHaiyang Zhang 		goto close;
179595fa0405SHaiyang Zhang 	}
179695fa0405SHaiyang Zhang 
179712f69661SStephen Hemminger 	/* Writing nvdev pointer unlocks netvsc_send(), make sure chn_table is
179812f69661SStephen Hemminger 	 * populated.
179912f69661SStephen Hemminger 	 */
180012f69661SStephen Hemminger 	rcu_assign_pointer(net_device_ctx->nvdev, net_device);
180112f69661SStephen Hemminger 
18029749fed5Sstephen hemminger 	return net_device;
180395fa0405SHaiyang Zhang 
180495fa0405SHaiyang Zhang close:
180549393347Sstephen hemminger 	RCU_INIT_POINTER(net_device_ctx->nvdev, NULL);
180649393347Sstephen hemminger 	napi_disable(&net_device->chan_table[0].napi);
180715a863bfSstephen hemminger 
180895fa0405SHaiyang Zhang 	/* Now, we can close the channel safely */
180995fa0405SHaiyang Zhang 	vmbus_close(device->channel);
181095fa0405SHaiyang Zhang 
181195fa0405SHaiyang Zhang cleanup:
1812fcfb4a00SStephen Hemminger 	netif_napi_del(&net_device->chan_table[0].napi);
1813351e1581SHaiyang Zhang 
1814351e1581SHaiyang Zhang cleanup2:
1815545a8e79Sstephen hemminger 	free_netvsc_device(&net_device->rcu);
181695fa0405SHaiyang Zhang 
18179749fed5Sstephen hemminger 	return ERR_PTR(ret);
181895fa0405SHaiyang Zhang }
1819