1 /*
2  * Copyright (c) 2013, Cisco Systems, Inc. All rights reserved.
3  *
4  * This software is available to you under a choice of one of two
5  * licenses.  You may choose to be licensed under the terms of the GNU
6  * General Public License (GPL) Version 2, available from the file
7  * COPYING in the main directory of this source tree, or the
8  * BSD license below:
9  *
10  *     Redistribution and use in source and binary forms, with or
11  *     without modification, are permitted provided that the following
12  *     conditions are met:
13  *
14  *      - Redistributions of source code must retain the above
15  *        copyright notice, this list of conditions and the following
16  *        disclaimer.
17  *
18  *      - Redistributions in binary form must reproduce the above
19  *        copyright notice, this list of conditions and the following
20  *        disclaimer in the documentation and/or other materials
21  *        provided with the distribution.
22  *
23  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30  * SOFTWARE.
31  *
32  * Author: Upinder Malhi <umalhi@cisco.com>
33  * Author: Anant Deepak <anadeepa@cisco.com>
34  * Author: Cesare Cantu' <cantuc@cisco.com>
35  * Author: Jeff Squyres <jsquyres@cisco.com>
36  * Author: Kiran Thirumalai <kithirum@cisco.com>
37  * Author: Xuyang Wang <xuywang@cisco.com>
38  * Author: Reese Faucette <rfaucett@cisco.com>
39  *
40  */
41 
42 #include <linux/module.h>
43 #include <linux/inetdevice.h>
44 #include <linux/init.h>
45 #include <linux/slab.h>
46 #include <linux/errno.h>
47 #include <linux/pci.h>
48 #include <linux/netdevice.h>
49 
50 #include <rdma/ib_user_verbs.h>
51 #include <rdma/ib_addr.h>
52 
53 #include "usnic_abi.h"
54 #include "usnic_common_util.h"
55 #include "usnic_ib.h"
56 #include "usnic_ib_qp_grp.h"
57 #include "usnic_log.h"
58 #include "usnic_fwd.h"
59 #include "usnic_debugfs.h"
60 #include "usnic_ib_verbs.h"
61 #include "usnic_transport.h"
62 #include "usnic_uiom.h"
63 #include "usnic_ib_sysfs.h"
64 
65 unsigned int usnic_log_lvl = USNIC_LOG_LVL_ERR;
66 unsigned int usnic_ib_share_vf = 1;
67 
68 static const char usnic_version[] =
69 	DRV_NAME ": Cisco VIC (USNIC) Verbs Driver v"
70 	DRV_VERSION " (" DRV_RELDATE ")\n";
71 
72 static DEFINE_MUTEX(usnic_ib_ibdev_list_lock);
73 static LIST_HEAD(usnic_ib_ibdev_list);
74 
75 /* Callback dump funcs */
76 static int usnic_ib_dump_vf_hdr(void *obj, char *buf, int buf_sz)
77 {
78 	struct usnic_ib_vf *vf = obj;
79 	return scnprintf(buf, buf_sz, "PF: %s ", vf->pf->ib_dev.name);
80 }
81 /* End callback dump funcs */
82 
83 static void usnic_ib_dump_vf(struct usnic_ib_vf *vf, char *buf, int buf_sz)
84 {
85 	usnic_vnic_dump(vf->vnic, buf, buf_sz, vf,
86 			usnic_ib_dump_vf_hdr,
87 			usnic_ib_qp_grp_dump_hdr, usnic_ib_qp_grp_dump_rows);
88 }
89 
90 void usnic_ib_log_vf(struct usnic_ib_vf *vf)
91 {
92 	char buf[1000];
93 	usnic_ib_dump_vf(vf, buf, sizeof(buf));
94 	usnic_dbg("%s\n", buf);
95 }
96 
97 /* Start of netdev section */
98 static inline const char *usnic_ib_netdev_event_to_string(unsigned long event)
99 {
100 	const char *event2str[] = {"NETDEV_NONE", "NETDEV_UP", "NETDEV_DOWN",
101 		"NETDEV_REBOOT", "NETDEV_CHANGE",
102 		"NETDEV_REGISTER", "NETDEV_UNREGISTER", "NETDEV_CHANGEMTU",
103 		"NETDEV_CHANGEADDR", "NETDEV_GOING_DOWN", "NETDEV_FEAT_CHANGE",
104 		"NETDEV_BONDING_FAILOVER", "NETDEV_PRE_UP",
105 		"NETDEV_PRE_TYPE_CHANGE", "NETDEV_POST_TYPE_CHANGE",
106 		"NETDEV_POST_INT", "NETDEV_UNREGISTER_FINAL", "NETDEV_RELEASE",
107 		"NETDEV_NOTIFY_PEERS", "NETDEV_JOIN"
108 	};
109 
110 	if (event >= ARRAY_SIZE(event2str))
111 		return "UNKNOWN_NETDEV_EVENT";
112 	else
113 		return event2str[event];
114 }
115 
116 static void usnic_ib_qp_grp_modify_active_to_err(struct usnic_ib_dev *us_ibdev)
117 {
118 	struct usnic_ib_ucontext *ctx;
119 	struct usnic_ib_qp_grp *qp_grp;
120 	enum ib_qp_state cur_state;
121 	int status;
122 
123 	BUG_ON(!mutex_is_locked(&us_ibdev->usdev_lock));
124 
125 	list_for_each_entry(ctx, &us_ibdev->ctx_list, link) {
126 		list_for_each_entry(qp_grp, &ctx->qp_grp_list, link) {
127 			cur_state = qp_grp->state;
128 			if (cur_state == IB_QPS_INIT ||
129 				cur_state == IB_QPS_RTR ||
130 				cur_state == IB_QPS_RTS) {
131 				status = usnic_ib_qp_grp_modify(qp_grp,
132 								IB_QPS_ERR,
133 								NULL);
134 				if (status) {
135 					usnic_err("Failed to transistion qp grp %u from %s to %s\n",
136 						qp_grp->grp_id,
137 						usnic_ib_qp_grp_state_to_string
138 						(cur_state),
139 						usnic_ib_qp_grp_state_to_string
140 						(IB_QPS_ERR));
141 				}
142 			}
143 		}
144 	}
145 }
146 
147 static void usnic_ib_handle_usdev_event(struct usnic_ib_dev *us_ibdev,
148 					unsigned long event)
149 {
150 	struct net_device *netdev;
151 	struct ib_event ib_event;
152 
153 	memset(&ib_event, 0, sizeof(ib_event));
154 
155 	mutex_lock(&us_ibdev->usdev_lock);
156 	netdev = us_ibdev->netdev;
157 	switch (event) {
158 	case NETDEV_REBOOT:
159 		usnic_info("PF Reset on %s\n", us_ibdev->ib_dev.name);
160 		usnic_ib_qp_grp_modify_active_to_err(us_ibdev);
161 		ib_event.event = IB_EVENT_PORT_ERR;
162 		ib_event.device = &us_ibdev->ib_dev;
163 		ib_event.element.port_num = 1;
164 		ib_dispatch_event(&ib_event);
165 		break;
166 	case NETDEV_UP:
167 	case NETDEV_DOWN:
168 	case NETDEV_CHANGE:
169 		if (!us_ibdev->ufdev->link_up &&
170 				netif_carrier_ok(netdev)) {
171 			usnic_fwd_carrier_up(us_ibdev->ufdev);
172 			usnic_info("Link UP on %s\n", us_ibdev->ib_dev.name);
173 			ib_event.event = IB_EVENT_PORT_ACTIVE;
174 			ib_event.device = &us_ibdev->ib_dev;
175 			ib_event.element.port_num = 1;
176 			ib_dispatch_event(&ib_event);
177 		} else if (us_ibdev->ufdev->link_up &&
178 				!netif_carrier_ok(netdev)) {
179 			usnic_fwd_carrier_down(us_ibdev->ufdev);
180 			usnic_info("Link DOWN on %s\n", us_ibdev->ib_dev.name);
181 			usnic_ib_qp_grp_modify_active_to_err(us_ibdev);
182 			ib_event.event = IB_EVENT_PORT_ERR;
183 			ib_event.device = &us_ibdev->ib_dev;
184 			ib_event.element.port_num = 1;
185 			ib_dispatch_event(&ib_event);
186 		} else {
187 			usnic_dbg("Ignoring %s on %s\n",
188 					usnic_ib_netdev_event_to_string(event),
189 					us_ibdev->ib_dev.name);
190 		}
191 		break;
192 	case NETDEV_CHANGEADDR:
193 		if (!memcmp(us_ibdev->ufdev->mac, netdev->dev_addr,
194 				sizeof(us_ibdev->ufdev->mac))) {
195 			usnic_dbg("Ignoring addr change on %s\n",
196 					us_ibdev->ib_dev.name);
197 		} else {
198 			usnic_info(" %s old mac: %pM new mac: %pM\n",
199 					us_ibdev->ib_dev.name,
200 					us_ibdev->ufdev->mac,
201 					netdev->dev_addr);
202 			usnic_fwd_set_mac(us_ibdev->ufdev, netdev->dev_addr);
203 			usnic_ib_qp_grp_modify_active_to_err(us_ibdev);
204 			ib_event.event = IB_EVENT_GID_CHANGE;
205 			ib_event.device = &us_ibdev->ib_dev;
206 			ib_event.element.port_num = 1;
207 			ib_dispatch_event(&ib_event);
208 		}
209 
210 		break;
211 	case NETDEV_CHANGEMTU:
212 		if (us_ibdev->ufdev->mtu != netdev->mtu) {
213 			usnic_info("MTU Change on %s old: %u new: %u\n",
214 					us_ibdev->ib_dev.name,
215 					us_ibdev->ufdev->mtu, netdev->mtu);
216 			usnic_fwd_set_mtu(us_ibdev->ufdev, netdev->mtu);
217 			usnic_ib_qp_grp_modify_active_to_err(us_ibdev);
218 		} else {
219 			usnic_dbg("Ignoring MTU change on %s\n",
220 					us_ibdev->ib_dev.name);
221 		}
222 		break;
223 	default:
224 		usnic_dbg("Ignoring event %s on %s",
225 				usnic_ib_netdev_event_to_string(event),
226 				us_ibdev->ib_dev.name);
227 	}
228 	mutex_unlock(&us_ibdev->usdev_lock);
229 }
230 
231 static int usnic_ib_netdevice_event(struct notifier_block *notifier,
232 					unsigned long event, void *ptr)
233 {
234 	struct usnic_ib_dev *us_ibdev;
235 
236 	struct net_device *netdev = netdev_notifier_info_to_dev(ptr);
237 
238 	mutex_lock(&usnic_ib_ibdev_list_lock);
239 	list_for_each_entry(us_ibdev, &usnic_ib_ibdev_list, ib_dev_link) {
240 		if (us_ibdev->netdev == netdev) {
241 			usnic_ib_handle_usdev_event(us_ibdev, event);
242 			break;
243 		}
244 	}
245 	mutex_unlock(&usnic_ib_ibdev_list_lock);
246 
247 	return NOTIFY_DONE;
248 }
249 
250 static struct notifier_block usnic_ib_netdevice_notifier = {
251 	.notifier_call = usnic_ib_netdevice_event
252 };
253 /* End of netdev section */
254 
255 /* Start of inet section */
256 static int usnic_ib_handle_inet_event(struct usnic_ib_dev *us_ibdev,
257 					unsigned long event, void *ptr)
258 {
259 	struct in_ifaddr *ifa = ptr;
260 	struct ib_event ib_event;
261 
262 	mutex_lock(&us_ibdev->usdev_lock);
263 
264 	switch (event) {
265 	case NETDEV_DOWN:
266 		usnic_info("%s via ip notifiers",
267 				usnic_ib_netdev_event_to_string(event));
268 		usnic_fwd_del_ipaddr(us_ibdev->ufdev);
269 		usnic_ib_qp_grp_modify_active_to_err(us_ibdev);
270 		ib_event.event = IB_EVENT_GID_CHANGE;
271 		ib_event.device = &us_ibdev->ib_dev;
272 		ib_event.element.port_num = 1;
273 		ib_dispatch_event(&ib_event);
274 		break;
275 	case NETDEV_UP:
276 		usnic_fwd_add_ipaddr(us_ibdev->ufdev, ifa->ifa_address);
277 		usnic_info("%s via ip notifiers: ip %pI4",
278 				usnic_ib_netdev_event_to_string(event),
279 				&us_ibdev->ufdev->inaddr);
280 		ib_event.event = IB_EVENT_GID_CHANGE;
281 		ib_event.device = &us_ibdev->ib_dev;
282 		ib_event.element.port_num = 1;
283 		ib_dispatch_event(&ib_event);
284 		break;
285 	default:
286 		usnic_info("Ignoring event %s on %s",
287 				usnic_ib_netdev_event_to_string(event),
288 				us_ibdev->ib_dev.name);
289 	}
290 	mutex_unlock(&us_ibdev->usdev_lock);
291 
292 	return NOTIFY_DONE;
293 }
294 
295 static int usnic_ib_inetaddr_event(struct notifier_block *notifier,
296 					unsigned long event, void *ptr)
297 {
298 	struct usnic_ib_dev *us_ibdev;
299 	struct in_ifaddr *ifa = ptr;
300 	struct net_device *netdev = ifa->ifa_dev->dev;
301 
302 	mutex_lock(&usnic_ib_ibdev_list_lock);
303 	list_for_each_entry(us_ibdev, &usnic_ib_ibdev_list, ib_dev_link) {
304 		if (us_ibdev->netdev == netdev) {
305 			usnic_ib_handle_inet_event(us_ibdev, event, ptr);
306 			break;
307 		}
308 	}
309 	mutex_unlock(&usnic_ib_ibdev_list_lock);
310 
311 	return NOTIFY_DONE;
312 }
313 static struct notifier_block usnic_ib_inetaddr_notifier = {
314 	.notifier_call = usnic_ib_inetaddr_event
315 };
316 /* End of inet section*/
317 
318 static int usnic_port_immutable(struct ib_device *ibdev, u8 port_num,
319 			        struct ib_port_immutable *immutable)
320 {
321 	struct ib_port_attr attr;
322 	int err;
323 
324 	err = usnic_ib_query_port(ibdev, port_num, &attr);
325 	if (err)
326 		return err;
327 
328 	immutable->pkey_tbl_len = attr.pkey_tbl_len;
329 	immutable->gid_tbl_len = attr.gid_tbl_len;
330 
331 	return 0;
332 }
333 
334 static void usnic_get_dev_fw_str(struct ib_device *device,
335 				 char *str,
336 				 size_t str_len)
337 {
338 	struct usnic_ib_dev *us_ibdev =
339 		container_of(device, struct usnic_ib_dev, ib_dev);
340 	struct ethtool_drvinfo info;
341 
342 	mutex_lock(&us_ibdev->usdev_lock);
343 	us_ibdev->netdev->ethtool_ops->get_drvinfo(us_ibdev->netdev, &info);
344 	mutex_unlock(&us_ibdev->usdev_lock);
345 
346 	snprintf(str, str_len, "%s", info.fw_version);
347 }
348 
349 /* Start of PF discovery section */
350 static void *usnic_ib_device_add(struct pci_dev *dev)
351 {
352 	struct usnic_ib_dev *us_ibdev;
353 	union ib_gid gid;
354 	struct in_ifaddr *in;
355 	struct net_device *netdev;
356 
357 	usnic_dbg("\n");
358 	netdev = pci_get_drvdata(dev);
359 
360 	us_ibdev = (struct usnic_ib_dev *)ib_alloc_device(sizeof(*us_ibdev));
361 	if (!us_ibdev) {
362 		usnic_err("Device %s context alloc failed\n",
363 				netdev_name(pci_get_drvdata(dev)));
364 		return ERR_PTR(-EFAULT);
365 	}
366 
367 	us_ibdev->ufdev = usnic_fwd_dev_alloc(dev);
368 	if (!us_ibdev->ufdev) {
369 		usnic_err("Failed to alloc ufdev for %s\n", pci_name(dev));
370 		goto err_dealloc;
371 	}
372 
373 	mutex_init(&us_ibdev->usdev_lock);
374 	INIT_LIST_HEAD(&us_ibdev->vf_dev_list);
375 	INIT_LIST_HEAD(&us_ibdev->ctx_list);
376 
377 	us_ibdev->pdev = dev;
378 	us_ibdev->netdev = pci_get_drvdata(dev);
379 	us_ibdev->ib_dev.owner = THIS_MODULE;
380 	us_ibdev->ib_dev.node_type = RDMA_NODE_USNIC_UDP;
381 	us_ibdev->ib_dev.phys_port_cnt = USNIC_IB_PORT_CNT;
382 	us_ibdev->ib_dev.num_comp_vectors = USNIC_IB_NUM_COMP_VECTORS;
383 	us_ibdev->ib_dev.dma_device = &dev->dev;
384 	us_ibdev->ib_dev.uverbs_abi_ver = USNIC_UVERBS_ABI_VERSION;
385 	strlcpy(us_ibdev->ib_dev.name, "usnic_%d", IB_DEVICE_NAME_MAX);
386 
387 	us_ibdev->ib_dev.uverbs_cmd_mask =
388 		(1ull << IB_USER_VERBS_CMD_GET_CONTEXT) |
389 		(1ull << IB_USER_VERBS_CMD_QUERY_DEVICE) |
390 		(1ull << IB_USER_VERBS_CMD_QUERY_PORT) |
391 		(1ull << IB_USER_VERBS_CMD_ALLOC_PD) |
392 		(1ull << IB_USER_VERBS_CMD_DEALLOC_PD) |
393 		(1ull << IB_USER_VERBS_CMD_REG_MR) |
394 		(1ull << IB_USER_VERBS_CMD_DEREG_MR) |
395 		(1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
396 		(1ull << IB_USER_VERBS_CMD_CREATE_CQ) |
397 		(1ull << IB_USER_VERBS_CMD_DESTROY_CQ) |
398 		(1ull << IB_USER_VERBS_CMD_CREATE_QP) |
399 		(1ull << IB_USER_VERBS_CMD_MODIFY_QP) |
400 		(1ull << IB_USER_VERBS_CMD_QUERY_QP) |
401 		(1ull << IB_USER_VERBS_CMD_DESTROY_QP) |
402 		(1ull << IB_USER_VERBS_CMD_ATTACH_MCAST) |
403 		(1ull << IB_USER_VERBS_CMD_DETACH_MCAST) |
404 		(1ull << IB_USER_VERBS_CMD_OPEN_QP);
405 
406 	us_ibdev->ib_dev.query_device = usnic_ib_query_device;
407 	us_ibdev->ib_dev.query_port = usnic_ib_query_port;
408 	us_ibdev->ib_dev.query_pkey = usnic_ib_query_pkey;
409 	us_ibdev->ib_dev.query_gid = usnic_ib_query_gid;
410 	us_ibdev->ib_dev.get_link_layer = usnic_ib_port_link_layer;
411 	us_ibdev->ib_dev.alloc_pd = usnic_ib_alloc_pd;
412 	us_ibdev->ib_dev.dealloc_pd = usnic_ib_dealloc_pd;
413 	us_ibdev->ib_dev.create_qp = usnic_ib_create_qp;
414 	us_ibdev->ib_dev.modify_qp = usnic_ib_modify_qp;
415 	us_ibdev->ib_dev.query_qp = usnic_ib_query_qp;
416 	us_ibdev->ib_dev.destroy_qp = usnic_ib_destroy_qp;
417 	us_ibdev->ib_dev.create_cq = usnic_ib_create_cq;
418 	us_ibdev->ib_dev.destroy_cq = usnic_ib_destroy_cq;
419 	us_ibdev->ib_dev.reg_user_mr = usnic_ib_reg_mr;
420 	us_ibdev->ib_dev.dereg_mr = usnic_ib_dereg_mr;
421 	us_ibdev->ib_dev.alloc_ucontext = usnic_ib_alloc_ucontext;
422 	us_ibdev->ib_dev.dealloc_ucontext = usnic_ib_dealloc_ucontext;
423 	us_ibdev->ib_dev.mmap = usnic_ib_mmap;
424 	us_ibdev->ib_dev.create_ah = usnic_ib_create_ah;
425 	us_ibdev->ib_dev.destroy_ah = usnic_ib_destroy_ah;
426 	us_ibdev->ib_dev.post_send = usnic_ib_post_send;
427 	us_ibdev->ib_dev.post_recv = usnic_ib_post_recv;
428 	us_ibdev->ib_dev.poll_cq = usnic_ib_poll_cq;
429 	us_ibdev->ib_dev.req_notify_cq = usnic_ib_req_notify_cq;
430 	us_ibdev->ib_dev.get_dma_mr = usnic_ib_get_dma_mr;
431 	us_ibdev->ib_dev.get_port_immutable = usnic_port_immutable;
432 	us_ibdev->ib_dev.get_dev_fw_str     = usnic_get_dev_fw_str;
433 
434 
435 	if (ib_register_device(&us_ibdev->ib_dev, NULL))
436 		goto err_fwd_dealloc;
437 
438 	usnic_fwd_set_mtu(us_ibdev->ufdev, us_ibdev->netdev->mtu);
439 	usnic_fwd_set_mac(us_ibdev->ufdev, us_ibdev->netdev->dev_addr);
440 	if (netif_carrier_ok(us_ibdev->netdev))
441 		usnic_fwd_carrier_up(us_ibdev->ufdev);
442 
443 	in = ((struct in_device *)(netdev->ip_ptr))->ifa_list;
444 	if (in != NULL)
445 		usnic_fwd_add_ipaddr(us_ibdev->ufdev, in->ifa_address);
446 
447 	usnic_mac_ip_to_gid(us_ibdev->netdev->perm_addr,
448 				us_ibdev->ufdev->inaddr, &gid.raw[0]);
449 	memcpy(&us_ibdev->ib_dev.node_guid, &gid.global.interface_id,
450 		sizeof(gid.global.interface_id));
451 	kref_init(&us_ibdev->vf_cnt);
452 
453 	usnic_info("Added ibdev: %s netdev: %s with mac %pM Link: %u MTU: %u\n",
454 			us_ibdev->ib_dev.name, netdev_name(us_ibdev->netdev),
455 			us_ibdev->ufdev->mac, us_ibdev->ufdev->link_up,
456 			us_ibdev->ufdev->mtu);
457 	return us_ibdev;
458 
459 err_fwd_dealloc:
460 	usnic_fwd_dev_free(us_ibdev->ufdev);
461 err_dealloc:
462 	usnic_err("failed -- deallocing device\n");
463 	ib_dealloc_device(&us_ibdev->ib_dev);
464 	return NULL;
465 }
466 
467 static void usnic_ib_device_remove(struct usnic_ib_dev *us_ibdev)
468 {
469 	usnic_info("Unregistering %s\n", us_ibdev->ib_dev.name);
470 	usnic_ib_sysfs_unregister_usdev(us_ibdev);
471 	usnic_fwd_dev_free(us_ibdev->ufdev);
472 	ib_unregister_device(&us_ibdev->ib_dev);
473 	ib_dealloc_device(&us_ibdev->ib_dev);
474 }
475 
476 static void usnic_ib_undiscover_pf(struct kref *kref)
477 {
478 	struct usnic_ib_dev *us_ibdev, *tmp;
479 	struct pci_dev *dev;
480 	bool found = false;
481 
482 	dev = container_of(kref, struct usnic_ib_dev, vf_cnt)->pdev;
483 	mutex_lock(&usnic_ib_ibdev_list_lock);
484 	list_for_each_entry_safe(us_ibdev, tmp,
485 				&usnic_ib_ibdev_list, ib_dev_link) {
486 		if (us_ibdev->pdev == dev) {
487 			list_del(&us_ibdev->ib_dev_link);
488 			usnic_ib_device_remove(us_ibdev);
489 			found = true;
490 			break;
491 		}
492 	}
493 
494 	WARN(!found, "Failed to remove PF %s\n", pci_name(dev));
495 
496 	mutex_unlock(&usnic_ib_ibdev_list_lock);
497 }
498 
499 static struct usnic_ib_dev *usnic_ib_discover_pf(struct usnic_vnic *vnic)
500 {
501 	struct usnic_ib_dev *us_ibdev;
502 	struct pci_dev *parent_pci, *vf_pci;
503 	int err;
504 
505 	vf_pci = usnic_vnic_get_pdev(vnic);
506 	parent_pci = pci_physfn(vf_pci);
507 
508 	BUG_ON(!parent_pci);
509 
510 	mutex_lock(&usnic_ib_ibdev_list_lock);
511 	list_for_each_entry(us_ibdev, &usnic_ib_ibdev_list, ib_dev_link) {
512 		if (us_ibdev->pdev == parent_pci) {
513 			kref_get(&us_ibdev->vf_cnt);
514 			goto out;
515 		}
516 	}
517 
518 	us_ibdev = usnic_ib_device_add(parent_pci);
519 	if (IS_ERR_OR_NULL(us_ibdev)) {
520 		us_ibdev = us_ibdev ? us_ibdev : ERR_PTR(-EFAULT);
521 		goto out;
522 	}
523 
524 	err = usnic_ib_sysfs_register_usdev(us_ibdev);
525 	if (err) {
526 		usnic_ib_device_remove(us_ibdev);
527 		us_ibdev = ERR_PTR(err);
528 		goto out;
529 	}
530 
531 	list_add(&us_ibdev->ib_dev_link, &usnic_ib_ibdev_list);
532 out:
533 	mutex_unlock(&usnic_ib_ibdev_list_lock);
534 	return us_ibdev;
535 }
536 /* End of PF discovery section */
537 
538 /* Start of PCI section */
539 
540 static const struct pci_device_id usnic_ib_pci_ids[] = {
541 	{PCI_DEVICE(PCI_VENDOR_ID_CISCO, PCI_DEVICE_ID_CISCO_VIC_USPACE_NIC)},
542 	{0,}
543 };
544 
545 static int usnic_ib_pci_probe(struct pci_dev *pdev,
546 				const struct pci_device_id *id)
547 {
548 	int err;
549 	struct usnic_ib_dev *pf;
550 	struct usnic_ib_vf *vf;
551 	enum usnic_vnic_res_type res_type;
552 
553 	vf = kzalloc(sizeof(*vf), GFP_KERNEL);
554 	if (!vf)
555 		return -ENOMEM;
556 
557 	err = pci_enable_device(pdev);
558 	if (err) {
559 		usnic_err("Failed to enable %s with err %d\n",
560 				pci_name(pdev), err);
561 		goto out_clean_vf;
562 	}
563 
564 	err = pci_request_regions(pdev, DRV_NAME);
565 	if (err) {
566 		usnic_err("Failed to request region for %s with err %d\n",
567 				pci_name(pdev), err);
568 		goto out_disable_device;
569 	}
570 
571 	pci_set_master(pdev);
572 	pci_set_drvdata(pdev, vf);
573 
574 	vf->vnic = usnic_vnic_alloc(pdev);
575 	if (IS_ERR_OR_NULL(vf->vnic)) {
576 		err = vf->vnic ? PTR_ERR(vf->vnic) : -ENOMEM;
577 		usnic_err("Failed to alloc vnic for %s with err %d\n",
578 				pci_name(pdev), err);
579 		goto out_release_regions;
580 	}
581 
582 	pf = usnic_ib_discover_pf(vf->vnic);
583 	if (IS_ERR_OR_NULL(pf)) {
584 		usnic_err("Failed to discover pf of vnic %s with err%ld\n",
585 				pci_name(pdev), PTR_ERR(pf));
586 		err = pf ? PTR_ERR(pf) : -EFAULT;
587 		goto out_clean_vnic;
588 	}
589 
590 	vf->pf = pf;
591 	spin_lock_init(&vf->lock);
592 	mutex_lock(&pf->usdev_lock);
593 	list_add_tail(&vf->link, &pf->vf_dev_list);
594 	/*
595 	 * Save max settings (will be same for each VF, easier to re-write than
596 	 * to say "if (!set) { set_values(); set=1; }
597 	 */
598 	for (res_type = USNIC_VNIC_RES_TYPE_EOL+1;
599 			res_type < USNIC_VNIC_RES_TYPE_MAX;
600 			res_type++) {
601 		pf->vf_res_cnt[res_type] = usnic_vnic_res_cnt(vf->vnic,
602 								res_type);
603 	}
604 
605 	mutex_unlock(&pf->usdev_lock);
606 
607 	usnic_info("Registering usnic VF %s into PF %s\n", pci_name(pdev),
608 			pf->ib_dev.name);
609 	usnic_ib_log_vf(vf);
610 	return 0;
611 
612 out_clean_vnic:
613 	usnic_vnic_free(vf->vnic);
614 out_release_regions:
615 	pci_set_drvdata(pdev, NULL);
616 	pci_clear_master(pdev);
617 	pci_release_regions(pdev);
618 out_disable_device:
619 	pci_disable_device(pdev);
620 out_clean_vf:
621 	kfree(vf);
622 	return err;
623 }
624 
625 static void usnic_ib_pci_remove(struct pci_dev *pdev)
626 {
627 	struct usnic_ib_vf *vf = pci_get_drvdata(pdev);
628 	struct usnic_ib_dev *pf = vf->pf;
629 
630 	mutex_lock(&pf->usdev_lock);
631 	list_del(&vf->link);
632 	mutex_unlock(&pf->usdev_lock);
633 
634 	kref_put(&pf->vf_cnt, usnic_ib_undiscover_pf);
635 	usnic_vnic_free(vf->vnic);
636 	pci_set_drvdata(pdev, NULL);
637 	pci_clear_master(pdev);
638 	pci_release_regions(pdev);
639 	pci_disable_device(pdev);
640 	kfree(vf);
641 
642 	usnic_info("Removed VF %s\n", pci_name(pdev));
643 }
644 
645 /* PCI driver entry points */
646 static struct pci_driver usnic_ib_pci_driver = {
647 	.name = DRV_NAME,
648 	.id_table = usnic_ib_pci_ids,
649 	.probe = usnic_ib_pci_probe,
650 	.remove = usnic_ib_pci_remove,
651 };
652 /* End of PCI section */
653 
654 /* Start of module section */
655 static int __init usnic_ib_init(void)
656 {
657 	int err;
658 
659 	printk_once(KERN_INFO "%s", usnic_version);
660 
661 	err = usnic_uiom_init(DRV_NAME);
662 	if (err) {
663 		usnic_err("Unable to initalize umem with err %d\n", err);
664 		return err;
665 	}
666 
667 	if (pci_register_driver(&usnic_ib_pci_driver)) {
668 		usnic_err("Unable to register with PCI\n");
669 		goto out_umem_fini;
670 	}
671 
672 	err = register_netdevice_notifier(&usnic_ib_netdevice_notifier);
673 	if (err) {
674 		usnic_err("Failed to register netdev notifier\n");
675 		goto out_pci_unreg;
676 	}
677 
678 	err = register_inetaddr_notifier(&usnic_ib_inetaddr_notifier);
679 	if (err) {
680 		usnic_err("Failed to register inet addr notifier\n");
681 		goto out_unreg_netdev_notifier;
682 	}
683 
684 	err = usnic_transport_init();
685 	if (err) {
686 		usnic_err("Failed to initialize transport\n");
687 		goto out_unreg_inetaddr_notifier;
688 	}
689 
690 	usnic_debugfs_init();
691 
692 	return 0;
693 
694 out_unreg_inetaddr_notifier:
695 	unregister_inetaddr_notifier(&usnic_ib_inetaddr_notifier);
696 out_unreg_netdev_notifier:
697 	unregister_netdevice_notifier(&usnic_ib_netdevice_notifier);
698 out_pci_unreg:
699 	pci_unregister_driver(&usnic_ib_pci_driver);
700 out_umem_fini:
701 	usnic_uiom_fini();
702 
703 	return err;
704 }
705 
706 static void __exit usnic_ib_destroy(void)
707 {
708 	usnic_dbg("\n");
709 	usnic_debugfs_exit();
710 	usnic_transport_fini();
711 	unregister_inetaddr_notifier(&usnic_ib_inetaddr_notifier);
712 	unregister_netdevice_notifier(&usnic_ib_netdevice_notifier);
713 	pci_unregister_driver(&usnic_ib_pci_driver);
714 	usnic_uiom_fini();
715 }
716 
717 MODULE_DESCRIPTION("Cisco VIC (usNIC) Verbs Driver");
718 MODULE_AUTHOR("Upinder Malhi <umalhi@cisco.com>");
719 MODULE_LICENSE("Dual BSD/GPL");
720 MODULE_VERSION(DRV_VERSION);
721 module_param(usnic_log_lvl, uint, S_IRUGO | S_IWUSR);
722 module_param(usnic_ib_share_vf, uint, S_IRUGO | S_IWUSR);
723 MODULE_PARM_DESC(usnic_log_lvl, " Off=0, Err=1, Info=2, Debug=3");
724 MODULE_PARM_DESC(usnic_ib_share_vf, "Off=0, On=1 VF sharing amongst QPs");
725 MODULE_DEVICE_TABLE(pci, usnic_ib_pci_ids);
726 
727 module_init(usnic_ib_init);
728 module_exit(usnic_ib_destroy);
729 /* End of module section */
730