2 * Copyright (c) 2013, Cisco Systems, Inc. All rights reserved.
4 * This program is free software; you may redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; version 2 of the License.
8 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
9 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
10 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
11 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
12 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
13 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
14 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
17 * Author: Upinder Malhi <umalhi@cisco.com>
18 * Author: Anant Deepak <anadeepa@cisco.com>
19 * Author: Cesare Cantu' <cantuc@cisco.com>
20 * Author: Jeff Squyres <jsquyres@cisco.com>
21 * Author: Kiran Thirumalai <kithirum@cisco.com>
22 * Author: Xuyang Wang <xuywang@cisco.com>
23 * Author: Reese Faucette <rfaucett@cisco.com>
27 #include <linux/module.h>
28 #include <linux/init.h>
29 #include <linux/slab.h>
30 #include <linux/errno.h>
31 #include <linux/pci.h>
32 #include <linux/netdevice.h>
34 #include <rdma/ib_user_verbs.h>
35 #include <rdma/ib_addr.h>
37 #include "usnic_abi.h"
38 #include "usnic_common_util.h"
40 #include "usnic_ib_qp_grp.h"
41 #include "usnic_log.h"
42 #include "usnic_fwd.h"
43 #include "usnic_debugfs.h"
44 #include "usnic_ib_verbs.h"
45 #include "usnic_transport.h"
46 #include "usnic_uiom.h"
47 #include "usnic_ib_sysfs.h"
49 unsigned int usnic_log_lvl = USNIC_LOG_LVL_ERR;
50 unsigned int usnic_ib_share_vf = 1;
52 static const char usnic_version[] =
53 DRV_NAME ": Cisco VIC (USNIC) Verbs Driver v"
54 DRV_VERSION " (" DRV_RELDATE ")\n";
56 static DEFINE_MUTEX(usnic_ib_ibdev_list_lock);
57 static LIST_HEAD(usnic_ib_ibdev_list);
59 /* Callback dump funcs */
60 static int usnic_ib_dump_vf_hdr(void *obj, char *buf, int buf_sz)
62 struct usnic_ib_vf *vf = obj;
63 return scnprintf(buf, buf_sz, "PF: %s ", vf->pf->ib_dev.name);
65 /* End callback dump funcs */
67 static void usnic_ib_dump_vf(struct usnic_ib_vf *vf, char *buf, int buf_sz)
69 usnic_vnic_dump(vf->vnic, buf, buf_sz, vf,
71 usnic_ib_qp_grp_dump_hdr, usnic_ib_qp_grp_dump_rows);
74 void usnic_ib_log_vf(struct usnic_ib_vf *vf)
77 usnic_ib_dump_vf(vf, buf, sizeof(buf));
78 usnic_dbg("%s\n", buf);
81 /* Start of netdev section */
82 static inline const char *usnic_ib_netdev_event_to_string(unsigned long event)
84 const char *event2str[] = {"NETDEV_NONE", "NETDEV_UP", "NETDEV_DOWN",
85 "NETDEV_REBOOT", "NETDEV_CHANGE",
86 "NETDEV_REGISTER", "NETDEV_UNREGISTER", "NETDEV_CHANGEMTU",
87 "NETDEV_CHANGEADDR", "NETDEV_GOING_DOWN", "NETDEV_FEAT_CHANGE",
88 "NETDEV_BONDING_FAILOVER", "NETDEV_PRE_UP",
89 "NETDEV_PRE_TYPE_CHANGE", "NETDEV_POST_TYPE_CHANGE",
90 "NETDEV_POST_INT", "NETDEV_UNREGISTER_FINAL", "NETDEV_RELEASE",
91 "NETDEV_NOTIFY_PEERS", "NETDEV_JOIN"
94 if (event >= ARRAY_SIZE(event2str))
95 return "UNKNOWN_NETDEV_EVENT";
97 return event2str[event];
100 static void usnic_ib_qp_grp_modify_active_to_err(struct usnic_ib_dev *us_ibdev)
102 struct usnic_ib_ucontext *ctx;
103 struct usnic_ib_qp_grp *qp_grp;
104 enum ib_qp_state cur_state;
107 BUG_ON(!mutex_is_locked(&us_ibdev->usdev_lock));
109 list_for_each_entry(ctx, &us_ibdev->ctx_list, link) {
110 list_for_each_entry(qp_grp, &ctx->qp_grp_list, link) {
111 cur_state = qp_grp->state;
112 if (cur_state == IB_QPS_INIT ||
113 cur_state == IB_QPS_RTR ||
114 cur_state == IB_QPS_RTS) {
115 status = usnic_ib_qp_grp_modify(qp_grp,
119 usnic_err("Failed to transistion qp grp %u from %s to %s\n",
121 usnic_ib_qp_grp_state_to_string
123 usnic_ib_qp_grp_state_to_string
131 static void usnic_ib_handle_usdev_event(struct usnic_ib_dev *us_ibdev,
134 struct net_device *netdev;
135 struct ib_event ib_event;
137 memset(&ib_event, 0, sizeof(ib_event));
139 mutex_lock(&us_ibdev->usdev_lock);
140 netdev = us_ibdev->netdev;
143 usnic_info("PF Reset on %s\n", us_ibdev->ib_dev.name);
144 usnic_ib_qp_grp_modify_active_to_err(us_ibdev);
145 ib_event.event = IB_EVENT_PORT_ERR;
146 ib_event.device = &us_ibdev->ib_dev;
147 ib_event.element.port_num = 1;
148 ib_dispatch_event(&ib_event);
153 if (!us_ibdev->ufdev->link_up &&
154 netif_carrier_ok(netdev)) {
155 usnic_fwd_carrier_up(us_ibdev->ufdev);
156 usnic_info("Link UP on %s\n", us_ibdev->ib_dev.name);
157 ib_event.event = IB_EVENT_PORT_ACTIVE;
158 ib_event.device = &us_ibdev->ib_dev;
159 ib_event.element.port_num = 1;
160 ib_dispatch_event(&ib_event);
161 } else if (us_ibdev->ufdev->link_up &&
162 !netif_carrier_ok(netdev)) {
163 usnic_fwd_carrier_down(us_ibdev->ufdev);
164 usnic_info("Link DOWN on %s\n", us_ibdev->ib_dev.name);
165 usnic_ib_qp_grp_modify_active_to_err(us_ibdev);
166 ib_event.event = IB_EVENT_PORT_ERR;
167 ib_event.device = &us_ibdev->ib_dev;
168 ib_event.element.port_num = 1;
169 ib_dispatch_event(&ib_event);
171 usnic_dbg("Ignorning %s on %s\n",
172 usnic_ib_netdev_event_to_string(event),
173 us_ibdev->ib_dev.name);
176 case NETDEV_CHANGEADDR:
177 if (!memcmp(us_ibdev->ufdev->mac, netdev->dev_addr,
178 sizeof(us_ibdev->ufdev->mac))) {
179 usnic_dbg("Ignorning addr change on %s\n",
180 us_ibdev->ib_dev.name);
182 usnic_info(" %s old mac: %pM new mac: %pM\n",
183 us_ibdev->ib_dev.name,
184 us_ibdev->ufdev->mac,
186 usnic_fwd_set_mac(us_ibdev->ufdev, netdev->dev_addr);
187 usnic_ib_qp_grp_modify_active_to_err(us_ibdev);
188 ib_event.event = IB_EVENT_GID_CHANGE;
189 ib_event.device = &us_ibdev->ib_dev;
190 ib_event.element.port_num = 1;
191 ib_dispatch_event(&ib_event);
195 case NETDEV_CHANGEMTU:
196 if (us_ibdev->ufdev->mtu != netdev->mtu) {
197 usnic_info("MTU Change on %s old: %u new: %u\n",
198 us_ibdev->ib_dev.name,
199 us_ibdev->ufdev->mtu, netdev->mtu);
200 usnic_fwd_set_mtu(us_ibdev->ufdev, netdev->mtu);
201 usnic_ib_qp_grp_modify_active_to_err(us_ibdev);
203 usnic_dbg("Ignoring MTU change on %s\n",
204 us_ibdev->ib_dev.name);
208 usnic_dbg("Ignorning event %s on %s",
209 usnic_ib_netdev_event_to_string(event),
210 us_ibdev->ib_dev.name);
212 mutex_unlock(&us_ibdev->usdev_lock);
215 static int usnic_ib_netdevice_event(struct notifier_block *notifier,
216 unsigned long event, void *ptr)
218 struct usnic_ib_dev *us_ibdev;
220 struct net_device *netdev = netdev_notifier_info_to_dev(ptr);
222 mutex_lock(&usnic_ib_ibdev_list_lock);
223 list_for_each_entry(us_ibdev, &usnic_ib_ibdev_list, ib_dev_link) {
224 if (us_ibdev->netdev == netdev) {
225 usnic_ib_handle_usdev_event(us_ibdev, event);
229 mutex_unlock(&usnic_ib_ibdev_list_lock);
234 static struct notifier_block usnic_ib_netdevice_notifier = {
235 .notifier_call = usnic_ib_netdevice_event
237 /* End of netdev section */
239 /* Start of PF discovery section */
240 static void *usnic_ib_device_add(struct pci_dev *dev)
242 struct usnic_ib_dev *us_ibdev;
247 us_ibdev = (struct usnic_ib_dev *)ib_alloc_device(sizeof(*us_ibdev));
248 if (IS_ERR_OR_NULL(us_ibdev)) {
249 usnic_err("Device %s context alloc failed\n",
250 netdev_name(pci_get_drvdata(dev)));
251 return ERR_PTR(us_ibdev ? PTR_ERR(us_ibdev) : -EFAULT);
254 us_ibdev->ufdev = usnic_fwd_dev_alloc(dev);
255 if (IS_ERR_OR_NULL(us_ibdev->ufdev)) {
256 usnic_err("Failed to alloc ufdev for %s with err %ld\n",
257 pci_name(dev), PTR_ERR(us_ibdev->ufdev));
261 mutex_init(&us_ibdev->usdev_lock);
262 INIT_LIST_HEAD(&us_ibdev->vf_dev_list);
263 INIT_LIST_HEAD(&us_ibdev->ctx_list);
265 us_ibdev->pdev = dev;
266 us_ibdev->netdev = pci_get_drvdata(dev);
267 us_ibdev->ib_dev.owner = THIS_MODULE;
268 us_ibdev->ib_dev.node_type = RDMA_NODE_USNIC;
269 us_ibdev->ib_dev.phys_port_cnt = USNIC_IB_PORT_CNT;
270 us_ibdev->ib_dev.num_comp_vectors = USNIC_IB_NUM_COMP_VECTORS;
271 us_ibdev->ib_dev.dma_device = &dev->dev;
272 us_ibdev->ib_dev.uverbs_abi_ver = USNIC_UVERBS_ABI_VERSION;
273 strlcpy(us_ibdev->ib_dev.name, "usnic_%d", IB_DEVICE_NAME_MAX);
275 us_ibdev->ib_dev.uverbs_cmd_mask =
276 (1ull << IB_USER_VERBS_CMD_GET_CONTEXT) |
277 (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE) |
278 (1ull << IB_USER_VERBS_CMD_QUERY_PORT) |
279 (1ull << IB_USER_VERBS_CMD_ALLOC_PD) |
280 (1ull << IB_USER_VERBS_CMD_DEALLOC_PD) |
281 (1ull << IB_USER_VERBS_CMD_REG_MR) |
282 (1ull << IB_USER_VERBS_CMD_DEREG_MR) |
283 (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
284 (1ull << IB_USER_VERBS_CMD_CREATE_CQ) |
285 (1ull << IB_USER_VERBS_CMD_DESTROY_CQ) |
286 (1ull << IB_USER_VERBS_CMD_CREATE_QP) |
287 (1ull << IB_USER_VERBS_CMD_MODIFY_QP) |
288 (1ull << IB_USER_VERBS_CMD_QUERY_QP) |
289 (1ull << IB_USER_VERBS_CMD_DESTROY_QP) |
290 (1ull << IB_USER_VERBS_CMD_ATTACH_MCAST) |
291 (1ull << IB_USER_VERBS_CMD_DETACH_MCAST) |
292 (1ull << IB_USER_VERBS_CMD_OPEN_QP);
294 us_ibdev->ib_dev.query_device = usnic_ib_query_device;
295 us_ibdev->ib_dev.query_port = usnic_ib_query_port;
296 us_ibdev->ib_dev.query_pkey = usnic_ib_query_pkey;
297 us_ibdev->ib_dev.query_gid = usnic_ib_query_gid;
298 us_ibdev->ib_dev.get_link_layer = usnic_ib_port_link_layer;
299 us_ibdev->ib_dev.alloc_pd = usnic_ib_alloc_pd;
300 us_ibdev->ib_dev.dealloc_pd = usnic_ib_dealloc_pd;
301 us_ibdev->ib_dev.create_qp = usnic_ib_create_qp;
302 us_ibdev->ib_dev.modify_qp = usnic_ib_modify_qp;
303 us_ibdev->ib_dev.query_qp = usnic_ib_query_qp;
304 us_ibdev->ib_dev.destroy_qp = usnic_ib_destroy_qp;
305 us_ibdev->ib_dev.create_cq = usnic_ib_create_cq;
306 us_ibdev->ib_dev.destroy_cq = usnic_ib_destroy_cq;
307 us_ibdev->ib_dev.reg_user_mr = usnic_ib_reg_mr;
308 us_ibdev->ib_dev.dereg_mr = usnic_ib_dereg_mr;
309 us_ibdev->ib_dev.alloc_ucontext = usnic_ib_alloc_ucontext;
310 us_ibdev->ib_dev.dealloc_ucontext = usnic_ib_dealloc_ucontext;
311 us_ibdev->ib_dev.mmap = usnic_ib_mmap;
312 us_ibdev->ib_dev.create_ah = usnic_ib_create_ah;
313 us_ibdev->ib_dev.destroy_ah = usnic_ib_destroy_ah;
314 us_ibdev->ib_dev.post_send = usnic_ib_post_send;
315 us_ibdev->ib_dev.post_recv = usnic_ib_post_recv;
316 us_ibdev->ib_dev.poll_cq = usnic_ib_poll_cq;
317 us_ibdev->ib_dev.req_notify_cq = usnic_ib_req_notify_cq;
318 us_ibdev->ib_dev.get_dma_mr = usnic_ib_get_dma_mr;
321 if (ib_register_device(&us_ibdev->ib_dev, NULL))
322 goto err_fwd_dealloc;
324 usnic_fwd_set_mtu(us_ibdev->ufdev, us_ibdev->netdev->mtu);
325 usnic_fwd_set_mac(us_ibdev->ufdev, us_ibdev->netdev->dev_addr);
326 if (netif_carrier_ok(us_ibdev->netdev))
327 usnic_fwd_carrier_up(us_ibdev->ufdev);
329 memcpy(&us_ibdev->ib_dev.node_guid, &gid.global.interface_id,
330 sizeof(gid.global.interface_id));
331 kref_init(&us_ibdev->vf_cnt);
333 usnic_info("Added ibdev: %s netdev: %s with mac %pM Link: %u MTU: %u\n",
334 us_ibdev->ib_dev.name, netdev_name(us_ibdev->netdev),
335 us_ibdev->ufdev->mac, us_ibdev->ufdev->link_up,
336 us_ibdev->ufdev->mtu);
340 usnic_fwd_dev_free(us_ibdev->ufdev);
342 usnic_err("failed -- deallocing device\n");
343 ib_dealloc_device(&us_ibdev->ib_dev);
347 static void usnic_ib_device_remove(struct usnic_ib_dev *us_ibdev)
349 usnic_info("Unregistering %s\n", us_ibdev->ib_dev.name);
350 usnic_ib_sysfs_unregister_usdev(us_ibdev);
351 usnic_fwd_dev_free(us_ibdev->ufdev);
352 ib_unregister_device(&us_ibdev->ib_dev);
353 ib_dealloc_device(&us_ibdev->ib_dev);
356 static void usnic_ib_undiscover_pf(struct kref *kref)
358 struct usnic_ib_dev *us_ibdev, *tmp;
362 dev = container_of(kref, struct usnic_ib_dev, vf_cnt)->pdev;
363 mutex_lock(&usnic_ib_ibdev_list_lock);
364 list_for_each_entry_safe(us_ibdev, tmp,
365 &usnic_ib_ibdev_list, ib_dev_link) {
366 if (us_ibdev->pdev == dev) {
367 list_del(&us_ibdev->ib_dev_link);
368 usnic_ib_device_remove(us_ibdev);
374 WARN(!found, "Failed to remove PF %s\n", pci_name(dev));
376 mutex_unlock(&usnic_ib_ibdev_list_lock);
379 static struct usnic_ib_dev *usnic_ib_discover_pf(struct usnic_vnic *vnic)
381 struct usnic_ib_dev *us_ibdev;
382 struct pci_dev *parent_pci, *vf_pci;
385 vf_pci = usnic_vnic_get_pdev(vnic);
386 parent_pci = pci_physfn(vf_pci);
390 mutex_lock(&usnic_ib_ibdev_list_lock);
391 list_for_each_entry(us_ibdev, &usnic_ib_ibdev_list, ib_dev_link) {
392 if (us_ibdev->pdev == parent_pci) {
393 kref_get(&us_ibdev->vf_cnt);
398 us_ibdev = usnic_ib_device_add(parent_pci);
399 if (IS_ERR_OR_NULL(us_ibdev)) {
400 us_ibdev = (us_ibdev) ? us_ibdev : ERR_PTR(-EFAULT);
404 err = usnic_ib_sysfs_register_usdev(us_ibdev);
406 usnic_ib_device_remove(us_ibdev);
407 us_ibdev = ERR_PTR(err);
411 list_add(&us_ibdev->ib_dev_link, &usnic_ib_ibdev_list);
413 mutex_unlock(&usnic_ib_ibdev_list_lock);
416 /* End of PF discovery section */
418 /* Start of PCI section */
420 static DEFINE_PCI_DEVICE_TABLE(usnic_ib_pci_ids) = {
421 {PCI_DEVICE(PCI_VENDOR_ID_CISCO, PCI_DEVICE_ID_CISCO_VIC_USPACE_NIC)},
425 static int usnic_ib_pci_probe(struct pci_dev *pdev,
426 const struct pci_device_id *id)
429 struct usnic_ib_dev *pf;
430 struct usnic_ib_vf *vf;
431 enum usnic_vnic_res_type res_type;
433 vf = kzalloc(sizeof(*vf), GFP_KERNEL);
437 err = pci_enable_device(pdev);
439 usnic_err("Failed to enable %s with err %d\n",
440 pci_name(pdev), err);
444 err = pci_request_regions(pdev, DRV_NAME);
446 usnic_err("Failed to request region for %s with err %d\n",
447 pci_name(pdev), err);
448 goto out_disable_device;
451 pci_set_master(pdev);
452 pci_set_drvdata(pdev, vf);
454 vf->vnic = usnic_vnic_alloc(pdev);
455 if (IS_ERR_OR_NULL(vf->vnic)) {
456 err = (vf->vnic ? PTR_ERR(vf->vnic) : -ENOMEM);
457 usnic_err("Failed to alloc vnic for %s with err %d\n",
458 pci_name(pdev), err);
459 goto out_release_regions;
462 pf = usnic_ib_discover_pf(vf->vnic);
463 if (IS_ERR_OR_NULL(pf)) {
464 usnic_err("Failed to discover pf of vnic %s with err%ld\n",
465 pci_name(pdev), PTR_ERR(pf));
466 err = (pf ? PTR_ERR(pf) : -EFAULT);
471 spin_lock_init(&vf->lock);
472 mutex_lock(&pf->usdev_lock);
473 list_add_tail(&vf->link, &pf->vf_dev_list);
475 * Save max settings (will be same for each VF, easier to re-write than
476 * to say "if (!set) { set_values(); set=1; }
478 for (res_type = USNIC_VNIC_RES_TYPE_EOL+1;
479 res_type < USNIC_VNIC_RES_TYPE_MAX;
481 pf->vf_res_cnt[res_type] = usnic_vnic_res_cnt(vf->vnic,
485 mutex_unlock(&pf->usdev_lock);
487 usnic_info("Registering usnic VF %s into PF %s\n", pci_name(pdev),
493 usnic_vnic_free(vf->vnic);
495 pci_set_drvdata(pdev, NULL);
496 pci_clear_master(pdev);
497 pci_release_regions(pdev);
499 pci_disable_device(pdev);
505 static void usnic_ib_pci_remove(struct pci_dev *pdev)
507 struct usnic_ib_vf *vf = pci_get_drvdata(pdev);
508 struct usnic_ib_dev *pf = vf->pf;
510 mutex_lock(&pf->usdev_lock);
512 mutex_unlock(&pf->usdev_lock);
514 kref_put(&pf->vf_cnt, usnic_ib_undiscover_pf);
515 usnic_vnic_free(vf->vnic);
516 pci_set_drvdata(pdev, NULL);
517 pci_clear_master(pdev);
518 pci_release_regions(pdev);
519 pci_disable_device(pdev);
522 usnic_info("Removed VF %s\n", pci_name(pdev));
525 /* PCI driver entry points */
526 static struct pci_driver usnic_ib_pci_driver = {
528 .id_table = usnic_ib_pci_ids,
529 .probe = usnic_ib_pci_probe,
530 .remove = usnic_ib_pci_remove,
532 /* End of PCI section */
534 /* Start of module section */
535 static int __init usnic_ib_init(void)
539 printk_once(KERN_INFO "%s", usnic_version);
541 err = usnic_uiom_init(DRV_NAME);
543 usnic_err("Unable to initalize umem with err %d\n", err);
547 if (pci_register_driver(&usnic_ib_pci_driver)) {
548 usnic_err("Unable to register with PCI\n");
552 err = register_netdevice_notifier(&usnic_ib_netdevice_notifier);
554 usnic_err("Failed to register netdev notifier\n");
558 err = usnic_transport_init();
560 usnic_err("Failed to initialize transport\n");
561 goto out_unreg_netdev_notifier;
564 usnic_debugfs_init();
568 out_unreg_netdev_notifier:
569 unregister_netdevice_notifier(&usnic_ib_netdevice_notifier);
571 pci_unregister_driver(&usnic_ib_pci_driver);
578 static void __exit usnic_ib_destroy(void)
581 usnic_debugfs_exit();
582 usnic_transport_fini();
583 unregister_netdevice_notifier(&usnic_ib_netdevice_notifier);
584 pci_unregister_driver(&usnic_ib_pci_driver);
588 MODULE_DESCRIPTION("Cisco VIC (usNIC) Verbs Driver");
589 MODULE_AUTHOR("Upinder Malhi <umalhi@cisco.com>");
590 MODULE_LICENSE("Dual BSD/GPL");
591 MODULE_VERSION(DRV_VERSION);
592 module_param(usnic_log_lvl, uint, S_IRUGO | S_IWUSR);
593 module_param(usnic_ib_share_vf, uint, S_IRUGO | S_IWUSR);
594 MODULE_PARM_DESC(usnic_log_lvl, " Off=0, Err=1, Info=2, Debug=3");
595 MODULE_PARM_DESC(usnic_ib_share_vf, "Off=0, On=1 VF sharing amongst QPs");
596 MODULE_DEVICE_TABLE(pci, usnic_ib_pci_ids);
598 module_init(usnic_ib_init);
599 module_exit(usnic_ib_destroy);
600 /* End of module section */