RDMA/ocrdma: Support the new memory registration API
[firefly-linux-kernel-4.4.55.git] / drivers / infiniband / hw / ocrdma / ocrdma_main.c
1 /* This file is part of the Emulex RoCE Device Driver for
2  * RoCE (RDMA over Converged Ethernet) adapters.
3  * Copyright (C) 2012-2015 Emulex. All rights reserved.
4  * EMULEX and SLI are trademarks of Emulex.
5  * www.emulex.com
6  *
7  * This software is available to you under a choice of one of two licenses.
8  * You may choose to be licensed under the terms of the GNU General Public
9  * License (GPL) Version 2, available from the file COPYING in the main
10  * directory of this source tree, or the BSD license below:
11  *
12  * Redistribution and use in source and binary forms, with or without
13  * modification, are permitted provided that the following conditions
14  * are met:
15  *
16  * - Redistributions of source code must retain the above copyright notice,
17  *   this list of conditions and the following disclaimer.
18  *
19  * - Redistributions in binary form must reproduce the above copyright
20  *   notice, this list of conditions and the following disclaimer in
21  *   the documentation and/or other materials provided with the distribution.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
24  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,THE
25  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
27  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
28  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
29  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
30  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
31  * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
32  * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
33  * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
34  *
35  * Contact Information:
36  * linux-drivers@emulex.com
37  *
38  * Emulex
39  * 3333 Susan Street
40  * Costa Mesa, CA 92626
41  */
42
43 #include <linux/module.h>
44 #include <linux/idr.h>
45 #include <rdma/ib_verbs.h>
46 #include <rdma/ib_user_verbs.h>
47 #include <rdma/ib_addr.h>
48 #include <rdma/ib_mad.h>
49
50 #include <linux/netdevice.h>
51 #include <net/addrconf.h>
52
53 #include "ocrdma.h"
54 #include "ocrdma_verbs.h"
55 #include "ocrdma_ah.h"
56 #include "be_roce.h"
57 #include "ocrdma_hw.h"
58 #include "ocrdma_stats.h"
59 #include "ocrdma_abi.h"
60
61 MODULE_VERSION(OCRDMA_ROCE_DRV_VERSION);
62 MODULE_DESCRIPTION(OCRDMA_ROCE_DRV_DESC " " OCRDMA_ROCE_DRV_VERSION);
63 MODULE_AUTHOR("Emulex Corporation");
64 MODULE_LICENSE("Dual BSD/GPL");
65
66 static DEFINE_IDR(ocrdma_dev_id);
67
68 void ocrdma_get_guid(struct ocrdma_dev *dev, u8 *guid)
69 {
70         u8 mac_addr[6];
71
72         memcpy(&mac_addr[0], &dev->nic_info.mac_addr[0], ETH_ALEN);
73         guid[0] = mac_addr[0] ^ 2;
74         guid[1] = mac_addr[1];
75         guid[2] = mac_addr[2];
76         guid[3] = 0xff;
77         guid[4] = 0xfe;
78         guid[5] = mac_addr[3];
79         guid[6] = mac_addr[4];
80         guid[7] = mac_addr[5];
81 }
82 static enum rdma_link_layer ocrdma_link_layer(struct ib_device *device,
83                                               u8 port_num)
84 {
85         return IB_LINK_LAYER_ETHERNET;
86 }
87
88 static int ocrdma_port_immutable(struct ib_device *ibdev, u8 port_num,
89                                  struct ib_port_immutable *immutable)
90 {
91         struct ib_port_attr attr;
92         int err;
93
94         err = ocrdma_query_port(ibdev, port_num, &attr);
95         if (err)
96                 return err;
97
98         immutable->pkey_tbl_len = attr.pkey_tbl_len;
99         immutable->gid_tbl_len = attr.gid_tbl_len;
100         immutable->core_cap_flags = RDMA_CORE_PORT_IBA_ROCE;
101         immutable->max_mad_size = IB_MGMT_MAD_SIZE;
102
103         return 0;
104 }
105
106 static int ocrdma_register_device(struct ocrdma_dev *dev)
107 {
108         strlcpy(dev->ibdev.name, "ocrdma%d", IB_DEVICE_NAME_MAX);
109         ocrdma_get_guid(dev, (u8 *)&dev->ibdev.node_guid);
110         memcpy(dev->ibdev.node_desc, OCRDMA_NODE_DESC,
111                sizeof(OCRDMA_NODE_DESC));
112         dev->ibdev.owner = THIS_MODULE;
113         dev->ibdev.uverbs_abi_ver = OCRDMA_ABI_VERSION;
114         dev->ibdev.uverbs_cmd_mask =
115             OCRDMA_UVERBS(GET_CONTEXT) |
116             OCRDMA_UVERBS(QUERY_DEVICE) |
117             OCRDMA_UVERBS(QUERY_PORT) |
118             OCRDMA_UVERBS(ALLOC_PD) |
119             OCRDMA_UVERBS(DEALLOC_PD) |
120             OCRDMA_UVERBS(REG_MR) |
121             OCRDMA_UVERBS(DEREG_MR) |
122             OCRDMA_UVERBS(CREATE_COMP_CHANNEL) |
123             OCRDMA_UVERBS(CREATE_CQ) |
124             OCRDMA_UVERBS(RESIZE_CQ) |
125             OCRDMA_UVERBS(DESTROY_CQ) |
126             OCRDMA_UVERBS(REQ_NOTIFY_CQ) |
127             OCRDMA_UVERBS(CREATE_QP) |
128             OCRDMA_UVERBS(MODIFY_QP) |
129             OCRDMA_UVERBS(QUERY_QP) |
130             OCRDMA_UVERBS(DESTROY_QP) |
131             OCRDMA_UVERBS(POLL_CQ) |
132             OCRDMA_UVERBS(POST_SEND) |
133             OCRDMA_UVERBS(POST_RECV);
134
135         dev->ibdev.uverbs_cmd_mask |=
136             OCRDMA_UVERBS(CREATE_AH) |
137              OCRDMA_UVERBS(MODIFY_AH) |
138              OCRDMA_UVERBS(QUERY_AH) |
139              OCRDMA_UVERBS(DESTROY_AH);
140
141         dev->ibdev.node_type = RDMA_NODE_IB_CA;
142         dev->ibdev.phys_port_cnt = 1;
143         dev->ibdev.num_comp_vectors = dev->eq_cnt;
144
145         /* mandatory verbs. */
146         dev->ibdev.query_device = ocrdma_query_device;
147         dev->ibdev.query_port = ocrdma_query_port;
148         dev->ibdev.modify_port = ocrdma_modify_port;
149         dev->ibdev.query_gid = ocrdma_query_gid;
150         dev->ibdev.get_netdev = ocrdma_get_netdev;
151         dev->ibdev.add_gid = ocrdma_add_gid;
152         dev->ibdev.del_gid = ocrdma_del_gid;
153         dev->ibdev.get_link_layer = ocrdma_link_layer;
154         dev->ibdev.alloc_pd = ocrdma_alloc_pd;
155         dev->ibdev.dealloc_pd = ocrdma_dealloc_pd;
156
157         dev->ibdev.create_cq = ocrdma_create_cq;
158         dev->ibdev.destroy_cq = ocrdma_destroy_cq;
159         dev->ibdev.resize_cq = ocrdma_resize_cq;
160
161         dev->ibdev.create_qp = ocrdma_create_qp;
162         dev->ibdev.modify_qp = ocrdma_modify_qp;
163         dev->ibdev.query_qp = ocrdma_query_qp;
164         dev->ibdev.destroy_qp = ocrdma_destroy_qp;
165
166         dev->ibdev.query_pkey = ocrdma_query_pkey;
167         dev->ibdev.create_ah = ocrdma_create_ah;
168         dev->ibdev.destroy_ah = ocrdma_destroy_ah;
169         dev->ibdev.query_ah = ocrdma_query_ah;
170         dev->ibdev.modify_ah = ocrdma_modify_ah;
171
172         dev->ibdev.poll_cq = ocrdma_poll_cq;
173         dev->ibdev.post_send = ocrdma_post_send;
174         dev->ibdev.post_recv = ocrdma_post_recv;
175         dev->ibdev.req_notify_cq = ocrdma_arm_cq;
176
177         dev->ibdev.get_dma_mr = ocrdma_get_dma_mr;
178         dev->ibdev.reg_phys_mr = ocrdma_reg_kernel_mr;
179         dev->ibdev.dereg_mr = ocrdma_dereg_mr;
180         dev->ibdev.reg_user_mr = ocrdma_reg_user_mr;
181
182         dev->ibdev.alloc_mr = ocrdma_alloc_mr;
183         dev->ibdev.map_mr_sg = ocrdma_map_mr_sg;
184         dev->ibdev.alloc_fast_reg_page_list = ocrdma_alloc_frmr_page_list;
185         dev->ibdev.free_fast_reg_page_list = ocrdma_free_frmr_page_list;
186
187         /* mandatory to support user space verbs consumer. */
188         dev->ibdev.alloc_ucontext = ocrdma_alloc_ucontext;
189         dev->ibdev.dealloc_ucontext = ocrdma_dealloc_ucontext;
190         dev->ibdev.mmap = ocrdma_mmap;
191         dev->ibdev.dma_device = &dev->nic_info.pdev->dev;
192
193         dev->ibdev.process_mad = ocrdma_process_mad;
194         dev->ibdev.get_port_immutable = ocrdma_port_immutable;
195
196         if (ocrdma_get_asic_type(dev) == OCRDMA_ASIC_GEN_SKH_R) {
197                 dev->ibdev.uverbs_cmd_mask |=
198                      OCRDMA_UVERBS(CREATE_SRQ) |
199                      OCRDMA_UVERBS(MODIFY_SRQ) |
200                      OCRDMA_UVERBS(QUERY_SRQ) |
201                      OCRDMA_UVERBS(DESTROY_SRQ) |
202                      OCRDMA_UVERBS(POST_SRQ_RECV);
203
204                 dev->ibdev.create_srq = ocrdma_create_srq;
205                 dev->ibdev.modify_srq = ocrdma_modify_srq;
206                 dev->ibdev.query_srq = ocrdma_query_srq;
207                 dev->ibdev.destroy_srq = ocrdma_destroy_srq;
208                 dev->ibdev.post_srq_recv = ocrdma_post_srq_recv;
209         }
210         return ib_register_device(&dev->ibdev, NULL);
211 }
212
213 static int ocrdma_alloc_resources(struct ocrdma_dev *dev)
214 {
215         mutex_init(&dev->dev_lock);
216         dev->cq_tbl = kzalloc(sizeof(struct ocrdma_cq *) *
217                               OCRDMA_MAX_CQ, GFP_KERNEL);
218         if (!dev->cq_tbl)
219                 goto alloc_err;
220
221         if (dev->attr.max_qp) {
222                 dev->qp_tbl = kzalloc(sizeof(struct ocrdma_qp *) *
223                                       OCRDMA_MAX_QP, GFP_KERNEL);
224                 if (!dev->qp_tbl)
225                         goto alloc_err;
226         }
227
228         dev->stag_arr = kzalloc(sizeof(u64) * OCRDMA_MAX_STAG, GFP_KERNEL);
229         if (dev->stag_arr == NULL)
230                 goto alloc_err;
231
232         ocrdma_alloc_pd_pool(dev);
233
234         spin_lock_init(&dev->av_tbl.lock);
235         spin_lock_init(&dev->flush_q_lock);
236         return 0;
237 alloc_err:
238         pr_err("%s(%d) error.\n", __func__, dev->id);
239         return -ENOMEM;
240 }
241
242 static void ocrdma_free_resources(struct ocrdma_dev *dev)
243 {
244         kfree(dev->stag_arr);
245         kfree(dev->qp_tbl);
246         kfree(dev->cq_tbl);
247 }
248
249 /* OCRDMA sysfs interface */
250 static ssize_t show_rev(struct device *device, struct device_attribute *attr,
251                         char *buf)
252 {
253         struct ocrdma_dev *dev = dev_get_drvdata(device);
254
255         return scnprintf(buf, PAGE_SIZE, "0x%x\n", dev->nic_info.pdev->vendor);
256 }
257
258 static ssize_t show_fw_ver(struct device *device, struct device_attribute *attr,
259                         char *buf)
260 {
261         struct ocrdma_dev *dev = dev_get_drvdata(device);
262
263         return scnprintf(buf, PAGE_SIZE, "%s\n", &dev->attr.fw_ver[0]);
264 }
265
266 static ssize_t show_hca_type(struct device *device,
267                              struct device_attribute *attr, char *buf)
268 {
269         struct ocrdma_dev *dev = dev_get_drvdata(device);
270
271         return scnprintf(buf, PAGE_SIZE, "%s\n", &dev->model_number[0]);
272 }
273
274 static DEVICE_ATTR(hw_rev, S_IRUGO, show_rev, NULL);
275 static DEVICE_ATTR(fw_ver, S_IRUGO, show_fw_ver, NULL);
276 static DEVICE_ATTR(hca_type, S_IRUGO, show_hca_type, NULL);
277
278 static struct device_attribute *ocrdma_attributes[] = {
279         &dev_attr_hw_rev,
280         &dev_attr_fw_ver,
281         &dev_attr_hca_type
282 };
283
284 static void ocrdma_remove_sysfiles(struct ocrdma_dev *dev)
285 {
286         int i;
287
288         for (i = 0; i < ARRAY_SIZE(ocrdma_attributes); i++)
289                 device_remove_file(&dev->ibdev.dev, ocrdma_attributes[i]);
290 }
291
292 static struct ocrdma_dev *ocrdma_add(struct be_dev_info *dev_info)
293 {
294         int status = 0, i;
295         struct ocrdma_dev *dev;
296
297         dev = (struct ocrdma_dev *)ib_alloc_device(sizeof(struct ocrdma_dev));
298         if (!dev) {
299                 pr_err("Unable to allocate ib device\n");
300                 return NULL;
301         }
302         dev->mbx_cmd = kzalloc(sizeof(struct ocrdma_mqe_emb_cmd), GFP_KERNEL);
303         if (!dev->mbx_cmd)
304                 goto idr_err;
305
306         memcpy(&dev->nic_info, dev_info, sizeof(*dev_info));
307         dev->id = idr_alloc(&ocrdma_dev_id, NULL, 0, 0, GFP_KERNEL);
308         if (dev->id < 0)
309                 goto idr_err;
310
311         status = ocrdma_init_hw(dev);
312         if (status)
313                 goto init_err;
314
315         status = ocrdma_alloc_resources(dev);
316         if (status)
317                 goto alloc_err;
318
319         ocrdma_init_service_level(dev);
320         status = ocrdma_register_device(dev);
321         if (status)
322                 goto alloc_err;
323
324         for (i = 0; i < ARRAY_SIZE(ocrdma_attributes); i++)
325                 if (device_create_file(&dev->ibdev.dev, ocrdma_attributes[i]))
326                         goto sysfs_err;
327         /* Init stats */
328         ocrdma_add_port_stats(dev);
329         /* Interrupt Moderation */
330         INIT_DELAYED_WORK(&dev->eqd_work, ocrdma_eqd_set_task);
331         schedule_delayed_work(&dev->eqd_work, msecs_to_jiffies(1000));
332
333         pr_info("%s %s: %s \"%s\" port %d\n",
334                 dev_name(&dev->nic_info.pdev->dev), hca_name(dev),
335                 port_speed_string(dev), dev->model_number,
336                 dev->hba_port_num);
337         pr_info("%s ocrdma%d driver loaded successfully\n",
338                 dev_name(&dev->nic_info.pdev->dev), dev->id);
339         return dev;
340
341 sysfs_err:
342         ocrdma_remove_sysfiles(dev);
343 alloc_err:
344         ocrdma_free_resources(dev);
345         ocrdma_cleanup_hw(dev);
346 init_err:
347         idr_remove(&ocrdma_dev_id, dev->id);
348 idr_err:
349         kfree(dev->mbx_cmd);
350         ib_dealloc_device(&dev->ibdev);
351         pr_err("%s() leaving. ret=%d\n", __func__, status);
352         return NULL;
353 }
354
355 static void ocrdma_remove_free(struct ocrdma_dev *dev)
356 {
357
358         idr_remove(&ocrdma_dev_id, dev->id);
359         kfree(dev->mbx_cmd);
360         ib_dealloc_device(&dev->ibdev);
361 }
362
363 static void ocrdma_remove(struct ocrdma_dev *dev)
364 {
365         /* first unregister with stack to stop all the active traffic
366          * of the registered clients.
367          */
368         cancel_delayed_work_sync(&dev->eqd_work);
369         ocrdma_remove_sysfiles(dev);
370         ib_unregister_device(&dev->ibdev);
371
372         ocrdma_rem_port_stats(dev);
373         ocrdma_free_resources(dev);
374         ocrdma_cleanup_hw(dev);
375         ocrdma_remove_free(dev);
376 }
377
378 static int ocrdma_open(struct ocrdma_dev *dev)
379 {
380         struct ib_event port_event;
381
382         port_event.event = IB_EVENT_PORT_ACTIVE;
383         port_event.element.port_num = 1;
384         port_event.device = &dev->ibdev;
385         ib_dispatch_event(&port_event);
386         return 0;
387 }
388
389 static int ocrdma_close(struct ocrdma_dev *dev)
390 {
391         int i;
392         struct ocrdma_qp *qp, **cur_qp;
393         struct ib_event err_event;
394         struct ib_qp_attr attrs;
395         int attr_mask = IB_QP_STATE;
396
397         attrs.qp_state = IB_QPS_ERR;
398         mutex_lock(&dev->dev_lock);
399         if (dev->qp_tbl) {
400                 cur_qp = dev->qp_tbl;
401                 for (i = 0; i < OCRDMA_MAX_QP; i++) {
402                         qp = cur_qp[i];
403                         if (qp && qp->ibqp.qp_type != IB_QPT_GSI) {
404                                 /* change the QP state to ERROR */
405                                 _ocrdma_modify_qp(&qp->ibqp, &attrs, attr_mask);
406
407                                 err_event.event = IB_EVENT_QP_FATAL;
408                                 err_event.element.qp = &qp->ibqp;
409                                 err_event.device = &dev->ibdev;
410                                 ib_dispatch_event(&err_event);
411                         }
412                 }
413         }
414         mutex_unlock(&dev->dev_lock);
415
416         err_event.event = IB_EVENT_PORT_ERR;
417         err_event.element.port_num = 1;
418         err_event.device = &dev->ibdev;
419         ib_dispatch_event(&err_event);
420         return 0;
421 }
422
423 static void ocrdma_shutdown(struct ocrdma_dev *dev)
424 {
425         ocrdma_close(dev);
426         ocrdma_remove(dev);
427 }
428
429 /* event handling via NIC driver ensures that all the NIC specific
430  * initialization done before RoCE driver notifies
431  * event to stack.
432  */
433 static void ocrdma_event_handler(struct ocrdma_dev *dev, u32 event)
434 {
435         switch (event) {
436         case BE_DEV_UP:
437                 ocrdma_open(dev);
438                 break;
439         case BE_DEV_DOWN:
440                 ocrdma_close(dev);
441                 break;
442         case BE_DEV_SHUTDOWN:
443                 ocrdma_shutdown(dev);
444                 break;
445         }
446 }
447
448 static struct ocrdma_driver ocrdma_drv = {
449         .name                   = "ocrdma_driver",
450         .add                    = ocrdma_add,
451         .remove                 = ocrdma_remove,
452         .state_change_handler   = ocrdma_event_handler,
453         .be_abi_version         = OCRDMA_BE_ROCE_ABI_VERSION,
454 };
455
456 static int __init ocrdma_init_module(void)
457 {
458         int status;
459
460         ocrdma_init_debugfs();
461
462         status = be_roce_register_driver(&ocrdma_drv);
463         if (status)
464                 goto err_be_reg;
465
466         return 0;
467
468 err_be_reg:
469
470         return status;
471 }
472
473 static void __exit ocrdma_exit_module(void)
474 {
475         be_roce_unregister_driver(&ocrdma_drv);
476         ocrdma_rem_debugfs();
477         idr_destroy(&ocrdma_dev_id);
478 }
479
480 module_init(ocrdma_init_module);
481 module_exit(ocrdma_exit_module);