Loading...
1/*
2 * Copyright (c) 2016 Hisilicon Limited.
3 * Copyright (c) 2007, 2008 Mellanox Technologies. All rights reserved.
4 *
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
10 *
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
13 * conditions are met:
14 *
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
17 * disclaimer.
18 *
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
23 *
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31 * SOFTWARE.
32 */
33#include <linux/acpi.h>
34#include <linux/module.h>
35#include <linux/pci.h>
36#include <rdma/ib_addr.h>
37#include <rdma/ib_smi.h>
38#include <rdma/ib_user_verbs.h>
39#include <rdma/ib_cache.h>
40#include "hns_roce_common.h"
41#include "hns_roce_device.h"
42#include "hns_roce_hem.h"
43
44static int hns_roce_set_mac(struct hns_roce_dev *hr_dev, u32 port,
45 const u8 *addr)
46{
47 u8 phy_port;
48 u32 i;
49
50 if (hr_dev->pci_dev->revision >= PCI_REVISION_ID_HIP09)
51 return 0;
52
53 if (!memcmp(hr_dev->dev_addr[port], addr, ETH_ALEN))
54 return 0;
55
56 for (i = 0; i < ETH_ALEN; i++)
57 hr_dev->dev_addr[port][i] = addr[i];
58
59 phy_port = hr_dev->iboe.phy_port[port];
60 return hr_dev->hw->set_mac(hr_dev, phy_port, addr);
61}
62
63static int hns_roce_add_gid(const struct ib_gid_attr *attr, void **context)
64{
65 struct hns_roce_dev *hr_dev = to_hr_dev(attr->device);
66 u32 port = attr->port_num - 1;
67 int ret;
68
69 if (port >= hr_dev->caps.num_ports)
70 return -EINVAL;
71
72 ret = hr_dev->hw->set_gid(hr_dev, attr->index, &attr->gid, attr);
73
74 return ret;
75}
76
77static int hns_roce_del_gid(const struct ib_gid_attr *attr, void **context)
78{
79 struct hns_roce_dev *hr_dev = to_hr_dev(attr->device);
80 u32 port = attr->port_num - 1;
81 int ret;
82
83 if (port >= hr_dev->caps.num_ports)
84 return -EINVAL;
85
86 ret = hr_dev->hw->set_gid(hr_dev, attr->index, NULL, NULL);
87
88 return ret;
89}
90
91static int handle_en_event(struct hns_roce_dev *hr_dev, u32 port,
92 unsigned long event)
93{
94 struct device *dev = hr_dev->dev;
95 struct net_device *netdev;
96 int ret = 0;
97
98 netdev = hr_dev->iboe.netdevs[port];
99 if (!netdev) {
100 dev_err(dev, "can't find netdev on port(%u)!\n", port);
101 return -ENODEV;
102 }
103
104 switch (event) {
105 case NETDEV_UP:
106 case NETDEV_CHANGE:
107 case NETDEV_REGISTER:
108 case NETDEV_CHANGEADDR:
109 ret = hns_roce_set_mac(hr_dev, port, netdev->dev_addr);
110 break;
111 case NETDEV_DOWN:
112 /*
113 * In v1 engine, only support all ports closed together.
114 */
115 break;
116 default:
117 dev_dbg(dev, "NETDEV event = 0x%x!\n", (u32)(event));
118 break;
119 }
120
121 return ret;
122}
123
124static int hns_roce_netdev_event(struct notifier_block *self,
125 unsigned long event, void *ptr)
126{
127 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
128 struct hns_roce_ib_iboe *iboe = NULL;
129 struct hns_roce_dev *hr_dev = NULL;
130 int ret;
131 u32 port;
132
133 hr_dev = container_of(self, struct hns_roce_dev, iboe.nb);
134 iboe = &hr_dev->iboe;
135
136 for (port = 0; port < hr_dev->caps.num_ports; port++) {
137 if (dev == iboe->netdevs[port]) {
138 ret = handle_en_event(hr_dev, port, event);
139 if (ret)
140 return NOTIFY_DONE;
141 break;
142 }
143 }
144
145 return NOTIFY_DONE;
146}
147
148static int hns_roce_setup_mtu_mac(struct hns_roce_dev *hr_dev)
149{
150 int ret;
151 u8 i;
152
153 for (i = 0; i < hr_dev->caps.num_ports; i++) {
154 ret = hns_roce_set_mac(hr_dev, i,
155 hr_dev->iboe.netdevs[i]->dev_addr);
156 if (ret)
157 return ret;
158 }
159
160 return 0;
161}
162
163static int hns_roce_query_device(struct ib_device *ib_dev,
164 struct ib_device_attr *props,
165 struct ib_udata *uhw)
166{
167 struct hns_roce_dev *hr_dev = to_hr_dev(ib_dev);
168
169 memset(props, 0, sizeof(*props));
170
171 props->fw_ver = hr_dev->caps.fw_ver;
172 props->sys_image_guid = cpu_to_be64(hr_dev->sys_image_guid);
173 props->max_mr_size = (u64)(~(0ULL));
174 props->page_size_cap = hr_dev->caps.page_size_cap;
175 props->vendor_id = hr_dev->vendor_id;
176 props->vendor_part_id = hr_dev->vendor_part_id;
177 props->hw_ver = hr_dev->hw_rev;
178 props->max_qp = hr_dev->caps.num_qps;
179 props->max_qp_wr = hr_dev->caps.max_wqes;
180 props->device_cap_flags = IB_DEVICE_PORT_ACTIVE_EVENT |
181 IB_DEVICE_RC_RNR_NAK_GEN;
182 props->max_send_sge = hr_dev->caps.max_sq_sg;
183 props->max_recv_sge = hr_dev->caps.max_rq_sg;
184 props->max_sge_rd = 1;
185 props->max_cq = hr_dev->caps.num_cqs;
186 props->max_cqe = hr_dev->caps.max_cqes;
187 props->max_mr = hr_dev->caps.num_mtpts;
188 props->max_pd = hr_dev->caps.num_pds;
189 props->max_qp_rd_atom = hr_dev->caps.max_qp_dest_rdma;
190 props->max_qp_init_rd_atom = hr_dev->caps.max_qp_init_rdma;
191 props->atomic_cap = hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_ATOMIC ?
192 IB_ATOMIC_HCA : IB_ATOMIC_NONE;
193 props->max_pkeys = 1;
194 props->local_ca_ack_delay = hr_dev->caps.local_ca_ack_delay;
195 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ) {
196 props->max_srq = hr_dev->caps.num_srqs;
197 props->max_srq_wr = hr_dev->caps.max_srq_wrs;
198 props->max_srq_sge = hr_dev->caps.max_srq_sges;
199 }
200
201 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_FRMR &&
202 hr_dev->pci_dev->revision >= PCI_REVISION_ID_HIP09) {
203 props->device_cap_flags |= IB_DEVICE_MEM_MGT_EXTENSIONS;
204 props->max_fast_reg_page_list_len = HNS_ROCE_FRMR_MAX_PA;
205 }
206
207 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_XRC)
208 props->device_cap_flags |= IB_DEVICE_XRC;
209
210 return 0;
211}
212
213static int hns_roce_query_port(struct ib_device *ib_dev, u32 port_num,
214 struct ib_port_attr *props)
215{
216 struct hns_roce_dev *hr_dev = to_hr_dev(ib_dev);
217 struct device *dev = hr_dev->dev;
218 struct net_device *net_dev;
219 unsigned long flags;
220 enum ib_mtu mtu;
221 u32 port;
222 int ret;
223
224 port = port_num - 1;
225
226 /* props being zeroed by the caller, avoid zeroing it here */
227
228 props->max_mtu = hr_dev->caps.max_mtu;
229 props->gid_tbl_len = hr_dev->caps.gid_table_len[port];
230 props->port_cap_flags = IB_PORT_CM_SUP | IB_PORT_REINIT_SUP |
231 IB_PORT_VENDOR_CLASS_SUP |
232 IB_PORT_BOOT_MGMT_SUP;
233 props->max_msg_sz = HNS_ROCE_MAX_MSG_LEN;
234 props->pkey_tbl_len = 1;
235 ret = ib_get_eth_speed(ib_dev, port_num, &props->active_speed,
236 &props->active_width);
237 if (ret)
238 ibdev_warn(ib_dev, "failed to get speed, ret = %d.\n", ret);
239
240 spin_lock_irqsave(&hr_dev->iboe.lock, flags);
241
242 net_dev = hr_dev->iboe.netdevs[port];
243 if (!net_dev) {
244 spin_unlock_irqrestore(&hr_dev->iboe.lock, flags);
245 dev_err(dev, "find netdev %u failed!\n", port);
246 return -EINVAL;
247 }
248
249 mtu = iboe_get_mtu(net_dev->mtu);
250 props->active_mtu = mtu ? min(props->max_mtu, mtu) : IB_MTU_256;
251 props->state = netif_running(net_dev) && netif_carrier_ok(net_dev) ?
252 IB_PORT_ACTIVE :
253 IB_PORT_DOWN;
254 props->phys_state = props->state == IB_PORT_ACTIVE ?
255 IB_PORT_PHYS_STATE_LINK_UP :
256 IB_PORT_PHYS_STATE_DISABLED;
257
258 spin_unlock_irqrestore(&hr_dev->iboe.lock, flags);
259
260 return 0;
261}
262
263static enum rdma_link_layer hns_roce_get_link_layer(struct ib_device *device,
264 u32 port_num)
265{
266 return IB_LINK_LAYER_ETHERNET;
267}
268
269static int hns_roce_query_pkey(struct ib_device *ib_dev, u32 port, u16 index,
270 u16 *pkey)
271{
272 if (index > 0)
273 return -EINVAL;
274
275 *pkey = PKEY_ID;
276
277 return 0;
278}
279
280static int hns_roce_modify_device(struct ib_device *ib_dev, int mask,
281 struct ib_device_modify *props)
282{
283 unsigned long flags;
284
285 if (mask & ~IB_DEVICE_MODIFY_NODE_DESC)
286 return -EOPNOTSUPP;
287
288 if (mask & IB_DEVICE_MODIFY_NODE_DESC) {
289 spin_lock_irqsave(&to_hr_dev(ib_dev)->sm_lock, flags);
290 memcpy(ib_dev->node_desc, props->node_desc, NODE_DESC_SIZE);
291 spin_unlock_irqrestore(&to_hr_dev(ib_dev)->sm_lock, flags);
292 }
293
294 return 0;
295}
296
297struct hns_user_mmap_entry *
298hns_roce_user_mmap_entry_insert(struct ib_ucontext *ucontext, u64 address,
299 size_t length,
300 enum hns_roce_mmap_type mmap_type)
301{
302 struct hns_user_mmap_entry *entry;
303 int ret;
304
305 entry = kzalloc(sizeof(*entry), GFP_KERNEL);
306 if (!entry)
307 return NULL;
308
309 entry->address = address;
310 entry->mmap_type = mmap_type;
311
312 switch (mmap_type) {
313 /* pgoff 0 must be used by DB for compatibility */
314 case HNS_ROCE_MMAP_TYPE_DB:
315 ret = rdma_user_mmap_entry_insert_exact(
316 ucontext, &entry->rdma_entry, length, 0);
317 break;
318 case HNS_ROCE_MMAP_TYPE_DWQE:
319 ret = rdma_user_mmap_entry_insert_range(
320 ucontext, &entry->rdma_entry, length, 1,
321 U32_MAX);
322 break;
323 default:
324 ret = -EINVAL;
325 break;
326 }
327
328 if (ret) {
329 kfree(entry);
330 return NULL;
331 }
332
333 return entry;
334}
335
336static void hns_roce_dealloc_uar_entry(struct hns_roce_ucontext *context)
337{
338 if (context->db_mmap_entry)
339 rdma_user_mmap_entry_remove(
340 &context->db_mmap_entry->rdma_entry);
341}
342
343static int hns_roce_alloc_uar_entry(struct ib_ucontext *uctx)
344{
345 struct hns_roce_ucontext *context = to_hr_ucontext(uctx);
346 u64 address;
347
348 address = context->uar.pfn << PAGE_SHIFT;
349 context->db_mmap_entry = hns_roce_user_mmap_entry_insert(
350 uctx, address, PAGE_SIZE, HNS_ROCE_MMAP_TYPE_DB);
351 if (!context->db_mmap_entry)
352 return -ENOMEM;
353
354 return 0;
355}
356
357static int hns_roce_alloc_ucontext(struct ib_ucontext *uctx,
358 struct ib_udata *udata)
359{
360 struct hns_roce_ucontext *context = to_hr_ucontext(uctx);
361 struct hns_roce_dev *hr_dev = to_hr_dev(uctx->device);
362 struct hns_roce_ib_alloc_ucontext_resp resp = {};
363 struct hns_roce_ib_alloc_ucontext ucmd = {};
364 int ret = -EAGAIN;
365
366 if (!hr_dev->active)
367 goto error_out;
368
369 resp.qp_tab_size = hr_dev->caps.num_qps;
370 resp.srq_tab_size = hr_dev->caps.num_srqs;
371
372 ret = ib_copy_from_udata(&ucmd, udata,
373 min(udata->inlen, sizeof(ucmd)));
374 if (ret)
375 goto error_out;
376
377 if (hr_dev->pci_dev->revision >= PCI_REVISION_ID_HIP09)
378 context->config = ucmd.config & HNS_ROCE_EXSGE_FLAGS;
379
380 if (context->config & HNS_ROCE_EXSGE_FLAGS) {
381 resp.config |= HNS_ROCE_RSP_EXSGE_FLAGS;
382 resp.max_inline_data = hr_dev->caps.max_sq_inline;
383 }
384
385 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_RQ_INLINE) {
386 context->config |= ucmd.config & HNS_ROCE_RQ_INLINE_FLAGS;
387 if (context->config & HNS_ROCE_RQ_INLINE_FLAGS)
388 resp.config |= HNS_ROCE_RSP_RQ_INLINE_FLAGS;
389 }
390
391 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_CQE_INLINE) {
392 context->config |= ucmd.config & HNS_ROCE_CQE_INLINE_FLAGS;
393 if (context->config & HNS_ROCE_CQE_INLINE_FLAGS)
394 resp.config |= HNS_ROCE_RSP_CQE_INLINE_FLAGS;
395 }
396
397 ret = hns_roce_uar_alloc(hr_dev, &context->uar);
398 if (ret)
399 goto error_out;
400
401 ret = hns_roce_alloc_uar_entry(uctx);
402 if (ret)
403 goto error_fail_uar_entry;
404
405 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_CQ_RECORD_DB ||
406 hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_QP_RECORD_DB) {
407 INIT_LIST_HEAD(&context->page_list);
408 mutex_init(&context->page_mutex);
409 }
410
411 resp.cqe_size = hr_dev->caps.cqe_sz;
412
413 ret = ib_copy_to_udata(udata, &resp,
414 min(udata->outlen, sizeof(resp)));
415 if (ret)
416 goto error_fail_copy_to_udata;
417
418 return 0;
419
420error_fail_copy_to_udata:
421 hns_roce_dealloc_uar_entry(context);
422
423error_fail_uar_entry:
424 ida_free(&hr_dev->uar_ida.ida, (int)context->uar.logic_idx);
425
426error_out:
427 atomic64_inc(&hr_dev->dfx_cnt[HNS_ROCE_DFX_UCTX_ALLOC_ERR_CNT]);
428
429 return ret;
430}
431
432static void hns_roce_dealloc_ucontext(struct ib_ucontext *ibcontext)
433{
434 struct hns_roce_ucontext *context = to_hr_ucontext(ibcontext);
435 struct hns_roce_dev *hr_dev = to_hr_dev(ibcontext->device);
436
437 hns_roce_dealloc_uar_entry(context);
438
439 ida_free(&hr_dev->uar_ida.ida, (int)context->uar.logic_idx);
440}
441
442static int hns_roce_mmap(struct ib_ucontext *uctx, struct vm_area_struct *vma)
443{
444 struct hns_roce_dev *hr_dev = to_hr_dev(uctx->device);
445 struct rdma_user_mmap_entry *rdma_entry;
446 struct hns_user_mmap_entry *entry;
447 phys_addr_t pfn;
448 pgprot_t prot;
449 int ret;
450
451 rdma_entry = rdma_user_mmap_entry_get_pgoff(uctx, vma->vm_pgoff);
452 if (!rdma_entry) {
453 atomic64_inc(&hr_dev->dfx_cnt[HNS_ROCE_DFX_MMAP_ERR_CNT]);
454 return -EINVAL;
455 }
456
457 entry = to_hns_mmap(rdma_entry);
458 pfn = entry->address >> PAGE_SHIFT;
459
460 switch (entry->mmap_type) {
461 case HNS_ROCE_MMAP_TYPE_DB:
462 case HNS_ROCE_MMAP_TYPE_DWQE:
463 prot = pgprot_device(vma->vm_page_prot);
464 break;
465 default:
466 ret = -EINVAL;
467 goto out;
468 }
469
470 ret = rdma_user_mmap_io(uctx, vma, pfn, rdma_entry->npages * PAGE_SIZE,
471 prot, rdma_entry);
472
473out:
474 rdma_user_mmap_entry_put(rdma_entry);
475 if (ret)
476 atomic64_inc(&hr_dev->dfx_cnt[HNS_ROCE_DFX_MMAP_ERR_CNT]);
477
478 return ret;
479}
480
481static void hns_roce_free_mmap(struct rdma_user_mmap_entry *rdma_entry)
482{
483 struct hns_user_mmap_entry *entry = to_hns_mmap(rdma_entry);
484
485 kfree(entry);
486}
487
488static int hns_roce_port_immutable(struct ib_device *ib_dev, u32 port_num,
489 struct ib_port_immutable *immutable)
490{
491 struct ib_port_attr attr;
492 int ret;
493
494 ret = ib_query_port(ib_dev, port_num, &attr);
495 if (ret)
496 return ret;
497
498 immutable->pkey_tbl_len = attr.pkey_tbl_len;
499 immutable->gid_tbl_len = attr.gid_tbl_len;
500
501 immutable->max_mad_size = IB_MGMT_MAD_SIZE;
502 immutable->core_cap_flags = RDMA_CORE_PORT_IBA_ROCE;
503 if (to_hr_dev(ib_dev)->caps.flags & HNS_ROCE_CAP_FLAG_ROCE_V1_V2)
504 immutable->core_cap_flags |= RDMA_CORE_PORT_IBA_ROCE_UDP_ENCAP;
505
506 return 0;
507}
508
509static void hns_roce_disassociate_ucontext(struct ib_ucontext *ibcontext)
510{
511}
512
513static void hns_roce_get_fw_ver(struct ib_device *device, char *str)
514{
515 u64 fw_ver = to_hr_dev(device)->caps.fw_ver;
516 unsigned int major, minor, sub_minor;
517
518 major = upper_32_bits(fw_ver);
519 minor = high_16_bits(lower_32_bits(fw_ver));
520 sub_minor = low_16_bits(fw_ver);
521
522 snprintf(str, IB_FW_VERSION_NAME_MAX, "%u.%u.%04u", major, minor,
523 sub_minor);
524}
525
526#define HNS_ROCE_HW_CNT(ename, cname) \
527 [HNS_ROCE_HW_##ename##_CNT].name = cname
528
529static const struct rdma_stat_desc hns_roce_port_stats_descs[] = {
530 HNS_ROCE_HW_CNT(RX_RC_PKT, "rx_rc_pkt"),
531 HNS_ROCE_HW_CNT(RX_UC_PKT, "rx_uc_pkt"),
532 HNS_ROCE_HW_CNT(RX_UD_PKT, "rx_ud_pkt"),
533 HNS_ROCE_HW_CNT(RX_XRC_PKT, "rx_xrc_pkt"),
534 HNS_ROCE_HW_CNT(RX_PKT, "rx_pkt"),
535 HNS_ROCE_HW_CNT(RX_ERR_PKT, "rx_err_pkt"),
536 HNS_ROCE_HW_CNT(RX_CNP_PKT, "rx_cnp_pkt"),
537 HNS_ROCE_HW_CNT(TX_RC_PKT, "tx_rc_pkt"),
538 HNS_ROCE_HW_CNT(TX_UC_PKT, "tx_uc_pkt"),
539 HNS_ROCE_HW_CNT(TX_UD_PKT, "tx_ud_pkt"),
540 HNS_ROCE_HW_CNT(TX_XRC_PKT, "tx_xrc_pkt"),
541 HNS_ROCE_HW_CNT(TX_PKT, "tx_pkt"),
542 HNS_ROCE_HW_CNT(TX_ERR_PKT, "tx_err_pkt"),
543 HNS_ROCE_HW_CNT(TX_CNP_PKT, "tx_cnp_pkt"),
544 HNS_ROCE_HW_CNT(TRP_GET_MPT_ERR_PKT, "trp_get_mpt_err_pkt"),
545 HNS_ROCE_HW_CNT(TRP_GET_IRRL_ERR_PKT, "trp_get_irrl_err_pkt"),
546 HNS_ROCE_HW_CNT(ECN_DB, "ecn_doorbell"),
547 HNS_ROCE_HW_CNT(RX_BUF, "rx_buffer"),
548 HNS_ROCE_HW_CNT(TRP_RX_SOF, "trp_rx_sof"),
549 HNS_ROCE_HW_CNT(CQ_CQE, "cq_cqe"),
550 HNS_ROCE_HW_CNT(CQ_POE, "cq_poe"),
551 HNS_ROCE_HW_CNT(CQ_NOTIFY, "cq_notify"),
552};
553
554static struct rdma_hw_stats *hns_roce_alloc_hw_port_stats(
555 struct ib_device *device, u32 port_num)
556{
557 struct hns_roce_dev *hr_dev = to_hr_dev(device);
558
559 if (port_num > hr_dev->caps.num_ports) {
560 ibdev_err(device, "invalid port num.\n");
561 return NULL;
562 }
563
564 return rdma_alloc_hw_stats_struct(hns_roce_port_stats_descs,
565 ARRAY_SIZE(hns_roce_port_stats_descs),
566 RDMA_HW_STATS_DEFAULT_LIFESPAN);
567}
568
569static int hns_roce_get_hw_stats(struct ib_device *device,
570 struct rdma_hw_stats *stats,
571 u32 port, int index)
572{
573 struct hns_roce_dev *hr_dev = to_hr_dev(device);
574 int num_counters = HNS_ROCE_HW_CNT_TOTAL;
575 int ret;
576
577 if (port == 0)
578 return 0;
579
580 if (port > hr_dev->caps.num_ports)
581 return -EINVAL;
582
583 ret = hr_dev->hw->query_hw_counter(hr_dev, stats->value, port,
584 &num_counters);
585 if (ret) {
586 ibdev_err(device, "failed to query hw counter, ret = %d\n",
587 ret);
588 return ret;
589 }
590
591 return num_counters;
592}
593
594static void hns_roce_unregister_device(struct hns_roce_dev *hr_dev)
595{
596 struct hns_roce_ib_iboe *iboe = &hr_dev->iboe;
597
598 hr_dev->active = false;
599 unregister_netdevice_notifier(&iboe->nb);
600 ib_unregister_device(&hr_dev->ib_dev);
601}
602
603static const struct ib_device_ops hns_roce_dev_ops = {
604 .owner = THIS_MODULE,
605 .driver_id = RDMA_DRIVER_HNS,
606 .uverbs_abi_ver = 1,
607 .uverbs_no_driver_id_binding = 1,
608
609 .get_dev_fw_str = hns_roce_get_fw_ver,
610 .add_gid = hns_roce_add_gid,
611 .alloc_pd = hns_roce_alloc_pd,
612 .alloc_ucontext = hns_roce_alloc_ucontext,
613 .create_ah = hns_roce_create_ah,
614 .create_user_ah = hns_roce_create_ah,
615 .create_cq = hns_roce_create_cq,
616 .create_qp = hns_roce_create_qp,
617 .dealloc_pd = hns_roce_dealloc_pd,
618 .dealloc_ucontext = hns_roce_dealloc_ucontext,
619 .del_gid = hns_roce_del_gid,
620 .dereg_mr = hns_roce_dereg_mr,
621 .destroy_ah = hns_roce_destroy_ah,
622 .destroy_cq = hns_roce_destroy_cq,
623 .disassociate_ucontext = hns_roce_disassociate_ucontext,
624 .get_dma_mr = hns_roce_get_dma_mr,
625 .get_link_layer = hns_roce_get_link_layer,
626 .get_port_immutable = hns_roce_port_immutable,
627 .mmap = hns_roce_mmap,
628 .mmap_free = hns_roce_free_mmap,
629 .modify_device = hns_roce_modify_device,
630 .modify_qp = hns_roce_modify_qp,
631 .query_ah = hns_roce_query_ah,
632 .query_device = hns_roce_query_device,
633 .query_pkey = hns_roce_query_pkey,
634 .query_port = hns_roce_query_port,
635 .reg_user_mr = hns_roce_reg_user_mr,
636
637 INIT_RDMA_OBJ_SIZE(ib_ah, hns_roce_ah, ibah),
638 INIT_RDMA_OBJ_SIZE(ib_cq, hns_roce_cq, ib_cq),
639 INIT_RDMA_OBJ_SIZE(ib_pd, hns_roce_pd, ibpd),
640 INIT_RDMA_OBJ_SIZE(ib_qp, hns_roce_qp, ibqp),
641 INIT_RDMA_OBJ_SIZE(ib_ucontext, hns_roce_ucontext, ibucontext),
642};
643
644static const struct ib_device_ops hns_roce_dev_hw_stats_ops = {
645 .alloc_hw_port_stats = hns_roce_alloc_hw_port_stats,
646 .get_hw_stats = hns_roce_get_hw_stats,
647};
648
649static const struct ib_device_ops hns_roce_dev_mr_ops = {
650 .rereg_user_mr = hns_roce_rereg_user_mr,
651};
652
653static const struct ib_device_ops hns_roce_dev_mw_ops = {
654 .alloc_mw = hns_roce_alloc_mw,
655 .dealloc_mw = hns_roce_dealloc_mw,
656
657 INIT_RDMA_OBJ_SIZE(ib_mw, hns_roce_mw, ibmw),
658};
659
660static const struct ib_device_ops hns_roce_dev_frmr_ops = {
661 .alloc_mr = hns_roce_alloc_mr,
662 .map_mr_sg = hns_roce_map_mr_sg,
663};
664
665static const struct ib_device_ops hns_roce_dev_srq_ops = {
666 .create_srq = hns_roce_create_srq,
667 .destroy_srq = hns_roce_destroy_srq,
668
669 INIT_RDMA_OBJ_SIZE(ib_srq, hns_roce_srq, ibsrq),
670};
671
672static const struct ib_device_ops hns_roce_dev_xrcd_ops = {
673 .alloc_xrcd = hns_roce_alloc_xrcd,
674 .dealloc_xrcd = hns_roce_dealloc_xrcd,
675
676 INIT_RDMA_OBJ_SIZE(ib_xrcd, hns_roce_xrcd, ibxrcd),
677};
678
679static const struct ib_device_ops hns_roce_dev_restrack_ops = {
680 .fill_res_cq_entry = hns_roce_fill_res_cq_entry,
681 .fill_res_cq_entry_raw = hns_roce_fill_res_cq_entry_raw,
682 .fill_res_qp_entry = hns_roce_fill_res_qp_entry,
683 .fill_res_qp_entry_raw = hns_roce_fill_res_qp_entry_raw,
684 .fill_res_mr_entry = hns_roce_fill_res_mr_entry,
685 .fill_res_mr_entry_raw = hns_roce_fill_res_mr_entry_raw,
686 .fill_res_srq_entry = hns_roce_fill_res_srq_entry,
687 .fill_res_srq_entry_raw = hns_roce_fill_res_srq_entry_raw,
688};
689
690static int hns_roce_register_device(struct hns_roce_dev *hr_dev)
691{
692 int ret;
693 struct hns_roce_ib_iboe *iboe = NULL;
694 struct ib_device *ib_dev = NULL;
695 struct device *dev = hr_dev->dev;
696 unsigned int i;
697
698 iboe = &hr_dev->iboe;
699 spin_lock_init(&iboe->lock);
700
701 ib_dev = &hr_dev->ib_dev;
702
703 ib_dev->node_type = RDMA_NODE_IB_CA;
704 ib_dev->dev.parent = dev;
705
706 ib_dev->phys_port_cnt = hr_dev->caps.num_ports;
707 ib_dev->local_dma_lkey = hr_dev->caps.reserved_lkey;
708 ib_dev->num_comp_vectors = hr_dev->caps.num_comp_vectors;
709
710 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_REREG_MR)
711 ib_set_device_ops(ib_dev, &hns_roce_dev_mr_ops);
712
713 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_MW)
714 ib_set_device_ops(ib_dev, &hns_roce_dev_mw_ops);
715
716 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_FRMR)
717 ib_set_device_ops(ib_dev, &hns_roce_dev_frmr_ops);
718
719 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ) {
720 ib_set_device_ops(ib_dev, &hns_roce_dev_srq_ops);
721 ib_set_device_ops(ib_dev, hr_dev->hw->hns_roce_dev_srq_ops);
722 }
723
724 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_XRC)
725 ib_set_device_ops(ib_dev, &hns_roce_dev_xrcd_ops);
726
727 if (hr_dev->pci_dev->revision >= PCI_REVISION_ID_HIP09 &&
728 !hr_dev->is_vf)
729 ib_set_device_ops(ib_dev, &hns_roce_dev_hw_stats_ops);
730
731 ib_set_device_ops(ib_dev, hr_dev->hw->hns_roce_dev_ops);
732 ib_set_device_ops(ib_dev, &hns_roce_dev_ops);
733 ib_set_device_ops(ib_dev, &hns_roce_dev_restrack_ops);
734 for (i = 0; i < hr_dev->caps.num_ports; i++) {
735 if (!hr_dev->iboe.netdevs[i])
736 continue;
737
738 ret = ib_device_set_netdev(ib_dev, hr_dev->iboe.netdevs[i],
739 i + 1);
740 if (ret)
741 return ret;
742 }
743 dma_set_max_seg_size(dev, UINT_MAX);
744 ret = ib_register_device(ib_dev, "hns_%d", dev);
745 if (ret) {
746 dev_err(dev, "ib_register_device failed!\n");
747 return ret;
748 }
749
750 ret = hns_roce_setup_mtu_mac(hr_dev);
751 if (ret) {
752 dev_err(dev, "setup_mtu_mac failed!\n");
753 goto error_failed_setup_mtu_mac;
754 }
755
756 iboe->nb.notifier_call = hns_roce_netdev_event;
757 ret = register_netdevice_notifier(&iboe->nb);
758 if (ret) {
759 dev_err(dev, "register_netdevice_notifier failed!\n");
760 goto error_failed_setup_mtu_mac;
761 }
762
763 hr_dev->active = true;
764 return 0;
765
766error_failed_setup_mtu_mac:
767 ib_unregister_device(ib_dev);
768
769 return ret;
770}
771
772static int hns_roce_init_hem(struct hns_roce_dev *hr_dev)
773{
774 struct device *dev = hr_dev->dev;
775 int ret;
776
777 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->mr_table.mtpt_table,
778 HEM_TYPE_MTPT, hr_dev->caps.mtpt_entry_sz,
779 hr_dev->caps.num_mtpts);
780 if (ret) {
781 dev_err(dev, "failed to init MTPT context memory, aborting.\n");
782 return ret;
783 }
784
785 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->qp_table.qp_table,
786 HEM_TYPE_QPC, hr_dev->caps.qpc_sz,
787 hr_dev->caps.num_qps);
788 if (ret) {
789 dev_err(dev, "failed to init QP context memory, aborting.\n");
790 goto err_unmap_dmpt;
791 }
792
793 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->qp_table.irrl_table,
794 HEM_TYPE_IRRL,
795 hr_dev->caps.irrl_entry_sz *
796 hr_dev->caps.max_qp_init_rdma,
797 hr_dev->caps.num_qps);
798 if (ret) {
799 dev_err(dev, "failed to init irrl_table memory, aborting.\n");
800 goto err_unmap_qp;
801 }
802
803 if (hr_dev->caps.trrl_entry_sz) {
804 ret = hns_roce_init_hem_table(hr_dev,
805 &hr_dev->qp_table.trrl_table,
806 HEM_TYPE_TRRL,
807 hr_dev->caps.trrl_entry_sz *
808 hr_dev->caps.max_qp_dest_rdma,
809 hr_dev->caps.num_qps);
810 if (ret) {
811 dev_err(dev,
812 "failed to init trrl_table memory, aborting.\n");
813 goto err_unmap_irrl;
814 }
815 }
816
817 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->cq_table.table,
818 HEM_TYPE_CQC, hr_dev->caps.cqc_entry_sz,
819 hr_dev->caps.num_cqs);
820 if (ret) {
821 dev_err(dev, "failed to init CQ context memory, aborting.\n");
822 goto err_unmap_trrl;
823 }
824
825 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ) {
826 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->srq_table.table,
827 HEM_TYPE_SRQC,
828 hr_dev->caps.srqc_entry_sz,
829 hr_dev->caps.num_srqs);
830 if (ret) {
831 dev_err(dev,
832 "failed to init SRQ context memory, aborting.\n");
833 goto err_unmap_cq;
834 }
835 }
836
837 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_QP_FLOW_CTRL) {
838 ret = hns_roce_init_hem_table(hr_dev,
839 &hr_dev->qp_table.sccc_table,
840 HEM_TYPE_SCCC,
841 hr_dev->caps.sccc_sz,
842 hr_dev->caps.num_qps);
843 if (ret) {
844 dev_err(dev,
845 "failed to init SCC context memory, aborting.\n");
846 goto err_unmap_srq;
847 }
848 }
849
850 if (hr_dev->caps.qpc_timer_entry_sz) {
851 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->qpc_timer_table,
852 HEM_TYPE_QPC_TIMER,
853 hr_dev->caps.qpc_timer_entry_sz,
854 hr_dev->caps.qpc_timer_bt_num);
855 if (ret) {
856 dev_err(dev,
857 "failed to init QPC timer memory, aborting.\n");
858 goto err_unmap_ctx;
859 }
860 }
861
862 if (hr_dev->caps.cqc_timer_entry_sz) {
863 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->cqc_timer_table,
864 HEM_TYPE_CQC_TIMER,
865 hr_dev->caps.cqc_timer_entry_sz,
866 hr_dev->caps.cqc_timer_bt_num);
867 if (ret) {
868 dev_err(dev,
869 "failed to init CQC timer memory, aborting.\n");
870 goto err_unmap_qpc_timer;
871 }
872 }
873
874 if (hr_dev->caps.gmv_entry_sz) {
875 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->gmv_table,
876 HEM_TYPE_GMV,
877 hr_dev->caps.gmv_entry_sz,
878 hr_dev->caps.gmv_entry_num);
879 if (ret) {
880 dev_err(dev,
881 "failed to init gmv table memory, ret = %d\n",
882 ret);
883 goto err_unmap_cqc_timer;
884 }
885 }
886
887 return 0;
888
889err_unmap_cqc_timer:
890 if (hr_dev->caps.cqc_timer_entry_sz)
891 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->cqc_timer_table);
892
893err_unmap_qpc_timer:
894 if (hr_dev->caps.qpc_timer_entry_sz)
895 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->qpc_timer_table);
896
897err_unmap_ctx:
898 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_QP_FLOW_CTRL)
899 hns_roce_cleanup_hem_table(hr_dev,
900 &hr_dev->qp_table.sccc_table);
901err_unmap_srq:
902 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ)
903 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->srq_table.table);
904
905err_unmap_cq:
906 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->cq_table.table);
907
908err_unmap_trrl:
909 if (hr_dev->caps.trrl_entry_sz)
910 hns_roce_cleanup_hem_table(hr_dev,
911 &hr_dev->qp_table.trrl_table);
912
913err_unmap_irrl:
914 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->qp_table.irrl_table);
915
916err_unmap_qp:
917 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->qp_table.qp_table);
918
919err_unmap_dmpt:
920 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->mr_table.mtpt_table);
921
922 return ret;
923}
924
925/**
926 * hns_roce_setup_hca - setup host channel adapter
927 * @hr_dev: pointer to hns roce device
928 * Return : int
929 */
930static int hns_roce_setup_hca(struct hns_roce_dev *hr_dev)
931{
932 struct device *dev = hr_dev->dev;
933 int ret;
934
935 spin_lock_init(&hr_dev->sm_lock);
936
937 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_CQ_RECORD_DB ||
938 hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_QP_RECORD_DB) {
939 INIT_LIST_HEAD(&hr_dev->pgdir_list);
940 mutex_init(&hr_dev->pgdir_mutex);
941 }
942
943 hns_roce_init_uar_table(hr_dev);
944
945 ret = hns_roce_uar_alloc(hr_dev, &hr_dev->priv_uar);
946 if (ret) {
947 dev_err(dev, "failed to allocate priv_uar.\n");
948 goto err_uar_table_free;
949 }
950
951 ret = hns_roce_init_qp_table(hr_dev);
952 if (ret) {
953 dev_err(dev, "failed to init qp_table.\n");
954 goto err_uar_table_free;
955 }
956
957 hns_roce_init_pd_table(hr_dev);
958
959 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_XRC)
960 hns_roce_init_xrcd_table(hr_dev);
961
962 hns_roce_init_mr_table(hr_dev);
963
964 hns_roce_init_cq_table(hr_dev);
965
966 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ)
967 hns_roce_init_srq_table(hr_dev);
968
969 return 0;
970
971err_uar_table_free:
972 ida_destroy(&hr_dev->uar_ida.ida);
973 return ret;
974}
975
976static void check_and_get_armed_cq(struct list_head *cq_list, struct ib_cq *cq)
977{
978 struct hns_roce_cq *hr_cq = to_hr_cq(cq);
979 unsigned long flags;
980
981 spin_lock_irqsave(&hr_cq->lock, flags);
982 if (cq->comp_handler) {
983 if (!hr_cq->is_armed) {
984 hr_cq->is_armed = 1;
985 list_add_tail(&hr_cq->node, cq_list);
986 }
987 }
988 spin_unlock_irqrestore(&hr_cq->lock, flags);
989}
990
991void hns_roce_handle_device_err(struct hns_roce_dev *hr_dev)
992{
993 struct hns_roce_qp *hr_qp;
994 struct hns_roce_cq *hr_cq;
995 struct list_head cq_list;
996 unsigned long flags_qp;
997 unsigned long flags;
998
999 INIT_LIST_HEAD(&cq_list);
1000
1001 spin_lock_irqsave(&hr_dev->qp_list_lock, flags);
1002 list_for_each_entry(hr_qp, &hr_dev->qp_list, node) {
1003 spin_lock_irqsave(&hr_qp->sq.lock, flags_qp);
1004 if (hr_qp->sq.tail != hr_qp->sq.head)
1005 check_and_get_armed_cq(&cq_list, hr_qp->ibqp.send_cq);
1006 spin_unlock_irqrestore(&hr_qp->sq.lock, flags_qp);
1007
1008 spin_lock_irqsave(&hr_qp->rq.lock, flags_qp);
1009 if ((!hr_qp->ibqp.srq) && (hr_qp->rq.tail != hr_qp->rq.head))
1010 check_and_get_armed_cq(&cq_list, hr_qp->ibqp.recv_cq);
1011 spin_unlock_irqrestore(&hr_qp->rq.lock, flags_qp);
1012 }
1013
1014 list_for_each_entry(hr_cq, &cq_list, node)
1015 hns_roce_cq_completion(hr_dev, hr_cq->cqn);
1016
1017 spin_unlock_irqrestore(&hr_dev->qp_list_lock, flags);
1018}
1019
1020static int hns_roce_alloc_dfx_cnt(struct hns_roce_dev *hr_dev)
1021{
1022 hr_dev->dfx_cnt = kvcalloc(HNS_ROCE_DFX_CNT_TOTAL, sizeof(atomic64_t),
1023 GFP_KERNEL);
1024 if (!hr_dev->dfx_cnt)
1025 return -ENOMEM;
1026
1027 return 0;
1028}
1029
1030static void hns_roce_dealloc_dfx_cnt(struct hns_roce_dev *hr_dev)
1031{
1032 kvfree(hr_dev->dfx_cnt);
1033}
1034
1035int hns_roce_init(struct hns_roce_dev *hr_dev)
1036{
1037 struct device *dev = hr_dev->dev;
1038 int ret;
1039
1040 hr_dev->is_reset = false;
1041
1042 ret = hns_roce_alloc_dfx_cnt(hr_dev);
1043 if (ret)
1044 return ret;
1045
1046 if (hr_dev->hw->cmq_init) {
1047 ret = hr_dev->hw->cmq_init(hr_dev);
1048 if (ret) {
1049 dev_err(dev, "init RoCE Command Queue failed!\n");
1050 goto error_failed_alloc_dfx_cnt;
1051 }
1052 }
1053
1054 ret = hr_dev->hw->hw_profile(hr_dev);
1055 if (ret) {
1056 dev_err(dev, "get RoCE engine profile failed!\n");
1057 goto error_failed_cmd_init;
1058 }
1059
1060 ret = hns_roce_cmd_init(hr_dev);
1061 if (ret) {
1062 dev_err(dev, "cmd init failed!\n");
1063 goto error_failed_cmd_init;
1064 }
1065
1066 /* EQ depends on poll mode, event mode depends on EQ */
1067 ret = hr_dev->hw->init_eq(hr_dev);
1068 if (ret) {
1069 dev_err(dev, "eq init failed!\n");
1070 goto error_failed_eq_table;
1071 }
1072
1073 if (hr_dev->cmd_mod) {
1074 ret = hns_roce_cmd_use_events(hr_dev);
1075 if (ret)
1076 dev_warn(dev,
1077 "Cmd event mode failed, set back to poll!\n");
1078 }
1079
1080 ret = hns_roce_init_hem(hr_dev);
1081 if (ret) {
1082 dev_err(dev, "init HEM(Hardware Entry Memory) failed!\n");
1083 goto error_failed_init_hem;
1084 }
1085
1086 ret = hns_roce_setup_hca(hr_dev);
1087 if (ret) {
1088 dev_err(dev, "setup hca failed!\n");
1089 goto error_failed_setup_hca;
1090 }
1091
1092 if (hr_dev->hw->hw_init) {
1093 ret = hr_dev->hw->hw_init(hr_dev);
1094 if (ret) {
1095 dev_err(dev, "hw_init failed!\n");
1096 goto error_failed_engine_init;
1097 }
1098 }
1099
1100 INIT_LIST_HEAD(&hr_dev->qp_list);
1101 spin_lock_init(&hr_dev->qp_list_lock);
1102 INIT_LIST_HEAD(&hr_dev->dip_list);
1103 spin_lock_init(&hr_dev->dip_list_lock);
1104
1105 ret = hns_roce_register_device(hr_dev);
1106 if (ret)
1107 goto error_failed_register_device;
1108
1109 hns_roce_register_debugfs(hr_dev);
1110
1111 return 0;
1112
1113error_failed_register_device:
1114 if (hr_dev->hw->hw_exit)
1115 hr_dev->hw->hw_exit(hr_dev);
1116
1117error_failed_engine_init:
1118 hns_roce_cleanup_bitmap(hr_dev);
1119
1120error_failed_setup_hca:
1121 hns_roce_cleanup_hem(hr_dev);
1122
1123error_failed_init_hem:
1124 if (hr_dev->cmd_mod)
1125 hns_roce_cmd_use_polling(hr_dev);
1126 hr_dev->hw->cleanup_eq(hr_dev);
1127
1128error_failed_eq_table:
1129 hns_roce_cmd_cleanup(hr_dev);
1130
1131error_failed_cmd_init:
1132 if (hr_dev->hw->cmq_exit)
1133 hr_dev->hw->cmq_exit(hr_dev);
1134
1135error_failed_alloc_dfx_cnt:
1136 hns_roce_dealloc_dfx_cnt(hr_dev);
1137
1138 return ret;
1139}
1140
1141void hns_roce_exit(struct hns_roce_dev *hr_dev)
1142{
1143 hns_roce_unregister_debugfs(hr_dev);
1144 hns_roce_unregister_device(hr_dev);
1145
1146 if (hr_dev->hw->hw_exit)
1147 hr_dev->hw->hw_exit(hr_dev);
1148 hns_roce_cleanup_bitmap(hr_dev);
1149 hns_roce_cleanup_hem(hr_dev);
1150
1151 if (hr_dev->cmd_mod)
1152 hns_roce_cmd_use_polling(hr_dev);
1153
1154 hr_dev->hw->cleanup_eq(hr_dev);
1155 hns_roce_cmd_cleanup(hr_dev);
1156 if (hr_dev->hw->cmq_exit)
1157 hr_dev->hw->cmq_exit(hr_dev);
1158 hns_roce_dealloc_dfx_cnt(hr_dev);
1159}
1160
1161MODULE_LICENSE("Dual BSD/GPL");
1162MODULE_AUTHOR("Wei Hu <xavier.huwei@huawei.com>");
1163MODULE_AUTHOR("Nenglong Zhao <zhaonenglong@hisilicon.com>");
1164MODULE_AUTHOR("Lijun Ou <oulijun@huawei.com>");
1165MODULE_DESCRIPTION("HNS RoCE Driver");
1/*
2 * Copyright (c) 2016 Hisilicon Limited.
3 * Copyright (c) 2007, 2008 Mellanox Technologies. All rights reserved.
4 *
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
10 *
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
13 * conditions are met:
14 *
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
17 * disclaimer.
18 *
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
23 *
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31 * SOFTWARE.
32 */
33#include <linux/acpi.h>
34#include <linux/of_platform.h>
35#include <linux/module.h>
36#include <rdma/ib_addr.h>
37#include <rdma/ib_smi.h>
38#include <rdma/ib_user_verbs.h>
39#include <rdma/ib_cache.h>
40#include "hns_roce_common.h"
41#include "hns_roce_device.h"
42#include <rdma/hns-abi.h>
43#include "hns_roce_hem.h"
44
45/**
46 * hns_get_gid_index - Get gid index.
47 * @hr_dev: pointer to structure hns_roce_dev.
48 * @port: port, value range: 0 ~ MAX
49 * @gid_index: gid_index, value range: 0 ~ MAX
50 * Description:
51 * N ports shared gids, allocation method as follow:
52 * GID[0][0], GID[1][0],.....GID[N - 1][0],
53 * GID[0][0], GID[1][0],.....GID[N - 1][0],
54 * And so on
55 */
56int hns_get_gid_index(struct hns_roce_dev *hr_dev, u8 port, int gid_index)
57{
58 return gid_index * hr_dev->caps.num_ports + port;
59}
60
61static int hns_roce_set_mac(struct hns_roce_dev *hr_dev, u8 port, u8 *addr)
62{
63 u8 phy_port;
64 u32 i = 0;
65
66 if (!memcmp(hr_dev->dev_addr[port], addr, ETH_ALEN))
67 return 0;
68
69 for (i = 0; i < ETH_ALEN; i++)
70 hr_dev->dev_addr[port][i] = addr[i];
71
72 phy_port = hr_dev->iboe.phy_port[port];
73 return hr_dev->hw->set_mac(hr_dev, phy_port, addr);
74}
75
76static int hns_roce_add_gid(const struct ib_gid_attr *attr, void **context)
77{
78 struct hns_roce_dev *hr_dev = to_hr_dev(attr->device);
79 u8 port = attr->port_num - 1;
80 int ret;
81
82 if (port >= hr_dev->caps.num_ports)
83 return -EINVAL;
84
85 ret = hr_dev->hw->set_gid(hr_dev, port, attr->index, &attr->gid, attr);
86
87 return ret;
88}
89
90static int hns_roce_del_gid(const struct ib_gid_attr *attr, void **context)
91{
92 struct hns_roce_dev *hr_dev = to_hr_dev(attr->device);
93 struct ib_gid_attr zattr = { };
94 u8 port = attr->port_num - 1;
95 int ret;
96
97 if (port >= hr_dev->caps.num_ports)
98 return -EINVAL;
99
100 ret = hr_dev->hw->set_gid(hr_dev, port, attr->index, &zgid, &zattr);
101
102 return ret;
103}
104
105static int handle_en_event(struct hns_roce_dev *hr_dev, u8 port,
106 unsigned long event)
107{
108 struct device *dev = hr_dev->dev;
109 struct net_device *netdev;
110 int ret = 0;
111
112 netdev = hr_dev->iboe.netdevs[port];
113 if (!netdev) {
114 dev_err(dev, "port(%d) can't find netdev\n", port);
115 return -ENODEV;
116 }
117
118 switch (event) {
119 case NETDEV_UP:
120 case NETDEV_CHANGE:
121 case NETDEV_REGISTER:
122 case NETDEV_CHANGEADDR:
123 ret = hns_roce_set_mac(hr_dev, port, netdev->dev_addr);
124 break;
125 case NETDEV_DOWN:
126 /*
127 * In v1 engine, only support all ports closed together.
128 */
129 break;
130 default:
131 dev_dbg(dev, "NETDEV event = 0x%x!\n", (u32)(event));
132 break;
133 }
134
135 return ret;
136}
137
138static int hns_roce_netdev_event(struct notifier_block *self,
139 unsigned long event, void *ptr)
140{
141 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
142 struct hns_roce_ib_iboe *iboe = NULL;
143 struct hns_roce_dev *hr_dev = NULL;
144 u8 port = 0;
145 int ret = 0;
146
147 hr_dev = container_of(self, struct hns_roce_dev, iboe.nb);
148 iboe = &hr_dev->iboe;
149
150 for (port = 0; port < hr_dev->caps.num_ports; port++) {
151 if (dev == iboe->netdevs[port]) {
152 ret = handle_en_event(hr_dev, port, event);
153 if (ret)
154 return NOTIFY_DONE;
155 break;
156 }
157 }
158
159 return NOTIFY_DONE;
160}
161
162static int hns_roce_setup_mtu_mac(struct hns_roce_dev *hr_dev)
163{
164 int ret;
165 u8 i;
166
167 for (i = 0; i < hr_dev->caps.num_ports; i++) {
168 if (hr_dev->hw->set_mtu)
169 hr_dev->hw->set_mtu(hr_dev, hr_dev->iboe.phy_port[i],
170 hr_dev->caps.max_mtu);
171 ret = hns_roce_set_mac(hr_dev, i,
172 hr_dev->iboe.netdevs[i]->dev_addr);
173 if (ret)
174 return ret;
175 }
176
177 return 0;
178}
179
180static int hns_roce_query_device(struct ib_device *ib_dev,
181 struct ib_device_attr *props,
182 struct ib_udata *uhw)
183{
184 struct hns_roce_dev *hr_dev = to_hr_dev(ib_dev);
185
186 memset(props, 0, sizeof(*props));
187
188 props->fw_ver = hr_dev->caps.fw_ver;
189 props->sys_image_guid = cpu_to_be64(hr_dev->sys_image_guid);
190 props->max_mr_size = (u64)(~(0ULL));
191 props->page_size_cap = hr_dev->caps.page_size_cap;
192 props->vendor_id = hr_dev->vendor_id;
193 props->vendor_part_id = hr_dev->vendor_part_id;
194 props->hw_ver = hr_dev->hw_rev;
195 props->max_qp = hr_dev->caps.num_qps;
196 props->max_qp_wr = hr_dev->caps.max_wqes;
197 props->device_cap_flags = IB_DEVICE_PORT_ACTIVE_EVENT |
198 IB_DEVICE_RC_RNR_NAK_GEN;
199 props->max_send_sge = hr_dev->caps.max_sq_sg;
200 props->max_recv_sge = hr_dev->caps.max_rq_sg;
201 props->max_sge_rd = 1;
202 props->max_cq = hr_dev->caps.num_cqs;
203 props->max_cqe = hr_dev->caps.max_cqes;
204 props->max_mr = hr_dev->caps.num_mtpts;
205 props->max_pd = hr_dev->caps.num_pds;
206 props->max_qp_rd_atom = hr_dev->caps.max_qp_dest_rdma;
207 props->max_qp_init_rd_atom = hr_dev->caps.max_qp_init_rdma;
208 props->atomic_cap = hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_ATOMIC ?
209 IB_ATOMIC_HCA : IB_ATOMIC_NONE;
210 props->max_pkeys = 1;
211 props->local_ca_ack_delay = hr_dev->caps.local_ca_ack_delay;
212 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ) {
213 props->max_srq = hr_dev->caps.max_srqs;
214 props->max_srq_wr = hr_dev->caps.max_srq_wrs;
215 props->max_srq_sge = hr_dev->caps.max_srq_sges;
216 }
217
218 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_FRMR) {
219 props->device_cap_flags |= IB_DEVICE_MEM_MGT_EXTENSIONS;
220 props->max_fast_reg_page_list_len = HNS_ROCE_FRMR_MAX_PA;
221 }
222
223 return 0;
224}
225
226static int hns_roce_query_port(struct ib_device *ib_dev, u8 port_num,
227 struct ib_port_attr *props)
228{
229 struct hns_roce_dev *hr_dev = to_hr_dev(ib_dev);
230 struct device *dev = hr_dev->dev;
231 struct net_device *net_dev;
232 unsigned long flags;
233 enum ib_mtu mtu;
234 u8 port;
235
236 assert(port_num > 0);
237 port = port_num - 1;
238
239 /* props being zeroed by the caller, avoid zeroing it here */
240
241 props->max_mtu = hr_dev->caps.max_mtu;
242 props->gid_tbl_len = hr_dev->caps.gid_table_len[port];
243 props->port_cap_flags = IB_PORT_CM_SUP | IB_PORT_REINIT_SUP |
244 IB_PORT_VENDOR_CLASS_SUP |
245 IB_PORT_BOOT_MGMT_SUP;
246 props->max_msg_sz = HNS_ROCE_MAX_MSG_LEN;
247 props->pkey_tbl_len = 1;
248 props->active_width = IB_WIDTH_4X;
249 props->active_speed = 1;
250
251 spin_lock_irqsave(&hr_dev->iboe.lock, flags);
252
253 net_dev = hr_dev->iboe.netdevs[port];
254 if (!net_dev) {
255 spin_unlock_irqrestore(&hr_dev->iboe.lock, flags);
256 dev_err(dev, "find netdev %d failed!\r\n", port);
257 return -EINVAL;
258 }
259
260 mtu = iboe_get_mtu(net_dev->mtu);
261 props->active_mtu = mtu ? min(props->max_mtu, mtu) : IB_MTU_256;
262 props->state = (netif_running(net_dev) && netif_carrier_ok(net_dev)) ?
263 IB_PORT_ACTIVE : IB_PORT_DOWN;
264 props->phys_state = (props->state == IB_PORT_ACTIVE) ?
265 IB_PORT_PHYS_STATE_LINK_UP :
266 IB_PORT_PHYS_STATE_DISABLED;
267
268 spin_unlock_irqrestore(&hr_dev->iboe.lock, flags);
269
270 return 0;
271}
272
273static enum rdma_link_layer hns_roce_get_link_layer(struct ib_device *device,
274 u8 port_num)
275{
276 return IB_LINK_LAYER_ETHERNET;
277}
278
279static int hns_roce_query_pkey(struct ib_device *ib_dev, u8 port, u16 index,
280 u16 *pkey)
281{
282 *pkey = PKEY_ID;
283
284 return 0;
285}
286
287static int hns_roce_modify_device(struct ib_device *ib_dev, int mask,
288 struct ib_device_modify *props)
289{
290 unsigned long flags;
291
292 if (mask & ~IB_DEVICE_MODIFY_NODE_DESC)
293 return -EOPNOTSUPP;
294
295 if (mask & IB_DEVICE_MODIFY_NODE_DESC) {
296 spin_lock_irqsave(&to_hr_dev(ib_dev)->sm_lock, flags);
297 memcpy(ib_dev->node_desc, props->node_desc, NODE_DESC_SIZE);
298 spin_unlock_irqrestore(&to_hr_dev(ib_dev)->sm_lock, flags);
299 }
300
301 return 0;
302}
303
304static int hns_roce_modify_port(struct ib_device *ib_dev, u8 port_num, int mask,
305 struct ib_port_modify *props)
306{
307 return 0;
308}
309
310static int hns_roce_alloc_ucontext(struct ib_ucontext *uctx,
311 struct ib_udata *udata)
312{
313 int ret;
314 struct hns_roce_ucontext *context = to_hr_ucontext(uctx);
315 struct hns_roce_ib_alloc_ucontext_resp resp = {};
316 struct hns_roce_dev *hr_dev = to_hr_dev(uctx->device);
317
318 if (!hr_dev->active)
319 return -EAGAIN;
320
321 resp.qp_tab_size = hr_dev->caps.num_qps;
322
323 ret = hns_roce_uar_alloc(hr_dev, &context->uar);
324 if (ret)
325 goto error_fail_uar_alloc;
326
327 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_RECORD_DB) {
328 INIT_LIST_HEAD(&context->page_list);
329 mutex_init(&context->page_mutex);
330 }
331
332 ret = ib_copy_to_udata(udata, &resp, sizeof(resp));
333 if (ret)
334 goto error_fail_copy_to_udata;
335
336 return 0;
337
338error_fail_copy_to_udata:
339 hns_roce_uar_free(hr_dev, &context->uar);
340
341error_fail_uar_alloc:
342 return ret;
343}
344
345static void hns_roce_dealloc_ucontext(struct ib_ucontext *ibcontext)
346{
347 struct hns_roce_ucontext *context = to_hr_ucontext(ibcontext);
348
349 hns_roce_uar_free(to_hr_dev(ibcontext->device), &context->uar);
350}
351
352static int hns_roce_mmap(struct ib_ucontext *context,
353 struct vm_area_struct *vma)
354{
355 struct hns_roce_dev *hr_dev = to_hr_dev(context->device);
356
357 switch (vma->vm_pgoff) {
358 case 0:
359 return rdma_user_mmap_io(context, vma,
360 to_hr_ucontext(context)->uar.pfn,
361 PAGE_SIZE,
362 pgprot_noncached(vma->vm_page_prot));
363
364 /* vm_pgoff: 1 -- TPTR */
365 case 1:
366 if (!hr_dev->tptr_dma_addr || !hr_dev->tptr_size)
367 return -EINVAL;
368 /*
369 * FIXME: using io_remap_pfn_range on the dma address returned
370 * by dma_alloc_coherent is totally wrong.
371 */
372 return rdma_user_mmap_io(context, vma,
373 hr_dev->tptr_dma_addr >> PAGE_SHIFT,
374 hr_dev->tptr_size,
375 vma->vm_page_prot);
376
377 default:
378 return -EINVAL;
379 }
380}
381
382static int hns_roce_port_immutable(struct ib_device *ib_dev, u8 port_num,
383 struct ib_port_immutable *immutable)
384{
385 struct ib_port_attr attr;
386 int ret;
387
388 ret = ib_query_port(ib_dev, port_num, &attr);
389 if (ret)
390 return ret;
391
392 immutable->pkey_tbl_len = attr.pkey_tbl_len;
393 immutable->gid_tbl_len = attr.gid_tbl_len;
394
395 immutable->max_mad_size = IB_MGMT_MAD_SIZE;
396 immutable->core_cap_flags = RDMA_CORE_PORT_IBA_ROCE;
397 if (to_hr_dev(ib_dev)->caps.flags & HNS_ROCE_CAP_FLAG_ROCE_V1_V2)
398 immutable->core_cap_flags |= RDMA_CORE_PORT_IBA_ROCE_UDP_ENCAP;
399
400 return 0;
401}
402
403static void hns_roce_disassociate_ucontext(struct ib_ucontext *ibcontext)
404{
405}
406
407static void hns_roce_unregister_device(struct hns_roce_dev *hr_dev)
408{
409 struct hns_roce_ib_iboe *iboe = &hr_dev->iboe;
410
411 hr_dev->active = false;
412 unregister_netdevice_notifier(&iboe->nb);
413 ib_unregister_device(&hr_dev->ib_dev);
414}
415
416static const struct ib_device_ops hns_roce_dev_ops = {
417 .owner = THIS_MODULE,
418 .driver_id = RDMA_DRIVER_HNS,
419 .uverbs_abi_ver = 1,
420 .uverbs_no_driver_id_binding = 1,
421
422 .add_gid = hns_roce_add_gid,
423 .alloc_pd = hns_roce_alloc_pd,
424 .alloc_ucontext = hns_roce_alloc_ucontext,
425 .create_ah = hns_roce_create_ah,
426 .create_cq = hns_roce_ib_create_cq,
427 .create_qp = hns_roce_create_qp,
428 .dealloc_pd = hns_roce_dealloc_pd,
429 .dealloc_ucontext = hns_roce_dealloc_ucontext,
430 .del_gid = hns_roce_del_gid,
431 .dereg_mr = hns_roce_dereg_mr,
432 .destroy_ah = hns_roce_destroy_ah,
433 .destroy_cq = hns_roce_ib_destroy_cq,
434 .disassociate_ucontext = hns_roce_disassociate_ucontext,
435 .fill_res_entry = hns_roce_fill_res_entry,
436 .get_dma_mr = hns_roce_get_dma_mr,
437 .get_link_layer = hns_roce_get_link_layer,
438 .get_port_immutable = hns_roce_port_immutable,
439 .mmap = hns_roce_mmap,
440 .modify_device = hns_roce_modify_device,
441 .modify_port = hns_roce_modify_port,
442 .modify_qp = hns_roce_modify_qp,
443 .query_ah = hns_roce_query_ah,
444 .query_device = hns_roce_query_device,
445 .query_pkey = hns_roce_query_pkey,
446 .query_port = hns_roce_query_port,
447 .reg_user_mr = hns_roce_reg_user_mr,
448
449 INIT_RDMA_OBJ_SIZE(ib_ah, hns_roce_ah, ibah),
450 INIT_RDMA_OBJ_SIZE(ib_cq, hns_roce_cq, ib_cq),
451 INIT_RDMA_OBJ_SIZE(ib_pd, hns_roce_pd, ibpd),
452 INIT_RDMA_OBJ_SIZE(ib_ucontext, hns_roce_ucontext, ibucontext),
453};
454
455static const struct ib_device_ops hns_roce_dev_mr_ops = {
456 .rereg_user_mr = hns_roce_rereg_user_mr,
457};
458
459static const struct ib_device_ops hns_roce_dev_mw_ops = {
460 .alloc_mw = hns_roce_alloc_mw,
461 .dealloc_mw = hns_roce_dealloc_mw,
462};
463
464static const struct ib_device_ops hns_roce_dev_frmr_ops = {
465 .alloc_mr = hns_roce_alloc_mr,
466 .map_mr_sg = hns_roce_map_mr_sg,
467};
468
469static const struct ib_device_ops hns_roce_dev_srq_ops = {
470 .create_srq = hns_roce_create_srq,
471 .destroy_srq = hns_roce_destroy_srq,
472
473 INIT_RDMA_OBJ_SIZE(ib_srq, hns_roce_srq, ibsrq),
474};
475
476static int hns_roce_register_device(struct hns_roce_dev *hr_dev)
477{
478 int ret;
479 struct hns_roce_ib_iboe *iboe = NULL;
480 struct ib_device *ib_dev = NULL;
481 struct device *dev = hr_dev->dev;
482 unsigned int i;
483
484 iboe = &hr_dev->iboe;
485 spin_lock_init(&iboe->lock);
486
487 ib_dev = &hr_dev->ib_dev;
488
489 ib_dev->node_type = RDMA_NODE_IB_CA;
490 ib_dev->dev.parent = dev;
491
492 ib_dev->phys_port_cnt = hr_dev->caps.num_ports;
493 ib_dev->local_dma_lkey = hr_dev->caps.reserved_lkey;
494 ib_dev->num_comp_vectors = hr_dev->caps.num_comp_vectors;
495 ib_dev->uverbs_cmd_mask =
496 (1ULL << IB_USER_VERBS_CMD_GET_CONTEXT) |
497 (1ULL << IB_USER_VERBS_CMD_QUERY_DEVICE) |
498 (1ULL << IB_USER_VERBS_CMD_QUERY_PORT) |
499 (1ULL << IB_USER_VERBS_CMD_ALLOC_PD) |
500 (1ULL << IB_USER_VERBS_CMD_DEALLOC_PD) |
501 (1ULL << IB_USER_VERBS_CMD_REG_MR) |
502 (1ULL << IB_USER_VERBS_CMD_DEREG_MR) |
503 (1ULL << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
504 (1ULL << IB_USER_VERBS_CMD_CREATE_CQ) |
505 (1ULL << IB_USER_VERBS_CMD_DESTROY_CQ) |
506 (1ULL << IB_USER_VERBS_CMD_CREATE_QP) |
507 (1ULL << IB_USER_VERBS_CMD_MODIFY_QP) |
508 (1ULL << IB_USER_VERBS_CMD_QUERY_QP) |
509 (1ULL << IB_USER_VERBS_CMD_DESTROY_QP);
510
511 ib_dev->uverbs_ex_cmd_mask |=
512 (1ULL << IB_USER_VERBS_EX_CMD_MODIFY_CQ);
513
514 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_REREG_MR) {
515 ib_dev->uverbs_cmd_mask |= (1ULL << IB_USER_VERBS_CMD_REREG_MR);
516 ib_set_device_ops(ib_dev, &hns_roce_dev_mr_ops);
517 }
518
519 /* MW */
520 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_MW) {
521 ib_dev->uverbs_cmd_mask |=
522 (1ULL << IB_USER_VERBS_CMD_ALLOC_MW) |
523 (1ULL << IB_USER_VERBS_CMD_DEALLOC_MW);
524 ib_set_device_ops(ib_dev, &hns_roce_dev_mw_ops);
525 }
526
527 /* FRMR */
528 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_FRMR)
529 ib_set_device_ops(ib_dev, &hns_roce_dev_frmr_ops);
530
531 /* SRQ */
532 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ) {
533 ib_dev->uverbs_cmd_mask |=
534 (1ULL << IB_USER_VERBS_CMD_CREATE_SRQ) |
535 (1ULL << IB_USER_VERBS_CMD_MODIFY_SRQ) |
536 (1ULL << IB_USER_VERBS_CMD_QUERY_SRQ) |
537 (1ULL << IB_USER_VERBS_CMD_DESTROY_SRQ) |
538 (1ULL << IB_USER_VERBS_CMD_POST_SRQ_RECV);
539 ib_set_device_ops(ib_dev, &hns_roce_dev_srq_ops);
540 ib_set_device_ops(ib_dev, hr_dev->hw->hns_roce_dev_srq_ops);
541 }
542
543 ib_set_device_ops(ib_dev, hr_dev->hw->hns_roce_dev_ops);
544 ib_set_device_ops(ib_dev, &hns_roce_dev_ops);
545 for (i = 0; i < hr_dev->caps.num_ports; i++) {
546 if (!hr_dev->iboe.netdevs[i])
547 continue;
548
549 ret = ib_device_set_netdev(ib_dev, hr_dev->iboe.netdevs[i],
550 i + 1);
551 if (ret)
552 return ret;
553 }
554 ret = ib_register_device(ib_dev, "hns_%d");
555 if (ret) {
556 dev_err(dev, "ib_register_device failed!\n");
557 return ret;
558 }
559
560 ret = hns_roce_setup_mtu_mac(hr_dev);
561 if (ret) {
562 dev_err(dev, "setup_mtu_mac failed!\n");
563 goto error_failed_setup_mtu_mac;
564 }
565
566 iboe->nb.notifier_call = hns_roce_netdev_event;
567 ret = register_netdevice_notifier(&iboe->nb);
568 if (ret) {
569 dev_err(dev, "register_netdevice_notifier failed!\n");
570 goto error_failed_setup_mtu_mac;
571 }
572
573 hr_dev->active = true;
574 return 0;
575
576error_failed_setup_mtu_mac:
577 ib_unregister_device(ib_dev);
578
579 return ret;
580}
581
582static int hns_roce_init_hem(struct hns_roce_dev *hr_dev)
583{
584 int ret;
585 struct device *dev = hr_dev->dev;
586
587 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->mr_table.mtt_table,
588 HEM_TYPE_MTT, hr_dev->caps.mtt_entry_sz,
589 hr_dev->caps.num_mtt_segs, 1);
590 if (ret) {
591 dev_err(dev, "Failed to init MTT context memory, aborting.\n");
592 return ret;
593 }
594
595 if (hns_roce_check_whether_mhop(hr_dev, HEM_TYPE_CQE)) {
596 ret = hns_roce_init_hem_table(hr_dev,
597 &hr_dev->mr_table.mtt_cqe_table,
598 HEM_TYPE_CQE, hr_dev->caps.mtt_entry_sz,
599 hr_dev->caps.num_cqe_segs, 1);
600 if (ret) {
601 dev_err(dev, "Failed to init MTT CQE context memory, aborting.\n");
602 goto err_unmap_cqe;
603 }
604 }
605
606 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->mr_table.mtpt_table,
607 HEM_TYPE_MTPT, hr_dev->caps.mtpt_entry_sz,
608 hr_dev->caps.num_mtpts, 1);
609 if (ret) {
610 dev_err(dev, "Failed to init MTPT context memory, aborting.\n");
611 goto err_unmap_mtt;
612 }
613
614 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->qp_table.qp_table,
615 HEM_TYPE_QPC, hr_dev->caps.qpc_entry_sz,
616 hr_dev->caps.num_qps, 1);
617 if (ret) {
618 dev_err(dev, "Failed to init QP context memory, aborting.\n");
619 goto err_unmap_dmpt;
620 }
621
622 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->qp_table.irrl_table,
623 HEM_TYPE_IRRL,
624 hr_dev->caps.irrl_entry_sz *
625 hr_dev->caps.max_qp_init_rdma,
626 hr_dev->caps.num_qps, 1);
627 if (ret) {
628 dev_err(dev, "Failed to init irrl_table memory, aborting.\n");
629 goto err_unmap_qp;
630 }
631
632 if (hr_dev->caps.trrl_entry_sz) {
633 ret = hns_roce_init_hem_table(hr_dev,
634 &hr_dev->qp_table.trrl_table,
635 HEM_TYPE_TRRL,
636 hr_dev->caps.trrl_entry_sz *
637 hr_dev->caps.max_qp_dest_rdma,
638 hr_dev->caps.num_qps, 1);
639 if (ret) {
640 dev_err(dev,
641 "Failed to init trrl_table memory, aborting.\n");
642 goto err_unmap_irrl;
643 }
644 }
645
646 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->cq_table.table,
647 HEM_TYPE_CQC, hr_dev->caps.cqc_entry_sz,
648 hr_dev->caps.num_cqs, 1);
649 if (ret) {
650 dev_err(dev, "Failed to init CQ context memory, aborting.\n");
651 goto err_unmap_trrl;
652 }
653
654 if (hr_dev->caps.srqc_entry_sz) {
655 ret = hns_roce_init_hem_table(hr_dev, &hr_dev->srq_table.table,
656 HEM_TYPE_SRQC,
657 hr_dev->caps.srqc_entry_sz,
658 hr_dev->caps.num_srqs, 1);
659 if (ret) {
660 dev_err(dev,
661 "Failed to init SRQ context memory, aborting.\n");
662 goto err_unmap_cq;
663 }
664 }
665
666 if (hr_dev->caps.num_srqwqe_segs) {
667 ret = hns_roce_init_hem_table(hr_dev,
668 &hr_dev->mr_table.mtt_srqwqe_table,
669 HEM_TYPE_SRQWQE,
670 hr_dev->caps.mtt_entry_sz,
671 hr_dev->caps.num_srqwqe_segs, 1);
672 if (ret) {
673 dev_err(dev,
674 "Failed to init MTT srqwqe memory, aborting.\n");
675 goto err_unmap_srq;
676 }
677 }
678
679 if (hr_dev->caps.num_idx_segs) {
680 ret = hns_roce_init_hem_table(hr_dev,
681 &hr_dev->mr_table.mtt_idx_table,
682 HEM_TYPE_IDX,
683 hr_dev->caps.idx_entry_sz,
684 hr_dev->caps.num_idx_segs, 1);
685 if (ret) {
686 dev_err(dev,
687 "Failed to init MTT idx memory, aborting.\n");
688 goto err_unmap_srqwqe;
689 }
690 }
691
692 if (hr_dev->caps.sccc_entry_sz) {
693 ret = hns_roce_init_hem_table(hr_dev,
694 &hr_dev->qp_table.sccc_table,
695 HEM_TYPE_SCCC,
696 hr_dev->caps.sccc_entry_sz,
697 hr_dev->caps.num_qps, 1);
698 if (ret) {
699 dev_err(dev,
700 "Failed to init SCC context memory, aborting.\n");
701 goto err_unmap_idx;
702 }
703 }
704
705 if (hr_dev->caps.qpc_timer_entry_sz) {
706 ret = hns_roce_init_hem_table(hr_dev,
707 &hr_dev->qpc_timer_table,
708 HEM_TYPE_QPC_TIMER,
709 hr_dev->caps.qpc_timer_entry_sz,
710 hr_dev->caps.num_qpc_timer, 1);
711 if (ret) {
712 dev_err(dev,
713 "Failed to init QPC timer memory, aborting.\n");
714 goto err_unmap_ctx;
715 }
716 }
717
718 if (hr_dev->caps.cqc_timer_entry_sz) {
719 ret = hns_roce_init_hem_table(hr_dev,
720 &hr_dev->cqc_timer_table,
721 HEM_TYPE_CQC_TIMER,
722 hr_dev->caps.cqc_timer_entry_sz,
723 hr_dev->caps.num_cqc_timer, 1);
724 if (ret) {
725 dev_err(dev,
726 "Failed to init CQC timer memory, aborting.\n");
727 goto err_unmap_qpc_timer;
728 }
729 }
730
731 return 0;
732
733err_unmap_qpc_timer:
734 if (hr_dev->caps.qpc_timer_entry_sz)
735 hns_roce_cleanup_hem_table(hr_dev,
736 &hr_dev->qpc_timer_table);
737
738err_unmap_ctx:
739 if (hr_dev->caps.sccc_entry_sz)
740 hns_roce_cleanup_hem_table(hr_dev,
741 &hr_dev->qp_table.sccc_table);
742
743err_unmap_idx:
744 if (hr_dev->caps.num_idx_segs)
745 hns_roce_cleanup_hem_table(hr_dev,
746 &hr_dev->mr_table.mtt_idx_table);
747
748err_unmap_srqwqe:
749 if (hr_dev->caps.num_srqwqe_segs)
750 hns_roce_cleanup_hem_table(hr_dev,
751 &hr_dev->mr_table.mtt_srqwqe_table);
752
753err_unmap_srq:
754 if (hr_dev->caps.srqc_entry_sz)
755 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->srq_table.table);
756
757err_unmap_cq:
758 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->cq_table.table);
759
760err_unmap_trrl:
761 if (hr_dev->caps.trrl_entry_sz)
762 hns_roce_cleanup_hem_table(hr_dev,
763 &hr_dev->qp_table.trrl_table);
764
765err_unmap_irrl:
766 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->qp_table.irrl_table);
767
768err_unmap_qp:
769 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->qp_table.qp_table);
770
771err_unmap_dmpt:
772 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->mr_table.mtpt_table);
773
774err_unmap_mtt:
775 if (hns_roce_check_whether_mhop(hr_dev, HEM_TYPE_CQE))
776 hns_roce_cleanup_hem_table(hr_dev,
777 &hr_dev->mr_table.mtt_cqe_table);
778
779err_unmap_cqe:
780 hns_roce_cleanup_hem_table(hr_dev, &hr_dev->mr_table.mtt_table);
781
782 return ret;
783}
784
785/**
786 * hns_roce_setup_hca - setup host channel adapter
787 * @hr_dev: pointer to hns roce device
788 * Return : int
789 */
790static int hns_roce_setup_hca(struct hns_roce_dev *hr_dev)
791{
792 int ret;
793 struct device *dev = hr_dev->dev;
794
795 spin_lock_init(&hr_dev->sm_lock);
796 spin_lock_init(&hr_dev->bt_cmd_lock);
797
798 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_RECORD_DB) {
799 INIT_LIST_HEAD(&hr_dev->pgdir_list);
800 mutex_init(&hr_dev->pgdir_mutex);
801 }
802
803 ret = hns_roce_init_uar_table(hr_dev);
804 if (ret) {
805 dev_err(dev, "Failed to initialize uar table. aborting\n");
806 return ret;
807 }
808
809 ret = hns_roce_uar_alloc(hr_dev, &hr_dev->priv_uar);
810 if (ret) {
811 dev_err(dev, "Failed to allocate priv_uar.\n");
812 goto err_uar_table_free;
813 }
814
815 ret = hns_roce_init_pd_table(hr_dev);
816 if (ret) {
817 dev_err(dev, "Failed to init protected domain table.\n");
818 goto err_uar_alloc_free;
819 }
820
821 ret = hns_roce_init_mr_table(hr_dev);
822 if (ret) {
823 dev_err(dev, "Failed to init memory region table.\n");
824 goto err_pd_table_free;
825 }
826
827 ret = hns_roce_init_cq_table(hr_dev);
828 if (ret) {
829 dev_err(dev, "Failed to init completion queue table.\n");
830 goto err_mr_table_free;
831 }
832
833 ret = hns_roce_init_qp_table(hr_dev);
834 if (ret) {
835 dev_err(dev, "Failed to init queue pair table.\n");
836 goto err_cq_table_free;
837 }
838
839 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ) {
840 ret = hns_roce_init_srq_table(hr_dev);
841 if (ret) {
842 dev_err(dev,
843 "Failed to init share receive queue table.\n");
844 goto err_qp_table_free;
845 }
846 }
847
848 return 0;
849
850err_qp_table_free:
851 if (hr_dev->caps.flags & HNS_ROCE_CAP_FLAG_SRQ)
852 hns_roce_cleanup_qp_table(hr_dev);
853
854err_cq_table_free:
855 hns_roce_cleanup_cq_table(hr_dev);
856
857err_mr_table_free:
858 hns_roce_cleanup_mr_table(hr_dev);
859
860err_pd_table_free:
861 hns_roce_cleanup_pd_table(hr_dev);
862
863err_uar_alloc_free:
864 hns_roce_uar_free(hr_dev, &hr_dev->priv_uar);
865
866err_uar_table_free:
867 hns_roce_cleanup_uar_table(hr_dev);
868 return ret;
869}
870
871int hns_roce_init(struct hns_roce_dev *hr_dev)
872{
873 int ret;
874 struct device *dev = hr_dev->dev;
875
876 if (hr_dev->hw->reset) {
877 ret = hr_dev->hw->reset(hr_dev, true);
878 if (ret) {
879 dev_err(dev, "Reset RoCE engine failed!\n");
880 return ret;
881 }
882 }
883 hr_dev->is_reset = false;
884
885 if (hr_dev->hw->cmq_init) {
886 ret = hr_dev->hw->cmq_init(hr_dev);
887 if (ret) {
888 dev_err(dev, "Init RoCE Command Queue failed!\n");
889 goto error_failed_cmq_init;
890 }
891 }
892
893 ret = hr_dev->hw->hw_profile(hr_dev);
894 if (ret) {
895 dev_err(dev, "Get RoCE engine profile failed!\n");
896 goto error_failed_cmd_init;
897 }
898
899 ret = hns_roce_cmd_init(hr_dev);
900 if (ret) {
901 dev_err(dev, "cmd init failed!\n");
902 goto error_failed_cmd_init;
903 }
904
905 /* EQ depends on poll mode, event mode depends on EQ */
906 ret = hr_dev->hw->init_eq(hr_dev);
907 if (ret) {
908 dev_err(dev, "eq init failed!\n");
909 goto error_failed_eq_table;
910 }
911
912 if (hr_dev->cmd_mod) {
913 ret = hns_roce_cmd_use_events(hr_dev);
914 if (ret) {
915 dev_warn(dev,
916 "Cmd event mode failed, set back to poll!\n");
917 hns_roce_cmd_use_polling(hr_dev);
918 }
919 }
920
921 ret = hns_roce_init_hem(hr_dev);
922 if (ret) {
923 dev_err(dev, "init HEM(Hardware Entry Memory) failed!\n");
924 goto error_failed_init_hem;
925 }
926
927 ret = hns_roce_setup_hca(hr_dev);
928 if (ret) {
929 dev_err(dev, "setup hca failed!\n");
930 goto error_failed_setup_hca;
931 }
932
933 if (hr_dev->hw->hw_init) {
934 ret = hr_dev->hw->hw_init(hr_dev);
935 if (ret) {
936 dev_err(dev, "hw_init failed!\n");
937 goto error_failed_engine_init;
938 }
939 }
940
941 ret = hns_roce_register_device(hr_dev);
942 if (ret)
943 goto error_failed_register_device;
944
945 return 0;
946
947error_failed_register_device:
948 if (hr_dev->hw->hw_exit)
949 hr_dev->hw->hw_exit(hr_dev);
950
951error_failed_engine_init:
952 hns_roce_cleanup_bitmap(hr_dev);
953
954error_failed_setup_hca:
955 hns_roce_cleanup_hem(hr_dev);
956
957error_failed_init_hem:
958 if (hr_dev->cmd_mod)
959 hns_roce_cmd_use_polling(hr_dev);
960 hr_dev->hw->cleanup_eq(hr_dev);
961
962error_failed_eq_table:
963 hns_roce_cmd_cleanup(hr_dev);
964
965error_failed_cmd_init:
966 if (hr_dev->hw->cmq_exit)
967 hr_dev->hw->cmq_exit(hr_dev);
968
969error_failed_cmq_init:
970 if (hr_dev->hw->reset) {
971 if (hr_dev->hw->reset(hr_dev, false))
972 dev_err(dev, "Dereset RoCE engine failed!\n");
973 }
974
975 return ret;
976}
977
978void hns_roce_exit(struct hns_roce_dev *hr_dev)
979{
980 hns_roce_unregister_device(hr_dev);
981
982 if (hr_dev->hw->hw_exit)
983 hr_dev->hw->hw_exit(hr_dev);
984 hns_roce_cleanup_bitmap(hr_dev);
985 hns_roce_cleanup_hem(hr_dev);
986
987 if (hr_dev->cmd_mod)
988 hns_roce_cmd_use_polling(hr_dev);
989
990 hr_dev->hw->cleanup_eq(hr_dev);
991 hns_roce_cmd_cleanup(hr_dev);
992 if (hr_dev->hw->cmq_exit)
993 hr_dev->hw->cmq_exit(hr_dev);
994 if (hr_dev->hw->reset)
995 hr_dev->hw->reset(hr_dev, false);
996}
997
998MODULE_LICENSE("Dual BSD/GPL");
999MODULE_AUTHOR("Wei Hu <xavier.huwei@huawei.com>");
1000MODULE_AUTHOR("Nenglong Zhao <zhaonenglong@hisilicon.com>");
1001MODULE_AUTHOR("Lijun Ou <oulijun@huawei.com>");
1002MODULE_DESCRIPTION("HNS RoCE Driver");