Loading...
1// SPDX-License-Identifier: GPL-2.0 OR BSD-2-Clause
2/*
3 * Copyright 2018-2021 Amazon.com, Inc. or its affiliates. All rights reserved.
4 */
5
6#include "efa_com.h"
7#include "efa_regs_defs.h"
8
9#define ADMIN_CMD_TIMEOUT_US 30000000 /* usecs */
10
11#define EFA_REG_READ_TIMEOUT_US 50000 /* usecs */
12#define EFA_MMIO_READ_INVALID 0xffffffff
13
14#define EFA_POLL_INTERVAL_MS 100 /* msecs */
15
16#define EFA_ASYNC_QUEUE_DEPTH 16
17#define EFA_ADMIN_QUEUE_DEPTH 32
18
19#define EFA_CTRL_MAJOR 0
20#define EFA_CTRL_MINOR 0
21#define EFA_CTRL_SUB_MINOR 1
22
23enum efa_cmd_status {
24 EFA_CMD_SUBMITTED,
25 EFA_CMD_COMPLETED,
26};
27
28struct efa_comp_ctx {
29 struct completion wait_event;
30 struct efa_admin_acq_entry *user_cqe;
31 u32 comp_size;
32 enum efa_cmd_status status;
33 u8 cmd_opcode;
34 u8 occupied;
35};
36
37static const char *efa_com_cmd_str(u8 cmd)
38{
39#define EFA_CMD_STR_CASE(_cmd) case EFA_ADMIN_##_cmd: return #_cmd
40
41 switch (cmd) {
42 EFA_CMD_STR_CASE(CREATE_QP);
43 EFA_CMD_STR_CASE(MODIFY_QP);
44 EFA_CMD_STR_CASE(QUERY_QP);
45 EFA_CMD_STR_CASE(DESTROY_QP);
46 EFA_CMD_STR_CASE(CREATE_AH);
47 EFA_CMD_STR_CASE(DESTROY_AH);
48 EFA_CMD_STR_CASE(REG_MR);
49 EFA_CMD_STR_CASE(DEREG_MR);
50 EFA_CMD_STR_CASE(CREATE_CQ);
51 EFA_CMD_STR_CASE(DESTROY_CQ);
52 EFA_CMD_STR_CASE(GET_FEATURE);
53 EFA_CMD_STR_CASE(SET_FEATURE);
54 EFA_CMD_STR_CASE(GET_STATS);
55 EFA_CMD_STR_CASE(ALLOC_PD);
56 EFA_CMD_STR_CASE(DEALLOC_PD);
57 EFA_CMD_STR_CASE(ALLOC_UAR);
58 EFA_CMD_STR_CASE(DEALLOC_UAR);
59 EFA_CMD_STR_CASE(CREATE_EQ);
60 EFA_CMD_STR_CASE(DESTROY_EQ);
61 default: return "unknown command opcode";
62 }
63#undef EFA_CMD_STR_CASE
64}
65
66void efa_com_set_dma_addr(dma_addr_t addr, u32 *addr_high, u32 *addr_low)
67{
68 *addr_low = lower_32_bits(addr);
69 *addr_high = upper_32_bits(addr);
70}
71
72static u32 efa_com_reg_read32(struct efa_com_dev *edev, u16 offset)
73{
74 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
75 struct efa_admin_mmio_req_read_less_resp *read_resp;
76 unsigned long exp_time;
77 u32 mmio_read_reg = 0;
78 u32 err;
79
80 read_resp = mmio_read->read_resp;
81
82 spin_lock(&mmio_read->lock);
83 mmio_read->seq_num++;
84
85 /* trash DMA req_id to identify when hardware is done */
86 read_resp->req_id = mmio_read->seq_num + 0x9aL;
87 EFA_SET(&mmio_read_reg, EFA_REGS_MMIO_REG_READ_REG_OFF, offset);
88 EFA_SET(&mmio_read_reg, EFA_REGS_MMIO_REG_READ_REQ_ID,
89 mmio_read->seq_num);
90
91 writel(mmio_read_reg, edev->reg_bar + EFA_REGS_MMIO_REG_READ_OFF);
92
93 exp_time = jiffies + usecs_to_jiffies(mmio_read->mmio_read_timeout);
94 do {
95 if (READ_ONCE(read_resp->req_id) == mmio_read->seq_num)
96 break;
97 udelay(1);
98 } while (time_is_after_jiffies(exp_time));
99
100 if (read_resp->req_id != mmio_read->seq_num) {
101 ibdev_err_ratelimited(
102 edev->efa_dev,
103 "Reading register timed out. expected: req id[%u] offset[%#x] actual: req id[%u] offset[%#x]\n",
104 mmio_read->seq_num, offset, read_resp->req_id,
105 read_resp->reg_off);
106 err = EFA_MMIO_READ_INVALID;
107 goto out;
108 }
109
110 if (read_resp->reg_off != offset) {
111 ibdev_err_ratelimited(
112 edev->efa_dev,
113 "Reading register failed: wrong offset provided\n");
114 err = EFA_MMIO_READ_INVALID;
115 goto out;
116 }
117
118 err = read_resp->reg_val;
119out:
120 spin_unlock(&mmio_read->lock);
121 return err;
122}
123
124static int efa_com_admin_init_sq(struct efa_com_dev *edev)
125{
126 struct efa_com_admin_queue *aq = &edev->aq;
127 struct efa_com_admin_sq *sq = &aq->sq;
128 u16 size = aq->depth * sizeof(*sq->entries);
129 u32 aq_caps = 0;
130 u32 addr_high;
131 u32 addr_low;
132
133 sq->entries =
134 dma_alloc_coherent(aq->dmadev, size, &sq->dma_addr, GFP_KERNEL);
135 if (!sq->entries)
136 return -ENOMEM;
137
138 spin_lock_init(&sq->lock);
139
140 sq->cc = 0;
141 sq->pc = 0;
142 sq->phase = 1;
143
144 sq->db_addr = (u32 __iomem *)(edev->reg_bar + EFA_REGS_AQ_PROD_DB_OFF);
145
146 addr_high = upper_32_bits(sq->dma_addr);
147 addr_low = lower_32_bits(sq->dma_addr);
148
149 writel(addr_low, edev->reg_bar + EFA_REGS_AQ_BASE_LO_OFF);
150 writel(addr_high, edev->reg_bar + EFA_REGS_AQ_BASE_HI_OFF);
151
152 EFA_SET(&aq_caps, EFA_REGS_AQ_CAPS_AQ_DEPTH, aq->depth);
153 EFA_SET(&aq_caps, EFA_REGS_AQ_CAPS_AQ_ENTRY_SIZE,
154 sizeof(struct efa_admin_aq_entry));
155
156 writel(aq_caps, edev->reg_bar + EFA_REGS_AQ_CAPS_OFF);
157
158 return 0;
159}
160
161static int efa_com_admin_init_cq(struct efa_com_dev *edev)
162{
163 struct efa_com_admin_queue *aq = &edev->aq;
164 struct efa_com_admin_cq *cq = &aq->cq;
165 u16 size = aq->depth * sizeof(*cq->entries);
166 u32 acq_caps = 0;
167 u32 addr_high;
168 u32 addr_low;
169
170 cq->entries =
171 dma_alloc_coherent(aq->dmadev, size, &cq->dma_addr, GFP_KERNEL);
172 if (!cq->entries)
173 return -ENOMEM;
174
175 spin_lock_init(&cq->lock);
176
177 cq->cc = 0;
178 cq->phase = 1;
179
180 addr_high = upper_32_bits(cq->dma_addr);
181 addr_low = lower_32_bits(cq->dma_addr);
182
183 writel(addr_low, edev->reg_bar + EFA_REGS_ACQ_BASE_LO_OFF);
184 writel(addr_high, edev->reg_bar + EFA_REGS_ACQ_BASE_HI_OFF);
185
186 EFA_SET(&acq_caps, EFA_REGS_ACQ_CAPS_ACQ_DEPTH, aq->depth);
187 EFA_SET(&acq_caps, EFA_REGS_ACQ_CAPS_ACQ_ENTRY_SIZE,
188 sizeof(struct efa_admin_acq_entry));
189 EFA_SET(&acq_caps, EFA_REGS_ACQ_CAPS_ACQ_MSIX_VECTOR,
190 aq->msix_vector_idx);
191
192 writel(acq_caps, edev->reg_bar + EFA_REGS_ACQ_CAPS_OFF);
193
194 return 0;
195}
196
197static int efa_com_admin_init_aenq(struct efa_com_dev *edev,
198 struct efa_aenq_handlers *aenq_handlers)
199{
200 struct efa_com_aenq *aenq = &edev->aenq;
201 u32 addr_low, addr_high;
202 u32 aenq_caps = 0;
203 u16 size;
204
205 if (!aenq_handlers) {
206 ibdev_err(edev->efa_dev, "aenq handlers pointer is NULL\n");
207 return -EINVAL;
208 }
209
210 size = EFA_ASYNC_QUEUE_DEPTH * sizeof(*aenq->entries);
211 aenq->entries = dma_alloc_coherent(edev->dmadev, size, &aenq->dma_addr,
212 GFP_KERNEL);
213 if (!aenq->entries)
214 return -ENOMEM;
215
216 aenq->aenq_handlers = aenq_handlers;
217 aenq->depth = EFA_ASYNC_QUEUE_DEPTH;
218 aenq->cc = 0;
219 aenq->phase = 1;
220
221 addr_low = lower_32_bits(aenq->dma_addr);
222 addr_high = upper_32_bits(aenq->dma_addr);
223
224 writel(addr_low, edev->reg_bar + EFA_REGS_AENQ_BASE_LO_OFF);
225 writel(addr_high, edev->reg_bar + EFA_REGS_AENQ_BASE_HI_OFF);
226
227 EFA_SET(&aenq_caps, EFA_REGS_AENQ_CAPS_AENQ_DEPTH, aenq->depth);
228 EFA_SET(&aenq_caps, EFA_REGS_AENQ_CAPS_AENQ_ENTRY_SIZE,
229 sizeof(struct efa_admin_aenq_entry));
230 EFA_SET(&aenq_caps, EFA_REGS_AENQ_CAPS_AENQ_MSIX_VECTOR,
231 aenq->msix_vector_idx);
232 writel(aenq_caps, edev->reg_bar + EFA_REGS_AENQ_CAPS_OFF);
233
234 /*
235 * Init cons_db to mark that all entries in the queue
236 * are initially available
237 */
238 writel(edev->aenq.cc, edev->reg_bar + EFA_REGS_AENQ_CONS_DB_OFF);
239
240 return 0;
241}
242
243/* ID to be used with efa_com_get_comp_ctx */
244static u16 efa_com_alloc_ctx_id(struct efa_com_admin_queue *aq)
245{
246 u16 ctx_id;
247
248 spin_lock(&aq->comp_ctx_lock);
249 ctx_id = aq->comp_ctx_pool[aq->comp_ctx_pool_next];
250 aq->comp_ctx_pool_next++;
251 spin_unlock(&aq->comp_ctx_lock);
252
253 return ctx_id;
254}
255
256static void efa_com_dealloc_ctx_id(struct efa_com_admin_queue *aq,
257 u16 ctx_id)
258{
259 spin_lock(&aq->comp_ctx_lock);
260 aq->comp_ctx_pool_next--;
261 aq->comp_ctx_pool[aq->comp_ctx_pool_next] = ctx_id;
262 spin_unlock(&aq->comp_ctx_lock);
263}
264
265static inline void efa_com_put_comp_ctx(struct efa_com_admin_queue *aq,
266 struct efa_comp_ctx *comp_ctx)
267{
268 u16 cmd_id = EFA_GET(&comp_ctx->user_cqe->acq_common_descriptor.command,
269 EFA_ADMIN_ACQ_COMMON_DESC_COMMAND_ID);
270 u16 ctx_id = cmd_id & (aq->depth - 1);
271
272 ibdev_dbg(aq->efa_dev, "Put completion command_id %#x\n", cmd_id);
273 comp_ctx->occupied = 0;
274 efa_com_dealloc_ctx_id(aq, ctx_id);
275}
276
277static struct efa_comp_ctx *efa_com_get_comp_ctx(struct efa_com_admin_queue *aq,
278 u16 cmd_id, bool capture)
279{
280 u16 ctx_id = cmd_id & (aq->depth - 1);
281
282 if (aq->comp_ctx[ctx_id].occupied && capture) {
283 ibdev_err_ratelimited(
284 aq->efa_dev,
285 "Completion context for command_id %#x is occupied\n",
286 cmd_id);
287 return NULL;
288 }
289
290 if (capture) {
291 aq->comp_ctx[ctx_id].occupied = 1;
292 ibdev_dbg(aq->efa_dev,
293 "Take completion ctxt for command_id %#x\n", cmd_id);
294 }
295
296 return &aq->comp_ctx[ctx_id];
297}
298
299static struct efa_comp_ctx *__efa_com_submit_admin_cmd(struct efa_com_admin_queue *aq,
300 struct efa_admin_aq_entry *cmd,
301 size_t cmd_size_in_bytes,
302 struct efa_admin_acq_entry *comp,
303 size_t comp_size_in_bytes)
304{
305 struct efa_admin_aq_entry *aqe;
306 struct efa_comp_ctx *comp_ctx;
307 u16 queue_size_mask;
308 u16 cmd_id;
309 u16 ctx_id;
310 u16 pi;
311
312 queue_size_mask = aq->depth - 1;
313 pi = aq->sq.pc & queue_size_mask;
314
315 ctx_id = efa_com_alloc_ctx_id(aq);
316
317 /* cmd_id LSBs are the ctx_id and MSBs are entropy bits from pc */
318 cmd_id = ctx_id & queue_size_mask;
319 cmd_id |= aq->sq.pc & ~queue_size_mask;
320 cmd_id &= EFA_ADMIN_AQ_COMMON_DESC_COMMAND_ID_MASK;
321
322 cmd->aq_common_descriptor.command_id = cmd_id;
323 EFA_SET(&cmd->aq_common_descriptor.flags,
324 EFA_ADMIN_AQ_COMMON_DESC_PHASE, aq->sq.phase);
325
326 comp_ctx = efa_com_get_comp_ctx(aq, cmd_id, true);
327 if (!comp_ctx) {
328 efa_com_dealloc_ctx_id(aq, ctx_id);
329 return ERR_PTR(-EINVAL);
330 }
331
332 comp_ctx->status = EFA_CMD_SUBMITTED;
333 comp_ctx->comp_size = comp_size_in_bytes;
334 comp_ctx->user_cqe = comp;
335 comp_ctx->cmd_opcode = cmd->aq_common_descriptor.opcode;
336
337 reinit_completion(&comp_ctx->wait_event);
338
339 aqe = &aq->sq.entries[pi];
340 memset(aqe, 0, sizeof(*aqe));
341 memcpy(aqe, cmd, cmd_size_in_bytes);
342
343 aq->sq.pc++;
344 atomic64_inc(&aq->stats.submitted_cmd);
345
346 if ((aq->sq.pc & queue_size_mask) == 0)
347 aq->sq.phase = !aq->sq.phase;
348
349 /* barrier not needed in case of writel */
350 writel(aq->sq.pc, aq->sq.db_addr);
351
352 return comp_ctx;
353}
354
355static inline int efa_com_init_comp_ctxt(struct efa_com_admin_queue *aq)
356{
357 size_t pool_size = aq->depth * sizeof(*aq->comp_ctx_pool);
358 size_t size = aq->depth * sizeof(struct efa_comp_ctx);
359 struct efa_comp_ctx *comp_ctx;
360 u16 i;
361
362 aq->comp_ctx = devm_kzalloc(aq->dmadev, size, GFP_KERNEL);
363 aq->comp_ctx_pool = devm_kzalloc(aq->dmadev, pool_size, GFP_KERNEL);
364 if (!aq->comp_ctx || !aq->comp_ctx_pool) {
365 devm_kfree(aq->dmadev, aq->comp_ctx_pool);
366 devm_kfree(aq->dmadev, aq->comp_ctx);
367 return -ENOMEM;
368 }
369
370 for (i = 0; i < aq->depth; i++) {
371 comp_ctx = efa_com_get_comp_ctx(aq, i, false);
372 if (comp_ctx)
373 init_completion(&comp_ctx->wait_event);
374
375 aq->comp_ctx_pool[i] = i;
376 }
377
378 spin_lock_init(&aq->comp_ctx_lock);
379
380 aq->comp_ctx_pool_next = 0;
381
382 return 0;
383}
384
385static struct efa_comp_ctx *efa_com_submit_admin_cmd(struct efa_com_admin_queue *aq,
386 struct efa_admin_aq_entry *cmd,
387 size_t cmd_size_in_bytes,
388 struct efa_admin_acq_entry *comp,
389 size_t comp_size_in_bytes)
390{
391 struct efa_comp_ctx *comp_ctx;
392
393 spin_lock(&aq->sq.lock);
394 if (!test_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state)) {
395 ibdev_err_ratelimited(aq->efa_dev, "Admin queue is closed\n");
396 spin_unlock(&aq->sq.lock);
397 return ERR_PTR(-ENODEV);
398 }
399
400 comp_ctx = __efa_com_submit_admin_cmd(aq, cmd, cmd_size_in_bytes, comp,
401 comp_size_in_bytes);
402 spin_unlock(&aq->sq.lock);
403 if (IS_ERR(comp_ctx))
404 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
405
406 return comp_ctx;
407}
408
409static void efa_com_handle_single_admin_completion(struct efa_com_admin_queue *aq,
410 struct efa_admin_acq_entry *cqe)
411{
412 struct efa_comp_ctx *comp_ctx;
413 u16 cmd_id;
414
415 cmd_id = EFA_GET(&cqe->acq_common_descriptor.command,
416 EFA_ADMIN_ACQ_COMMON_DESC_COMMAND_ID);
417
418 comp_ctx = efa_com_get_comp_ctx(aq, cmd_id, false);
419 if (!comp_ctx) {
420 ibdev_err(aq->efa_dev,
421 "comp_ctx is NULL. Changing the admin queue running state\n");
422 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
423 return;
424 }
425
426 comp_ctx->status = EFA_CMD_COMPLETED;
427 memcpy(comp_ctx->user_cqe, cqe, comp_ctx->comp_size);
428
429 if (!test_bit(EFA_AQ_STATE_POLLING_BIT, &aq->state))
430 complete(&comp_ctx->wait_event);
431}
432
433static void efa_com_handle_admin_completion(struct efa_com_admin_queue *aq)
434{
435 struct efa_admin_acq_entry *cqe;
436 u16 queue_size_mask;
437 u16 comp_num = 0;
438 u8 phase;
439 u16 ci;
440
441 queue_size_mask = aq->depth - 1;
442
443 ci = aq->cq.cc & queue_size_mask;
444 phase = aq->cq.phase;
445
446 cqe = &aq->cq.entries[ci];
447
448 /* Go over all the completions */
449 while ((READ_ONCE(cqe->acq_common_descriptor.flags) &
450 EFA_ADMIN_ACQ_COMMON_DESC_PHASE_MASK) == phase) {
451 /*
452 * Do not read the rest of the completion entry before the
453 * phase bit was validated
454 */
455 dma_rmb();
456 efa_com_handle_single_admin_completion(aq, cqe);
457
458 ci++;
459 comp_num++;
460 if (ci == aq->depth) {
461 ci = 0;
462 phase = !phase;
463 }
464
465 cqe = &aq->cq.entries[ci];
466 }
467
468 aq->cq.cc += comp_num;
469 aq->cq.phase = phase;
470 aq->sq.cc += comp_num;
471 atomic64_add(comp_num, &aq->stats.completed_cmd);
472}
473
474static int efa_com_comp_status_to_errno(u8 comp_status)
475{
476 switch (comp_status) {
477 case EFA_ADMIN_SUCCESS:
478 return 0;
479 case EFA_ADMIN_RESOURCE_ALLOCATION_FAILURE:
480 return -ENOMEM;
481 case EFA_ADMIN_UNSUPPORTED_OPCODE:
482 return -EOPNOTSUPP;
483 case EFA_ADMIN_BAD_OPCODE:
484 case EFA_ADMIN_MALFORMED_REQUEST:
485 case EFA_ADMIN_ILLEGAL_PARAMETER:
486 case EFA_ADMIN_UNKNOWN_ERROR:
487 return -EINVAL;
488 default:
489 return -EINVAL;
490 }
491}
492
493static int efa_com_wait_and_process_admin_cq_polling(struct efa_comp_ctx *comp_ctx,
494 struct efa_com_admin_queue *aq)
495{
496 unsigned long timeout;
497 unsigned long flags;
498 int err;
499
500 timeout = jiffies + usecs_to_jiffies(aq->completion_timeout);
501
502 while (1) {
503 spin_lock_irqsave(&aq->cq.lock, flags);
504 efa_com_handle_admin_completion(aq);
505 spin_unlock_irqrestore(&aq->cq.lock, flags);
506
507 if (comp_ctx->status != EFA_CMD_SUBMITTED)
508 break;
509
510 if (time_is_before_jiffies(timeout)) {
511 ibdev_err_ratelimited(
512 aq->efa_dev,
513 "Wait for completion (polling) timeout\n");
514 /* EFA didn't have any completion */
515 atomic64_inc(&aq->stats.no_completion);
516
517 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
518 err = -ETIME;
519 goto out;
520 }
521
522 msleep(aq->poll_interval);
523 }
524
525 err = efa_com_comp_status_to_errno(comp_ctx->user_cqe->acq_common_descriptor.status);
526out:
527 efa_com_put_comp_ctx(aq, comp_ctx);
528 return err;
529}
530
531static int efa_com_wait_and_process_admin_cq_interrupts(struct efa_comp_ctx *comp_ctx,
532 struct efa_com_admin_queue *aq)
533{
534 unsigned long flags;
535 int err;
536
537 wait_for_completion_timeout(&comp_ctx->wait_event,
538 usecs_to_jiffies(aq->completion_timeout));
539
540 /*
541 * In case the command wasn't completed find out the root cause.
542 * There might be 2 kinds of errors
543 * 1) No completion (timeout reached)
544 * 2) There is completion but the device didn't get any msi-x interrupt.
545 */
546 if (comp_ctx->status == EFA_CMD_SUBMITTED) {
547 spin_lock_irqsave(&aq->cq.lock, flags);
548 efa_com_handle_admin_completion(aq);
549 spin_unlock_irqrestore(&aq->cq.lock, flags);
550
551 atomic64_inc(&aq->stats.no_completion);
552
553 if (comp_ctx->status == EFA_CMD_COMPLETED)
554 ibdev_err_ratelimited(
555 aq->efa_dev,
556 "The device sent a completion but the driver didn't receive any MSI-X interrupt for admin cmd %s(%d) status %d (ctx: 0x%p, sq producer: %d, sq consumer: %d, cq consumer: %d)\n",
557 efa_com_cmd_str(comp_ctx->cmd_opcode),
558 comp_ctx->cmd_opcode, comp_ctx->status,
559 comp_ctx, aq->sq.pc, aq->sq.cc, aq->cq.cc);
560 else
561 ibdev_err_ratelimited(
562 aq->efa_dev,
563 "The device didn't send any completion for admin cmd %s(%d) status %d (ctx 0x%p, sq producer: %d, sq consumer: %d, cq consumer: %d)\n",
564 efa_com_cmd_str(comp_ctx->cmd_opcode),
565 comp_ctx->cmd_opcode, comp_ctx->status,
566 comp_ctx, aq->sq.pc, aq->sq.cc, aq->cq.cc);
567
568 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
569 err = -ETIME;
570 goto out;
571 }
572
573 err = efa_com_comp_status_to_errno(comp_ctx->user_cqe->acq_common_descriptor.status);
574out:
575 efa_com_put_comp_ctx(aq, comp_ctx);
576 return err;
577}
578
579/*
580 * There are two types to wait for completion.
581 * Polling mode - wait until the completion is available.
582 * Async mode - wait on wait queue until the completion is ready
583 * (or the timeout expired).
584 * It is expected that the IRQ called efa_com_handle_admin_completion
585 * to mark the completions.
586 */
587static int efa_com_wait_and_process_admin_cq(struct efa_comp_ctx *comp_ctx,
588 struct efa_com_admin_queue *aq)
589{
590 if (test_bit(EFA_AQ_STATE_POLLING_BIT, &aq->state))
591 return efa_com_wait_and_process_admin_cq_polling(comp_ctx, aq);
592
593 return efa_com_wait_and_process_admin_cq_interrupts(comp_ctx, aq);
594}
595
596/**
597 * efa_com_cmd_exec - Execute admin command
598 * @aq: admin queue.
599 * @cmd: the admin command to execute.
600 * @cmd_size: the command size.
601 * @comp: command completion return entry.
602 * @comp_size: command completion size.
603 * Submit an admin command and then wait until the device will return a
604 * completion.
605 * The completion will be copied into comp.
606 *
607 * @return - 0 on success, negative value on failure.
608 */
609int efa_com_cmd_exec(struct efa_com_admin_queue *aq,
610 struct efa_admin_aq_entry *cmd,
611 size_t cmd_size,
612 struct efa_admin_acq_entry *comp,
613 size_t comp_size)
614{
615 struct efa_comp_ctx *comp_ctx;
616 int err;
617
618 might_sleep();
619
620 /* In case of queue FULL */
621 down(&aq->avail_cmds);
622
623 ibdev_dbg(aq->efa_dev, "%s (opcode %d)\n",
624 efa_com_cmd_str(cmd->aq_common_descriptor.opcode),
625 cmd->aq_common_descriptor.opcode);
626 comp_ctx = efa_com_submit_admin_cmd(aq, cmd, cmd_size, comp, comp_size);
627 if (IS_ERR(comp_ctx)) {
628 ibdev_err_ratelimited(
629 aq->efa_dev,
630 "Failed to submit command %s (opcode %u) err %ld\n",
631 efa_com_cmd_str(cmd->aq_common_descriptor.opcode),
632 cmd->aq_common_descriptor.opcode, PTR_ERR(comp_ctx));
633
634 up(&aq->avail_cmds);
635 atomic64_inc(&aq->stats.cmd_err);
636 return PTR_ERR(comp_ctx);
637 }
638
639 err = efa_com_wait_and_process_admin_cq(comp_ctx, aq);
640 if (err) {
641 ibdev_err_ratelimited(
642 aq->efa_dev,
643 "Failed to process command %s (opcode %u) comp_status %d err %d\n",
644 efa_com_cmd_str(cmd->aq_common_descriptor.opcode),
645 cmd->aq_common_descriptor.opcode,
646 comp_ctx->user_cqe->acq_common_descriptor.status, err);
647 atomic64_inc(&aq->stats.cmd_err);
648 }
649
650 up(&aq->avail_cmds);
651
652 return err;
653}
654
655/**
656 * efa_com_admin_destroy - Destroy the admin and the async events queues.
657 * @edev: EFA communication layer struct
658 */
659void efa_com_admin_destroy(struct efa_com_dev *edev)
660{
661 struct efa_com_admin_queue *aq = &edev->aq;
662 struct efa_com_aenq *aenq = &edev->aenq;
663 struct efa_com_admin_cq *cq = &aq->cq;
664 struct efa_com_admin_sq *sq = &aq->sq;
665 u16 size;
666
667 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
668
669 devm_kfree(edev->dmadev, aq->comp_ctx_pool);
670 devm_kfree(edev->dmadev, aq->comp_ctx);
671
672 size = aq->depth * sizeof(*sq->entries);
673 dma_free_coherent(edev->dmadev, size, sq->entries, sq->dma_addr);
674
675 size = aq->depth * sizeof(*cq->entries);
676 dma_free_coherent(edev->dmadev, size, cq->entries, cq->dma_addr);
677
678 size = aenq->depth * sizeof(*aenq->entries);
679 dma_free_coherent(edev->dmadev, size, aenq->entries, aenq->dma_addr);
680}
681
682/**
683 * efa_com_set_admin_polling_mode - Set the admin completion queue polling mode
684 * @edev: EFA communication layer struct
685 * @polling: Enable/Disable polling mode
686 *
687 * Set the admin completion mode.
688 */
689void efa_com_set_admin_polling_mode(struct efa_com_dev *edev, bool polling)
690{
691 u32 mask_value = 0;
692
693 if (polling)
694 EFA_SET(&mask_value, EFA_REGS_INTR_MASK_EN, 1);
695
696 writel(mask_value, edev->reg_bar + EFA_REGS_INTR_MASK_OFF);
697 if (polling)
698 set_bit(EFA_AQ_STATE_POLLING_BIT, &edev->aq.state);
699 else
700 clear_bit(EFA_AQ_STATE_POLLING_BIT, &edev->aq.state);
701}
702
703static void efa_com_stats_init(struct efa_com_dev *edev)
704{
705 atomic64_t *s = (atomic64_t *)&edev->aq.stats;
706 int i;
707
708 for (i = 0; i < sizeof(edev->aq.stats) / sizeof(*s); i++, s++)
709 atomic64_set(s, 0);
710}
711
712/**
713 * efa_com_admin_init - Init the admin and the async queues
714 * @edev: EFA communication layer struct
715 * @aenq_handlers: Those handlers to be called upon event.
716 *
717 * Initialize the admin submission and completion queues.
718 * Initialize the asynchronous events notification queues.
719 *
720 * @return - 0 on success, negative value on failure.
721 */
722int efa_com_admin_init(struct efa_com_dev *edev,
723 struct efa_aenq_handlers *aenq_handlers)
724{
725 struct efa_com_admin_queue *aq = &edev->aq;
726 u32 timeout;
727 u32 dev_sts;
728 u32 cap;
729 int err;
730
731 dev_sts = efa_com_reg_read32(edev, EFA_REGS_DEV_STS_OFF);
732 if (!EFA_GET(&dev_sts, EFA_REGS_DEV_STS_READY)) {
733 ibdev_err(edev->efa_dev,
734 "Device isn't ready, abort com init %#x\n", dev_sts);
735 return -ENODEV;
736 }
737
738 aq->depth = EFA_ADMIN_QUEUE_DEPTH;
739
740 aq->dmadev = edev->dmadev;
741 aq->efa_dev = edev->efa_dev;
742 set_bit(EFA_AQ_STATE_POLLING_BIT, &aq->state);
743
744 sema_init(&aq->avail_cmds, aq->depth);
745
746 efa_com_stats_init(edev);
747
748 err = efa_com_init_comp_ctxt(aq);
749 if (err)
750 return err;
751
752 err = efa_com_admin_init_sq(edev);
753 if (err)
754 goto err_destroy_comp_ctxt;
755
756 err = efa_com_admin_init_cq(edev);
757 if (err)
758 goto err_destroy_sq;
759
760 efa_com_set_admin_polling_mode(edev, false);
761
762 err = efa_com_admin_init_aenq(edev, aenq_handlers);
763 if (err)
764 goto err_destroy_cq;
765
766 cap = efa_com_reg_read32(edev, EFA_REGS_CAPS_OFF);
767 timeout = EFA_GET(&cap, EFA_REGS_CAPS_ADMIN_CMD_TO);
768 if (timeout)
769 /* the resolution of timeout reg is 100ms */
770 aq->completion_timeout = timeout * 100000;
771 else
772 aq->completion_timeout = ADMIN_CMD_TIMEOUT_US;
773
774 aq->poll_interval = EFA_POLL_INTERVAL_MS;
775
776 set_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
777
778 return 0;
779
780err_destroy_cq:
781 dma_free_coherent(edev->dmadev, aq->depth * sizeof(*aq->cq.entries),
782 aq->cq.entries, aq->cq.dma_addr);
783err_destroy_sq:
784 dma_free_coherent(edev->dmadev, aq->depth * sizeof(*aq->sq.entries),
785 aq->sq.entries, aq->sq.dma_addr);
786err_destroy_comp_ctxt:
787 devm_kfree(edev->dmadev, aq->comp_ctx);
788
789 return err;
790}
791
792/**
793 * efa_com_admin_q_comp_intr_handler - admin queue interrupt handler
794 * @edev: EFA communication layer struct
795 *
796 * This method goes over the admin completion queue and wakes up
797 * all the pending threads that wait on the commands wait event.
798 *
799 * Note: Should be called after MSI-X interrupt.
800 */
801void efa_com_admin_q_comp_intr_handler(struct efa_com_dev *edev)
802{
803 unsigned long flags;
804
805 spin_lock_irqsave(&edev->aq.cq.lock, flags);
806 efa_com_handle_admin_completion(&edev->aq);
807 spin_unlock_irqrestore(&edev->aq.cq.lock, flags);
808}
809
810/*
811 * efa_handle_specific_aenq_event:
812 * return the handler that is relevant to the specific event group
813 */
814static efa_aenq_handler efa_com_get_specific_aenq_cb(struct efa_com_dev *edev,
815 u16 group)
816{
817 struct efa_aenq_handlers *aenq_handlers = edev->aenq.aenq_handlers;
818
819 if (group < EFA_MAX_HANDLERS && aenq_handlers->handlers[group])
820 return aenq_handlers->handlers[group];
821
822 return aenq_handlers->unimplemented_handler;
823}
824
825/**
826 * efa_com_aenq_intr_handler - AENQ interrupt handler
827 * @edev: EFA communication layer struct
828 * @data: Data of interrupt handler.
829 *
830 * Go over the async event notification queue and call the proper aenq handler.
831 */
832void efa_com_aenq_intr_handler(struct efa_com_dev *edev, void *data)
833{
834 struct efa_admin_aenq_common_desc *aenq_common;
835 struct efa_com_aenq *aenq = &edev->aenq;
836 struct efa_admin_aenq_entry *aenq_e;
837 efa_aenq_handler handler_cb;
838 u32 processed = 0;
839 u8 phase;
840 u32 ci;
841
842 ci = aenq->cc & (aenq->depth - 1);
843 phase = aenq->phase;
844 aenq_e = &aenq->entries[ci]; /* Get first entry */
845 aenq_common = &aenq_e->aenq_common_desc;
846
847 /* Go over all the events */
848 while ((READ_ONCE(aenq_common->flags) &
849 EFA_ADMIN_AENQ_COMMON_DESC_PHASE_MASK) == phase) {
850 /*
851 * Do not read the rest of the completion entry before the
852 * phase bit was validated
853 */
854 dma_rmb();
855
856 /* Handle specific event*/
857 handler_cb = efa_com_get_specific_aenq_cb(edev,
858 aenq_common->group);
859 handler_cb(data, aenq_e); /* call the actual event handler*/
860
861 /* Get next event entry */
862 ci++;
863 processed++;
864
865 if (ci == aenq->depth) {
866 ci = 0;
867 phase = !phase;
868 }
869 aenq_e = &aenq->entries[ci];
870 aenq_common = &aenq_e->aenq_common_desc;
871 }
872
873 aenq->cc += processed;
874 aenq->phase = phase;
875
876 /* Don't update aenq doorbell if there weren't any processed events */
877 if (!processed)
878 return;
879
880 /* barrier not needed in case of writel */
881 writel(aenq->cc, edev->reg_bar + EFA_REGS_AENQ_CONS_DB_OFF);
882}
883
884static void efa_com_mmio_reg_read_resp_addr_init(struct efa_com_dev *edev)
885{
886 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
887 u32 addr_high;
888 u32 addr_low;
889
890 /* dma_addr_bits is unknown at this point */
891 addr_high = (mmio_read->read_resp_dma_addr >> 32) & GENMASK(31, 0);
892 addr_low = mmio_read->read_resp_dma_addr & GENMASK(31, 0);
893
894 writel(addr_high, edev->reg_bar + EFA_REGS_MMIO_RESP_HI_OFF);
895 writel(addr_low, edev->reg_bar + EFA_REGS_MMIO_RESP_LO_OFF);
896}
897
898int efa_com_mmio_reg_read_init(struct efa_com_dev *edev)
899{
900 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
901
902 spin_lock_init(&mmio_read->lock);
903 mmio_read->read_resp =
904 dma_alloc_coherent(edev->dmadev, sizeof(*mmio_read->read_resp),
905 &mmio_read->read_resp_dma_addr, GFP_KERNEL);
906 if (!mmio_read->read_resp)
907 return -ENOMEM;
908
909 efa_com_mmio_reg_read_resp_addr_init(edev);
910
911 mmio_read->read_resp->req_id = 0;
912 mmio_read->seq_num = 0;
913 mmio_read->mmio_read_timeout = EFA_REG_READ_TIMEOUT_US;
914
915 return 0;
916}
917
918void efa_com_mmio_reg_read_destroy(struct efa_com_dev *edev)
919{
920 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
921
922 dma_free_coherent(edev->dmadev, sizeof(*mmio_read->read_resp),
923 mmio_read->read_resp, mmio_read->read_resp_dma_addr);
924}
925
926int efa_com_validate_version(struct efa_com_dev *edev)
927{
928 u32 min_ctrl_ver = 0;
929 u32 ctrl_ver_masked;
930 u32 min_ver = 0;
931 u32 ctrl_ver;
932 u32 ver;
933
934 /*
935 * Make sure the EFA version and the controller version are at least
936 * as the driver expects
937 */
938 ver = efa_com_reg_read32(edev, EFA_REGS_VERSION_OFF);
939 ctrl_ver = efa_com_reg_read32(edev,
940 EFA_REGS_CONTROLLER_VERSION_OFF);
941
942 ibdev_dbg(edev->efa_dev, "efa device version: %d.%d\n",
943 EFA_GET(&ver, EFA_REGS_VERSION_MAJOR_VERSION),
944 EFA_GET(&ver, EFA_REGS_VERSION_MINOR_VERSION));
945
946 EFA_SET(&min_ver, EFA_REGS_VERSION_MAJOR_VERSION,
947 EFA_ADMIN_API_VERSION_MAJOR);
948 EFA_SET(&min_ver, EFA_REGS_VERSION_MINOR_VERSION,
949 EFA_ADMIN_API_VERSION_MINOR);
950 if (ver < min_ver) {
951 ibdev_err(edev->efa_dev,
952 "EFA version is lower than the minimal version the driver supports\n");
953 return -EOPNOTSUPP;
954 }
955
956 ibdev_dbg(
957 edev->efa_dev,
958 "efa controller version: %d.%d.%d implementation version %d\n",
959 EFA_GET(&ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MAJOR_VERSION),
960 EFA_GET(&ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MINOR_VERSION),
961 EFA_GET(&ctrl_ver,
962 EFA_REGS_CONTROLLER_VERSION_SUBMINOR_VERSION),
963 EFA_GET(&ctrl_ver, EFA_REGS_CONTROLLER_VERSION_IMPL_ID));
964
965 ctrl_ver_masked =
966 EFA_GET(&ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MAJOR_VERSION) |
967 EFA_GET(&ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MINOR_VERSION) |
968 EFA_GET(&ctrl_ver,
969 EFA_REGS_CONTROLLER_VERSION_SUBMINOR_VERSION);
970
971 EFA_SET(&min_ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MAJOR_VERSION,
972 EFA_CTRL_MAJOR);
973 EFA_SET(&min_ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MINOR_VERSION,
974 EFA_CTRL_MINOR);
975 EFA_SET(&min_ctrl_ver, EFA_REGS_CONTROLLER_VERSION_SUBMINOR_VERSION,
976 EFA_CTRL_SUB_MINOR);
977 /* Validate the ctrl version without the implementation ID */
978 if (ctrl_ver_masked < min_ctrl_ver) {
979 ibdev_err(edev->efa_dev,
980 "EFA ctrl version is lower than the minimal ctrl version the driver supports\n");
981 return -EOPNOTSUPP;
982 }
983
984 return 0;
985}
986
987/**
988 * efa_com_get_dma_width - Retrieve physical dma address width the device
989 * supports.
990 * @edev: EFA communication layer struct
991 *
992 * Retrieve the maximum physical address bits the device can handle.
993 *
994 * @return: > 0 on Success and negative value otherwise.
995 */
996int efa_com_get_dma_width(struct efa_com_dev *edev)
997{
998 u32 caps = efa_com_reg_read32(edev, EFA_REGS_CAPS_OFF);
999 int width;
1000
1001 width = EFA_GET(&caps, EFA_REGS_CAPS_DMA_ADDR_WIDTH);
1002
1003 ibdev_dbg(edev->efa_dev, "DMA width: %d\n", width);
1004
1005 if (width < 32 || width > 64) {
1006 ibdev_err(edev->efa_dev, "DMA width illegal value: %d\n", width);
1007 return -EINVAL;
1008 }
1009
1010 edev->dma_addr_bits = width;
1011
1012 return width;
1013}
1014
1015static int wait_for_reset_state(struct efa_com_dev *edev, u32 timeout, int on)
1016{
1017 u32 val, i;
1018
1019 for (i = 0; i < timeout; i++) {
1020 val = efa_com_reg_read32(edev, EFA_REGS_DEV_STS_OFF);
1021
1022 if (EFA_GET(&val, EFA_REGS_DEV_STS_RESET_IN_PROGRESS) == on)
1023 return 0;
1024
1025 ibdev_dbg(edev->efa_dev, "Reset indication val %d\n", val);
1026 msleep(EFA_POLL_INTERVAL_MS);
1027 }
1028
1029 return -ETIME;
1030}
1031
1032/**
1033 * efa_com_dev_reset - Perform device FLR to the device.
1034 * @edev: EFA communication layer struct
1035 * @reset_reason: Specify what is the trigger for the reset in case of an error.
1036 *
1037 * @return - 0 on success, negative value on failure.
1038 */
1039int efa_com_dev_reset(struct efa_com_dev *edev,
1040 enum efa_regs_reset_reason_types reset_reason)
1041{
1042 u32 stat, timeout, cap;
1043 u32 reset_val = 0;
1044 int err;
1045
1046 stat = efa_com_reg_read32(edev, EFA_REGS_DEV_STS_OFF);
1047 cap = efa_com_reg_read32(edev, EFA_REGS_CAPS_OFF);
1048
1049 if (!EFA_GET(&stat, EFA_REGS_DEV_STS_READY)) {
1050 ibdev_err(edev->efa_dev,
1051 "Device isn't ready, can't reset device\n");
1052 return -EINVAL;
1053 }
1054
1055 timeout = EFA_GET(&cap, EFA_REGS_CAPS_RESET_TIMEOUT);
1056 if (!timeout) {
1057 ibdev_err(edev->efa_dev, "Invalid timeout value\n");
1058 return -EINVAL;
1059 }
1060
1061 /* start reset */
1062 EFA_SET(&reset_val, EFA_REGS_DEV_CTL_DEV_RESET, 1);
1063 EFA_SET(&reset_val, EFA_REGS_DEV_CTL_RESET_REASON, reset_reason);
1064 writel(reset_val, edev->reg_bar + EFA_REGS_DEV_CTL_OFF);
1065
1066 /* reset clears the mmio readless address, restore it */
1067 efa_com_mmio_reg_read_resp_addr_init(edev);
1068
1069 err = wait_for_reset_state(edev, timeout, 1);
1070 if (err) {
1071 ibdev_err(edev->efa_dev, "Reset indication didn't turn on\n");
1072 return err;
1073 }
1074
1075 /* reset done */
1076 writel(0, edev->reg_bar + EFA_REGS_DEV_CTL_OFF);
1077 err = wait_for_reset_state(edev, timeout, 0);
1078 if (err) {
1079 ibdev_err(edev->efa_dev, "Reset indication didn't turn off\n");
1080 return err;
1081 }
1082
1083 timeout = EFA_GET(&cap, EFA_REGS_CAPS_ADMIN_CMD_TO);
1084 if (timeout)
1085 /* the resolution of timeout reg is 100ms */
1086 edev->aq.completion_timeout = timeout * 100000;
1087 else
1088 edev->aq.completion_timeout = ADMIN_CMD_TIMEOUT_US;
1089
1090 return 0;
1091}
1092
1093static int efa_com_create_eq(struct efa_com_dev *edev,
1094 struct efa_com_create_eq_params *params,
1095 struct efa_com_create_eq_result *result)
1096{
1097 struct efa_com_admin_queue *aq = &edev->aq;
1098 struct efa_admin_create_eq_resp resp = {};
1099 struct efa_admin_create_eq_cmd cmd = {};
1100 int err;
1101
1102 cmd.aq_common_descriptor.opcode = EFA_ADMIN_CREATE_EQ;
1103 EFA_SET(&cmd.caps, EFA_ADMIN_CREATE_EQ_CMD_ENTRY_SIZE_WORDS,
1104 params->entry_size_in_bytes / 4);
1105 cmd.depth = params->depth;
1106 cmd.event_bitmask = params->event_bitmask;
1107 cmd.msix_vec = params->msix_vec;
1108
1109 efa_com_set_dma_addr(params->dma_addr, &cmd.ba.mem_addr_high,
1110 &cmd.ba.mem_addr_low);
1111
1112 err = efa_com_cmd_exec(aq,
1113 (struct efa_admin_aq_entry *)&cmd,
1114 sizeof(cmd),
1115 (struct efa_admin_acq_entry *)&resp,
1116 sizeof(resp));
1117 if (err) {
1118 ibdev_err_ratelimited(edev->efa_dev,
1119 "Failed to create eq[%d]\n", err);
1120 return err;
1121 }
1122
1123 result->eqn = resp.eqn;
1124
1125 return 0;
1126}
1127
1128static void efa_com_destroy_eq(struct efa_com_dev *edev,
1129 struct efa_com_destroy_eq_params *params)
1130{
1131 struct efa_com_admin_queue *aq = &edev->aq;
1132 struct efa_admin_destroy_eq_resp resp = {};
1133 struct efa_admin_destroy_eq_cmd cmd = {};
1134 int err;
1135
1136 cmd.aq_common_descriptor.opcode = EFA_ADMIN_DESTROY_EQ;
1137 cmd.eqn = params->eqn;
1138
1139 err = efa_com_cmd_exec(aq,
1140 (struct efa_admin_aq_entry *)&cmd,
1141 sizeof(cmd),
1142 (struct efa_admin_acq_entry *)&resp,
1143 sizeof(resp));
1144 if (err)
1145 ibdev_err_ratelimited(edev->efa_dev,
1146 "Failed to destroy EQ-%u [%d]\n", cmd.eqn,
1147 err);
1148}
1149
1150static void efa_com_arm_eq(struct efa_com_dev *edev, struct efa_com_eq *eeq)
1151{
1152 u32 val = 0;
1153
1154 EFA_SET(&val, EFA_REGS_EQ_DB_EQN, eeq->eqn);
1155 EFA_SET(&val, EFA_REGS_EQ_DB_ARM, 1);
1156
1157 writel(val, edev->reg_bar + EFA_REGS_EQ_DB_OFF);
1158}
1159
1160void efa_com_eq_comp_intr_handler(struct efa_com_dev *edev,
1161 struct efa_com_eq *eeq)
1162{
1163 struct efa_admin_eqe *eqe;
1164 u32 processed = 0;
1165 u8 phase;
1166 u32 ci;
1167
1168 ci = eeq->cc & (eeq->depth - 1);
1169 phase = eeq->phase;
1170 eqe = &eeq->eqes[ci];
1171
1172 /* Go over all the events */
1173 while ((READ_ONCE(eqe->common) & EFA_ADMIN_EQE_PHASE_MASK) == phase) {
1174 /*
1175 * Do not read the rest of the completion entry before the
1176 * phase bit was validated
1177 */
1178 dma_rmb();
1179
1180 eeq->cb(eeq, eqe);
1181
1182 /* Get next event entry */
1183 ci++;
1184 processed++;
1185
1186 if (ci == eeq->depth) {
1187 ci = 0;
1188 phase = !phase;
1189 }
1190
1191 eqe = &eeq->eqes[ci];
1192 }
1193
1194 eeq->cc += processed;
1195 eeq->phase = phase;
1196 efa_com_arm_eq(eeq->edev, eeq);
1197}
1198
1199void efa_com_eq_destroy(struct efa_com_dev *edev, struct efa_com_eq *eeq)
1200{
1201 struct efa_com_destroy_eq_params params = {
1202 .eqn = eeq->eqn,
1203 };
1204
1205 efa_com_destroy_eq(edev, ¶ms);
1206 dma_free_coherent(edev->dmadev, eeq->depth * sizeof(*eeq->eqes),
1207 eeq->eqes, eeq->dma_addr);
1208}
1209
1210int efa_com_eq_init(struct efa_com_dev *edev, struct efa_com_eq *eeq,
1211 efa_eqe_handler cb, u16 depth, u8 msix_vec)
1212{
1213 struct efa_com_create_eq_params params = {};
1214 struct efa_com_create_eq_result result = {};
1215 int err;
1216
1217 params.depth = depth;
1218 params.entry_size_in_bytes = sizeof(*eeq->eqes);
1219 EFA_SET(¶ms.event_bitmask,
1220 EFA_ADMIN_CREATE_EQ_CMD_COMPLETION_EVENTS, 1);
1221 params.msix_vec = msix_vec;
1222
1223 eeq->eqes = dma_alloc_coherent(edev->dmadev,
1224 params.depth * sizeof(*eeq->eqes),
1225 ¶ms.dma_addr, GFP_KERNEL);
1226 if (!eeq->eqes)
1227 return -ENOMEM;
1228
1229 err = efa_com_create_eq(edev, ¶ms, &result);
1230 if (err)
1231 goto err_free_coherent;
1232
1233 eeq->eqn = result.eqn;
1234 eeq->edev = edev;
1235 eeq->dma_addr = params.dma_addr;
1236 eeq->phase = 1;
1237 eeq->depth = params.depth;
1238 eeq->cb = cb;
1239 efa_com_arm_eq(edev, eeq);
1240
1241 return 0;
1242
1243err_free_coherent:
1244 dma_free_coherent(edev->dmadev, params.depth * sizeof(*eeq->eqes),
1245 eeq->eqes, params.dma_addr);
1246 return err;
1247}
1// SPDX-License-Identifier: GPL-2.0 OR BSD-2-Clause
2/*
3 * Copyright 2018-2019 Amazon.com, Inc. or its affiliates. All rights reserved.
4 */
5
6#include "efa_com.h"
7#include "efa_regs_defs.h"
8
9#define ADMIN_CMD_TIMEOUT_US 30000000 /* usecs */
10
11#define EFA_REG_READ_TIMEOUT_US 50000 /* usecs */
12#define EFA_MMIO_READ_INVALID 0xffffffff
13
14#define EFA_POLL_INTERVAL_MS 100 /* msecs */
15
16#define EFA_ASYNC_QUEUE_DEPTH 16
17#define EFA_ADMIN_QUEUE_DEPTH 32
18
19#define MIN_EFA_VER\
20 ((EFA_ADMIN_API_VERSION_MAJOR << EFA_REGS_VERSION_MAJOR_VERSION_SHIFT) | \
21 (EFA_ADMIN_API_VERSION_MINOR & EFA_REGS_VERSION_MINOR_VERSION_MASK))
22
23#define EFA_CTRL_MAJOR 0
24#define EFA_CTRL_MINOR 0
25#define EFA_CTRL_SUB_MINOR 1
26
27#define MIN_EFA_CTRL_VER \
28 (((EFA_CTRL_MAJOR) << \
29 (EFA_REGS_CONTROLLER_VERSION_MAJOR_VERSION_SHIFT)) | \
30 ((EFA_CTRL_MINOR) << \
31 (EFA_REGS_CONTROLLER_VERSION_MINOR_VERSION_SHIFT)) | \
32 (EFA_CTRL_SUB_MINOR))
33
34#define EFA_DMA_ADDR_TO_UINT32_LOW(x) ((u32)((u64)(x)))
35#define EFA_DMA_ADDR_TO_UINT32_HIGH(x) ((u32)(((u64)(x)) >> 32))
36
37#define EFA_REGS_ADMIN_INTR_MASK 1
38
39enum efa_cmd_status {
40 EFA_CMD_SUBMITTED,
41 EFA_CMD_COMPLETED,
42};
43
44struct efa_comp_ctx {
45 struct completion wait_event;
46 struct efa_admin_acq_entry *user_cqe;
47 u32 comp_size;
48 enum efa_cmd_status status;
49 /* status from the device */
50 u8 comp_status;
51 u8 cmd_opcode;
52 u8 occupied;
53};
54
55static const char *efa_com_cmd_str(u8 cmd)
56{
57#define EFA_CMD_STR_CASE(_cmd) case EFA_ADMIN_##_cmd: return #_cmd
58
59 switch (cmd) {
60 EFA_CMD_STR_CASE(CREATE_QP);
61 EFA_CMD_STR_CASE(MODIFY_QP);
62 EFA_CMD_STR_CASE(QUERY_QP);
63 EFA_CMD_STR_CASE(DESTROY_QP);
64 EFA_CMD_STR_CASE(CREATE_AH);
65 EFA_CMD_STR_CASE(DESTROY_AH);
66 EFA_CMD_STR_CASE(REG_MR);
67 EFA_CMD_STR_CASE(DEREG_MR);
68 EFA_CMD_STR_CASE(CREATE_CQ);
69 EFA_CMD_STR_CASE(DESTROY_CQ);
70 EFA_CMD_STR_CASE(GET_FEATURE);
71 EFA_CMD_STR_CASE(SET_FEATURE);
72 EFA_CMD_STR_CASE(GET_STATS);
73 EFA_CMD_STR_CASE(ALLOC_PD);
74 EFA_CMD_STR_CASE(DEALLOC_PD);
75 EFA_CMD_STR_CASE(ALLOC_UAR);
76 EFA_CMD_STR_CASE(DEALLOC_UAR);
77 default: return "unknown command opcode";
78 }
79#undef EFA_CMD_STR_CASE
80}
81
82static u32 efa_com_reg_read32(struct efa_com_dev *edev, u16 offset)
83{
84 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
85 struct efa_admin_mmio_req_read_less_resp *read_resp;
86 unsigned long exp_time;
87 u32 mmio_read_reg;
88 u32 err;
89
90 read_resp = mmio_read->read_resp;
91
92 spin_lock(&mmio_read->lock);
93 mmio_read->seq_num++;
94
95 /* trash DMA req_id to identify when hardware is done */
96 read_resp->req_id = mmio_read->seq_num + 0x9aL;
97 mmio_read_reg = (offset << EFA_REGS_MMIO_REG_READ_REG_OFF_SHIFT) &
98 EFA_REGS_MMIO_REG_READ_REG_OFF_MASK;
99 mmio_read_reg |= mmio_read->seq_num &
100 EFA_REGS_MMIO_REG_READ_REQ_ID_MASK;
101
102 writel(mmio_read_reg, edev->reg_bar + EFA_REGS_MMIO_REG_READ_OFF);
103
104 exp_time = jiffies + usecs_to_jiffies(mmio_read->mmio_read_timeout);
105 do {
106 if (READ_ONCE(read_resp->req_id) == mmio_read->seq_num)
107 break;
108 udelay(1);
109 } while (time_is_after_jiffies(exp_time));
110
111 if (read_resp->req_id != mmio_read->seq_num) {
112 ibdev_err_ratelimited(
113 edev->efa_dev,
114 "Reading register timed out. expected: req id[%u] offset[%#x] actual: req id[%u] offset[%#x]\n",
115 mmio_read->seq_num, offset, read_resp->req_id,
116 read_resp->reg_off);
117 err = EFA_MMIO_READ_INVALID;
118 goto out;
119 }
120
121 if (read_resp->reg_off != offset) {
122 ibdev_err_ratelimited(
123 edev->efa_dev,
124 "Reading register failed: wrong offset provided\n");
125 err = EFA_MMIO_READ_INVALID;
126 goto out;
127 }
128
129 err = read_resp->reg_val;
130out:
131 spin_unlock(&mmio_read->lock);
132 return err;
133}
134
135static int efa_com_admin_init_sq(struct efa_com_dev *edev)
136{
137 struct efa_com_admin_queue *aq = &edev->aq;
138 struct efa_com_admin_sq *sq = &aq->sq;
139 u16 size = aq->depth * sizeof(*sq->entries);
140 u32 addr_high;
141 u32 addr_low;
142 u32 aq_caps;
143
144 sq->entries =
145 dma_alloc_coherent(aq->dmadev, size, &sq->dma_addr, GFP_KERNEL);
146 if (!sq->entries)
147 return -ENOMEM;
148
149 spin_lock_init(&sq->lock);
150
151 sq->cc = 0;
152 sq->pc = 0;
153 sq->phase = 1;
154
155 sq->db_addr = (u32 __iomem *)(edev->reg_bar + EFA_REGS_AQ_PROD_DB_OFF);
156
157 addr_high = EFA_DMA_ADDR_TO_UINT32_HIGH(sq->dma_addr);
158 addr_low = EFA_DMA_ADDR_TO_UINT32_LOW(sq->dma_addr);
159
160 writel(addr_low, edev->reg_bar + EFA_REGS_AQ_BASE_LO_OFF);
161 writel(addr_high, edev->reg_bar + EFA_REGS_AQ_BASE_HI_OFF);
162
163 aq_caps = aq->depth & EFA_REGS_AQ_CAPS_AQ_DEPTH_MASK;
164 aq_caps |= (sizeof(struct efa_admin_aq_entry) <<
165 EFA_REGS_AQ_CAPS_AQ_ENTRY_SIZE_SHIFT) &
166 EFA_REGS_AQ_CAPS_AQ_ENTRY_SIZE_MASK;
167
168 writel(aq_caps, edev->reg_bar + EFA_REGS_AQ_CAPS_OFF);
169
170 return 0;
171}
172
173static int efa_com_admin_init_cq(struct efa_com_dev *edev)
174{
175 struct efa_com_admin_queue *aq = &edev->aq;
176 struct efa_com_admin_cq *cq = &aq->cq;
177 u16 size = aq->depth * sizeof(*cq->entries);
178 u32 addr_high;
179 u32 addr_low;
180 u32 acq_caps;
181
182 cq->entries =
183 dma_alloc_coherent(aq->dmadev, size, &cq->dma_addr, GFP_KERNEL);
184 if (!cq->entries)
185 return -ENOMEM;
186
187 spin_lock_init(&cq->lock);
188
189 cq->cc = 0;
190 cq->phase = 1;
191
192 addr_high = EFA_DMA_ADDR_TO_UINT32_HIGH(cq->dma_addr);
193 addr_low = EFA_DMA_ADDR_TO_UINT32_LOW(cq->dma_addr);
194
195 writel(addr_low, edev->reg_bar + EFA_REGS_ACQ_BASE_LO_OFF);
196 writel(addr_high, edev->reg_bar + EFA_REGS_ACQ_BASE_HI_OFF);
197
198 acq_caps = aq->depth & EFA_REGS_ACQ_CAPS_ACQ_DEPTH_MASK;
199 acq_caps |= (sizeof(struct efa_admin_acq_entry) <<
200 EFA_REGS_ACQ_CAPS_ACQ_ENTRY_SIZE_SHIFT) &
201 EFA_REGS_ACQ_CAPS_ACQ_ENTRY_SIZE_MASK;
202 acq_caps |= (aq->msix_vector_idx <<
203 EFA_REGS_ACQ_CAPS_ACQ_MSIX_VECTOR_SHIFT) &
204 EFA_REGS_ACQ_CAPS_ACQ_MSIX_VECTOR_MASK;
205
206 writel(acq_caps, edev->reg_bar + EFA_REGS_ACQ_CAPS_OFF);
207
208 return 0;
209}
210
211static int efa_com_admin_init_aenq(struct efa_com_dev *edev,
212 struct efa_aenq_handlers *aenq_handlers)
213{
214 struct efa_com_aenq *aenq = &edev->aenq;
215 u32 addr_low, addr_high, aenq_caps;
216 u16 size;
217
218 if (!aenq_handlers) {
219 ibdev_err(edev->efa_dev, "aenq handlers pointer is NULL\n");
220 return -EINVAL;
221 }
222
223 size = EFA_ASYNC_QUEUE_DEPTH * sizeof(*aenq->entries);
224 aenq->entries = dma_alloc_coherent(edev->dmadev, size, &aenq->dma_addr,
225 GFP_KERNEL);
226 if (!aenq->entries)
227 return -ENOMEM;
228
229 aenq->aenq_handlers = aenq_handlers;
230 aenq->depth = EFA_ASYNC_QUEUE_DEPTH;
231 aenq->cc = 0;
232 aenq->phase = 1;
233
234 addr_low = EFA_DMA_ADDR_TO_UINT32_LOW(aenq->dma_addr);
235 addr_high = EFA_DMA_ADDR_TO_UINT32_HIGH(aenq->dma_addr);
236
237 writel(addr_low, edev->reg_bar + EFA_REGS_AENQ_BASE_LO_OFF);
238 writel(addr_high, edev->reg_bar + EFA_REGS_AENQ_BASE_HI_OFF);
239
240 aenq_caps = aenq->depth & EFA_REGS_AENQ_CAPS_AENQ_DEPTH_MASK;
241 aenq_caps |= (sizeof(struct efa_admin_aenq_entry) <<
242 EFA_REGS_AENQ_CAPS_AENQ_ENTRY_SIZE_SHIFT) &
243 EFA_REGS_AENQ_CAPS_AENQ_ENTRY_SIZE_MASK;
244 aenq_caps |= (aenq->msix_vector_idx
245 << EFA_REGS_AENQ_CAPS_AENQ_MSIX_VECTOR_SHIFT) &
246 EFA_REGS_AENQ_CAPS_AENQ_MSIX_VECTOR_MASK;
247 writel(aenq_caps, edev->reg_bar + EFA_REGS_AENQ_CAPS_OFF);
248
249 /*
250 * Init cons_db to mark that all entries in the queue
251 * are initially available
252 */
253 writel(edev->aenq.cc, edev->reg_bar + EFA_REGS_AENQ_CONS_DB_OFF);
254
255 return 0;
256}
257
258/* ID to be used with efa_com_get_comp_ctx */
259static u16 efa_com_alloc_ctx_id(struct efa_com_admin_queue *aq)
260{
261 u16 ctx_id;
262
263 spin_lock(&aq->comp_ctx_lock);
264 ctx_id = aq->comp_ctx_pool[aq->comp_ctx_pool_next];
265 aq->comp_ctx_pool_next++;
266 spin_unlock(&aq->comp_ctx_lock);
267
268 return ctx_id;
269}
270
271static void efa_com_dealloc_ctx_id(struct efa_com_admin_queue *aq,
272 u16 ctx_id)
273{
274 spin_lock(&aq->comp_ctx_lock);
275 aq->comp_ctx_pool_next--;
276 aq->comp_ctx_pool[aq->comp_ctx_pool_next] = ctx_id;
277 spin_unlock(&aq->comp_ctx_lock);
278}
279
280static inline void efa_com_put_comp_ctx(struct efa_com_admin_queue *aq,
281 struct efa_comp_ctx *comp_ctx)
282{
283 u16 cmd_id = comp_ctx->user_cqe->acq_common_descriptor.command &
284 EFA_ADMIN_ACQ_COMMON_DESC_COMMAND_ID_MASK;
285 u16 ctx_id = cmd_id & (aq->depth - 1);
286
287 ibdev_dbg(aq->efa_dev, "Put completion command_id %#x\n", cmd_id);
288 comp_ctx->occupied = 0;
289 efa_com_dealloc_ctx_id(aq, ctx_id);
290}
291
292static struct efa_comp_ctx *efa_com_get_comp_ctx(struct efa_com_admin_queue *aq,
293 u16 cmd_id, bool capture)
294{
295 u16 ctx_id = cmd_id & (aq->depth - 1);
296
297 if (aq->comp_ctx[ctx_id].occupied && capture) {
298 ibdev_err_ratelimited(
299 aq->efa_dev,
300 "Completion context for command_id %#x is occupied\n",
301 cmd_id);
302 return NULL;
303 }
304
305 if (capture) {
306 aq->comp_ctx[ctx_id].occupied = 1;
307 ibdev_dbg(aq->efa_dev,
308 "Take completion ctxt for command_id %#x\n", cmd_id);
309 }
310
311 return &aq->comp_ctx[ctx_id];
312}
313
314static struct efa_comp_ctx *__efa_com_submit_admin_cmd(struct efa_com_admin_queue *aq,
315 struct efa_admin_aq_entry *cmd,
316 size_t cmd_size_in_bytes,
317 struct efa_admin_acq_entry *comp,
318 size_t comp_size_in_bytes)
319{
320 struct efa_comp_ctx *comp_ctx;
321 u16 queue_size_mask;
322 u16 cmd_id;
323 u16 ctx_id;
324 u16 pi;
325
326 queue_size_mask = aq->depth - 1;
327 pi = aq->sq.pc & queue_size_mask;
328
329 ctx_id = efa_com_alloc_ctx_id(aq);
330
331 /* cmd_id LSBs are the ctx_id and MSBs are entropy bits from pc */
332 cmd_id = ctx_id & queue_size_mask;
333 cmd_id |= aq->sq.pc & ~queue_size_mask;
334 cmd_id &= EFA_ADMIN_AQ_COMMON_DESC_COMMAND_ID_MASK;
335
336 cmd->aq_common_descriptor.command_id = cmd_id;
337 cmd->aq_common_descriptor.flags |= aq->sq.phase &
338 EFA_ADMIN_AQ_COMMON_DESC_PHASE_MASK;
339
340 comp_ctx = efa_com_get_comp_ctx(aq, cmd_id, true);
341 if (!comp_ctx) {
342 efa_com_dealloc_ctx_id(aq, ctx_id);
343 return ERR_PTR(-EINVAL);
344 }
345
346 comp_ctx->status = EFA_CMD_SUBMITTED;
347 comp_ctx->comp_size = comp_size_in_bytes;
348 comp_ctx->user_cqe = comp;
349 comp_ctx->cmd_opcode = cmd->aq_common_descriptor.opcode;
350
351 reinit_completion(&comp_ctx->wait_event);
352
353 memcpy(&aq->sq.entries[pi], cmd, cmd_size_in_bytes);
354
355 aq->sq.pc++;
356 atomic64_inc(&aq->stats.submitted_cmd);
357
358 if ((aq->sq.pc & queue_size_mask) == 0)
359 aq->sq.phase = !aq->sq.phase;
360
361 /* barrier not needed in case of writel */
362 writel(aq->sq.pc, aq->sq.db_addr);
363
364 return comp_ctx;
365}
366
367static inline int efa_com_init_comp_ctxt(struct efa_com_admin_queue *aq)
368{
369 size_t pool_size = aq->depth * sizeof(*aq->comp_ctx_pool);
370 size_t size = aq->depth * sizeof(struct efa_comp_ctx);
371 struct efa_comp_ctx *comp_ctx;
372 u16 i;
373
374 aq->comp_ctx = devm_kzalloc(aq->dmadev, size, GFP_KERNEL);
375 aq->comp_ctx_pool = devm_kzalloc(aq->dmadev, pool_size, GFP_KERNEL);
376 if (!aq->comp_ctx || !aq->comp_ctx_pool) {
377 devm_kfree(aq->dmadev, aq->comp_ctx_pool);
378 devm_kfree(aq->dmadev, aq->comp_ctx);
379 return -ENOMEM;
380 }
381
382 for (i = 0; i < aq->depth; i++) {
383 comp_ctx = efa_com_get_comp_ctx(aq, i, false);
384 if (comp_ctx)
385 init_completion(&comp_ctx->wait_event);
386
387 aq->comp_ctx_pool[i] = i;
388 }
389
390 spin_lock_init(&aq->comp_ctx_lock);
391
392 aq->comp_ctx_pool_next = 0;
393
394 return 0;
395}
396
397static struct efa_comp_ctx *efa_com_submit_admin_cmd(struct efa_com_admin_queue *aq,
398 struct efa_admin_aq_entry *cmd,
399 size_t cmd_size_in_bytes,
400 struct efa_admin_acq_entry *comp,
401 size_t comp_size_in_bytes)
402{
403 struct efa_comp_ctx *comp_ctx;
404
405 spin_lock(&aq->sq.lock);
406 if (!test_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state)) {
407 ibdev_err_ratelimited(aq->efa_dev, "Admin queue is closed\n");
408 spin_unlock(&aq->sq.lock);
409 return ERR_PTR(-ENODEV);
410 }
411
412 comp_ctx = __efa_com_submit_admin_cmd(aq, cmd, cmd_size_in_bytes, comp,
413 comp_size_in_bytes);
414 spin_unlock(&aq->sq.lock);
415 if (IS_ERR(comp_ctx))
416 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
417
418 return comp_ctx;
419}
420
421static void efa_com_handle_single_admin_completion(struct efa_com_admin_queue *aq,
422 struct efa_admin_acq_entry *cqe)
423{
424 struct efa_comp_ctx *comp_ctx;
425 u16 cmd_id;
426
427 cmd_id = cqe->acq_common_descriptor.command &
428 EFA_ADMIN_ACQ_COMMON_DESC_COMMAND_ID_MASK;
429
430 comp_ctx = efa_com_get_comp_ctx(aq, cmd_id, false);
431 if (!comp_ctx) {
432 ibdev_err(aq->efa_dev,
433 "comp_ctx is NULL. Changing the admin queue running state\n");
434 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
435 return;
436 }
437
438 comp_ctx->status = EFA_CMD_COMPLETED;
439 comp_ctx->comp_status = cqe->acq_common_descriptor.status;
440 if (comp_ctx->user_cqe)
441 memcpy(comp_ctx->user_cqe, cqe, comp_ctx->comp_size);
442
443 if (!test_bit(EFA_AQ_STATE_POLLING_BIT, &aq->state))
444 complete(&comp_ctx->wait_event);
445}
446
447static void efa_com_handle_admin_completion(struct efa_com_admin_queue *aq)
448{
449 struct efa_admin_acq_entry *cqe;
450 u16 queue_size_mask;
451 u16 comp_num = 0;
452 u8 phase;
453 u16 ci;
454
455 queue_size_mask = aq->depth - 1;
456
457 ci = aq->cq.cc & queue_size_mask;
458 phase = aq->cq.phase;
459
460 cqe = &aq->cq.entries[ci];
461
462 /* Go over all the completions */
463 while ((READ_ONCE(cqe->acq_common_descriptor.flags) &
464 EFA_ADMIN_ACQ_COMMON_DESC_PHASE_MASK) == phase) {
465 /*
466 * Do not read the rest of the completion entry before the
467 * phase bit was validated
468 */
469 dma_rmb();
470 efa_com_handle_single_admin_completion(aq, cqe);
471
472 ci++;
473 comp_num++;
474 if (ci == aq->depth) {
475 ci = 0;
476 phase = !phase;
477 }
478
479 cqe = &aq->cq.entries[ci];
480 }
481
482 aq->cq.cc += comp_num;
483 aq->cq.phase = phase;
484 aq->sq.cc += comp_num;
485 atomic64_add(comp_num, &aq->stats.completed_cmd);
486}
487
488static int efa_com_comp_status_to_errno(u8 comp_status)
489{
490 switch (comp_status) {
491 case EFA_ADMIN_SUCCESS:
492 return 0;
493 case EFA_ADMIN_RESOURCE_ALLOCATION_FAILURE:
494 return -ENOMEM;
495 case EFA_ADMIN_UNSUPPORTED_OPCODE:
496 return -EOPNOTSUPP;
497 case EFA_ADMIN_BAD_OPCODE:
498 case EFA_ADMIN_MALFORMED_REQUEST:
499 case EFA_ADMIN_ILLEGAL_PARAMETER:
500 case EFA_ADMIN_UNKNOWN_ERROR:
501 return -EINVAL;
502 default:
503 return -EINVAL;
504 }
505}
506
507static int efa_com_wait_and_process_admin_cq_polling(struct efa_comp_ctx *comp_ctx,
508 struct efa_com_admin_queue *aq)
509{
510 unsigned long timeout;
511 unsigned long flags;
512 int err;
513
514 timeout = jiffies + usecs_to_jiffies(aq->completion_timeout);
515
516 while (1) {
517 spin_lock_irqsave(&aq->cq.lock, flags);
518 efa_com_handle_admin_completion(aq);
519 spin_unlock_irqrestore(&aq->cq.lock, flags);
520
521 if (comp_ctx->status != EFA_CMD_SUBMITTED)
522 break;
523
524 if (time_is_before_jiffies(timeout)) {
525 ibdev_err_ratelimited(
526 aq->efa_dev,
527 "Wait for completion (polling) timeout\n");
528 /* EFA didn't have any completion */
529 atomic64_inc(&aq->stats.no_completion);
530
531 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
532 err = -ETIME;
533 goto out;
534 }
535
536 msleep(aq->poll_interval);
537 }
538
539 err = efa_com_comp_status_to_errno(comp_ctx->comp_status);
540out:
541 efa_com_put_comp_ctx(aq, comp_ctx);
542 return err;
543}
544
545static int efa_com_wait_and_process_admin_cq_interrupts(struct efa_comp_ctx *comp_ctx,
546 struct efa_com_admin_queue *aq)
547{
548 unsigned long flags;
549 int err;
550
551 wait_for_completion_timeout(&comp_ctx->wait_event,
552 usecs_to_jiffies(aq->completion_timeout));
553
554 /*
555 * In case the command wasn't completed find out the root cause.
556 * There might be 2 kinds of errors
557 * 1) No completion (timeout reached)
558 * 2) There is completion but the device didn't get any msi-x interrupt.
559 */
560 if (comp_ctx->status == EFA_CMD_SUBMITTED) {
561 spin_lock_irqsave(&aq->cq.lock, flags);
562 efa_com_handle_admin_completion(aq);
563 spin_unlock_irqrestore(&aq->cq.lock, flags);
564
565 atomic64_inc(&aq->stats.no_completion);
566
567 if (comp_ctx->status == EFA_CMD_COMPLETED)
568 ibdev_err_ratelimited(
569 aq->efa_dev,
570 "The device sent a completion but the driver didn't receive any MSI-X interrupt for admin cmd %s(%d) status %d (ctx: 0x%p, sq producer: %d, sq consumer: %d, cq consumer: %d)\n",
571 efa_com_cmd_str(comp_ctx->cmd_opcode),
572 comp_ctx->cmd_opcode, comp_ctx->status,
573 comp_ctx, aq->sq.pc, aq->sq.cc, aq->cq.cc);
574 else
575 ibdev_err_ratelimited(
576 aq->efa_dev,
577 "The device didn't send any completion for admin cmd %s(%d) status %d (ctx 0x%p, sq producer: %d, sq consumer: %d, cq consumer: %d)\n",
578 efa_com_cmd_str(comp_ctx->cmd_opcode),
579 comp_ctx->cmd_opcode, comp_ctx->status,
580 comp_ctx, aq->sq.pc, aq->sq.cc, aq->cq.cc);
581
582 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
583 err = -ETIME;
584 goto out;
585 }
586
587 err = efa_com_comp_status_to_errno(comp_ctx->comp_status);
588out:
589 efa_com_put_comp_ctx(aq, comp_ctx);
590 return err;
591}
592
593/*
594 * There are two types to wait for completion.
595 * Polling mode - wait until the completion is available.
596 * Async mode - wait on wait queue until the completion is ready
597 * (or the timeout expired).
598 * It is expected that the IRQ called efa_com_handle_admin_completion
599 * to mark the completions.
600 */
601static int efa_com_wait_and_process_admin_cq(struct efa_comp_ctx *comp_ctx,
602 struct efa_com_admin_queue *aq)
603{
604 if (test_bit(EFA_AQ_STATE_POLLING_BIT, &aq->state))
605 return efa_com_wait_and_process_admin_cq_polling(comp_ctx, aq);
606
607 return efa_com_wait_and_process_admin_cq_interrupts(comp_ctx, aq);
608}
609
610/**
611 * efa_com_cmd_exec - Execute admin command
612 * @aq: admin queue.
613 * @cmd: the admin command to execute.
614 * @cmd_size: the command size.
615 * @comp: command completion return entry.
616 * @comp_size: command completion size.
617 * Submit an admin command and then wait until the device will return a
618 * completion.
619 * The completion will be copied into comp.
620 *
621 * @return - 0 on success, negative value on failure.
622 */
623int efa_com_cmd_exec(struct efa_com_admin_queue *aq,
624 struct efa_admin_aq_entry *cmd,
625 size_t cmd_size,
626 struct efa_admin_acq_entry *comp,
627 size_t comp_size)
628{
629 struct efa_comp_ctx *comp_ctx;
630 int err;
631
632 might_sleep();
633
634 /* In case of queue FULL */
635 down(&aq->avail_cmds);
636
637 ibdev_dbg(aq->efa_dev, "%s (opcode %d)\n",
638 efa_com_cmd_str(cmd->aq_common_descriptor.opcode),
639 cmd->aq_common_descriptor.opcode);
640 comp_ctx = efa_com_submit_admin_cmd(aq, cmd, cmd_size, comp, comp_size);
641 if (IS_ERR(comp_ctx)) {
642 ibdev_err_ratelimited(
643 aq->efa_dev,
644 "Failed to submit command %s (opcode %u) err %ld\n",
645 efa_com_cmd_str(cmd->aq_common_descriptor.opcode),
646 cmd->aq_common_descriptor.opcode, PTR_ERR(comp_ctx));
647
648 up(&aq->avail_cmds);
649 return PTR_ERR(comp_ctx);
650 }
651
652 err = efa_com_wait_and_process_admin_cq(comp_ctx, aq);
653 if (err)
654 ibdev_err_ratelimited(
655 aq->efa_dev,
656 "Failed to process command %s (opcode %u) comp_status %d err %d\n",
657 efa_com_cmd_str(cmd->aq_common_descriptor.opcode),
658 cmd->aq_common_descriptor.opcode, comp_ctx->comp_status,
659 err);
660
661 up(&aq->avail_cmds);
662
663 return err;
664}
665
666/**
667 * efa_com_admin_destroy - Destroy the admin and the async events queues.
668 * @edev: EFA communication layer struct
669 */
670void efa_com_admin_destroy(struct efa_com_dev *edev)
671{
672 struct efa_com_admin_queue *aq = &edev->aq;
673 struct efa_com_aenq *aenq = &edev->aenq;
674 struct efa_com_admin_cq *cq = &aq->cq;
675 struct efa_com_admin_sq *sq = &aq->sq;
676 u16 size;
677
678 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
679
680 devm_kfree(edev->dmadev, aq->comp_ctx_pool);
681 devm_kfree(edev->dmadev, aq->comp_ctx);
682
683 size = aq->depth * sizeof(*sq->entries);
684 dma_free_coherent(edev->dmadev, size, sq->entries, sq->dma_addr);
685
686 size = aq->depth * sizeof(*cq->entries);
687 dma_free_coherent(edev->dmadev, size, cq->entries, cq->dma_addr);
688
689 size = aenq->depth * sizeof(*aenq->entries);
690 dma_free_coherent(edev->dmadev, size, aenq->entries, aenq->dma_addr);
691}
692
693/**
694 * efa_com_set_admin_polling_mode - Set the admin completion queue polling mode
695 * @edev: EFA communication layer struct
696 * @polling: Enable/Disable polling mode
697 *
698 * Set the admin completion mode.
699 */
700void efa_com_set_admin_polling_mode(struct efa_com_dev *edev, bool polling)
701{
702 u32 mask_value = 0;
703
704 if (polling)
705 mask_value = EFA_REGS_ADMIN_INTR_MASK;
706
707 writel(mask_value, edev->reg_bar + EFA_REGS_INTR_MASK_OFF);
708 if (polling)
709 set_bit(EFA_AQ_STATE_POLLING_BIT, &edev->aq.state);
710 else
711 clear_bit(EFA_AQ_STATE_POLLING_BIT, &edev->aq.state);
712}
713
714static void efa_com_stats_init(struct efa_com_dev *edev)
715{
716 atomic64_t *s = (atomic64_t *)&edev->aq.stats;
717 int i;
718
719 for (i = 0; i < sizeof(edev->aq.stats) / sizeof(*s); i++, s++)
720 atomic64_set(s, 0);
721}
722
723/**
724 * efa_com_admin_init - Init the admin and the async queues
725 * @edev: EFA communication layer struct
726 * @aenq_handlers: Those handlers to be called upon event.
727 *
728 * Initialize the admin submission and completion queues.
729 * Initialize the asynchronous events notification queues.
730 *
731 * @return - 0 on success, negative value on failure.
732 */
733int efa_com_admin_init(struct efa_com_dev *edev,
734 struct efa_aenq_handlers *aenq_handlers)
735{
736 struct efa_com_admin_queue *aq = &edev->aq;
737 u32 timeout;
738 u32 dev_sts;
739 u32 cap;
740 int err;
741
742 dev_sts = efa_com_reg_read32(edev, EFA_REGS_DEV_STS_OFF);
743 if (!(dev_sts & EFA_REGS_DEV_STS_READY_MASK)) {
744 ibdev_err(edev->efa_dev,
745 "Device isn't ready, abort com init %#x\n", dev_sts);
746 return -ENODEV;
747 }
748
749 aq->depth = EFA_ADMIN_QUEUE_DEPTH;
750
751 aq->dmadev = edev->dmadev;
752 aq->efa_dev = edev->efa_dev;
753 set_bit(EFA_AQ_STATE_POLLING_BIT, &aq->state);
754
755 sema_init(&aq->avail_cmds, aq->depth);
756
757 efa_com_stats_init(edev);
758
759 err = efa_com_init_comp_ctxt(aq);
760 if (err)
761 return err;
762
763 err = efa_com_admin_init_sq(edev);
764 if (err)
765 goto err_destroy_comp_ctxt;
766
767 err = efa_com_admin_init_cq(edev);
768 if (err)
769 goto err_destroy_sq;
770
771 efa_com_set_admin_polling_mode(edev, false);
772
773 err = efa_com_admin_init_aenq(edev, aenq_handlers);
774 if (err)
775 goto err_destroy_cq;
776
777 cap = efa_com_reg_read32(edev, EFA_REGS_CAPS_OFF);
778 timeout = (cap & EFA_REGS_CAPS_ADMIN_CMD_TO_MASK) >>
779 EFA_REGS_CAPS_ADMIN_CMD_TO_SHIFT;
780 if (timeout)
781 /* the resolution of timeout reg is 100ms */
782 aq->completion_timeout = timeout * 100000;
783 else
784 aq->completion_timeout = ADMIN_CMD_TIMEOUT_US;
785
786 aq->poll_interval = EFA_POLL_INTERVAL_MS;
787
788 set_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
789
790 return 0;
791
792err_destroy_cq:
793 dma_free_coherent(edev->dmadev, aq->depth * sizeof(*aq->cq.entries),
794 aq->cq.entries, aq->cq.dma_addr);
795err_destroy_sq:
796 dma_free_coherent(edev->dmadev, aq->depth * sizeof(*aq->sq.entries),
797 aq->sq.entries, aq->sq.dma_addr);
798err_destroy_comp_ctxt:
799 devm_kfree(edev->dmadev, aq->comp_ctx);
800
801 return err;
802}
803
804/**
805 * efa_com_admin_q_comp_intr_handler - admin queue interrupt handler
806 * @edev: EFA communication layer struct
807 *
808 * This method goes over the admin completion queue and wakes up
809 * all the pending threads that wait on the commands wait event.
810 *
811 * @note: Should be called after MSI-X interrupt.
812 */
813void efa_com_admin_q_comp_intr_handler(struct efa_com_dev *edev)
814{
815 unsigned long flags;
816
817 spin_lock_irqsave(&edev->aq.cq.lock, flags);
818 efa_com_handle_admin_completion(&edev->aq);
819 spin_unlock_irqrestore(&edev->aq.cq.lock, flags);
820}
821
822/*
823 * efa_handle_specific_aenq_event:
824 * return the handler that is relevant to the specific event group
825 */
826static efa_aenq_handler efa_com_get_specific_aenq_cb(struct efa_com_dev *edev,
827 u16 group)
828{
829 struct efa_aenq_handlers *aenq_handlers = edev->aenq.aenq_handlers;
830
831 if (group < EFA_MAX_HANDLERS && aenq_handlers->handlers[group])
832 return aenq_handlers->handlers[group];
833
834 return aenq_handlers->unimplemented_handler;
835}
836
837/**
838 * efa_com_aenq_intr_handler - AENQ interrupt handler
839 * @edev: EFA communication layer struct
840 * @data: Data of interrupt handler.
841 *
842 * Go over the async event notification queue and call the proper aenq handler.
843 */
844void efa_com_aenq_intr_handler(struct efa_com_dev *edev, void *data)
845{
846 struct efa_admin_aenq_common_desc *aenq_common;
847 struct efa_com_aenq *aenq = &edev->aenq;
848 struct efa_admin_aenq_entry *aenq_e;
849 efa_aenq_handler handler_cb;
850 u32 processed = 0;
851 u8 phase;
852 u32 ci;
853
854 ci = aenq->cc & (aenq->depth - 1);
855 phase = aenq->phase;
856 aenq_e = &aenq->entries[ci]; /* Get first entry */
857 aenq_common = &aenq_e->aenq_common_desc;
858
859 /* Go over all the events */
860 while ((READ_ONCE(aenq_common->flags) &
861 EFA_ADMIN_AENQ_COMMON_DESC_PHASE_MASK) == phase) {
862 /*
863 * Do not read the rest of the completion entry before the
864 * phase bit was validated
865 */
866 dma_rmb();
867
868 /* Handle specific event*/
869 handler_cb = efa_com_get_specific_aenq_cb(edev,
870 aenq_common->group);
871 handler_cb(data, aenq_e); /* call the actual event handler*/
872
873 /* Get next event entry */
874 ci++;
875 processed++;
876
877 if (ci == aenq->depth) {
878 ci = 0;
879 phase = !phase;
880 }
881 aenq_e = &aenq->entries[ci];
882 aenq_common = &aenq_e->aenq_common_desc;
883 }
884
885 aenq->cc += processed;
886 aenq->phase = phase;
887
888 /* Don't update aenq doorbell if there weren't any processed events */
889 if (!processed)
890 return;
891
892 /* barrier not needed in case of writel */
893 writel(aenq->cc, edev->reg_bar + EFA_REGS_AENQ_CONS_DB_OFF);
894}
895
896static void efa_com_mmio_reg_read_resp_addr_init(struct efa_com_dev *edev)
897{
898 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
899 u32 addr_high;
900 u32 addr_low;
901
902 /* dma_addr_bits is unknown at this point */
903 addr_high = (mmio_read->read_resp_dma_addr >> 32) & GENMASK(31, 0);
904 addr_low = mmio_read->read_resp_dma_addr & GENMASK(31, 0);
905
906 writel(addr_high, edev->reg_bar + EFA_REGS_MMIO_RESP_HI_OFF);
907 writel(addr_low, edev->reg_bar + EFA_REGS_MMIO_RESP_LO_OFF);
908}
909
910int efa_com_mmio_reg_read_init(struct efa_com_dev *edev)
911{
912 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
913
914 spin_lock_init(&mmio_read->lock);
915 mmio_read->read_resp =
916 dma_alloc_coherent(edev->dmadev, sizeof(*mmio_read->read_resp),
917 &mmio_read->read_resp_dma_addr, GFP_KERNEL);
918 if (!mmio_read->read_resp)
919 return -ENOMEM;
920
921 efa_com_mmio_reg_read_resp_addr_init(edev);
922
923 mmio_read->read_resp->req_id = 0;
924 mmio_read->seq_num = 0;
925 mmio_read->mmio_read_timeout = EFA_REG_READ_TIMEOUT_US;
926
927 return 0;
928}
929
930void efa_com_mmio_reg_read_destroy(struct efa_com_dev *edev)
931{
932 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
933
934 dma_free_coherent(edev->dmadev, sizeof(*mmio_read->read_resp),
935 mmio_read->read_resp, mmio_read->read_resp_dma_addr);
936}
937
938int efa_com_validate_version(struct efa_com_dev *edev)
939{
940 u32 ctrl_ver_masked;
941 u32 ctrl_ver;
942 u32 ver;
943
944 /*
945 * Make sure the EFA version and the controller version are at least
946 * as the driver expects
947 */
948 ver = efa_com_reg_read32(edev, EFA_REGS_VERSION_OFF);
949 ctrl_ver = efa_com_reg_read32(edev,
950 EFA_REGS_CONTROLLER_VERSION_OFF);
951
952 ibdev_dbg(edev->efa_dev, "efa device version: %d.%d\n",
953 (ver & EFA_REGS_VERSION_MAJOR_VERSION_MASK) >>
954 EFA_REGS_VERSION_MAJOR_VERSION_SHIFT,
955 ver & EFA_REGS_VERSION_MINOR_VERSION_MASK);
956
957 if (ver < MIN_EFA_VER) {
958 ibdev_err(edev->efa_dev,
959 "EFA version is lower than the minimal version the driver supports\n");
960 return -EOPNOTSUPP;
961 }
962
963 ibdev_dbg(edev->efa_dev,
964 "efa controller version: %d.%d.%d implementation version %d\n",
965 (ctrl_ver & EFA_REGS_CONTROLLER_VERSION_MAJOR_VERSION_MASK) >>
966 EFA_REGS_CONTROLLER_VERSION_MAJOR_VERSION_SHIFT,
967 (ctrl_ver & EFA_REGS_CONTROLLER_VERSION_MINOR_VERSION_MASK) >>
968 EFA_REGS_CONTROLLER_VERSION_MINOR_VERSION_SHIFT,
969 (ctrl_ver & EFA_REGS_CONTROLLER_VERSION_SUBMINOR_VERSION_MASK),
970 (ctrl_ver & EFA_REGS_CONTROLLER_VERSION_IMPL_ID_MASK) >>
971 EFA_REGS_CONTROLLER_VERSION_IMPL_ID_SHIFT);
972
973 ctrl_ver_masked =
974 (ctrl_ver & EFA_REGS_CONTROLLER_VERSION_MAJOR_VERSION_MASK) |
975 (ctrl_ver & EFA_REGS_CONTROLLER_VERSION_MINOR_VERSION_MASK) |
976 (ctrl_ver & EFA_REGS_CONTROLLER_VERSION_SUBMINOR_VERSION_MASK);
977
978 /* Validate the ctrl version without the implementation ID */
979 if (ctrl_ver_masked < MIN_EFA_CTRL_VER) {
980 ibdev_err(edev->efa_dev,
981 "EFA ctrl version is lower than the minimal ctrl version the driver supports\n");
982 return -EOPNOTSUPP;
983 }
984
985 return 0;
986}
987
988/**
989 * efa_com_get_dma_width - Retrieve physical dma address width the device
990 * supports.
991 * @edev: EFA communication layer struct
992 *
993 * Retrieve the maximum physical address bits the device can handle.
994 *
995 * @return: > 0 on Success and negative value otherwise.
996 */
997int efa_com_get_dma_width(struct efa_com_dev *edev)
998{
999 u32 caps = efa_com_reg_read32(edev, EFA_REGS_CAPS_OFF);
1000 int width;
1001
1002 width = (caps & EFA_REGS_CAPS_DMA_ADDR_WIDTH_MASK) >>
1003 EFA_REGS_CAPS_DMA_ADDR_WIDTH_SHIFT;
1004
1005 ibdev_dbg(edev->efa_dev, "DMA width: %d\n", width);
1006
1007 if (width < 32 || width > 64) {
1008 ibdev_err(edev->efa_dev, "DMA width illegal value: %d\n", width);
1009 return -EINVAL;
1010 }
1011
1012 edev->dma_addr_bits = width;
1013
1014 return width;
1015}
1016
1017static int wait_for_reset_state(struct efa_com_dev *edev, u32 timeout,
1018 u16 exp_state)
1019{
1020 u32 val, i;
1021
1022 for (i = 0; i < timeout; i++) {
1023 val = efa_com_reg_read32(edev, EFA_REGS_DEV_STS_OFF);
1024
1025 if ((val & EFA_REGS_DEV_STS_RESET_IN_PROGRESS_MASK) ==
1026 exp_state)
1027 return 0;
1028
1029 ibdev_dbg(edev->efa_dev, "Reset indication val %d\n", val);
1030 msleep(EFA_POLL_INTERVAL_MS);
1031 }
1032
1033 return -ETIME;
1034}
1035
1036/**
1037 * efa_com_dev_reset - Perform device FLR to the device.
1038 * @edev: EFA communication layer struct
1039 * @reset_reason: Specify what is the trigger for the reset in case of an error.
1040 *
1041 * @return - 0 on success, negative value on failure.
1042 */
1043int efa_com_dev_reset(struct efa_com_dev *edev,
1044 enum efa_regs_reset_reason_types reset_reason)
1045{
1046 u32 stat, timeout, cap, reset_val;
1047 int err;
1048
1049 stat = efa_com_reg_read32(edev, EFA_REGS_DEV_STS_OFF);
1050 cap = efa_com_reg_read32(edev, EFA_REGS_CAPS_OFF);
1051
1052 if (!(stat & EFA_REGS_DEV_STS_READY_MASK)) {
1053 ibdev_err(edev->efa_dev,
1054 "Device isn't ready, can't reset device\n");
1055 return -EINVAL;
1056 }
1057
1058 timeout = (cap & EFA_REGS_CAPS_RESET_TIMEOUT_MASK) >>
1059 EFA_REGS_CAPS_RESET_TIMEOUT_SHIFT;
1060 if (!timeout) {
1061 ibdev_err(edev->efa_dev, "Invalid timeout value\n");
1062 return -EINVAL;
1063 }
1064
1065 /* start reset */
1066 reset_val = EFA_REGS_DEV_CTL_DEV_RESET_MASK;
1067 reset_val |= (reset_reason << EFA_REGS_DEV_CTL_RESET_REASON_SHIFT) &
1068 EFA_REGS_DEV_CTL_RESET_REASON_MASK;
1069 writel(reset_val, edev->reg_bar + EFA_REGS_DEV_CTL_OFF);
1070
1071 /* reset clears the mmio readless address, restore it */
1072 efa_com_mmio_reg_read_resp_addr_init(edev);
1073
1074 err = wait_for_reset_state(edev, timeout,
1075 EFA_REGS_DEV_STS_RESET_IN_PROGRESS_MASK);
1076 if (err) {
1077 ibdev_err(edev->efa_dev, "Reset indication didn't turn on\n");
1078 return err;
1079 }
1080
1081 /* reset done */
1082 writel(0, edev->reg_bar + EFA_REGS_DEV_CTL_OFF);
1083 err = wait_for_reset_state(edev, timeout, 0);
1084 if (err) {
1085 ibdev_err(edev->efa_dev, "Reset indication didn't turn off\n");
1086 return err;
1087 }
1088
1089 timeout = (cap & EFA_REGS_CAPS_ADMIN_CMD_TO_MASK) >>
1090 EFA_REGS_CAPS_ADMIN_CMD_TO_SHIFT;
1091 if (timeout)
1092 /* the resolution of timeout reg is 100ms */
1093 edev->aq.completion_timeout = timeout * 100000;
1094 else
1095 edev->aq.completion_timeout = ADMIN_CMD_TIMEOUT_US;
1096
1097 return 0;
1098}