WIP FPC-III support
[linux/fpc-iii.git] / drivers / infiniband / hw / efa / efa_com.c
blob336bc2c57bb1d0eb83bd1c0819c4964e99ca0451
1 // SPDX-License-Identifier: GPL-2.0 OR BSD-2-Clause
2 /*
3 * Copyright 2018-2020 Amazon.com, Inc. or its affiliates. All rights reserved.
4 */
6 #include "efa_com.h"
7 #include "efa_regs_defs.h"
9 #define ADMIN_CMD_TIMEOUT_US 30000000 /* usecs */
11 #define EFA_REG_READ_TIMEOUT_US 50000 /* usecs */
12 #define EFA_MMIO_READ_INVALID 0xffffffff
14 #define EFA_POLL_INTERVAL_MS 100 /* msecs */
16 #define EFA_ASYNC_QUEUE_DEPTH 16
17 #define EFA_ADMIN_QUEUE_DEPTH 32
19 #define EFA_CTRL_MAJOR 0
20 #define EFA_CTRL_MINOR 0
21 #define EFA_CTRL_SUB_MINOR 1
23 #define EFA_DMA_ADDR_TO_UINT32_LOW(x) ((u32)((u64)(x)))
24 #define EFA_DMA_ADDR_TO_UINT32_HIGH(x) ((u32)(((u64)(x)) >> 32))
26 enum efa_cmd_status {
27 EFA_CMD_SUBMITTED,
28 EFA_CMD_COMPLETED,
31 struct efa_comp_ctx {
32 struct completion wait_event;
33 struct efa_admin_acq_entry *user_cqe;
34 u32 comp_size;
35 enum efa_cmd_status status;
36 /* status from the device */
37 u8 comp_status;
38 u8 cmd_opcode;
39 u8 occupied;
42 static const char *efa_com_cmd_str(u8 cmd)
44 #define EFA_CMD_STR_CASE(_cmd) case EFA_ADMIN_##_cmd: return #_cmd
46 switch (cmd) {
47 EFA_CMD_STR_CASE(CREATE_QP);
48 EFA_CMD_STR_CASE(MODIFY_QP);
49 EFA_CMD_STR_CASE(QUERY_QP);
50 EFA_CMD_STR_CASE(DESTROY_QP);
51 EFA_CMD_STR_CASE(CREATE_AH);
52 EFA_CMD_STR_CASE(DESTROY_AH);
53 EFA_CMD_STR_CASE(REG_MR);
54 EFA_CMD_STR_CASE(DEREG_MR);
55 EFA_CMD_STR_CASE(CREATE_CQ);
56 EFA_CMD_STR_CASE(DESTROY_CQ);
57 EFA_CMD_STR_CASE(GET_FEATURE);
58 EFA_CMD_STR_CASE(SET_FEATURE);
59 EFA_CMD_STR_CASE(GET_STATS);
60 EFA_CMD_STR_CASE(ALLOC_PD);
61 EFA_CMD_STR_CASE(DEALLOC_PD);
62 EFA_CMD_STR_CASE(ALLOC_UAR);
63 EFA_CMD_STR_CASE(DEALLOC_UAR);
64 default: return "unknown command opcode";
66 #undef EFA_CMD_STR_CASE
69 static u32 efa_com_reg_read32(struct efa_com_dev *edev, u16 offset)
71 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
72 struct efa_admin_mmio_req_read_less_resp *read_resp;
73 unsigned long exp_time;
74 u32 mmio_read_reg = 0;
75 u32 err;
77 read_resp = mmio_read->read_resp;
79 spin_lock(&mmio_read->lock);
80 mmio_read->seq_num++;
82 /* trash DMA req_id to identify when hardware is done */
83 read_resp->req_id = mmio_read->seq_num + 0x9aL;
84 EFA_SET(&mmio_read_reg, EFA_REGS_MMIO_REG_READ_REG_OFF, offset);
85 EFA_SET(&mmio_read_reg, EFA_REGS_MMIO_REG_READ_REQ_ID,
86 mmio_read->seq_num);
88 writel(mmio_read_reg, edev->reg_bar + EFA_REGS_MMIO_REG_READ_OFF);
90 exp_time = jiffies + usecs_to_jiffies(mmio_read->mmio_read_timeout);
91 do {
92 if (READ_ONCE(read_resp->req_id) == mmio_read->seq_num)
93 break;
94 udelay(1);
95 } while (time_is_after_jiffies(exp_time));
97 if (read_resp->req_id != mmio_read->seq_num) {
98 ibdev_err_ratelimited(
99 edev->efa_dev,
100 "Reading register timed out. expected: req id[%u] offset[%#x] actual: req id[%u] offset[%#x]\n",
101 mmio_read->seq_num, offset, read_resp->req_id,
102 read_resp->reg_off);
103 err = EFA_MMIO_READ_INVALID;
104 goto out;
107 if (read_resp->reg_off != offset) {
108 ibdev_err_ratelimited(
109 edev->efa_dev,
110 "Reading register failed: wrong offset provided\n");
111 err = EFA_MMIO_READ_INVALID;
112 goto out;
115 err = read_resp->reg_val;
116 out:
117 spin_unlock(&mmio_read->lock);
118 return err;
121 static int efa_com_admin_init_sq(struct efa_com_dev *edev)
123 struct efa_com_admin_queue *aq = &edev->aq;
124 struct efa_com_admin_sq *sq = &aq->sq;
125 u16 size = aq->depth * sizeof(*sq->entries);
126 u32 aq_caps = 0;
127 u32 addr_high;
128 u32 addr_low;
130 sq->entries =
131 dma_alloc_coherent(aq->dmadev, size, &sq->dma_addr, GFP_KERNEL);
132 if (!sq->entries)
133 return -ENOMEM;
135 spin_lock_init(&sq->lock);
137 sq->cc = 0;
138 sq->pc = 0;
139 sq->phase = 1;
141 sq->db_addr = (u32 __iomem *)(edev->reg_bar + EFA_REGS_AQ_PROD_DB_OFF);
143 addr_high = EFA_DMA_ADDR_TO_UINT32_HIGH(sq->dma_addr);
144 addr_low = EFA_DMA_ADDR_TO_UINT32_LOW(sq->dma_addr);
146 writel(addr_low, edev->reg_bar + EFA_REGS_AQ_BASE_LO_OFF);
147 writel(addr_high, edev->reg_bar + EFA_REGS_AQ_BASE_HI_OFF);
149 EFA_SET(&aq_caps, EFA_REGS_AQ_CAPS_AQ_DEPTH, aq->depth);
150 EFA_SET(&aq_caps, EFA_REGS_AQ_CAPS_AQ_ENTRY_SIZE,
151 sizeof(struct efa_admin_aq_entry));
153 writel(aq_caps, edev->reg_bar + EFA_REGS_AQ_CAPS_OFF);
155 return 0;
158 static int efa_com_admin_init_cq(struct efa_com_dev *edev)
160 struct efa_com_admin_queue *aq = &edev->aq;
161 struct efa_com_admin_cq *cq = &aq->cq;
162 u16 size = aq->depth * sizeof(*cq->entries);
163 u32 acq_caps = 0;
164 u32 addr_high;
165 u32 addr_low;
167 cq->entries =
168 dma_alloc_coherent(aq->dmadev, size, &cq->dma_addr, GFP_KERNEL);
169 if (!cq->entries)
170 return -ENOMEM;
172 spin_lock_init(&cq->lock);
174 cq->cc = 0;
175 cq->phase = 1;
177 addr_high = EFA_DMA_ADDR_TO_UINT32_HIGH(cq->dma_addr);
178 addr_low = EFA_DMA_ADDR_TO_UINT32_LOW(cq->dma_addr);
180 writel(addr_low, edev->reg_bar + EFA_REGS_ACQ_BASE_LO_OFF);
181 writel(addr_high, edev->reg_bar + EFA_REGS_ACQ_BASE_HI_OFF);
183 EFA_SET(&acq_caps, EFA_REGS_ACQ_CAPS_ACQ_DEPTH, aq->depth);
184 EFA_SET(&acq_caps, EFA_REGS_ACQ_CAPS_ACQ_ENTRY_SIZE,
185 sizeof(struct efa_admin_acq_entry));
186 EFA_SET(&acq_caps, EFA_REGS_ACQ_CAPS_ACQ_MSIX_VECTOR,
187 aq->msix_vector_idx);
189 writel(acq_caps, edev->reg_bar + EFA_REGS_ACQ_CAPS_OFF);
191 return 0;
194 static int efa_com_admin_init_aenq(struct efa_com_dev *edev,
195 struct efa_aenq_handlers *aenq_handlers)
197 struct efa_com_aenq *aenq = &edev->aenq;
198 u32 addr_low, addr_high;
199 u32 aenq_caps = 0;
200 u16 size;
202 if (!aenq_handlers) {
203 ibdev_err(edev->efa_dev, "aenq handlers pointer is NULL\n");
204 return -EINVAL;
207 size = EFA_ASYNC_QUEUE_DEPTH * sizeof(*aenq->entries);
208 aenq->entries = dma_alloc_coherent(edev->dmadev, size, &aenq->dma_addr,
209 GFP_KERNEL);
210 if (!aenq->entries)
211 return -ENOMEM;
213 aenq->aenq_handlers = aenq_handlers;
214 aenq->depth = EFA_ASYNC_QUEUE_DEPTH;
215 aenq->cc = 0;
216 aenq->phase = 1;
218 addr_low = EFA_DMA_ADDR_TO_UINT32_LOW(aenq->dma_addr);
219 addr_high = EFA_DMA_ADDR_TO_UINT32_HIGH(aenq->dma_addr);
221 writel(addr_low, edev->reg_bar + EFA_REGS_AENQ_BASE_LO_OFF);
222 writel(addr_high, edev->reg_bar + EFA_REGS_AENQ_BASE_HI_OFF);
224 EFA_SET(&aenq_caps, EFA_REGS_AENQ_CAPS_AENQ_DEPTH, aenq->depth);
225 EFA_SET(&aenq_caps, EFA_REGS_AENQ_CAPS_AENQ_ENTRY_SIZE,
226 sizeof(struct efa_admin_aenq_entry));
227 EFA_SET(&aenq_caps, EFA_REGS_AENQ_CAPS_AENQ_MSIX_VECTOR,
228 aenq->msix_vector_idx);
229 writel(aenq_caps, edev->reg_bar + EFA_REGS_AENQ_CAPS_OFF);
232 * Init cons_db to mark that all entries in the queue
233 * are initially available
235 writel(edev->aenq.cc, edev->reg_bar + EFA_REGS_AENQ_CONS_DB_OFF);
237 return 0;
240 /* ID to be used with efa_com_get_comp_ctx */
241 static u16 efa_com_alloc_ctx_id(struct efa_com_admin_queue *aq)
243 u16 ctx_id;
245 spin_lock(&aq->comp_ctx_lock);
246 ctx_id = aq->comp_ctx_pool[aq->comp_ctx_pool_next];
247 aq->comp_ctx_pool_next++;
248 spin_unlock(&aq->comp_ctx_lock);
250 return ctx_id;
253 static void efa_com_dealloc_ctx_id(struct efa_com_admin_queue *aq,
254 u16 ctx_id)
256 spin_lock(&aq->comp_ctx_lock);
257 aq->comp_ctx_pool_next--;
258 aq->comp_ctx_pool[aq->comp_ctx_pool_next] = ctx_id;
259 spin_unlock(&aq->comp_ctx_lock);
262 static inline void efa_com_put_comp_ctx(struct efa_com_admin_queue *aq,
263 struct efa_comp_ctx *comp_ctx)
265 u16 cmd_id = EFA_GET(&comp_ctx->user_cqe->acq_common_descriptor.command,
266 EFA_ADMIN_ACQ_COMMON_DESC_COMMAND_ID);
267 u16 ctx_id = cmd_id & (aq->depth - 1);
269 ibdev_dbg(aq->efa_dev, "Put completion command_id %#x\n", cmd_id);
270 comp_ctx->occupied = 0;
271 efa_com_dealloc_ctx_id(aq, ctx_id);
274 static struct efa_comp_ctx *efa_com_get_comp_ctx(struct efa_com_admin_queue *aq,
275 u16 cmd_id, bool capture)
277 u16 ctx_id = cmd_id & (aq->depth - 1);
279 if (aq->comp_ctx[ctx_id].occupied && capture) {
280 ibdev_err_ratelimited(
281 aq->efa_dev,
282 "Completion context for command_id %#x is occupied\n",
283 cmd_id);
284 return NULL;
287 if (capture) {
288 aq->comp_ctx[ctx_id].occupied = 1;
289 ibdev_dbg(aq->efa_dev,
290 "Take completion ctxt for command_id %#x\n", cmd_id);
293 return &aq->comp_ctx[ctx_id];
296 static struct efa_comp_ctx *__efa_com_submit_admin_cmd(struct efa_com_admin_queue *aq,
297 struct efa_admin_aq_entry *cmd,
298 size_t cmd_size_in_bytes,
299 struct efa_admin_acq_entry *comp,
300 size_t comp_size_in_bytes)
302 struct efa_admin_aq_entry *aqe;
303 struct efa_comp_ctx *comp_ctx;
304 u16 queue_size_mask;
305 u16 cmd_id;
306 u16 ctx_id;
307 u16 pi;
309 queue_size_mask = aq->depth - 1;
310 pi = aq->sq.pc & queue_size_mask;
312 ctx_id = efa_com_alloc_ctx_id(aq);
314 /* cmd_id LSBs are the ctx_id and MSBs are entropy bits from pc */
315 cmd_id = ctx_id & queue_size_mask;
316 cmd_id |= aq->sq.pc & ~queue_size_mask;
317 cmd_id &= EFA_ADMIN_AQ_COMMON_DESC_COMMAND_ID_MASK;
319 cmd->aq_common_descriptor.command_id = cmd_id;
320 EFA_SET(&cmd->aq_common_descriptor.flags,
321 EFA_ADMIN_AQ_COMMON_DESC_PHASE, aq->sq.phase);
323 comp_ctx = efa_com_get_comp_ctx(aq, cmd_id, true);
324 if (!comp_ctx) {
325 efa_com_dealloc_ctx_id(aq, ctx_id);
326 return ERR_PTR(-EINVAL);
329 comp_ctx->status = EFA_CMD_SUBMITTED;
330 comp_ctx->comp_size = comp_size_in_bytes;
331 comp_ctx->user_cqe = comp;
332 comp_ctx->cmd_opcode = cmd->aq_common_descriptor.opcode;
334 reinit_completion(&comp_ctx->wait_event);
336 aqe = &aq->sq.entries[pi];
337 memset(aqe, 0, sizeof(*aqe));
338 memcpy(aqe, cmd, cmd_size_in_bytes);
340 aq->sq.pc++;
341 atomic64_inc(&aq->stats.submitted_cmd);
343 if ((aq->sq.pc & queue_size_mask) == 0)
344 aq->sq.phase = !aq->sq.phase;
346 /* barrier not needed in case of writel */
347 writel(aq->sq.pc, aq->sq.db_addr);
349 return comp_ctx;
352 static inline int efa_com_init_comp_ctxt(struct efa_com_admin_queue *aq)
354 size_t pool_size = aq->depth * sizeof(*aq->comp_ctx_pool);
355 size_t size = aq->depth * sizeof(struct efa_comp_ctx);
356 struct efa_comp_ctx *comp_ctx;
357 u16 i;
359 aq->comp_ctx = devm_kzalloc(aq->dmadev, size, GFP_KERNEL);
360 aq->comp_ctx_pool = devm_kzalloc(aq->dmadev, pool_size, GFP_KERNEL);
361 if (!aq->comp_ctx || !aq->comp_ctx_pool) {
362 devm_kfree(aq->dmadev, aq->comp_ctx_pool);
363 devm_kfree(aq->dmadev, aq->comp_ctx);
364 return -ENOMEM;
367 for (i = 0; i < aq->depth; i++) {
368 comp_ctx = efa_com_get_comp_ctx(aq, i, false);
369 if (comp_ctx)
370 init_completion(&comp_ctx->wait_event);
372 aq->comp_ctx_pool[i] = i;
375 spin_lock_init(&aq->comp_ctx_lock);
377 aq->comp_ctx_pool_next = 0;
379 return 0;
382 static struct efa_comp_ctx *efa_com_submit_admin_cmd(struct efa_com_admin_queue *aq,
383 struct efa_admin_aq_entry *cmd,
384 size_t cmd_size_in_bytes,
385 struct efa_admin_acq_entry *comp,
386 size_t comp_size_in_bytes)
388 struct efa_comp_ctx *comp_ctx;
390 spin_lock(&aq->sq.lock);
391 if (!test_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state)) {
392 ibdev_err_ratelimited(aq->efa_dev, "Admin queue is closed\n");
393 spin_unlock(&aq->sq.lock);
394 return ERR_PTR(-ENODEV);
397 comp_ctx = __efa_com_submit_admin_cmd(aq, cmd, cmd_size_in_bytes, comp,
398 comp_size_in_bytes);
399 spin_unlock(&aq->sq.lock);
400 if (IS_ERR(comp_ctx))
401 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
403 return comp_ctx;
406 static void efa_com_handle_single_admin_completion(struct efa_com_admin_queue *aq,
407 struct efa_admin_acq_entry *cqe)
409 struct efa_comp_ctx *comp_ctx;
410 u16 cmd_id;
412 cmd_id = EFA_GET(&cqe->acq_common_descriptor.command,
413 EFA_ADMIN_ACQ_COMMON_DESC_COMMAND_ID);
415 comp_ctx = efa_com_get_comp_ctx(aq, cmd_id, false);
416 if (!comp_ctx) {
417 ibdev_err(aq->efa_dev,
418 "comp_ctx is NULL. Changing the admin queue running state\n");
419 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
420 return;
423 comp_ctx->status = EFA_CMD_COMPLETED;
424 comp_ctx->comp_status = cqe->acq_common_descriptor.status;
425 if (comp_ctx->user_cqe)
426 memcpy(comp_ctx->user_cqe, cqe, comp_ctx->comp_size);
428 if (!test_bit(EFA_AQ_STATE_POLLING_BIT, &aq->state))
429 complete(&comp_ctx->wait_event);
432 static void efa_com_handle_admin_completion(struct efa_com_admin_queue *aq)
434 struct efa_admin_acq_entry *cqe;
435 u16 queue_size_mask;
436 u16 comp_num = 0;
437 u8 phase;
438 u16 ci;
440 queue_size_mask = aq->depth - 1;
442 ci = aq->cq.cc & queue_size_mask;
443 phase = aq->cq.phase;
445 cqe = &aq->cq.entries[ci];
447 /* Go over all the completions */
448 while ((READ_ONCE(cqe->acq_common_descriptor.flags) &
449 EFA_ADMIN_ACQ_COMMON_DESC_PHASE_MASK) == phase) {
451 * Do not read the rest of the completion entry before the
452 * phase bit was validated
454 dma_rmb();
455 efa_com_handle_single_admin_completion(aq, cqe);
457 ci++;
458 comp_num++;
459 if (ci == aq->depth) {
460 ci = 0;
461 phase = !phase;
464 cqe = &aq->cq.entries[ci];
467 aq->cq.cc += comp_num;
468 aq->cq.phase = phase;
469 aq->sq.cc += comp_num;
470 atomic64_add(comp_num, &aq->stats.completed_cmd);
473 static int efa_com_comp_status_to_errno(u8 comp_status)
475 switch (comp_status) {
476 case EFA_ADMIN_SUCCESS:
477 return 0;
478 case EFA_ADMIN_RESOURCE_ALLOCATION_FAILURE:
479 return -ENOMEM;
480 case EFA_ADMIN_UNSUPPORTED_OPCODE:
481 return -EOPNOTSUPP;
482 case EFA_ADMIN_BAD_OPCODE:
483 case EFA_ADMIN_MALFORMED_REQUEST:
484 case EFA_ADMIN_ILLEGAL_PARAMETER:
485 case EFA_ADMIN_UNKNOWN_ERROR:
486 return -EINVAL;
487 default:
488 return -EINVAL;
492 static int efa_com_wait_and_process_admin_cq_polling(struct efa_comp_ctx *comp_ctx,
493 struct efa_com_admin_queue *aq)
495 unsigned long timeout;
496 unsigned long flags;
497 int err;
499 timeout = jiffies + usecs_to_jiffies(aq->completion_timeout);
501 while (1) {
502 spin_lock_irqsave(&aq->cq.lock, flags);
503 efa_com_handle_admin_completion(aq);
504 spin_unlock_irqrestore(&aq->cq.lock, flags);
506 if (comp_ctx->status != EFA_CMD_SUBMITTED)
507 break;
509 if (time_is_before_jiffies(timeout)) {
510 ibdev_err_ratelimited(
511 aq->efa_dev,
512 "Wait for completion (polling) timeout\n");
513 /* EFA didn't have any completion */
514 atomic64_inc(&aq->stats.no_completion);
516 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
517 err = -ETIME;
518 goto out;
521 msleep(aq->poll_interval);
524 err = efa_com_comp_status_to_errno(comp_ctx->comp_status);
525 out:
526 efa_com_put_comp_ctx(aq, comp_ctx);
527 return err;
530 static int efa_com_wait_and_process_admin_cq_interrupts(struct efa_comp_ctx *comp_ctx,
531 struct efa_com_admin_queue *aq)
533 unsigned long flags;
534 int err;
536 wait_for_completion_timeout(&comp_ctx->wait_event,
537 usecs_to_jiffies(aq->completion_timeout));
540 * In case the command wasn't completed find out the root cause.
541 * There might be 2 kinds of errors
542 * 1) No completion (timeout reached)
543 * 2) There is completion but the device didn't get any msi-x interrupt.
545 if (comp_ctx->status == EFA_CMD_SUBMITTED) {
546 spin_lock_irqsave(&aq->cq.lock, flags);
547 efa_com_handle_admin_completion(aq);
548 spin_unlock_irqrestore(&aq->cq.lock, flags);
550 atomic64_inc(&aq->stats.no_completion);
552 if (comp_ctx->status == EFA_CMD_COMPLETED)
553 ibdev_err_ratelimited(
554 aq->efa_dev,
555 "The device sent a completion but the driver didn't receive any MSI-X interrupt for admin cmd %s(%d) status %d (ctx: 0x%p, sq producer: %d, sq consumer: %d, cq consumer: %d)\n",
556 efa_com_cmd_str(comp_ctx->cmd_opcode),
557 comp_ctx->cmd_opcode, comp_ctx->status,
558 comp_ctx, aq->sq.pc, aq->sq.cc, aq->cq.cc);
559 else
560 ibdev_err_ratelimited(
561 aq->efa_dev,
562 "The device didn't send any completion for admin cmd %s(%d) status %d (ctx 0x%p, sq producer: %d, sq consumer: %d, cq consumer: %d)\n",
563 efa_com_cmd_str(comp_ctx->cmd_opcode),
564 comp_ctx->cmd_opcode, comp_ctx->status,
565 comp_ctx, aq->sq.pc, aq->sq.cc, aq->cq.cc);
567 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
568 err = -ETIME;
569 goto out;
572 err = efa_com_comp_status_to_errno(comp_ctx->comp_status);
573 out:
574 efa_com_put_comp_ctx(aq, comp_ctx);
575 return err;
579 * There are two types to wait for completion.
580 * Polling mode - wait until the completion is available.
581 * Async mode - wait on wait queue until the completion is ready
582 * (or the timeout expired).
583 * It is expected that the IRQ called efa_com_handle_admin_completion
584 * to mark the completions.
586 static int efa_com_wait_and_process_admin_cq(struct efa_comp_ctx *comp_ctx,
587 struct efa_com_admin_queue *aq)
589 if (test_bit(EFA_AQ_STATE_POLLING_BIT, &aq->state))
590 return efa_com_wait_and_process_admin_cq_polling(comp_ctx, aq);
592 return efa_com_wait_and_process_admin_cq_interrupts(comp_ctx, aq);
596 * efa_com_cmd_exec - Execute admin command
597 * @aq: admin queue.
598 * @cmd: the admin command to execute.
599 * @cmd_size: the command size.
600 * @comp: command completion return entry.
601 * @comp_size: command completion size.
602 * Submit an admin command and then wait until the device will return a
603 * completion.
604 * The completion will be copied into comp.
606 * @return - 0 on success, negative value on failure.
608 int efa_com_cmd_exec(struct efa_com_admin_queue *aq,
609 struct efa_admin_aq_entry *cmd,
610 size_t cmd_size,
611 struct efa_admin_acq_entry *comp,
612 size_t comp_size)
614 struct efa_comp_ctx *comp_ctx;
615 int err;
617 might_sleep();
619 /* In case of queue FULL */
620 down(&aq->avail_cmds);
622 ibdev_dbg(aq->efa_dev, "%s (opcode %d)\n",
623 efa_com_cmd_str(cmd->aq_common_descriptor.opcode),
624 cmd->aq_common_descriptor.opcode);
625 comp_ctx = efa_com_submit_admin_cmd(aq, cmd, cmd_size, comp, comp_size);
626 if (IS_ERR(comp_ctx)) {
627 ibdev_err_ratelimited(
628 aq->efa_dev,
629 "Failed to submit command %s (opcode %u) err %ld\n",
630 efa_com_cmd_str(cmd->aq_common_descriptor.opcode),
631 cmd->aq_common_descriptor.opcode, PTR_ERR(comp_ctx));
633 up(&aq->avail_cmds);
634 atomic64_inc(&aq->stats.cmd_err);
635 return PTR_ERR(comp_ctx);
638 err = efa_com_wait_and_process_admin_cq(comp_ctx, aq);
639 if (err) {
640 ibdev_err_ratelimited(
641 aq->efa_dev,
642 "Failed to process command %s (opcode %u) comp_status %d err %d\n",
643 efa_com_cmd_str(cmd->aq_common_descriptor.opcode),
644 cmd->aq_common_descriptor.opcode, comp_ctx->comp_status,
645 err);
646 atomic64_inc(&aq->stats.cmd_err);
649 up(&aq->avail_cmds);
651 return err;
655 * efa_com_admin_destroy - Destroy the admin and the async events queues.
656 * @edev: EFA communication layer struct
658 void efa_com_admin_destroy(struct efa_com_dev *edev)
660 struct efa_com_admin_queue *aq = &edev->aq;
661 struct efa_com_aenq *aenq = &edev->aenq;
662 struct efa_com_admin_cq *cq = &aq->cq;
663 struct efa_com_admin_sq *sq = &aq->sq;
664 u16 size;
666 clear_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
668 devm_kfree(edev->dmadev, aq->comp_ctx_pool);
669 devm_kfree(edev->dmadev, aq->comp_ctx);
671 size = aq->depth * sizeof(*sq->entries);
672 dma_free_coherent(edev->dmadev, size, sq->entries, sq->dma_addr);
674 size = aq->depth * sizeof(*cq->entries);
675 dma_free_coherent(edev->dmadev, size, cq->entries, cq->dma_addr);
677 size = aenq->depth * sizeof(*aenq->entries);
678 dma_free_coherent(edev->dmadev, size, aenq->entries, aenq->dma_addr);
682 * efa_com_set_admin_polling_mode - Set the admin completion queue polling mode
683 * @edev: EFA communication layer struct
684 * @polling: Enable/Disable polling mode
686 * Set the admin completion mode.
688 void efa_com_set_admin_polling_mode(struct efa_com_dev *edev, bool polling)
690 u32 mask_value = 0;
692 if (polling)
693 EFA_SET(&mask_value, EFA_REGS_INTR_MASK_EN, 1);
695 writel(mask_value, edev->reg_bar + EFA_REGS_INTR_MASK_OFF);
696 if (polling)
697 set_bit(EFA_AQ_STATE_POLLING_BIT, &edev->aq.state);
698 else
699 clear_bit(EFA_AQ_STATE_POLLING_BIT, &edev->aq.state);
702 static void efa_com_stats_init(struct efa_com_dev *edev)
704 atomic64_t *s = (atomic64_t *)&edev->aq.stats;
705 int i;
707 for (i = 0; i < sizeof(edev->aq.stats) / sizeof(*s); i++, s++)
708 atomic64_set(s, 0);
712 * efa_com_admin_init - Init the admin and the async queues
713 * @edev: EFA communication layer struct
714 * @aenq_handlers: Those handlers to be called upon event.
716 * Initialize the admin submission and completion queues.
717 * Initialize the asynchronous events notification queues.
719 * @return - 0 on success, negative value on failure.
721 int efa_com_admin_init(struct efa_com_dev *edev,
722 struct efa_aenq_handlers *aenq_handlers)
724 struct efa_com_admin_queue *aq = &edev->aq;
725 u32 timeout;
726 u32 dev_sts;
727 u32 cap;
728 int err;
730 dev_sts = efa_com_reg_read32(edev, EFA_REGS_DEV_STS_OFF);
731 if (!EFA_GET(&dev_sts, EFA_REGS_DEV_STS_READY)) {
732 ibdev_err(edev->efa_dev,
733 "Device isn't ready, abort com init %#x\n", dev_sts);
734 return -ENODEV;
737 aq->depth = EFA_ADMIN_QUEUE_DEPTH;
739 aq->dmadev = edev->dmadev;
740 aq->efa_dev = edev->efa_dev;
741 set_bit(EFA_AQ_STATE_POLLING_BIT, &aq->state);
743 sema_init(&aq->avail_cmds, aq->depth);
745 efa_com_stats_init(edev);
747 err = efa_com_init_comp_ctxt(aq);
748 if (err)
749 return err;
751 err = efa_com_admin_init_sq(edev);
752 if (err)
753 goto err_destroy_comp_ctxt;
755 err = efa_com_admin_init_cq(edev);
756 if (err)
757 goto err_destroy_sq;
759 efa_com_set_admin_polling_mode(edev, false);
761 err = efa_com_admin_init_aenq(edev, aenq_handlers);
762 if (err)
763 goto err_destroy_cq;
765 cap = efa_com_reg_read32(edev, EFA_REGS_CAPS_OFF);
766 timeout = EFA_GET(&cap, EFA_REGS_CAPS_ADMIN_CMD_TO);
767 if (timeout)
768 /* the resolution of timeout reg is 100ms */
769 aq->completion_timeout = timeout * 100000;
770 else
771 aq->completion_timeout = ADMIN_CMD_TIMEOUT_US;
773 aq->poll_interval = EFA_POLL_INTERVAL_MS;
775 set_bit(EFA_AQ_STATE_RUNNING_BIT, &aq->state);
777 return 0;
779 err_destroy_cq:
780 dma_free_coherent(edev->dmadev, aq->depth * sizeof(*aq->cq.entries),
781 aq->cq.entries, aq->cq.dma_addr);
782 err_destroy_sq:
783 dma_free_coherent(edev->dmadev, aq->depth * sizeof(*aq->sq.entries),
784 aq->sq.entries, aq->sq.dma_addr);
785 err_destroy_comp_ctxt:
786 devm_kfree(edev->dmadev, aq->comp_ctx);
788 return err;
792 * efa_com_admin_q_comp_intr_handler - admin queue interrupt handler
793 * @edev: EFA communication layer struct
795 * This method goes over the admin completion queue and wakes up
796 * all the pending threads that wait on the commands wait event.
798 * @note: Should be called after MSI-X interrupt.
800 void efa_com_admin_q_comp_intr_handler(struct efa_com_dev *edev)
802 unsigned long flags;
804 spin_lock_irqsave(&edev->aq.cq.lock, flags);
805 efa_com_handle_admin_completion(&edev->aq);
806 spin_unlock_irqrestore(&edev->aq.cq.lock, flags);
810 * efa_handle_specific_aenq_event:
811 * return the handler that is relevant to the specific event group
813 static efa_aenq_handler efa_com_get_specific_aenq_cb(struct efa_com_dev *edev,
814 u16 group)
816 struct efa_aenq_handlers *aenq_handlers = edev->aenq.aenq_handlers;
818 if (group < EFA_MAX_HANDLERS && aenq_handlers->handlers[group])
819 return aenq_handlers->handlers[group];
821 return aenq_handlers->unimplemented_handler;
825 * efa_com_aenq_intr_handler - AENQ interrupt handler
826 * @edev: EFA communication layer struct
827 * @data: Data of interrupt handler.
829 * Go over the async event notification queue and call the proper aenq handler.
831 void efa_com_aenq_intr_handler(struct efa_com_dev *edev, void *data)
833 struct efa_admin_aenq_common_desc *aenq_common;
834 struct efa_com_aenq *aenq = &edev->aenq;
835 struct efa_admin_aenq_entry *aenq_e;
836 efa_aenq_handler handler_cb;
837 u32 processed = 0;
838 u8 phase;
839 u32 ci;
841 ci = aenq->cc & (aenq->depth - 1);
842 phase = aenq->phase;
843 aenq_e = &aenq->entries[ci]; /* Get first entry */
844 aenq_common = &aenq_e->aenq_common_desc;
846 /* Go over all the events */
847 while ((READ_ONCE(aenq_common->flags) &
848 EFA_ADMIN_AENQ_COMMON_DESC_PHASE_MASK) == phase) {
850 * Do not read the rest of the completion entry before the
851 * phase bit was validated
853 dma_rmb();
855 /* Handle specific event*/
856 handler_cb = efa_com_get_specific_aenq_cb(edev,
857 aenq_common->group);
858 handler_cb(data, aenq_e); /* call the actual event handler*/
860 /* Get next event entry */
861 ci++;
862 processed++;
864 if (ci == aenq->depth) {
865 ci = 0;
866 phase = !phase;
868 aenq_e = &aenq->entries[ci];
869 aenq_common = &aenq_e->aenq_common_desc;
872 aenq->cc += processed;
873 aenq->phase = phase;
875 /* Don't update aenq doorbell if there weren't any processed events */
876 if (!processed)
877 return;
879 /* barrier not needed in case of writel */
880 writel(aenq->cc, edev->reg_bar + EFA_REGS_AENQ_CONS_DB_OFF);
883 static void efa_com_mmio_reg_read_resp_addr_init(struct efa_com_dev *edev)
885 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
886 u32 addr_high;
887 u32 addr_low;
889 /* dma_addr_bits is unknown at this point */
890 addr_high = (mmio_read->read_resp_dma_addr >> 32) & GENMASK(31, 0);
891 addr_low = mmio_read->read_resp_dma_addr & GENMASK(31, 0);
893 writel(addr_high, edev->reg_bar + EFA_REGS_MMIO_RESP_HI_OFF);
894 writel(addr_low, edev->reg_bar + EFA_REGS_MMIO_RESP_LO_OFF);
897 int efa_com_mmio_reg_read_init(struct efa_com_dev *edev)
899 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
901 spin_lock_init(&mmio_read->lock);
902 mmio_read->read_resp =
903 dma_alloc_coherent(edev->dmadev, sizeof(*mmio_read->read_resp),
904 &mmio_read->read_resp_dma_addr, GFP_KERNEL);
905 if (!mmio_read->read_resp)
906 return -ENOMEM;
908 efa_com_mmio_reg_read_resp_addr_init(edev);
910 mmio_read->read_resp->req_id = 0;
911 mmio_read->seq_num = 0;
912 mmio_read->mmio_read_timeout = EFA_REG_READ_TIMEOUT_US;
914 return 0;
917 void efa_com_mmio_reg_read_destroy(struct efa_com_dev *edev)
919 struct efa_com_mmio_read *mmio_read = &edev->mmio_read;
921 dma_free_coherent(edev->dmadev, sizeof(*mmio_read->read_resp),
922 mmio_read->read_resp, mmio_read->read_resp_dma_addr);
925 int efa_com_validate_version(struct efa_com_dev *edev)
927 u32 min_ctrl_ver = 0;
928 u32 ctrl_ver_masked;
929 u32 min_ver = 0;
930 u32 ctrl_ver;
931 u32 ver;
934 * Make sure the EFA version and the controller version are at least
935 * as the driver expects
937 ver = efa_com_reg_read32(edev, EFA_REGS_VERSION_OFF);
938 ctrl_ver = efa_com_reg_read32(edev,
939 EFA_REGS_CONTROLLER_VERSION_OFF);
941 ibdev_dbg(edev->efa_dev, "efa device version: %d.%d\n",
942 EFA_GET(&ver, EFA_REGS_VERSION_MAJOR_VERSION),
943 EFA_GET(&ver, EFA_REGS_VERSION_MINOR_VERSION));
945 EFA_SET(&min_ver, EFA_REGS_VERSION_MAJOR_VERSION,
946 EFA_ADMIN_API_VERSION_MAJOR);
947 EFA_SET(&min_ver, EFA_REGS_VERSION_MINOR_VERSION,
948 EFA_ADMIN_API_VERSION_MINOR);
949 if (ver < min_ver) {
950 ibdev_err(edev->efa_dev,
951 "EFA version is lower than the minimal version the driver supports\n");
952 return -EOPNOTSUPP;
955 ibdev_dbg(
956 edev->efa_dev,
957 "efa controller version: %d.%d.%d implementation version %d\n",
958 EFA_GET(&ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MAJOR_VERSION),
959 EFA_GET(&ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MINOR_VERSION),
960 EFA_GET(&ctrl_ver,
961 EFA_REGS_CONTROLLER_VERSION_SUBMINOR_VERSION),
962 EFA_GET(&ctrl_ver, EFA_REGS_CONTROLLER_VERSION_IMPL_ID));
964 ctrl_ver_masked =
965 EFA_GET(&ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MAJOR_VERSION) |
966 EFA_GET(&ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MINOR_VERSION) |
967 EFA_GET(&ctrl_ver,
968 EFA_REGS_CONTROLLER_VERSION_SUBMINOR_VERSION);
970 EFA_SET(&min_ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MAJOR_VERSION,
971 EFA_CTRL_MAJOR);
972 EFA_SET(&min_ctrl_ver, EFA_REGS_CONTROLLER_VERSION_MINOR_VERSION,
973 EFA_CTRL_MINOR);
974 EFA_SET(&min_ctrl_ver, EFA_REGS_CONTROLLER_VERSION_SUBMINOR_VERSION,
975 EFA_CTRL_SUB_MINOR);
976 /* Validate the ctrl version without the implementation ID */
977 if (ctrl_ver_masked < min_ctrl_ver) {
978 ibdev_err(edev->efa_dev,
979 "EFA ctrl version is lower than the minimal ctrl version the driver supports\n");
980 return -EOPNOTSUPP;
983 return 0;
987 * efa_com_get_dma_width - Retrieve physical dma address width the device
988 * supports.
989 * @edev: EFA communication layer struct
991 * Retrieve the maximum physical address bits the device can handle.
993 * @return: > 0 on Success and negative value otherwise.
995 int efa_com_get_dma_width(struct efa_com_dev *edev)
997 u32 caps = efa_com_reg_read32(edev, EFA_REGS_CAPS_OFF);
998 int width;
1000 width = EFA_GET(&caps, EFA_REGS_CAPS_DMA_ADDR_WIDTH);
1002 ibdev_dbg(edev->efa_dev, "DMA width: %d\n", width);
1004 if (width < 32 || width > 64) {
1005 ibdev_err(edev->efa_dev, "DMA width illegal value: %d\n", width);
1006 return -EINVAL;
1009 edev->dma_addr_bits = width;
1011 return width;
1014 static int wait_for_reset_state(struct efa_com_dev *edev, u32 timeout, int on)
1016 u32 val, i;
1018 for (i = 0; i < timeout; i++) {
1019 val = efa_com_reg_read32(edev, EFA_REGS_DEV_STS_OFF);
1021 if (EFA_GET(&val, EFA_REGS_DEV_STS_RESET_IN_PROGRESS) == on)
1022 return 0;
1024 ibdev_dbg(edev->efa_dev, "Reset indication val %d\n", val);
1025 msleep(EFA_POLL_INTERVAL_MS);
1028 return -ETIME;
1032 * efa_com_dev_reset - Perform device FLR to the device.
1033 * @edev: EFA communication layer struct
1034 * @reset_reason: Specify what is the trigger for the reset in case of an error.
1036 * @return - 0 on success, negative value on failure.
1038 int efa_com_dev_reset(struct efa_com_dev *edev,
1039 enum efa_regs_reset_reason_types reset_reason)
1041 u32 stat, timeout, cap;
1042 u32 reset_val = 0;
1043 int err;
1045 stat = efa_com_reg_read32(edev, EFA_REGS_DEV_STS_OFF);
1046 cap = efa_com_reg_read32(edev, EFA_REGS_CAPS_OFF);
1048 if (!EFA_GET(&stat, EFA_REGS_DEV_STS_READY)) {
1049 ibdev_err(edev->efa_dev,
1050 "Device isn't ready, can't reset device\n");
1051 return -EINVAL;
1054 timeout = EFA_GET(&cap, EFA_REGS_CAPS_RESET_TIMEOUT);
1055 if (!timeout) {
1056 ibdev_err(edev->efa_dev, "Invalid timeout value\n");
1057 return -EINVAL;
1060 /* start reset */
1061 EFA_SET(&reset_val, EFA_REGS_DEV_CTL_DEV_RESET, 1);
1062 EFA_SET(&reset_val, EFA_REGS_DEV_CTL_RESET_REASON, reset_reason);
1063 writel(reset_val, edev->reg_bar + EFA_REGS_DEV_CTL_OFF);
1065 /* reset clears the mmio readless address, restore it */
1066 efa_com_mmio_reg_read_resp_addr_init(edev);
1068 err = wait_for_reset_state(edev, timeout, 1);
1069 if (err) {
1070 ibdev_err(edev->efa_dev, "Reset indication didn't turn on\n");
1071 return err;
1074 /* reset done */
1075 writel(0, edev->reg_bar + EFA_REGS_DEV_CTL_OFF);
1076 err = wait_for_reset_state(edev, timeout, 0);
1077 if (err) {
1078 ibdev_err(edev->efa_dev, "Reset indication didn't turn off\n");
1079 return err;
1082 timeout = EFA_GET(&cap, EFA_REGS_CAPS_ADMIN_CMD_TO);
1083 if (timeout)
1084 /* the resolution of timeout reg is 100ms */
1085 edev->aq.completion_timeout = timeout * 100000;
1086 else
1087 edev->aq.completion_timeout = ADMIN_CMD_TIMEOUT_US;
1089 return 0;