| // SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause |
| |
| /* Authors: Cheng Xu <chengyou@linux.alibaba.com> */ |
| /* Kai Shen <kaishen@linux.alibaba.com> */ |
| /* Copyright (c) 2020-2022, Alibaba Group. */ |
| |
| #include "erdma.h" |
| |
| static void arm_cmdq_cq(struct erdma_cmdq *cmdq) |
| { |
| struct erdma_dev *dev = container_of(cmdq, struct erdma_dev, cmdq); |
| u64 db_data = FIELD_PREP(ERDMA_CQDB_CI_MASK, cmdq->cq.ci) | |
| FIELD_PREP(ERDMA_CQDB_ARM_MASK, 1) | |
| FIELD_PREP(ERDMA_CQDB_CMDSN_MASK, cmdq->cq.cmdsn) | |
| FIELD_PREP(ERDMA_CQDB_IDX_MASK, cmdq->cq.cmdsn); |
| |
| *cmdq->cq.db_record = db_data; |
| writeq(db_data, dev->func_bar + ERDMA_CMDQ_CQDB_REG); |
| |
| atomic64_inc(&cmdq->cq.armed_num); |
| } |
| |
| static void kick_cmdq_db(struct erdma_cmdq *cmdq) |
| { |
| struct erdma_dev *dev = container_of(cmdq, struct erdma_dev, cmdq); |
| u64 db_data = FIELD_PREP(ERDMA_CMD_HDR_WQEBB_INDEX_MASK, cmdq->sq.pi); |
| |
| *cmdq->sq.db_record = db_data; |
| writeq(db_data, dev->func_bar + ERDMA_CMDQ_SQDB_REG); |
| } |
| |
| static struct erdma_comp_wait *get_comp_wait(struct erdma_cmdq *cmdq) |
| { |
| int comp_idx; |
| |
| spin_lock(&cmdq->lock); |
| comp_idx = find_first_zero_bit(cmdq->comp_wait_bitmap, |
| cmdq->max_outstandings); |
| if (comp_idx == cmdq->max_outstandings) { |
| spin_unlock(&cmdq->lock); |
| return ERR_PTR(-ENOMEM); |
| } |
| |
| __set_bit(comp_idx, cmdq->comp_wait_bitmap); |
| spin_unlock(&cmdq->lock); |
| |
| return &cmdq->wait_pool[comp_idx]; |
| } |
| |
| static void put_comp_wait(struct erdma_cmdq *cmdq, |
| struct erdma_comp_wait *comp_wait) |
| { |
| int used; |
| |
| cmdq->wait_pool[comp_wait->ctx_id].cmd_status = ERDMA_CMD_STATUS_INIT; |
| spin_lock(&cmdq->lock); |
| used = __test_and_clear_bit(comp_wait->ctx_id, cmdq->comp_wait_bitmap); |
| spin_unlock(&cmdq->lock); |
| |
| WARN_ON(!used); |
| } |
| |
| static int erdma_cmdq_wait_res_init(struct erdma_dev *dev, |
| struct erdma_cmdq *cmdq) |
| { |
| int i; |
| |
| cmdq->wait_pool = |
| devm_kcalloc(&dev->pdev->dev, cmdq->max_outstandings, |
| sizeof(struct erdma_comp_wait), GFP_KERNEL); |
| if (!cmdq->wait_pool) |
| return -ENOMEM; |
| |
| spin_lock_init(&cmdq->lock); |
| cmdq->comp_wait_bitmap = devm_bitmap_zalloc( |
| &dev->pdev->dev, cmdq->max_outstandings, GFP_KERNEL); |
| if (!cmdq->comp_wait_bitmap) |
| return -ENOMEM; |
| |
| for (i = 0; i < cmdq->max_outstandings; i++) { |
| init_completion(&cmdq->wait_pool[i].wait_event); |
| cmdq->wait_pool[i].ctx_id = i; |
| } |
| |
| return 0; |
| } |
| |
| static int erdma_cmdq_sq_init(struct erdma_dev *dev) |
| { |
| struct erdma_cmdq *cmdq = &dev->cmdq; |
| struct erdma_cmdq_sq *sq = &cmdq->sq; |
| u32 buf_size; |
| |
| sq->wqebb_cnt = SQEBB_COUNT(ERDMA_CMDQ_SQE_SIZE); |
| sq->depth = cmdq->max_outstandings * sq->wqebb_cnt; |
| |
| buf_size = sq->depth << SQEBB_SHIFT; |
| |
| sq->qbuf = |
| dma_alloc_coherent(&dev->pdev->dev, WARPPED_BUFSIZE(buf_size), |
| &sq->qbuf_dma_addr, GFP_KERNEL); |
| if (!sq->qbuf) |
| return -ENOMEM; |
| |
| sq->db_record = (u64 *)(sq->qbuf + buf_size); |
| |
| spin_lock_init(&sq->lock); |
| |
| erdma_reg_write32(dev, ERDMA_REGS_CMDQ_SQ_ADDR_H_REG, |
| upper_32_bits(sq->qbuf_dma_addr)); |
| erdma_reg_write32(dev, ERDMA_REGS_CMDQ_SQ_ADDR_L_REG, |
| lower_32_bits(sq->qbuf_dma_addr)); |
| erdma_reg_write32(dev, ERDMA_REGS_CMDQ_DEPTH_REG, sq->depth); |
| erdma_reg_write64(dev, ERDMA_CMDQ_SQ_DB_HOST_ADDR_REG, |
| sq->qbuf_dma_addr + buf_size); |
| |
| return 0; |
| } |
| |
| static int erdma_cmdq_cq_init(struct erdma_dev *dev) |
| { |
| struct erdma_cmdq *cmdq = &dev->cmdq; |
| struct erdma_cmdq_cq *cq = &cmdq->cq; |
| u32 buf_size; |
| |
| cq->depth = cmdq->sq.depth; |
| buf_size = cq->depth << CQE_SHIFT; |
| |
| cq->qbuf = |
| dma_alloc_coherent(&dev->pdev->dev, WARPPED_BUFSIZE(buf_size), |
| &cq->qbuf_dma_addr, GFP_KERNEL | __GFP_ZERO); |
| if (!cq->qbuf) |
| return -ENOMEM; |
| |
| spin_lock_init(&cq->lock); |
| |
| cq->db_record = (u64 *)(cq->qbuf + buf_size); |
| |
| atomic64_set(&cq->armed_num, 0); |
| |
| erdma_reg_write32(dev, ERDMA_REGS_CMDQ_CQ_ADDR_H_REG, |
| upper_32_bits(cq->qbuf_dma_addr)); |
| erdma_reg_write32(dev, ERDMA_REGS_CMDQ_CQ_ADDR_L_REG, |
| lower_32_bits(cq->qbuf_dma_addr)); |
| erdma_reg_write64(dev, ERDMA_CMDQ_CQ_DB_HOST_ADDR_REG, |
| cq->qbuf_dma_addr + buf_size); |
| |
| return 0; |
| } |
| |
| static int erdma_cmdq_eq_init(struct erdma_dev *dev) |
| { |
| struct erdma_cmdq *cmdq = &dev->cmdq; |
| struct erdma_eq *eq = &cmdq->eq; |
| u32 buf_size; |
| |
| eq->depth = cmdq->max_outstandings; |
| buf_size = eq->depth << EQE_SHIFT; |
| |
| eq->qbuf = |
| dma_alloc_coherent(&dev->pdev->dev, WARPPED_BUFSIZE(buf_size), |
| &eq->qbuf_dma_addr, GFP_KERNEL | __GFP_ZERO); |
| if (!eq->qbuf) |
| return -ENOMEM; |
| |
| spin_lock_init(&eq->lock); |
| atomic64_set(&eq->event_num, 0); |
| |
| eq->db = dev->func_bar + ERDMA_REGS_CEQ_DB_BASE_REG; |
| eq->db_record = (u64 *)(eq->qbuf + buf_size); |
| |
| erdma_reg_write32(dev, ERDMA_REGS_CMDQ_EQ_ADDR_H_REG, |
| upper_32_bits(eq->qbuf_dma_addr)); |
| erdma_reg_write32(dev, ERDMA_REGS_CMDQ_EQ_ADDR_L_REG, |
| lower_32_bits(eq->qbuf_dma_addr)); |
| erdma_reg_write32(dev, ERDMA_REGS_CMDQ_EQ_DEPTH_REG, eq->depth); |
| erdma_reg_write64(dev, ERDMA_CMDQ_EQ_DB_HOST_ADDR_REG, |
| eq->qbuf_dma_addr + buf_size); |
| |
| return 0; |
| } |
| |
| int erdma_cmdq_init(struct erdma_dev *dev) |
| { |
| struct erdma_cmdq *cmdq = &dev->cmdq; |
| int err; |
| |
| cmdq->max_outstandings = ERDMA_CMDQ_MAX_OUTSTANDING; |
| cmdq->use_event = false; |
| |
| sema_init(&cmdq->credits, cmdq->max_outstandings); |
| |
| err = erdma_cmdq_wait_res_init(dev, cmdq); |
| if (err) |
| return err; |
| |
| err = erdma_cmdq_sq_init(dev); |
| if (err) |
| return err; |
| |
| err = erdma_cmdq_cq_init(dev); |
| if (err) |
| goto err_destroy_sq; |
| |
| err = erdma_cmdq_eq_init(dev); |
| if (err) |
| goto err_destroy_cq; |
| |
| set_bit(ERDMA_CMDQ_STATE_OK_BIT, &cmdq->state); |
| |
| return 0; |
| |
| err_destroy_cq: |
| dma_free_coherent(&dev->pdev->dev, |
| (cmdq->cq.depth << CQE_SHIFT) + |
| ERDMA_EXTRA_BUFFER_SIZE, |
| cmdq->cq.qbuf, cmdq->cq.qbuf_dma_addr); |
| |
| err_destroy_sq: |
| dma_free_coherent(&dev->pdev->dev, |
| (cmdq->sq.depth << SQEBB_SHIFT) + |
| ERDMA_EXTRA_BUFFER_SIZE, |
| cmdq->sq.qbuf, cmdq->sq.qbuf_dma_addr); |
| |
| return err; |
| } |
| |
| void erdma_finish_cmdq_init(struct erdma_dev *dev) |
| { |
| /* after device init successfully, change cmdq to event mode. */ |
| dev->cmdq.use_event = true; |
| arm_cmdq_cq(&dev->cmdq); |
| } |
| |
| void erdma_cmdq_destroy(struct erdma_dev *dev) |
| { |
| struct erdma_cmdq *cmdq = &dev->cmdq; |
| |
| clear_bit(ERDMA_CMDQ_STATE_OK_BIT, &cmdq->state); |
| |
| dma_free_coherent(&dev->pdev->dev, |
| (cmdq->eq.depth << EQE_SHIFT) + |
| ERDMA_EXTRA_BUFFER_SIZE, |
| cmdq->eq.qbuf, cmdq->eq.qbuf_dma_addr); |
| dma_free_coherent(&dev->pdev->dev, |
| (cmdq->sq.depth << SQEBB_SHIFT) + |
| ERDMA_EXTRA_BUFFER_SIZE, |
| cmdq->sq.qbuf, cmdq->sq.qbuf_dma_addr); |
| dma_free_coherent(&dev->pdev->dev, |
| (cmdq->cq.depth << CQE_SHIFT) + |
| ERDMA_EXTRA_BUFFER_SIZE, |
| cmdq->cq.qbuf, cmdq->cq.qbuf_dma_addr); |
| } |
| |
| static void *get_next_valid_cmdq_cqe(struct erdma_cmdq *cmdq) |
| { |
| __be32 *cqe = get_queue_entry(cmdq->cq.qbuf, cmdq->cq.ci, |
| cmdq->cq.depth, CQE_SHIFT); |
| u32 owner = FIELD_GET(ERDMA_CQE_HDR_OWNER_MASK, |
| be32_to_cpu(READ_ONCE(*cqe))); |
| |
| return owner ^ !!(cmdq->cq.ci & cmdq->cq.depth) ? cqe : NULL; |
| } |
| |
| static void push_cmdq_sqe(struct erdma_cmdq *cmdq, u64 *req, size_t req_len, |
| struct erdma_comp_wait *comp_wait) |
| { |
| __le64 *wqe; |
| u64 hdr = *req; |
| |
| comp_wait->cmd_status = ERDMA_CMD_STATUS_ISSUED; |
| reinit_completion(&comp_wait->wait_event); |
| comp_wait->sq_pi = cmdq->sq.pi; |
| |
| wqe = get_queue_entry(cmdq->sq.qbuf, cmdq->sq.pi, cmdq->sq.depth, |
| SQEBB_SHIFT); |
| memcpy(wqe, req, req_len); |
| |
| cmdq->sq.pi += cmdq->sq.wqebb_cnt; |
| hdr |= FIELD_PREP(ERDMA_CMD_HDR_WQEBB_INDEX_MASK, cmdq->sq.pi) | |
| FIELD_PREP(ERDMA_CMD_HDR_CONTEXT_COOKIE_MASK, |
| comp_wait->ctx_id) | |
| FIELD_PREP(ERDMA_CMD_HDR_WQEBB_CNT_MASK, cmdq->sq.wqebb_cnt - 1); |
| *wqe = cpu_to_le64(hdr); |
| |
| kick_cmdq_db(cmdq); |
| } |
| |
| static int erdma_poll_single_cmd_completion(struct erdma_cmdq *cmdq) |
| { |
| struct erdma_comp_wait *comp_wait; |
| u32 hdr0, sqe_idx; |
| __be32 *cqe; |
| u16 ctx_id; |
| u64 *sqe; |
| |
| cqe = get_next_valid_cmdq_cqe(cmdq); |
| if (!cqe) |
| return -EAGAIN; |
| |
| cmdq->cq.ci++; |
| |
| dma_rmb(); |
| hdr0 = be32_to_cpu(*cqe); |
| sqe_idx = be32_to_cpu(*(cqe + 1)); |
| |
| sqe = get_queue_entry(cmdq->sq.qbuf, sqe_idx, cmdq->sq.depth, |
| SQEBB_SHIFT); |
| ctx_id = FIELD_GET(ERDMA_CMD_HDR_CONTEXT_COOKIE_MASK, *sqe); |
| comp_wait = &cmdq->wait_pool[ctx_id]; |
| if (comp_wait->cmd_status != ERDMA_CMD_STATUS_ISSUED) |
| return -EIO; |
| |
| comp_wait->cmd_status = ERDMA_CMD_STATUS_FINISHED; |
| comp_wait->comp_status = FIELD_GET(ERDMA_CQE_HDR_SYNDROME_MASK, hdr0); |
| cmdq->sq.ci += cmdq->sq.wqebb_cnt; |
| /* Copy 16B comp data after cqe hdr to outer */ |
| be32_to_cpu_array(comp_wait->comp_data, cqe + 2, 4); |
| |
| if (cmdq->use_event) |
| complete(&comp_wait->wait_event); |
| |
| return 0; |
| } |
| |
| static void erdma_polling_cmd_completions(struct erdma_cmdq *cmdq) |
| { |
| unsigned long flags; |
| u16 comp_num; |
| |
| spin_lock_irqsave(&cmdq->cq.lock, flags); |
| |
| /* We must have less than # of max_outstandings |
| * completions at one time. |
| */ |
| for (comp_num = 0; comp_num < cmdq->max_outstandings; comp_num++) |
| if (erdma_poll_single_cmd_completion(cmdq)) |
| break; |
| |
| if (comp_num && cmdq->use_event) |
| arm_cmdq_cq(cmdq); |
| |
| spin_unlock_irqrestore(&cmdq->cq.lock, flags); |
| } |
| |
| void erdma_cmdq_completion_handler(struct erdma_cmdq *cmdq) |
| { |
| int got_event = 0; |
| |
| if (!test_bit(ERDMA_CMDQ_STATE_OK_BIT, &cmdq->state) || |
| !cmdq->use_event) |
| return; |
| |
| while (get_next_valid_eqe(&cmdq->eq)) { |
| cmdq->eq.ci++; |
| got_event++; |
| } |
| |
| if (got_event) { |
| cmdq->cq.cmdsn++; |
| erdma_polling_cmd_completions(cmdq); |
| } |
| |
| notify_eq(&cmdq->eq); |
| } |
| |
| static int erdma_poll_cmd_completion(struct erdma_comp_wait *comp_ctx, |
| struct erdma_cmdq *cmdq, u32 timeout) |
| { |
| unsigned long comp_timeout = jiffies + msecs_to_jiffies(timeout); |
| |
| while (1) { |
| erdma_polling_cmd_completions(cmdq); |
| if (comp_ctx->cmd_status != ERDMA_CMD_STATUS_ISSUED) |
| break; |
| |
| if (time_is_before_jiffies(comp_timeout)) |
| return -ETIME; |
| |
| msleep(20); |
| } |
| |
| return 0; |
| } |
| |
| static int erdma_wait_cmd_completion(struct erdma_comp_wait *comp_ctx, |
| struct erdma_cmdq *cmdq, u32 timeout) |
| { |
| unsigned long flags = 0; |
| |
| wait_for_completion_timeout(&comp_ctx->wait_event, |
| msecs_to_jiffies(timeout)); |
| |
| if (unlikely(comp_ctx->cmd_status != ERDMA_CMD_STATUS_FINISHED)) { |
| spin_lock_irqsave(&cmdq->cq.lock, flags); |
| comp_ctx->cmd_status = ERDMA_CMD_STATUS_TIMEOUT; |
| spin_unlock_irqrestore(&cmdq->cq.lock, flags); |
| return -ETIME; |
| } |
| |
| return 0; |
| } |
| |
| void erdma_cmdq_build_reqhdr(u64 *hdr, u32 mod, u32 op) |
| { |
| *hdr = FIELD_PREP(ERDMA_CMD_HDR_SUB_MOD_MASK, mod) | |
| FIELD_PREP(ERDMA_CMD_HDR_OPCODE_MASK, op); |
| } |
| |
| int erdma_post_cmd_wait(struct erdma_cmdq *cmdq, void *req, u32 req_size, |
| u64 *resp0, u64 *resp1) |
| { |
| struct erdma_comp_wait *comp_wait; |
| int ret; |
| |
| if (!test_bit(ERDMA_CMDQ_STATE_OK_BIT, &cmdq->state)) |
| return -ENODEV; |
| |
| down(&cmdq->credits); |
| |
| comp_wait = get_comp_wait(cmdq); |
| if (IS_ERR(comp_wait)) { |
| clear_bit(ERDMA_CMDQ_STATE_OK_BIT, &cmdq->state); |
| set_bit(ERDMA_CMDQ_STATE_CTX_ERR_BIT, &cmdq->state); |
| up(&cmdq->credits); |
| return PTR_ERR(comp_wait); |
| } |
| |
| spin_lock(&cmdq->sq.lock); |
| push_cmdq_sqe(cmdq, req, req_size, comp_wait); |
| spin_unlock(&cmdq->sq.lock); |
| |
| if (cmdq->use_event) |
| ret = erdma_wait_cmd_completion(comp_wait, cmdq, |
| ERDMA_CMDQ_TIMEOUT_MS); |
| else |
| ret = erdma_poll_cmd_completion(comp_wait, cmdq, |
| ERDMA_CMDQ_TIMEOUT_MS); |
| |
| if (ret) { |
| set_bit(ERDMA_CMDQ_STATE_TIMEOUT_BIT, &cmdq->state); |
| clear_bit(ERDMA_CMDQ_STATE_OK_BIT, &cmdq->state); |
| goto out; |
| } |
| |
| if (comp_wait->comp_status) |
| ret = -EIO; |
| |
| if (resp0 && resp1) { |
| *resp0 = *((u64 *)&comp_wait->comp_data[0]); |
| *resp1 = *((u64 *)&comp_wait->comp_data[2]); |
| } |
| put_comp_wait(cmdq, comp_wait); |
| |
| out: |
| up(&cmdq->credits); |
| |
| return ret; |
| } |