2 * Copyright (c) 2017 Mellanox Technologies. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
34 #include <net/addrconf.h>
35 #include <linux/etherdevice.h>
36 #include <linux/mlx5/vport.h>
38 #include "mlx5_core.h"
40 #include "fpga/conn.h"
42 #define MLX5_FPGA_PKEY 0xFFFF
43 #define MLX5_FPGA_PKEY_INDEX 0 /* RoCE PKEY 0xFFFF is always at index 0 */
44 #define MLX5_FPGA_RECV_SIZE 2048
45 #define MLX5_FPGA_PORT_NUM 1
46 #define MLX5_FPGA_CQ_BUDGET 64
48 static int mlx5_fpga_conn_map_buf(struct mlx5_fpga_conn *conn,
49 struct mlx5_fpga_dma_buf *buf)
51 struct device *dma_device;
54 if (unlikely(!buf->sg[0].data))
57 dma_device = &conn->fdev->mdev->pdev->dev;
58 buf->sg[0].dma_addr = dma_map_single(dma_device, buf->sg[0].data,
59 buf->sg[0].size, buf->dma_dir);
60 err = dma_mapping_error(dma_device, buf->sg[0].dma_addr);
62 mlx5_fpga_warn(conn->fdev, "DMA error on sg 0: %d\n", err);
70 buf->sg[1].dma_addr = dma_map_single(dma_device, buf->sg[1].data,
71 buf->sg[1].size, buf->dma_dir);
72 err = dma_mapping_error(dma_device, buf->sg[1].dma_addr);
74 mlx5_fpga_warn(conn->fdev, "DMA error on sg 1: %d\n", err);
75 dma_unmap_single(dma_device, buf->sg[0].dma_addr,
76 buf->sg[0].size, buf->dma_dir);
84 static void mlx5_fpga_conn_unmap_buf(struct mlx5_fpga_conn *conn,
85 struct mlx5_fpga_dma_buf *buf)
87 struct device *dma_device;
89 dma_device = &conn->fdev->mdev->pdev->dev;
91 dma_unmap_single(dma_device, buf->sg[1].dma_addr,
92 buf->sg[1].size, buf->dma_dir);
94 if (likely(buf->sg[0].data))
95 dma_unmap_single(dma_device, buf->sg[0].dma_addr,
96 buf->sg[0].size, buf->dma_dir);
99 static int mlx5_fpga_conn_post_recv(struct mlx5_fpga_conn *conn,
100 struct mlx5_fpga_dma_buf *buf)
102 struct mlx5_wqe_data_seg *data;
106 err = mlx5_fpga_conn_map_buf(conn, buf);
110 if (unlikely(conn->qp.rq.pc - conn->qp.rq.cc >= conn->qp.rq.size)) {
111 mlx5_fpga_conn_unmap_buf(conn, buf);
115 ix = conn->qp.rq.pc & (conn->qp.rq.size - 1);
116 data = mlx5_wq_cyc_get_wqe(&conn->qp.wq.rq, ix);
117 data->byte_count = cpu_to_be32(buf->sg[0].size);
118 data->lkey = cpu_to_be32(conn->fdev->conn_res.mkey.key);
119 data->addr = cpu_to_be64(buf->sg[0].dma_addr);
122 conn->qp.rq.bufs[ix] = buf;
124 /* Make sure that descriptors are written before doorbell record. */
126 *conn->qp.wq.rq.db = cpu_to_be32(conn->qp.rq.pc & 0xffff);
131 static void mlx5_fpga_conn_notify_hw(struct mlx5_fpga_conn *conn, void *wqe)
133 /* ensure wqe is visible to device before updating doorbell record */
135 *conn->qp.wq.sq.db = cpu_to_be32(conn->qp.sq.pc);
136 /* Make sure that doorbell record is visible before ringing */
138 mlx5_write64(wqe, conn->fdev->conn_res.uar->map + MLX5_BF_OFFSET);
141 static void mlx5_fpga_conn_post_send(struct mlx5_fpga_conn *conn,
142 struct mlx5_fpga_dma_buf *buf)
144 struct mlx5_wqe_ctrl_seg *ctrl;
145 struct mlx5_wqe_data_seg *data;
146 unsigned int ix, sgi;
149 ix = conn->qp.sq.pc & (conn->qp.sq.size - 1);
151 ctrl = mlx5_wq_cyc_get_wqe(&conn->qp.wq.sq, ix);
152 data = (void *)(ctrl + 1);
154 for (sgi = 0; sgi < ARRAY_SIZE(buf->sg); sgi++) {
155 if (!buf->sg[sgi].data)
157 data->byte_count = cpu_to_be32(buf->sg[sgi].size);
158 data->lkey = cpu_to_be32(conn->fdev->conn_res.mkey.key);
159 data->addr = cpu_to_be64(buf->sg[sgi].dma_addr);
165 ctrl->fm_ce_se = MLX5_WQE_CTRL_CQ_UPDATE;
166 ctrl->opmod_idx_opcode = cpu_to_be32(((conn->qp.sq.pc & 0xffff) << 8) |
168 ctrl->qpn_ds = cpu_to_be32(size | (conn->qp.mqp.qpn << 8));
171 conn->qp.sq.bufs[ix] = buf;
172 mlx5_fpga_conn_notify_hw(conn, ctrl);
175 int mlx5_fpga_conn_send(struct mlx5_fpga_conn *conn,
176 struct mlx5_fpga_dma_buf *buf)
181 if (!conn->qp.active)
184 buf->dma_dir = DMA_TO_DEVICE;
185 err = mlx5_fpga_conn_map_buf(conn, buf);
189 spin_lock_irqsave(&conn->qp.sq.lock, flags);
191 if (conn->qp.sq.pc - conn->qp.sq.cc >= conn->qp.sq.size) {
192 list_add_tail(&buf->list, &conn->qp.sq.backlog);
196 mlx5_fpga_conn_post_send(conn, buf);
199 spin_unlock_irqrestore(&conn->qp.sq.lock, flags);
203 static int mlx5_fpga_conn_post_recv_buf(struct mlx5_fpga_conn *conn)
205 struct mlx5_fpga_dma_buf *buf;
208 buf = kzalloc(sizeof(*buf) + MLX5_FPGA_RECV_SIZE, 0);
212 buf->sg[0].data = (void *)(buf + 1);
213 buf->sg[0].size = MLX5_FPGA_RECV_SIZE;
214 buf->dma_dir = DMA_FROM_DEVICE;
216 err = mlx5_fpga_conn_post_recv(conn, buf);
223 static int mlx5_fpga_conn_create_mkey(struct mlx5_core_dev *mdev, u32 pdn,
224 struct mlx5_core_mkey *mkey)
226 int inlen = MLX5_ST_SZ_BYTES(create_mkey_in);
231 in = kvzalloc(inlen, GFP_KERNEL);
235 mkc = MLX5_ADDR_OF(create_mkey_in, in, memory_key_mkey_entry);
236 MLX5_SET(mkc, mkc, access_mode_1_0, MLX5_MKC_ACCESS_MODE_PA);
237 MLX5_SET(mkc, mkc, lw, 1);
238 MLX5_SET(mkc, mkc, lr, 1);
240 MLX5_SET(mkc, mkc, pd, pdn);
241 MLX5_SET(mkc, mkc, length64, 1);
242 MLX5_SET(mkc, mkc, qpn, 0xffffff);
244 err = mlx5_core_create_mkey(mdev, mkey, in, inlen);
250 static void mlx5_fpga_conn_rq_cqe(struct mlx5_fpga_conn *conn,
251 struct mlx5_cqe64 *cqe, u8 status)
253 struct mlx5_fpga_dma_buf *buf;
256 ix = be16_to_cpu(cqe->wqe_counter) & (conn->qp.rq.size - 1);
257 buf = conn->qp.rq.bufs[ix];
258 conn->qp.rq.bufs[ix] = NULL;
261 if (unlikely(status && (status != MLX5_CQE_SYNDROME_WR_FLUSH_ERR)))
262 mlx5_fpga_warn(conn->fdev, "RQ buf %p on FPGA QP %u completion status %d\n",
263 buf, conn->fpga_qpn, status);
265 mlx5_fpga_dbg(conn->fdev, "RQ buf %p on FPGA QP %u completion status %d\n",
266 buf, conn->fpga_qpn, status);
268 mlx5_fpga_conn_unmap_buf(conn, buf);
270 if (unlikely(status || !conn->qp.active)) {
271 conn->qp.active = false;
276 buf->sg[0].size = be32_to_cpu(cqe->byte_cnt);
277 mlx5_fpga_dbg(conn->fdev, "Message with %u bytes received successfully\n",
279 conn->recv_cb(conn->cb_arg, buf);
281 buf->sg[0].size = MLX5_FPGA_RECV_SIZE;
282 err = mlx5_fpga_conn_post_recv(conn, buf);
284 mlx5_fpga_warn(conn->fdev,
285 "Failed to re-post recv buf: %d\n", err);
290 static void mlx5_fpga_conn_sq_cqe(struct mlx5_fpga_conn *conn,
291 struct mlx5_cqe64 *cqe, u8 status)
293 struct mlx5_fpga_dma_buf *buf, *nextbuf;
297 spin_lock_irqsave(&conn->qp.sq.lock, flags);
299 ix = be16_to_cpu(cqe->wqe_counter) & (conn->qp.sq.size - 1);
300 buf = conn->qp.sq.bufs[ix];
301 conn->qp.sq.bufs[ix] = NULL;
304 /* Handle backlog still under the spinlock to ensure message post order */
305 if (unlikely(!list_empty(&conn->qp.sq.backlog))) {
306 if (likely(conn->qp.active)) {
307 nextbuf = list_first_entry(&conn->qp.sq.backlog,
308 struct mlx5_fpga_dma_buf, list);
309 list_del(&nextbuf->list);
310 mlx5_fpga_conn_post_send(conn, nextbuf);
314 spin_unlock_irqrestore(&conn->qp.sq.lock, flags);
316 if (unlikely(status && (status != MLX5_CQE_SYNDROME_WR_FLUSH_ERR)))
317 mlx5_fpga_warn(conn->fdev, "SQ buf %p on FPGA QP %u completion status %d\n",
318 buf, conn->fpga_qpn, status);
320 mlx5_fpga_dbg(conn->fdev, "SQ buf %p on FPGA QP %u completion status %d\n",
321 buf, conn->fpga_qpn, status);
323 mlx5_fpga_conn_unmap_buf(conn, buf);
325 if (likely(buf->complete))
326 buf->complete(conn, conn->fdev, buf, status);
328 if (unlikely(status))
329 conn->qp.active = false;
332 static void mlx5_fpga_conn_handle_cqe(struct mlx5_fpga_conn *conn,
333 struct mlx5_cqe64 *cqe)
335 u8 opcode, status = 0;
337 opcode = get_cqe_opcode(cqe);
340 case MLX5_CQE_REQ_ERR:
341 status = ((struct mlx5_err_cqe *)cqe)->syndrome;
344 mlx5_fpga_conn_sq_cqe(conn, cqe, status);
347 case MLX5_CQE_RESP_ERR:
348 status = ((struct mlx5_err_cqe *)cqe)->syndrome;
350 case MLX5_CQE_RESP_SEND:
351 mlx5_fpga_conn_rq_cqe(conn, cqe, status);
354 mlx5_fpga_warn(conn->fdev, "Unexpected cqe opcode %u\n",
359 static void mlx5_fpga_conn_arm_cq(struct mlx5_fpga_conn *conn)
361 mlx5_cq_arm(&conn->cq.mcq, MLX5_CQ_DB_REQ_NOT,
362 conn->fdev->conn_res.uar->map, conn->cq.wq.cc);
365 static void mlx5_fpga_conn_cq_event(struct mlx5_core_cq *mcq,
366 enum mlx5_event event)
368 struct mlx5_fpga_conn *conn;
370 conn = container_of(mcq, struct mlx5_fpga_conn, cq.mcq);
371 mlx5_fpga_warn(conn->fdev, "CQ event %u on CQ #%u\n", event, mcq->cqn);
374 static void mlx5_fpga_conn_event(struct mlx5_core_qp *mqp, int event)
376 struct mlx5_fpga_conn *conn;
378 conn = container_of(mqp, struct mlx5_fpga_conn, qp.mqp);
379 mlx5_fpga_warn(conn->fdev, "QP event %u on QP #%u\n", event, mqp->qpn);
382 static inline void mlx5_fpga_conn_cqes(struct mlx5_fpga_conn *conn,
385 struct mlx5_cqe64 *cqe;
388 cqe = mlx5_cqwq_get_cqe(&conn->cq.wq);
393 mlx5_cqwq_pop(&conn->cq.wq);
394 mlx5_fpga_conn_handle_cqe(conn, cqe);
395 mlx5_cqwq_update_db_record(&conn->cq.wq);
398 tasklet_schedule(&conn->cq.tasklet);
402 mlx5_fpga_dbg(conn->fdev, "Re-arming CQ with cc# %u\n", conn->cq.wq.cc);
403 /* ensure cq space is freed before enabling more cqes */
405 mlx5_fpga_conn_arm_cq(conn);
408 static void mlx5_fpga_conn_cq_tasklet(unsigned long data)
410 struct mlx5_fpga_conn *conn = (void *)data;
412 if (unlikely(!conn->qp.active))
414 mlx5_fpga_conn_cqes(conn, MLX5_FPGA_CQ_BUDGET);
417 static void mlx5_fpga_conn_cq_complete(struct mlx5_core_cq *mcq,
418 struct mlx5_eqe *eqe)
420 struct mlx5_fpga_conn *conn;
422 conn = container_of(mcq, struct mlx5_fpga_conn, cq.mcq);
423 if (unlikely(!conn->qp.active))
425 mlx5_fpga_conn_cqes(conn, MLX5_FPGA_CQ_BUDGET);
428 static int mlx5_fpga_conn_create_cq(struct mlx5_fpga_conn *conn, int cq_size)
430 struct mlx5_fpga_device *fdev = conn->fdev;
431 struct mlx5_core_dev *mdev = fdev->mdev;
432 u32 temp_cqc[MLX5_ST_SZ_DW(cqc)] = {0};
433 u32 out[MLX5_ST_SZ_DW(create_cq_out)];
434 struct mlx5_wq_param wqp;
435 struct mlx5_cqe64 *cqe;
442 cq_size = roundup_pow_of_two(cq_size);
443 MLX5_SET(cqc, temp_cqc, log_cq_size, ilog2(cq_size));
445 wqp.buf_numa_node = mdev->priv.numa_node;
446 wqp.db_numa_node = mdev->priv.numa_node;
448 err = mlx5_cqwq_create(mdev, &wqp, temp_cqc, &conn->cq.wq,
453 for (i = 0; i < mlx5_cqwq_get_size(&conn->cq.wq); i++) {
454 cqe = mlx5_cqwq_get_wqe(&conn->cq.wq, i);
455 cqe->op_own = MLX5_CQE_INVALID << 4 | MLX5_CQE_OWNER_MASK;
458 inlen = MLX5_ST_SZ_BYTES(create_cq_in) +
459 sizeof(u64) * conn->cq.wq_ctrl.buf.npages;
460 in = kvzalloc(inlen, GFP_KERNEL);
466 err = mlx5_vector2eqn(mdev, smp_processor_id(), &eqn, &irqn);
472 cqc = MLX5_ADDR_OF(create_cq_in, in, cq_context);
473 MLX5_SET(cqc, cqc, log_cq_size, ilog2(cq_size));
474 MLX5_SET(cqc, cqc, c_eqn, eqn);
475 MLX5_SET(cqc, cqc, uar_page, fdev->conn_res.uar->index);
476 MLX5_SET(cqc, cqc, log_page_size, conn->cq.wq_ctrl.buf.page_shift -
477 MLX5_ADAPTER_PAGE_SHIFT);
478 MLX5_SET64(cqc, cqc, dbr_addr, conn->cq.wq_ctrl.db.dma);
480 pas = (__be64 *)MLX5_ADDR_OF(create_cq_in, in, pas);
481 mlx5_fill_page_frag_array(&conn->cq.wq_ctrl.buf, pas);
483 err = mlx5_core_create_cq(mdev, &conn->cq.mcq, in, inlen, out, sizeof(out));
489 conn->cq.mcq.cqe_sz = 64;
490 conn->cq.mcq.set_ci_db = conn->cq.wq_ctrl.db.db;
491 conn->cq.mcq.arm_db = conn->cq.wq_ctrl.db.db + 1;
492 *conn->cq.mcq.set_ci_db = 0;
493 *conn->cq.mcq.arm_db = 0;
494 conn->cq.mcq.vector = 0;
495 conn->cq.mcq.comp = mlx5_fpga_conn_cq_complete;
496 conn->cq.mcq.event = mlx5_fpga_conn_cq_event;
497 conn->cq.mcq.irqn = irqn;
498 conn->cq.mcq.uar = fdev->conn_res.uar;
499 tasklet_init(&conn->cq.tasklet, mlx5_fpga_conn_cq_tasklet,
500 (unsigned long)conn);
502 mlx5_fpga_dbg(fdev, "Created CQ #0x%x\n", conn->cq.mcq.cqn);
507 mlx5_wq_destroy(&conn->cq.wq_ctrl);
512 static void mlx5_fpga_conn_destroy_cq(struct mlx5_fpga_conn *conn)
514 tasklet_disable(&conn->cq.tasklet);
515 tasklet_kill(&conn->cq.tasklet);
516 mlx5_core_destroy_cq(conn->fdev->mdev, &conn->cq.mcq);
517 mlx5_wq_destroy(&conn->cq.wq_ctrl);
520 static int mlx5_fpga_conn_create_wq(struct mlx5_fpga_conn *conn, void *qpc)
522 struct mlx5_fpga_device *fdev = conn->fdev;
523 struct mlx5_core_dev *mdev = fdev->mdev;
524 struct mlx5_wq_param wqp;
526 wqp.buf_numa_node = mdev->priv.numa_node;
527 wqp.db_numa_node = mdev->priv.numa_node;
529 return mlx5_wq_qp_create(mdev, &wqp, qpc, &conn->qp.wq,
533 static int mlx5_fpga_conn_create_qp(struct mlx5_fpga_conn *conn,
534 unsigned int tx_size, unsigned int rx_size)
536 struct mlx5_fpga_device *fdev = conn->fdev;
537 struct mlx5_core_dev *mdev = fdev->mdev;
538 u32 temp_qpc[MLX5_ST_SZ_DW(qpc)] = {0};
539 void *in = NULL, *qpc;
544 conn->qp.rq.size = roundup_pow_of_two(rx_size);
547 conn->qp.sq.size = roundup_pow_of_two(tx_size);
549 MLX5_SET(qpc, temp_qpc, log_rq_stride, ilog2(MLX5_SEND_WQE_DS) - 4);
550 MLX5_SET(qpc, temp_qpc, log_rq_size, ilog2(conn->qp.rq.size));
551 MLX5_SET(qpc, temp_qpc, log_sq_size, ilog2(conn->qp.sq.size));
552 err = mlx5_fpga_conn_create_wq(conn, temp_qpc);
556 conn->qp.rq.bufs = kvcalloc(conn->qp.rq.size,
557 sizeof(conn->qp.rq.bufs[0]),
559 if (!conn->qp.rq.bufs) {
564 conn->qp.sq.bufs = kvcalloc(conn->qp.sq.size,
565 sizeof(conn->qp.sq.bufs[0]),
567 if (!conn->qp.sq.bufs) {
572 inlen = MLX5_ST_SZ_BYTES(create_qp_in) +
573 MLX5_FLD_SZ_BYTES(create_qp_in, pas[0]) *
574 conn->qp.wq_ctrl.buf.npages;
575 in = kvzalloc(inlen, GFP_KERNEL);
581 qpc = MLX5_ADDR_OF(create_qp_in, in, qpc);
582 MLX5_SET(qpc, qpc, uar_page, fdev->conn_res.uar->index);
583 MLX5_SET(qpc, qpc, log_page_size,
584 conn->qp.wq_ctrl.buf.page_shift - MLX5_ADAPTER_PAGE_SHIFT);
585 MLX5_SET(qpc, qpc, fre, 1);
586 MLX5_SET(qpc, qpc, rlky, 1);
587 MLX5_SET(qpc, qpc, st, MLX5_QP_ST_RC);
588 MLX5_SET(qpc, qpc, pm_state, MLX5_QP_PM_MIGRATED);
589 MLX5_SET(qpc, qpc, pd, fdev->conn_res.pdn);
590 MLX5_SET(qpc, qpc, log_rq_stride, ilog2(MLX5_SEND_WQE_DS) - 4);
591 MLX5_SET(qpc, qpc, log_rq_size, ilog2(conn->qp.rq.size));
592 MLX5_SET(qpc, qpc, rq_type, MLX5_NON_ZERO_RQ);
593 MLX5_SET(qpc, qpc, log_sq_size, ilog2(conn->qp.sq.size));
594 MLX5_SET(qpc, qpc, cqn_snd, conn->cq.mcq.cqn);
595 MLX5_SET(qpc, qpc, cqn_rcv, conn->cq.mcq.cqn);
596 MLX5_SET64(qpc, qpc, dbr_addr, conn->qp.wq_ctrl.db.dma);
597 if (MLX5_CAP_GEN(mdev, cqe_version) == 1)
598 MLX5_SET(qpc, qpc, user_index, 0xFFFFFF);
600 mlx5_fill_page_frag_array(&conn->qp.wq_ctrl.buf,
601 (__be64 *)MLX5_ADDR_OF(create_qp_in, in, pas));
603 err = mlx5_core_create_qp(mdev, &conn->qp.mqp, in, inlen);
607 conn->qp.mqp.event = mlx5_fpga_conn_event;
608 mlx5_fpga_dbg(fdev, "Created QP #0x%x\n", conn->qp.mqp.qpn);
613 kvfree(conn->qp.sq.bufs);
615 kvfree(conn->qp.rq.bufs);
617 mlx5_wq_destroy(&conn->qp.wq_ctrl);
623 static void mlx5_fpga_conn_free_recv_bufs(struct mlx5_fpga_conn *conn)
627 for (ix = 0; ix < conn->qp.rq.size; ix++) {
628 if (!conn->qp.rq.bufs[ix])
630 mlx5_fpga_conn_unmap_buf(conn, conn->qp.rq.bufs[ix]);
631 kfree(conn->qp.rq.bufs[ix]);
632 conn->qp.rq.bufs[ix] = NULL;
636 static void mlx5_fpga_conn_flush_send_bufs(struct mlx5_fpga_conn *conn)
638 struct mlx5_fpga_dma_buf *buf, *temp;
641 for (ix = 0; ix < conn->qp.sq.size; ix++) {
642 buf = conn->qp.sq.bufs[ix];
645 conn->qp.sq.bufs[ix] = NULL;
646 mlx5_fpga_conn_unmap_buf(conn, buf);
649 buf->complete(conn, conn->fdev, buf, MLX5_CQE_SYNDROME_WR_FLUSH_ERR);
651 list_for_each_entry_safe(buf, temp, &conn->qp.sq.backlog, list) {
652 mlx5_fpga_conn_unmap_buf(conn, buf);
655 buf->complete(conn, conn->fdev, buf, MLX5_CQE_SYNDROME_WR_FLUSH_ERR);
659 static void mlx5_fpga_conn_destroy_qp(struct mlx5_fpga_conn *conn)
661 mlx5_core_destroy_qp(conn->fdev->mdev, &conn->qp.mqp);
662 mlx5_fpga_conn_free_recv_bufs(conn);
663 mlx5_fpga_conn_flush_send_bufs(conn);
664 kvfree(conn->qp.sq.bufs);
665 kvfree(conn->qp.rq.bufs);
666 mlx5_wq_destroy(&conn->qp.wq_ctrl);
669 static inline int mlx5_fpga_conn_reset_qp(struct mlx5_fpga_conn *conn)
671 struct mlx5_core_dev *mdev = conn->fdev->mdev;
673 mlx5_fpga_dbg(conn->fdev, "Modifying QP %u to RST\n", conn->qp.mqp.qpn);
675 return mlx5_core_qp_modify(mdev, MLX5_CMD_OP_2RST_QP, 0, NULL,
679 static inline int mlx5_fpga_conn_init_qp(struct mlx5_fpga_conn *conn)
681 struct mlx5_fpga_device *fdev = conn->fdev;
682 struct mlx5_core_dev *mdev = fdev->mdev;
686 mlx5_fpga_dbg(conn->fdev, "Modifying QP %u to INIT\n", conn->qp.mqp.qpn);
688 qpc = kzalloc(MLX5_ST_SZ_BYTES(qpc), GFP_KERNEL);
694 MLX5_SET(qpc, qpc, st, MLX5_QP_ST_RC);
695 MLX5_SET(qpc, qpc, pm_state, MLX5_QP_PM_MIGRATED);
696 MLX5_SET(qpc, qpc, primary_address_path.pkey_index, MLX5_FPGA_PKEY_INDEX);
697 MLX5_SET(qpc, qpc, primary_address_path.vhca_port_num, MLX5_FPGA_PORT_NUM);
698 MLX5_SET(qpc, qpc, pd, conn->fdev->conn_res.pdn);
699 MLX5_SET(qpc, qpc, cqn_snd, conn->cq.mcq.cqn);
700 MLX5_SET(qpc, qpc, cqn_rcv, conn->cq.mcq.cqn);
701 MLX5_SET64(qpc, qpc, dbr_addr, conn->qp.wq_ctrl.db.dma);
703 err = mlx5_core_qp_modify(mdev, MLX5_CMD_OP_RST2INIT_QP, 0, qpc,
706 mlx5_fpga_warn(fdev, "qp_modify RST2INIT failed: %d\n", err);
715 static inline int mlx5_fpga_conn_rtr_qp(struct mlx5_fpga_conn *conn)
717 struct mlx5_fpga_device *fdev = conn->fdev;
718 struct mlx5_core_dev *mdev = fdev->mdev;
722 mlx5_fpga_dbg(conn->fdev, "QP RTR\n");
724 qpc = kzalloc(MLX5_ST_SZ_BYTES(qpc), GFP_KERNEL);
730 MLX5_SET(qpc, qpc, mtu, MLX5_QPC_MTU_1K_BYTES);
731 MLX5_SET(qpc, qpc, log_msg_max, (u8)MLX5_CAP_GEN(mdev, log_max_msg));
732 MLX5_SET(qpc, qpc, remote_qpn, conn->fpga_qpn);
733 MLX5_SET(qpc, qpc, next_rcv_psn,
734 MLX5_GET(fpga_qpc, conn->fpga_qpc, next_send_psn));
735 MLX5_SET(qpc, qpc, primary_address_path.pkey_index, MLX5_FPGA_PKEY_INDEX);
736 MLX5_SET(qpc, qpc, primary_address_path.vhca_port_num, MLX5_FPGA_PORT_NUM);
737 ether_addr_copy(MLX5_ADDR_OF(qpc, qpc, primary_address_path.rmac_47_32),
738 MLX5_ADDR_OF(fpga_qpc, conn->fpga_qpc, fpga_mac_47_32));
739 MLX5_SET(qpc, qpc, primary_address_path.udp_sport,
740 MLX5_CAP_ROCE(mdev, r_roce_min_src_udp_port));
741 MLX5_SET(qpc, qpc, primary_address_path.src_addr_index,
742 conn->qp.sgid_index);
743 MLX5_SET(qpc, qpc, primary_address_path.hop_limit, 0);
744 memcpy(MLX5_ADDR_OF(qpc, qpc, primary_address_path.rgid_rip),
745 MLX5_ADDR_OF(fpga_qpc, conn->fpga_qpc, fpga_ip),
746 MLX5_FLD_SZ_BYTES(qpc, primary_address_path.rgid_rip));
748 err = mlx5_core_qp_modify(mdev, MLX5_CMD_OP_INIT2RTR_QP, 0, qpc,
751 mlx5_fpga_warn(fdev, "qp_modify RST2INIT failed: %d\n", err);
760 static inline int mlx5_fpga_conn_rts_qp(struct mlx5_fpga_conn *conn)
762 struct mlx5_fpga_device *fdev = conn->fdev;
763 struct mlx5_core_dev *mdev = fdev->mdev;
768 mlx5_fpga_dbg(conn->fdev, "QP RTS\n");
770 qpc = kzalloc(MLX5_ST_SZ_BYTES(qpc), GFP_KERNEL);
776 MLX5_SET(qpc, qpc, log_ack_req_freq, 8);
777 MLX5_SET(qpc, qpc, min_rnr_nak, 0x12);
778 MLX5_SET(qpc, qpc, primary_address_path.ack_timeout, 0x12); /* ~1.07s */
779 MLX5_SET(qpc, qpc, next_send_psn,
780 MLX5_GET(fpga_qpc, conn->fpga_qpc, next_rcv_psn));
781 MLX5_SET(qpc, qpc, retry_count, 7);
782 MLX5_SET(qpc, qpc, rnr_retry, 7); /* Infinite retry if RNR NACK */
784 opt_mask = MLX5_QP_OPTPAR_RNR_TIMEOUT;
785 err = mlx5_core_qp_modify(mdev, MLX5_CMD_OP_RTR2RTS_QP, opt_mask, qpc,
788 mlx5_fpga_warn(fdev, "qp_modify RST2INIT failed: %d\n", err);
797 static int mlx5_fpga_conn_connect(struct mlx5_fpga_conn *conn)
799 struct mlx5_fpga_device *fdev = conn->fdev;
802 MLX5_SET(fpga_qpc, conn->fpga_qpc, state, MLX5_FPGA_QPC_STATE_ACTIVE);
803 err = mlx5_fpga_modify_qp(conn->fdev->mdev, conn->fpga_qpn,
804 MLX5_FPGA_QPC_STATE, &conn->fpga_qpc);
806 mlx5_fpga_err(fdev, "Failed to activate FPGA RC QP: %d\n", err);
810 err = mlx5_fpga_conn_reset_qp(conn);
812 mlx5_fpga_err(fdev, "Failed to change QP state to reset\n");
816 err = mlx5_fpga_conn_init_qp(conn);
818 mlx5_fpga_err(fdev, "Failed to modify QP from RESET to INIT\n");
821 conn->qp.active = true;
823 while (!mlx5_fpga_conn_post_recv_buf(conn))
826 err = mlx5_fpga_conn_rtr_qp(conn);
828 mlx5_fpga_err(fdev, "Failed to change QP state from INIT to RTR\n");
832 err = mlx5_fpga_conn_rts_qp(conn);
834 mlx5_fpga_err(fdev, "Failed to change QP state from RTR to RTS\n");
840 mlx5_fpga_conn_free_recv_bufs(conn);
842 MLX5_SET(fpga_qpc, conn->fpga_qpc, state, MLX5_FPGA_QPC_STATE_INIT);
843 if (mlx5_fpga_modify_qp(conn->fdev->mdev, conn->fpga_qpn,
844 MLX5_FPGA_QPC_STATE, &conn->fpga_qpc))
845 mlx5_fpga_err(fdev, "Failed to revert FPGA QP to INIT\n");
850 struct mlx5_fpga_conn *mlx5_fpga_conn_create(struct mlx5_fpga_device *fdev,
851 struct mlx5_fpga_conn_attr *attr,
852 enum mlx5_ifc_fpga_qp_type qp_type)
854 struct mlx5_fpga_conn *ret, *conn;
855 u8 *remote_mac, *remote_ip;
859 return ERR_PTR(-EINVAL);
861 conn = kzalloc(sizeof(*conn), GFP_KERNEL);
863 return ERR_PTR(-ENOMEM);
866 INIT_LIST_HEAD(&conn->qp.sq.backlog);
868 spin_lock_init(&conn->qp.sq.lock);
870 conn->recv_cb = attr->recv_cb;
871 conn->cb_arg = attr->cb_arg;
873 remote_mac = MLX5_ADDR_OF(fpga_qpc, conn->fpga_qpc, remote_mac_47_32);
874 err = mlx5_query_mac_address(fdev->mdev, remote_mac);
876 mlx5_fpga_err(fdev, "Failed to query local MAC: %d\n", err);
881 /* Build Modified EUI-64 IPv6 address from the MAC address */
882 remote_ip = MLX5_ADDR_OF(fpga_qpc, conn->fpga_qpc, remote_ip);
885 addrconf_addr_eui48(&remote_ip[8], remote_mac);
887 err = mlx5_core_reserved_gid_alloc(fdev->mdev, &conn->qp.sgid_index);
889 mlx5_fpga_err(fdev, "Failed to allocate SGID: %d\n", err);
894 err = mlx5_core_roce_gid_set(fdev->mdev, conn->qp.sgid_index,
896 MLX5_ROCE_L3_TYPE_IPV6,
897 remote_ip, remote_mac, true, 0,
900 mlx5_fpga_err(fdev, "Failed to set SGID: %d\n", err);
904 mlx5_fpga_dbg(fdev, "Reserved SGID index %u\n", conn->qp.sgid_index);
906 /* Allow for one cqe per rx/tx wqe, plus one cqe for the next wqe,
907 * created during processing of the cqe
909 err = mlx5_fpga_conn_create_cq(conn,
910 (attr->tx_size + attr->rx_size) * 2);
912 mlx5_fpga_err(fdev, "Failed to create CQ: %d\n", err);
917 mlx5_fpga_conn_arm_cq(conn);
919 err = mlx5_fpga_conn_create_qp(conn, attr->tx_size, attr->rx_size);
921 mlx5_fpga_err(fdev, "Failed to create QP: %d\n", err);
926 MLX5_SET(fpga_qpc, conn->fpga_qpc, state, MLX5_FPGA_QPC_STATE_INIT);
927 MLX5_SET(fpga_qpc, conn->fpga_qpc, qp_type, qp_type);
928 MLX5_SET(fpga_qpc, conn->fpga_qpc, st, MLX5_FPGA_QPC_ST_RC);
929 MLX5_SET(fpga_qpc, conn->fpga_qpc, ether_type, ETH_P_8021Q);
930 MLX5_SET(fpga_qpc, conn->fpga_qpc, vid, 0);
931 MLX5_SET(fpga_qpc, conn->fpga_qpc, next_rcv_psn, 1);
932 MLX5_SET(fpga_qpc, conn->fpga_qpc, next_send_psn, 0);
933 MLX5_SET(fpga_qpc, conn->fpga_qpc, pkey, MLX5_FPGA_PKEY);
934 MLX5_SET(fpga_qpc, conn->fpga_qpc, remote_qpn, conn->qp.mqp.qpn);
935 MLX5_SET(fpga_qpc, conn->fpga_qpc, rnr_retry, 7);
936 MLX5_SET(fpga_qpc, conn->fpga_qpc, retry_count, 7);
938 err = mlx5_fpga_create_qp(fdev->mdev, &conn->fpga_qpc,
941 mlx5_fpga_err(fdev, "Failed to create FPGA RC QP: %d\n", err);
946 err = mlx5_fpga_conn_connect(conn);
952 mlx5_fpga_dbg(fdev, "FPGA QPN is %u\n", conn->fpga_qpn);
957 mlx5_fpga_destroy_qp(conn->fdev->mdev, conn->fpga_qpn);
959 mlx5_fpga_conn_destroy_qp(conn);
961 mlx5_fpga_conn_destroy_cq(conn);
963 mlx5_core_roce_gid_set(fdev->mdev, conn->qp.sgid_index, 0, 0, NULL,
964 NULL, false, 0, MLX5_FPGA_PORT_NUM);
966 mlx5_core_reserved_gid_free(fdev->mdev, conn->qp.sgid_index);
973 void mlx5_fpga_conn_destroy(struct mlx5_fpga_conn *conn)
975 struct mlx5_fpga_device *fdev = conn->fdev;
976 struct mlx5_core_dev *mdev = fdev->mdev;
979 conn->qp.active = false;
980 tasklet_disable(&conn->cq.tasklet);
981 synchronize_irq(conn->cq.mcq.irqn);
983 mlx5_fpga_destroy_qp(conn->fdev->mdev, conn->fpga_qpn);
984 err = mlx5_core_qp_modify(mdev, MLX5_CMD_OP_2ERR_QP, 0, NULL,
987 mlx5_fpga_warn(fdev, "qp_modify 2ERR failed: %d\n", err);
988 mlx5_fpga_conn_destroy_qp(conn);
989 mlx5_fpga_conn_destroy_cq(conn);
991 mlx5_core_roce_gid_set(conn->fdev->mdev, conn->qp.sgid_index, 0, 0,
992 NULL, NULL, false, 0, MLX5_FPGA_PORT_NUM);
993 mlx5_core_reserved_gid_free(conn->fdev->mdev, conn->qp.sgid_index);
997 int mlx5_fpga_conn_device_init(struct mlx5_fpga_device *fdev)
1001 err = mlx5_nic_vport_enable_roce(fdev->mdev);
1003 mlx5_fpga_err(fdev, "Failed to enable RoCE: %d\n", err);
1007 fdev->conn_res.uar = mlx5_get_uars_page(fdev->mdev);
1008 if (IS_ERR(fdev->conn_res.uar)) {
1009 err = PTR_ERR(fdev->conn_res.uar);
1010 mlx5_fpga_err(fdev, "get_uars_page failed, %d\n", err);
1013 mlx5_fpga_dbg(fdev, "Allocated UAR index %u\n",
1014 fdev->conn_res.uar->index);
1016 err = mlx5_core_alloc_pd(fdev->mdev, &fdev->conn_res.pdn);
1018 mlx5_fpga_err(fdev, "alloc pd failed, %d\n", err);
1021 mlx5_fpga_dbg(fdev, "Allocated PD %u\n", fdev->conn_res.pdn);
1023 err = mlx5_fpga_conn_create_mkey(fdev->mdev, fdev->conn_res.pdn,
1024 &fdev->conn_res.mkey);
1026 mlx5_fpga_err(fdev, "create mkey failed, %d\n", err);
1027 goto err_dealloc_pd;
1029 mlx5_fpga_dbg(fdev, "Created mkey 0x%x\n", fdev->conn_res.mkey.key);
1034 mlx5_core_dealloc_pd(fdev->mdev, fdev->conn_res.pdn);
1036 mlx5_put_uars_page(fdev->mdev, fdev->conn_res.uar);
1038 mlx5_nic_vport_disable_roce(fdev->mdev);
1043 void mlx5_fpga_conn_device_cleanup(struct mlx5_fpga_device *fdev)
1045 mlx5_core_destroy_mkey(fdev->mdev, &fdev->conn_res.mkey);
1046 mlx5_core_dealloc_pd(fdev->mdev, fdev->conn_res.pdn);
1047 mlx5_put_uars_page(fdev->mdev, fdev->conn_res.uar);
1048 mlx5_nic_vport_disable_roce(fdev->mdev);