ac1d68296b
Convert to the much saner new idr interface. Signed-off-by: Tejun Heo <tj@kernel.org> Reviewed-by: Steve Wise <swise@opengridcomputing.com> Cc: Tom Tucker <tom@opengridcomputing.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
1026 lines
24 KiB
C
1026 lines
24 KiB
C
/*
|
|
* Copyright (c) 2004 Topspin Communications. All rights reserved.
|
|
* Copyright (c) 2005 Cisco Systems. All rights reserved.
|
|
* Copyright (c) 2005 Mellanox Technologies. All rights reserved.
|
|
* Copyright (c) 2004 Voltaire, Inc. All rights reserved.
|
|
* Copyright (c) 2005 Open Grid Computing, Inc. All rights reserved.
|
|
*
|
|
* This software is available to you under a choice of one of two
|
|
* licenses. You may choose to be licensed under the terms of the GNU
|
|
* General Public License (GPL) Version 2, available from the file
|
|
* COPYING in the main directory of this source tree, or the
|
|
* OpenIB.org BSD license below:
|
|
*
|
|
* Redistribution and use in source and binary forms, with or
|
|
* without modification, are permitted provided that the following
|
|
* conditions are met:
|
|
*
|
|
* - Redistributions of source code must retain the above
|
|
* copyright notice, this list of conditions and the following
|
|
* disclaimer.
|
|
*
|
|
* - Redistributions in binary form must reproduce the above
|
|
* copyright notice, this list of conditions and the following
|
|
* disclaimer in the documentation and/or other materials
|
|
* provided with the distribution.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
|
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
|
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
|
|
* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
|
|
* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
|
|
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
* SOFTWARE.
|
|
*
|
|
*/
|
|
|
|
#include <linux/delay.h>
|
|
#include <linux/gfp.h>
|
|
|
|
#include "c2.h"
|
|
#include "c2_vq.h"
|
|
#include "c2_status.h"
|
|
|
|
#define C2_MAX_ORD_PER_QP 128
|
|
#define C2_MAX_IRD_PER_QP 128
|
|
|
|
#define C2_HINT_MAKE(q_index, hint_count) (((q_index) << 16) | hint_count)
|
|
#define C2_HINT_GET_INDEX(hint) (((hint) & 0x7FFF0000) >> 16)
|
|
#define C2_HINT_GET_COUNT(hint) ((hint) & 0x0000FFFF)
|
|
|
|
#define NO_SUPPORT -1
|
|
static const u8 c2_opcode[] = {
|
|
[IB_WR_SEND] = C2_WR_TYPE_SEND,
|
|
[IB_WR_SEND_WITH_IMM] = NO_SUPPORT,
|
|
[IB_WR_RDMA_WRITE] = C2_WR_TYPE_RDMA_WRITE,
|
|
[IB_WR_RDMA_WRITE_WITH_IMM] = NO_SUPPORT,
|
|
[IB_WR_RDMA_READ] = C2_WR_TYPE_RDMA_READ,
|
|
[IB_WR_ATOMIC_CMP_AND_SWP] = NO_SUPPORT,
|
|
[IB_WR_ATOMIC_FETCH_AND_ADD] = NO_SUPPORT,
|
|
};
|
|
|
|
static int to_c2_state(enum ib_qp_state ib_state)
|
|
{
|
|
switch (ib_state) {
|
|
case IB_QPS_RESET:
|
|
return C2_QP_STATE_IDLE;
|
|
case IB_QPS_RTS:
|
|
return C2_QP_STATE_RTS;
|
|
case IB_QPS_SQD:
|
|
return C2_QP_STATE_CLOSING;
|
|
case IB_QPS_SQE:
|
|
return C2_QP_STATE_CLOSING;
|
|
case IB_QPS_ERR:
|
|
return C2_QP_STATE_ERROR;
|
|
default:
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
static int to_ib_state(enum c2_qp_state c2_state)
|
|
{
|
|
switch (c2_state) {
|
|
case C2_QP_STATE_IDLE:
|
|
return IB_QPS_RESET;
|
|
case C2_QP_STATE_CONNECTING:
|
|
return IB_QPS_RTR;
|
|
case C2_QP_STATE_RTS:
|
|
return IB_QPS_RTS;
|
|
case C2_QP_STATE_CLOSING:
|
|
return IB_QPS_SQD;
|
|
case C2_QP_STATE_ERROR:
|
|
return IB_QPS_ERR;
|
|
case C2_QP_STATE_TERMINATE:
|
|
return IB_QPS_SQE;
|
|
default:
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
static const char *to_ib_state_str(int ib_state)
|
|
{
|
|
static const char *state_str[] = {
|
|
"IB_QPS_RESET",
|
|
"IB_QPS_INIT",
|
|
"IB_QPS_RTR",
|
|
"IB_QPS_RTS",
|
|
"IB_QPS_SQD",
|
|
"IB_QPS_SQE",
|
|
"IB_QPS_ERR"
|
|
};
|
|
if (ib_state < IB_QPS_RESET ||
|
|
ib_state > IB_QPS_ERR)
|
|
return "<invalid IB QP state>";
|
|
|
|
ib_state -= IB_QPS_RESET;
|
|
return state_str[ib_state];
|
|
}
|
|
|
|
void c2_set_qp_state(struct c2_qp *qp, int c2_state)
|
|
{
|
|
int new_state = to_ib_state(c2_state);
|
|
|
|
pr_debug("%s: qp[%p] state modify %s --> %s\n",
|
|
__func__,
|
|
qp,
|
|
to_ib_state_str(qp->state),
|
|
to_ib_state_str(new_state));
|
|
qp->state = new_state;
|
|
}
|
|
|
|
#define C2_QP_NO_ATTR_CHANGE 0xFFFFFFFF
|
|
|
|
int c2_qp_modify(struct c2_dev *c2dev, struct c2_qp *qp,
|
|
struct ib_qp_attr *attr, int attr_mask)
|
|
{
|
|
struct c2wr_qp_modify_req wr;
|
|
struct c2wr_qp_modify_rep *reply;
|
|
struct c2_vq_req *vq_req;
|
|
unsigned long flags;
|
|
u8 next_state;
|
|
int err;
|
|
|
|
pr_debug("%s:%d qp=%p, %s --> %s\n",
|
|
__func__, __LINE__,
|
|
qp,
|
|
to_ib_state_str(qp->state),
|
|
to_ib_state_str(attr->qp_state));
|
|
|
|
vq_req = vq_req_alloc(c2dev);
|
|
if (!vq_req)
|
|
return -ENOMEM;
|
|
|
|
c2_wr_set_id(&wr, CCWR_QP_MODIFY);
|
|
wr.hdr.context = (unsigned long) vq_req;
|
|
wr.rnic_handle = c2dev->adapter_handle;
|
|
wr.qp_handle = qp->adapter_handle;
|
|
wr.ord = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
|
|
wr.ird = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
|
|
wr.sq_depth = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
|
|
wr.rq_depth = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
|
|
|
|
if (attr_mask & IB_QP_STATE) {
|
|
/* Ensure the state is valid */
|
|
if (attr->qp_state < 0 || attr->qp_state > IB_QPS_ERR) {
|
|
err = -EINVAL;
|
|
goto bail0;
|
|
}
|
|
|
|
wr.next_qp_state = cpu_to_be32(to_c2_state(attr->qp_state));
|
|
|
|
if (attr->qp_state == IB_QPS_ERR) {
|
|
spin_lock_irqsave(&qp->lock, flags);
|
|
if (qp->cm_id && qp->state == IB_QPS_RTS) {
|
|
pr_debug("Generating CLOSE event for QP-->ERR, "
|
|
"qp=%p, cm_id=%p\n",qp,qp->cm_id);
|
|
/* Generate an CLOSE event */
|
|
vq_req->cm_id = qp->cm_id;
|
|
vq_req->event = IW_CM_EVENT_CLOSE;
|
|
}
|
|
spin_unlock_irqrestore(&qp->lock, flags);
|
|
}
|
|
next_state = attr->qp_state;
|
|
|
|
} else if (attr_mask & IB_QP_CUR_STATE) {
|
|
|
|
if (attr->cur_qp_state != IB_QPS_RTR &&
|
|
attr->cur_qp_state != IB_QPS_RTS &&
|
|
attr->cur_qp_state != IB_QPS_SQD &&
|
|
attr->cur_qp_state != IB_QPS_SQE) {
|
|
err = -EINVAL;
|
|
goto bail0;
|
|
} else
|
|
wr.next_qp_state =
|
|
cpu_to_be32(to_c2_state(attr->cur_qp_state));
|
|
|
|
next_state = attr->cur_qp_state;
|
|
|
|
} else {
|
|
err = 0;
|
|
goto bail0;
|
|
}
|
|
|
|
/* reference the request struct */
|
|
vq_req_get(c2dev, vq_req);
|
|
|
|
err = vq_send_wr(c2dev, (union c2wr *) & wr);
|
|
if (err) {
|
|
vq_req_put(c2dev, vq_req);
|
|
goto bail0;
|
|
}
|
|
|
|
err = vq_wait_for_reply(c2dev, vq_req);
|
|
if (err)
|
|
goto bail0;
|
|
|
|
reply = (struct c2wr_qp_modify_rep *) (unsigned long) vq_req->reply_msg;
|
|
if (!reply) {
|
|
err = -ENOMEM;
|
|
goto bail0;
|
|
}
|
|
|
|
err = c2_errno(reply);
|
|
if (!err)
|
|
qp->state = next_state;
|
|
#ifdef DEBUG
|
|
else
|
|
pr_debug("%s: c2_errno=%d\n", __func__, err);
|
|
#endif
|
|
/*
|
|
* If we're going to error and generating the event here, then
|
|
* we need to remove the reference because there will be no
|
|
* close event generated by the adapter
|
|
*/
|
|
spin_lock_irqsave(&qp->lock, flags);
|
|
if (vq_req->event==IW_CM_EVENT_CLOSE && qp->cm_id) {
|
|
qp->cm_id->rem_ref(qp->cm_id);
|
|
qp->cm_id = NULL;
|
|
}
|
|
spin_unlock_irqrestore(&qp->lock, flags);
|
|
|
|
vq_repbuf_free(c2dev, reply);
|
|
bail0:
|
|
vq_req_free(c2dev, vq_req);
|
|
|
|
pr_debug("%s:%d qp=%p, cur_state=%s\n",
|
|
__func__, __LINE__,
|
|
qp,
|
|
to_ib_state_str(qp->state));
|
|
return err;
|
|
}
|
|
|
|
int c2_qp_set_read_limits(struct c2_dev *c2dev, struct c2_qp *qp,
|
|
int ord, int ird)
|
|
{
|
|
struct c2wr_qp_modify_req wr;
|
|
struct c2wr_qp_modify_rep *reply;
|
|
struct c2_vq_req *vq_req;
|
|
int err;
|
|
|
|
vq_req = vq_req_alloc(c2dev);
|
|
if (!vq_req)
|
|
return -ENOMEM;
|
|
|
|
c2_wr_set_id(&wr, CCWR_QP_MODIFY);
|
|
wr.hdr.context = (unsigned long) vq_req;
|
|
wr.rnic_handle = c2dev->adapter_handle;
|
|
wr.qp_handle = qp->adapter_handle;
|
|
wr.ord = cpu_to_be32(ord);
|
|
wr.ird = cpu_to_be32(ird);
|
|
wr.sq_depth = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
|
|
wr.rq_depth = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
|
|
wr.next_qp_state = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
|
|
|
|
/* reference the request struct */
|
|
vq_req_get(c2dev, vq_req);
|
|
|
|
err = vq_send_wr(c2dev, (union c2wr *) & wr);
|
|
if (err) {
|
|
vq_req_put(c2dev, vq_req);
|
|
goto bail0;
|
|
}
|
|
|
|
err = vq_wait_for_reply(c2dev, vq_req);
|
|
if (err)
|
|
goto bail0;
|
|
|
|
reply = (struct c2wr_qp_modify_rep *) (unsigned long)
|
|
vq_req->reply_msg;
|
|
if (!reply) {
|
|
err = -ENOMEM;
|
|
goto bail0;
|
|
}
|
|
|
|
err = c2_errno(reply);
|
|
vq_repbuf_free(c2dev, reply);
|
|
bail0:
|
|
vq_req_free(c2dev, vq_req);
|
|
return err;
|
|
}
|
|
|
|
static int destroy_qp(struct c2_dev *c2dev, struct c2_qp *qp)
|
|
{
|
|
struct c2_vq_req *vq_req;
|
|
struct c2wr_qp_destroy_req wr;
|
|
struct c2wr_qp_destroy_rep *reply;
|
|
unsigned long flags;
|
|
int err;
|
|
|
|
/*
|
|
* Allocate a verb request message
|
|
*/
|
|
vq_req = vq_req_alloc(c2dev);
|
|
if (!vq_req) {
|
|
return -ENOMEM;
|
|
}
|
|
|
|
/*
|
|
* Initialize the WR
|
|
*/
|
|
c2_wr_set_id(&wr, CCWR_QP_DESTROY);
|
|
wr.hdr.context = (unsigned long) vq_req;
|
|
wr.rnic_handle = c2dev->adapter_handle;
|
|
wr.qp_handle = qp->adapter_handle;
|
|
|
|
/*
|
|
* reference the request struct. dereferenced in the int handler.
|
|
*/
|
|
vq_req_get(c2dev, vq_req);
|
|
|
|
spin_lock_irqsave(&qp->lock, flags);
|
|
if (qp->cm_id && qp->state == IB_QPS_RTS) {
|
|
pr_debug("destroy_qp: generating CLOSE event for QP-->ERR, "
|
|
"qp=%p, cm_id=%p\n",qp,qp->cm_id);
|
|
/* Generate an CLOSE event */
|
|
vq_req->qp = qp;
|
|
vq_req->cm_id = qp->cm_id;
|
|
vq_req->event = IW_CM_EVENT_CLOSE;
|
|
}
|
|
spin_unlock_irqrestore(&qp->lock, flags);
|
|
|
|
/*
|
|
* Send WR to adapter
|
|
*/
|
|
err = vq_send_wr(c2dev, (union c2wr *) & wr);
|
|
if (err) {
|
|
vq_req_put(c2dev, vq_req);
|
|
goto bail0;
|
|
}
|
|
|
|
/*
|
|
* Wait for reply from adapter
|
|
*/
|
|
err = vq_wait_for_reply(c2dev, vq_req);
|
|
if (err) {
|
|
goto bail0;
|
|
}
|
|
|
|
/*
|
|
* Process reply
|
|
*/
|
|
reply = (struct c2wr_qp_destroy_rep *) (unsigned long) (vq_req->reply_msg);
|
|
if (!reply) {
|
|
err = -ENOMEM;
|
|
goto bail0;
|
|
}
|
|
|
|
spin_lock_irqsave(&qp->lock, flags);
|
|
if (qp->cm_id) {
|
|
qp->cm_id->rem_ref(qp->cm_id);
|
|
qp->cm_id = NULL;
|
|
}
|
|
spin_unlock_irqrestore(&qp->lock, flags);
|
|
|
|
vq_repbuf_free(c2dev, reply);
|
|
bail0:
|
|
vq_req_free(c2dev, vq_req);
|
|
return err;
|
|
}
|
|
|
|
static int c2_alloc_qpn(struct c2_dev *c2dev, struct c2_qp *qp)
|
|
{
|
|
int ret;
|
|
|
|
idr_preload(GFP_KERNEL);
|
|
spin_lock_irq(&c2dev->qp_table.lock);
|
|
|
|
ret = idr_alloc(&c2dev->qp_table.idr, qp, c2dev->qp_table.last++, 0,
|
|
GFP_NOWAIT);
|
|
if (ret >= 0)
|
|
qp->qpn = ret;
|
|
|
|
spin_unlock_irq(&c2dev->qp_table.lock);
|
|
idr_preload_end();
|
|
return ret < 0 ? ret : 0;
|
|
}
|
|
|
|
static void c2_free_qpn(struct c2_dev *c2dev, int qpn)
|
|
{
|
|
spin_lock_irq(&c2dev->qp_table.lock);
|
|
idr_remove(&c2dev->qp_table.idr, qpn);
|
|
spin_unlock_irq(&c2dev->qp_table.lock);
|
|
}
|
|
|
|
struct c2_qp *c2_find_qpn(struct c2_dev *c2dev, int qpn)
|
|
{
|
|
unsigned long flags;
|
|
struct c2_qp *qp;
|
|
|
|
spin_lock_irqsave(&c2dev->qp_table.lock, flags);
|
|
qp = idr_find(&c2dev->qp_table.idr, qpn);
|
|
spin_unlock_irqrestore(&c2dev->qp_table.lock, flags);
|
|
return qp;
|
|
}
|
|
|
|
int c2_alloc_qp(struct c2_dev *c2dev,
|
|
struct c2_pd *pd,
|
|
struct ib_qp_init_attr *qp_attrs, struct c2_qp *qp)
|
|
{
|
|
struct c2wr_qp_create_req wr;
|
|
struct c2wr_qp_create_rep *reply;
|
|
struct c2_vq_req *vq_req;
|
|
struct c2_cq *send_cq = to_c2cq(qp_attrs->send_cq);
|
|
struct c2_cq *recv_cq = to_c2cq(qp_attrs->recv_cq);
|
|
unsigned long peer_pa;
|
|
u32 q_size, msg_size, mmap_size;
|
|
void __iomem *mmap;
|
|
int err;
|
|
|
|
err = c2_alloc_qpn(c2dev, qp);
|
|
if (err)
|
|
return err;
|
|
qp->ibqp.qp_num = qp->qpn;
|
|
qp->ibqp.qp_type = IB_QPT_RC;
|
|
|
|
/* Allocate the SQ and RQ shared pointers */
|
|
qp->sq_mq.shared = c2_alloc_mqsp(c2dev, c2dev->kern_mqsp_pool,
|
|
&qp->sq_mq.shared_dma, GFP_KERNEL);
|
|
if (!qp->sq_mq.shared) {
|
|
err = -ENOMEM;
|
|
goto bail0;
|
|
}
|
|
|
|
qp->rq_mq.shared = c2_alloc_mqsp(c2dev, c2dev->kern_mqsp_pool,
|
|
&qp->rq_mq.shared_dma, GFP_KERNEL);
|
|
if (!qp->rq_mq.shared) {
|
|
err = -ENOMEM;
|
|
goto bail1;
|
|
}
|
|
|
|
/* Allocate the verbs request */
|
|
vq_req = vq_req_alloc(c2dev);
|
|
if (vq_req == NULL) {
|
|
err = -ENOMEM;
|
|
goto bail2;
|
|
}
|
|
|
|
/* Initialize the work request */
|
|
memset(&wr, 0, sizeof(wr));
|
|
c2_wr_set_id(&wr, CCWR_QP_CREATE);
|
|
wr.hdr.context = (unsigned long) vq_req;
|
|
wr.rnic_handle = c2dev->adapter_handle;
|
|
wr.sq_cq_handle = send_cq->adapter_handle;
|
|
wr.rq_cq_handle = recv_cq->adapter_handle;
|
|
wr.sq_depth = cpu_to_be32(qp_attrs->cap.max_send_wr + 1);
|
|
wr.rq_depth = cpu_to_be32(qp_attrs->cap.max_recv_wr + 1);
|
|
wr.srq_handle = 0;
|
|
wr.flags = cpu_to_be32(QP_RDMA_READ | QP_RDMA_WRITE | QP_MW_BIND |
|
|
QP_ZERO_STAG | QP_RDMA_READ_RESPONSE);
|
|
wr.send_sgl_depth = cpu_to_be32(qp_attrs->cap.max_send_sge);
|
|
wr.recv_sgl_depth = cpu_to_be32(qp_attrs->cap.max_recv_sge);
|
|
wr.rdma_write_sgl_depth = cpu_to_be32(qp_attrs->cap.max_send_sge);
|
|
wr.shared_sq_ht = cpu_to_be64(qp->sq_mq.shared_dma);
|
|
wr.shared_rq_ht = cpu_to_be64(qp->rq_mq.shared_dma);
|
|
wr.ord = cpu_to_be32(C2_MAX_ORD_PER_QP);
|
|
wr.ird = cpu_to_be32(C2_MAX_IRD_PER_QP);
|
|
wr.pd_id = pd->pd_id;
|
|
wr.user_context = (unsigned long) qp;
|
|
|
|
vq_req_get(c2dev, vq_req);
|
|
|
|
/* Send the WR to the adapter */
|
|
err = vq_send_wr(c2dev, (union c2wr *) & wr);
|
|
if (err) {
|
|
vq_req_put(c2dev, vq_req);
|
|
goto bail3;
|
|
}
|
|
|
|
/* Wait for the verb reply */
|
|
err = vq_wait_for_reply(c2dev, vq_req);
|
|
if (err) {
|
|
goto bail3;
|
|
}
|
|
|
|
/* Process the reply */
|
|
reply = (struct c2wr_qp_create_rep *) (unsigned long) (vq_req->reply_msg);
|
|
if (!reply) {
|
|
err = -ENOMEM;
|
|
goto bail3;
|
|
}
|
|
|
|
if ((err = c2_wr_get_result(reply)) != 0) {
|
|
goto bail4;
|
|
}
|
|
|
|
/* Fill in the kernel QP struct */
|
|
atomic_set(&qp->refcount, 1);
|
|
qp->adapter_handle = reply->qp_handle;
|
|
qp->state = IB_QPS_RESET;
|
|
qp->send_sgl_depth = qp_attrs->cap.max_send_sge;
|
|
qp->rdma_write_sgl_depth = qp_attrs->cap.max_send_sge;
|
|
qp->recv_sgl_depth = qp_attrs->cap.max_recv_sge;
|
|
init_waitqueue_head(&qp->wait);
|
|
|
|
/* Initialize the SQ MQ */
|
|
q_size = be32_to_cpu(reply->sq_depth);
|
|
msg_size = be32_to_cpu(reply->sq_msg_size);
|
|
peer_pa = c2dev->pa + be32_to_cpu(reply->sq_mq_start);
|
|
mmap_size = PAGE_ALIGN(sizeof(struct c2_mq_shared) + msg_size * q_size);
|
|
mmap = ioremap_nocache(peer_pa, mmap_size);
|
|
if (!mmap) {
|
|
err = -ENOMEM;
|
|
goto bail5;
|
|
}
|
|
|
|
c2_mq_req_init(&qp->sq_mq,
|
|
be32_to_cpu(reply->sq_mq_index),
|
|
q_size,
|
|
msg_size,
|
|
mmap + sizeof(struct c2_mq_shared), /* pool start */
|
|
mmap, /* peer */
|
|
C2_MQ_ADAPTER_TARGET);
|
|
|
|
/* Initialize the RQ mq */
|
|
q_size = be32_to_cpu(reply->rq_depth);
|
|
msg_size = be32_to_cpu(reply->rq_msg_size);
|
|
peer_pa = c2dev->pa + be32_to_cpu(reply->rq_mq_start);
|
|
mmap_size = PAGE_ALIGN(sizeof(struct c2_mq_shared) + msg_size * q_size);
|
|
mmap = ioremap_nocache(peer_pa, mmap_size);
|
|
if (!mmap) {
|
|
err = -ENOMEM;
|
|
goto bail6;
|
|
}
|
|
|
|
c2_mq_req_init(&qp->rq_mq,
|
|
be32_to_cpu(reply->rq_mq_index),
|
|
q_size,
|
|
msg_size,
|
|
mmap + sizeof(struct c2_mq_shared), /* pool start */
|
|
mmap, /* peer */
|
|
C2_MQ_ADAPTER_TARGET);
|
|
|
|
vq_repbuf_free(c2dev, reply);
|
|
vq_req_free(c2dev, vq_req);
|
|
|
|
return 0;
|
|
|
|
bail6:
|
|
iounmap(qp->sq_mq.peer);
|
|
bail5:
|
|
destroy_qp(c2dev, qp);
|
|
bail4:
|
|
vq_repbuf_free(c2dev, reply);
|
|
bail3:
|
|
vq_req_free(c2dev, vq_req);
|
|
bail2:
|
|
c2_free_mqsp(qp->rq_mq.shared);
|
|
bail1:
|
|
c2_free_mqsp(qp->sq_mq.shared);
|
|
bail0:
|
|
c2_free_qpn(c2dev, qp->qpn);
|
|
return err;
|
|
}
|
|
|
|
static inline void c2_lock_cqs(struct c2_cq *send_cq, struct c2_cq *recv_cq)
|
|
{
|
|
if (send_cq == recv_cq)
|
|
spin_lock_irq(&send_cq->lock);
|
|
else if (send_cq > recv_cq) {
|
|
spin_lock_irq(&send_cq->lock);
|
|
spin_lock_nested(&recv_cq->lock, SINGLE_DEPTH_NESTING);
|
|
} else {
|
|
spin_lock_irq(&recv_cq->lock);
|
|
spin_lock_nested(&send_cq->lock, SINGLE_DEPTH_NESTING);
|
|
}
|
|
}
|
|
|
|
static inline void c2_unlock_cqs(struct c2_cq *send_cq, struct c2_cq *recv_cq)
|
|
{
|
|
if (send_cq == recv_cq)
|
|
spin_unlock_irq(&send_cq->lock);
|
|
else if (send_cq > recv_cq) {
|
|
spin_unlock(&recv_cq->lock);
|
|
spin_unlock_irq(&send_cq->lock);
|
|
} else {
|
|
spin_unlock(&send_cq->lock);
|
|
spin_unlock_irq(&recv_cq->lock);
|
|
}
|
|
}
|
|
|
|
void c2_free_qp(struct c2_dev *c2dev, struct c2_qp *qp)
|
|
{
|
|
struct c2_cq *send_cq;
|
|
struct c2_cq *recv_cq;
|
|
|
|
send_cq = to_c2cq(qp->ibqp.send_cq);
|
|
recv_cq = to_c2cq(qp->ibqp.recv_cq);
|
|
|
|
/*
|
|
* Lock CQs here, so that CQ polling code can do QP lookup
|
|
* without taking a lock.
|
|
*/
|
|
c2_lock_cqs(send_cq, recv_cq);
|
|
c2_free_qpn(c2dev, qp->qpn);
|
|
c2_unlock_cqs(send_cq, recv_cq);
|
|
|
|
/*
|
|
* Destroy qp in the rnic...
|
|
*/
|
|
destroy_qp(c2dev, qp);
|
|
|
|
/*
|
|
* Mark any unreaped CQEs as null and void.
|
|
*/
|
|
c2_cq_clean(c2dev, qp, send_cq->cqn);
|
|
if (send_cq != recv_cq)
|
|
c2_cq_clean(c2dev, qp, recv_cq->cqn);
|
|
/*
|
|
* Unmap the MQs and return the shared pointers
|
|
* to the message pool.
|
|
*/
|
|
iounmap(qp->sq_mq.peer);
|
|
iounmap(qp->rq_mq.peer);
|
|
c2_free_mqsp(qp->sq_mq.shared);
|
|
c2_free_mqsp(qp->rq_mq.shared);
|
|
|
|
atomic_dec(&qp->refcount);
|
|
wait_event(qp->wait, !atomic_read(&qp->refcount));
|
|
}
|
|
|
|
/*
|
|
* Function: move_sgl
|
|
*
|
|
* Description:
|
|
* Move an SGL from the user's work request struct into a CCIL Work Request
|
|
* message, swapping to WR byte order and ensure the total length doesn't
|
|
* overflow.
|
|
*
|
|
* IN:
|
|
* dst - ptr to CCIL Work Request message SGL memory.
|
|
* src - ptr to the consumers SGL memory.
|
|
*
|
|
* OUT: none
|
|
*
|
|
* Return:
|
|
* CCIL status codes.
|
|
*/
|
|
static int
|
|
move_sgl(struct c2_data_addr * dst, struct ib_sge *src, int count, u32 * p_len,
|
|
u8 * actual_count)
|
|
{
|
|
u32 tot = 0; /* running total */
|
|
u8 acount = 0; /* running total non-0 len sge's */
|
|
|
|
while (count > 0) {
|
|
/*
|
|
* If the addition of this SGE causes the
|
|
* total SGL length to exceed 2^32-1, then
|
|
* fail-n-bail.
|
|
*
|
|
* If the current total plus the next element length
|
|
* wraps, then it will go negative and be less than the
|
|
* current total...
|
|
*/
|
|
if ((tot + src->length) < tot) {
|
|
return -EINVAL;
|
|
}
|
|
/*
|
|
* Bug: 1456 (as well as 1498 & 1643)
|
|
* Skip over any sge's supplied with len=0
|
|
*/
|
|
if (src->length) {
|
|
tot += src->length;
|
|
dst->stag = cpu_to_be32(src->lkey);
|
|
dst->to = cpu_to_be64(src->addr);
|
|
dst->length = cpu_to_be32(src->length);
|
|
dst++;
|
|
acount++;
|
|
}
|
|
src++;
|
|
count--;
|
|
}
|
|
|
|
if (acount == 0) {
|
|
/*
|
|
* Bug: 1476 (as well as 1498, 1456 and 1643)
|
|
* Setup the SGL in the WR to make it easier for the RNIC.
|
|
* This way, the FW doesn't have to deal with special cases.
|
|
* Setting length=0 should be sufficient.
|
|
*/
|
|
dst->stag = 0;
|
|
dst->to = 0;
|
|
dst->length = 0;
|
|
}
|
|
|
|
*p_len = tot;
|
|
*actual_count = acount;
|
|
return 0;
|
|
}
|
|
|
|
/*
|
|
* Function: c2_activity (private function)
|
|
*
|
|
* Description:
|
|
* Post an mq index to the host->adapter activity fifo.
|
|
*
|
|
* IN:
|
|
* c2dev - ptr to c2dev structure
|
|
* mq_index - mq index to post
|
|
* shared - value most recently written to shared
|
|
*
|
|
* OUT:
|
|
*
|
|
* Return:
|
|
* none
|
|
*/
|
|
static inline void c2_activity(struct c2_dev *c2dev, u32 mq_index, u16 shared)
|
|
{
|
|
/*
|
|
* First read the register to see if the FIFO is full, and if so,
|
|
* spin until it's not. This isn't perfect -- there is no
|
|
* synchronization among the clients of the register, but in
|
|
* practice it prevents multiple CPU from hammering the bus
|
|
* with PCI RETRY. Note that when this does happen, the card
|
|
* cannot get on the bus and the card and system hang in a
|
|
* deadlock -- thus the need for this code. [TOT]
|
|
*/
|
|
while (readl(c2dev->regs + PCI_BAR0_ADAPTER_HINT) & 0x80000000)
|
|
udelay(10);
|
|
|
|
__raw_writel(C2_HINT_MAKE(mq_index, shared),
|
|
c2dev->regs + PCI_BAR0_ADAPTER_HINT);
|
|
}
|
|
|
|
/*
|
|
* Function: qp_wr_post
|
|
*
|
|
* Description:
|
|
* This in-line function allocates a MQ msg, then moves the host-copy of
|
|
* the completed WR into msg. Then it posts the message.
|
|
*
|
|
* IN:
|
|
* q - ptr to user MQ.
|
|
* wr - ptr to host-copy of the WR.
|
|
* qp - ptr to user qp
|
|
* size - Number of bytes to post. Assumed to be divisible by 4.
|
|
*
|
|
* OUT: none
|
|
*
|
|
* Return:
|
|
* CCIL status codes.
|
|
*/
|
|
static int qp_wr_post(struct c2_mq *q, union c2wr * wr, struct c2_qp *qp, u32 size)
|
|
{
|
|
union c2wr *msg;
|
|
|
|
msg = c2_mq_alloc(q);
|
|
if (msg == NULL) {
|
|
return -EINVAL;
|
|
}
|
|
#ifdef CCMSGMAGIC
|
|
((c2wr_hdr_t *) wr)->magic = cpu_to_be32(CCWR_MAGIC);
|
|
#endif
|
|
|
|
/*
|
|
* Since all header fields in the WR are the same as the
|
|
* CQE, set the following so the adapter need not.
|
|
*/
|
|
c2_wr_set_result(wr, CCERR_PENDING);
|
|
|
|
/*
|
|
* Copy the wr down to the adapter
|
|
*/
|
|
memcpy((void *) msg, (void *) wr, size);
|
|
|
|
c2_mq_produce(q);
|
|
return 0;
|
|
}
|
|
|
|
|
|
int c2_post_send(struct ib_qp *ibqp, struct ib_send_wr *ib_wr,
|
|
struct ib_send_wr **bad_wr)
|
|
{
|
|
struct c2_dev *c2dev = to_c2dev(ibqp->device);
|
|
struct c2_qp *qp = to_c2qp(ibqp);
|
|
union c2wr wr;
|
|
unsigned long lock_flags;
|
|
int err = 0;
|
|
|
|
u32 flags;
|
|
u32 tot_len;
|
|
u8 actual_sge_count;
|
|
u32 msg_size;
|
|
|
|
if (qp->state > IB_QPS_RTS) {
|
|
err = -EINVAL;
|
|
goto out;
|
|
}
|
|
|
|
while (ib_wr) {
|
|
|
|
flags = 0;
|
|
wr.sqwr.sq_hdr.user_hdr.hdr.context = ib_wr->wr_id;
|
|
if (ib_wr->send_flags & IB_SEND_SIGNALED) {
|
|
flags |= SQ_SIGNALED;
|
|
}
|
|
|
|
switch (ib_wr->opcode) {
|
|
case IB_WR_SEND:
|
|
case IB_WR_SEND_WITH_INV:
|
|
if (ib_wr->opcode == IB_WR_SEND) {
|
|
if (ib_wr->send_flags & IB_SEND_SOLICITED)
|
|
c2_wr_set_id(&wr, C2_WR_TYPE_SEND_SE);
|
|
else
|
|
c2_wr_set_id(&wr, C2_WR_TYPE_SEND);
|
|
wr.sqwr.send.remote_stag = 0;
|
|
} else {
|
|
if (ib_wr->send_flags & IB_SEND_SOLICITED)
|
|
c2_wr_set_id(&wr, C2_WR_TYPE_SEND_SE_INV);
|
|
else
|
|
c2_wr_set_id(&wr, C2_WR_TYPE_SEND_INV);
|
|
wr.sqwr.send.remote_stag =
|
|
cpu_to_be32(ib_wr->ex.invalidate_rkey);
|
|
}
|
|
|
|
msg_size = sizeof(struct c2wr_send_req) +
|
|
sizeof(struct c2_data_addr) * ib_wr->num_sge;
|
|
if (ib_wr->num_sge > qp->send_sgl_depth) {
|
|
err = -EINVAL;
|
|
break;
|
|
}
|
|
if (ib_wr->send_flags & IB_SEND_FENCE) {
|
|
flags |= SQ_READ_FENCE;
|
|
}
|
|
err = move_sgl((struct c2_data_addr *) & (wr.sqwr.send.data),
|
|
ib_wr->sg_list,
|
|
ib_wr->num_sge,
|
|
&tot_len, &actual_sge_count);
|
|
wr.sqwr.send.sge_len = cpu_to_be32(tot_len);
|
|
c2_wr_set_sge_count(&wr, actual_sge_count);
|
|
break;
|
|
case IB_WR_RDMA_WRITE:
|
|
c2_wr_set_id(&wr, C2_WR_TYPE_RDMA_WRITE);
|
|
msg_size = sizeof(struct c2wr_rdma_write_req) +
|
|
(sizeof(struct c2_data_addr) * ib_wr->num_sge);
|
|
if (ib_wr->num_sge > qp->rdma_write_sgl_depth) {
|
|
err = -EINVAL;
|
|
break;
|
|
}
|
|
if (ib_wr->send_flags & IB_SEND_FENCE) {
|
|
flags |= SQ_READ_FENCE;
|
|
}
|
|
wr.sqwr.rdma_write.remote_stag =
|
|
cpu_to_be32(ib_wr->wr.rdma.rkey);
|
|
wr.sqwr.rdma_write.remote_to =
|
|
cpu_to_be64(ib_wr->wr.rdma.remote_addr);
|
|
err = move_sgl((struct c2_data_addr *)
|
|
& (wr.sqwr.rdma_write.data),
|
|
ib_wr->sg_list,
|
|
ib_wr->num_sge,
|
|
&tot_len, &actual_sge_count);
|
|
wr.sqwr.rdma_write.sge_len = cpu_to_be32(tot_len);
|
|
c2_wr_set_sge_count(&wr, actual_sge_count);
|
|
break;
|
|
case IB_WR_RDMA_READ:
|
|
c2_wr_set_id(&wr, C2_WR_TYPE_RDMA_READ);
|
|
msg_size = sizeof(struct c2wr_rdma_read_req);
|
|
|
|
/* IWarp only suppots 1 sge for RDMA reads */
|
|
if (ib_wr->num_sge > 1) {
|
|
err = -EINVAL;
|
|
break;
|
|
}
|
|
|
|
/*
|
|
* Move the local and remote stag/to/len into the WR.
|
|
*/
|
|
wr.sqwr.rdma_read.local_stag =
|
|
cpu_to_be32(ib_wr->sg_list->lkey);
|
|
wr.sqwr.rdma_read.local_to =
|
|
cpu_to_be64(ib_wr->sg_list->addr);
|
|
wr.sqwr.rdma_read.remote_stag =
|
|
cpu_to_be32(ib_wr->wr.rdma.rkey);
|
|
wr.sqwr.rdma_read.remote_to =
|
|
cpu_to_be64(ib_wr->wr.rdma.remote_addr);
|
|
wr.sqwr.rdma_read.length =
|
|
cpu_to_be32(ib_wr->sg_list->length);
|
|
break;
|
|
default:
|
|
/* error */
|
|
msg_size = 0;
|
|
err = -EINVAL;
|
|
break;
|
|
}
|
|
|
|
/*
|
|
* If we had an error on the last wr build, then
|
|
* break out. Possible errors include bogus WR
|
|
* type, and a bogus SGL length...
|
|
*/
|
|
if (err) {
|
|
break;
|
|
}
|
|
|
|
/*
|
|
* Store flags
|
|
*/
|
|
c2_wr_set_flags(&wr, flags);
|
|
|
|
/*
|
|
* Post the puppy!
|
|
*/
|
|
spin_lock_irqsave(&qp->lock, lock_flags);
|
|
err = qp_wr_post(&qp->sq_mq, &wr, qp, msg_size);
|
|
if (err) {
|
|
spin_unlock_irqrestore(&qp->lock, lock_flags);
|
|
break;
|
|
}
|
|
|
|
/*
|
|
* Enqueue mq index to activity FIFO.
|
|
*/
|
|
c2_activity(c2dev, qp->sq_mq.index, qp->sq_mq.hint_count);
|
|
spin_unlock_irqrestore(&qp->lock, lock_flags);
|
|
|
|
ib_wr = ib_wr->next;
|
|
}
|
|
|
|
out:
|
|
if (err)
|
|
*bad_wr = ib_wr;
|
|
return err;
|
|
}
|
|
|
|
int c2_post_receive(struct ib_qp *ibqp, struct ib_recv_wr *ib_wr,
|
|
struct ib_recv_wr **bad_wr)
|
|
{
|
|
struct c2_dev *c2dev = to_c2dev(ibqp->device);
|
|
struct c2_qp *qp = to_c2qp(ibqp);
|
|
union c2wr wr;
|
|
unsigned long lock_flags;
|
|
int err = 0;
|
|
|
|
if (qp->state > IB_QPS_RTS) {
|
|
err = -EINVAL;
|
|
goto out;
|
|
}
|
|
|
|
/*
|
|
* Try and post each work request
|
|
*/
|
|
while (ib_wr) {
|
|
u32 tot_len;
|
|
u8 actual_sge_count;
|
|
|
|
if (ib_wr->num_sge > qp->recv_sgl_depth) {
|
|
err = -EINVAL;
|
|
break;
|
|
}
|
|
|
|
/*
|
|
* Create local host-copy of the WR
|
|
*/
|
|
wr.rqwr.rq_hdr.user_hdr.hdr.context = ib_wr->wr_id;
|
|
c2_wr_set_id(&wr, CCWR_RECV);
|
|
c2_wr_set_flags(&wr, 0);
|
|
|
|
/* sge_count is limited to eight bits. */
|
|
BUG_ON(ib_wr->num_sge >= 256);
|
|
err = move_sgl((struct c2_data_addr *) & (wr.rqwr.data),
|
|
ib_wr->sg_list,
|
|
ib_wr->num_sge, &tot_len, &actual_sge_count);
|
|
c2_wr_set_sge_count(&wr, actual_sge_count);
|
|
|
|
/*
|
|
* If we had an error on the last wr build, then
|
|
* break out. Possible errors include bogus WR
|
|
* type, and a bogus SGL length...
|
|
*/
|
|
if (err) {
|
|
break;
|
|
}
|
|
|
|
spin_lock_irqsave(&qp->lock, lock_flags);
|
|
err = qp_wr_post(&qp->rq_mq, &wr, qp, qp->rq_mq.msg_size);
|
|
if (err) {
|
|
spin_unlock_irqrestore(&qp->lock, lock_flags);
|
|
break;
|
|
}
|
|
|
|
/*
|
|
* Enqueue mq index to activity FIFO
|
|
*/
|
|
c2_activity(c2dev, qp->rq_mq.index, qp->rq_mq.hint_count);
|
|
spin_unlock_irqrestore(&qp->lock, lock_flags);
|
|
|
|
ib_wr = ib_wr->next;
|
|
}
|
|
|
|
out:
|
|
if (err)
|
|
*bad_wr = ib_wr;
|
|
return err;
|
|
}
|
|
|
|
void c2_init_qp_table(struct c2_dev *c2dev)
|
|
{
|
|
spin_lock_init(&c2dev->qp_table.lock);
|
|
idr_init(&c2dev->qp_table.idr);
|
|
}
|
|
|
|
void c2_cleanup_qp_table(struct c2_dev *c2dev)
|
|
{
|
|
idr_destroy(&c2dev->qp_table.idr);
|
|
}
|