@@ -58,7 +58,7 @@ typedef struct ibv_context *ib_hca_handle_t;
typedef ib_hca_handle_t dapl_ibal_ca_t;
/* QP info to exchange, wire protocol version for these CM's */
-#define DCM_VER 6
+#define DCM_VER 7
/* CM private data areas, same for all operations */
#define DCM_MAX_PDATA_SIZE 118
@@ -98,7 +98,8 @@ typedef struct _ib_cm_msg
uint16_t p_size;
uint32_t s_id; /* src pid */
uint32_t d_id; /* dst pid */
- uint8_t resv[6];
+ uint8_t rd_in; /* atomic_rd_in */
+ uint8_t resv[5];
union dcm_addr saddr;
union dcm_addr daddr;
union dcm_addr saddr_alt;
@@ -442,11 +442,12 @@ dapls_modify_qp_state(IN ib_qp_handle_t qp_handle,
case IBV_QPS_RTR:
dapl_dbg_log(DAPL_DBG_TYPE_EP,
" QPS_RTR: type %d qpn 0x%x gid %p (%d) lid 0x%x"
- " port %d ep %p qp_state %d \n",
+ " port %d ep %p qp_state %d rd_atomic %d\n",
qp_handle->qp_type, ntohl(qpn), gid,
ia_ptr->hca_ptr->ib_trans.global,
ntohs(lid), ia_ptr->hca_ptr->port_num,
- ep_ptr, ep_ptr->qp_state);
+ ep_ptr, ep_ptr->qp_state,
+ ep_ptr->param.ep_attr.max_rdma_read_in);
mask |= IBV_QP_AV |
IBV_QP_PATH_MTU |
@@ -530,6 +530,9 @@ static void dapli_socket_connected(dp_ib_cm_handle_t cm_ptr, int err)
cm_ptr->state = DCM_REP_PENDING;
dapl_os_unlock(&cm_ptr->lock);
+ /* set max rdma inbound requests */
+ cm_ptr->msg.rd_in = ep_ptr->param.ep_attr.max_rdma_read_in;
+
/* send qp info and pdata to remote peer */
exp = sizeof(ib_cm_msg_t) - DCM_MAX_PDATA_SIZE;
iov[0].iov_base = (void *)&cm_ptr->msg;
@@ -798,6 +801,10 @@ static void dapli_socket_connect_rtu(dp_ib_cm_handle_t cm_ptr)
goto bail;
}
+ /* rdma_out, initiator, cannot exceed remote rdma_in max */
+ ep_ptr->param.ep_attr.max_rdma_read_out =
+ DAPL_MIN(ep_ptr->param.ep_attr.max_rdma_read_out, cm_ptr->msg.rd_in);
+
/* modify QP to RTR and then to RTS with remote info */
dapl_os_lock(&ep_ptr->header.lock);
if (dapls_modify_qp_state(ep_ptr->qp_handle,
@@ -1196,6 +1203,9 @@ dapli_socket_accept_usr(DAPL_EP * ep_ptr,
goto bail;
}
#endif
+ /* rdma_out, initiator, cannot exceed remote rdma_in max */
+ ep_ptr->param.ep_attr.max_rdma_read_out =
+ DAPL_MIN(ep_ptr->param.ep_attr.max_rdma_read_out, cm_ptr->msg.rd_in);
/* modify QP to RTR and then to RTS with remote info already read */
dapl_os_lock(&ep_ptr->header.lock);
@@ -1235,6 +1245,7 @@ dapli_socket_accept_usr(DAPL_EP * ep_ptr,
/* send our QP info, IA address, pdata. Don't overwrite dst data */
local.ver = htons(DCM_VER);
local.op = htons(DCM_REP);
+ local.rd_in = ep_ptr->param.ep_attr.max_rdma_read_in;
local.saddr.ib.qpn = htonl(ep_ptr->qp_handle->qp_num);
local.saddr.ib.qp_type = ep_ptr->qp_handle->qp_type;
local.saddr.ib.lid = ia_ptr->hca_ptr->ib_trans.lid;
@@ -1080,6 +1080,10 @@ static void ucm_connect_rtu(dp_ib_cm_handle_t cm, ib_cm_msg_t *msg)
}
dapl_os_unlock(&cm->lock);
+ /* rdma_out, initiator, cannot exceed remote rdma_in max */
+ cm->ep->param.ep_attr.max_rdma_read_out =
+ DAPL_MIN(cm->ep->param.ep_attr.max_rdma_read_out, cm->msg.rd_in);
+
/* modify QP to RTR and then to RTS with remote info */
dapl_os_lock(&cm->ep->header.lock);
if (dapls_modify_qp_state(cm->ep->qp_handle,
@@ -1232,6 +1236,7 @@ static void ucm_accept(ib_cm_srvc_handle_t cm, ib_cm_msg_t *msg)
acm->msg.sqpn = cm->msg.sqpn;
acm->msg.p_size = msg->p_size;
acm->msg.d_id = msg->s_id;
+ acm->msg.rd_in = msg->rd_in;
/* CR saddr is CM daddr info, need EP for local saddr */
dapl_os_memcpy(&acm->msg.daddr, &msg->saddr, sizeof(union dcm_addr));
@@ -1510,6 +1515,10 @@ dapli_accept_usr(DAPL_EP *ep, DAPL_CR *cr, DAT_COUNT p_size, DAT_PVOID p_data)
}
#endif
+ /* rdma_out, initiator, cannot exceed remote rdma_in max */
+ ep->param.ep_attr.max_rdma_read_out =
+ DAPL_MIN(ep->param.ep_attr.max_rdma_read_out, cm->msg.rd_in);
+
/* modify QP to RTR and then to RTS with remote info already read */
dapl_os_lock(&ep->header.lock);
if (dapls_modify_qp_state(ep->qp_handle,
@@ -1544,6 +1553,7 @@ dapli_accept_usr(DAPL_EP *ep, DAPL_CR *cr, DAT_COUNT p_size, DAT_PVOID p_data)
/* setup local QP info and type from EP, copy pdata, for reply */
cm->msg.op = htons(DCM_REP);
+ cm->msg.rd_in = ep->param.ep_attr.max_rdma_read_in;
cm->msg.saddr.ib.qpn = htonl(ep->qp_handle->qp_num);
cm->msg.saddr.ib.qp_type = ep->qp_handle->qp_type;
cm->msg.saddr.ib.lid = cm->hca->ib_trans.addr.ib.lid;
@@ -1626,6 +1636,9 @@ dapls_ib_connect(IN DAT_EP_HANDLE ep_handle,
cm->msg.dqpn = cm->msg.daddr.ib.qpn;
cm->msg.daddr.ib.qpn = 0; /* don't have a remote qpn until reply */
+ /* set max rdma inbound requests */
+ cm->msg.rd_in = ep->param.ep_attr.max_rdma_read_in;
+
if (p_size) {
cm->msg.p_size = htons(p_size);
dapl_os_memcpy(&cm->msg.p_data, p_data, p_size);