new file mode 100644
@@ -0,0 +1,244 @@
+/*
+ * InfiniBand Transport Layer
+ *
+ * Copyright (c) 2014 - 2017 ProfitBricks GmbH. All rights reserved.
+ * Authors: Fabian Holler < mail@fholler.de>
+ * Jack Wang <jinpu.wang@profitbricks.com>
+ * Kleber Souza <kleber.souza@profitbricks.com>
+ * Danil Kipnis <danil.kipnis@profitbricks.com>
+ * Roman Pen <roman.penyaev@profitbricks.com>
+ * Milind Dumbare <Milind.dumbare@gmail.com>
+ *
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions, and the following disclaimer,
+ * without modification.
+ * 2. Redistributions in binary form must reproduce at minimum a disclaimer
+ * substantially similar to the "NO WARRANTY" disclaimer below
+ * ("Disclaimer") and any redistribution must be conditioned upon
+ * including a substantially similar Disclaimer requirement for further
+ * binary redistribution.
+ * 3. Neither the names of the above-listed copyright holders nor the names
+ * of any contributors may be used to endorse or promote products derived
+ * from this software without specific prior written permission.
+ *
+ * Alternatively, this software may be distributed under the terms of the
+ * GNU General Public License ("GPL") version 2 as published by the Free
+ * Software Foundation.
+ *
+ * NO WARRANTY
+ * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+ * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+ * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTIBILITY AND FITNESS FOR
+ * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+ * HOLDERS OR CONTRIBUTORS BE LIABLE FOR SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
+ * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
+ * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+ * POSSIBILITY OF SUCH DAMAGES.
+ *
+ */
+
+#if !defined(IBTRS_CLT_INTERNAL_H)
+#define IBTRS_CLT_INTERNAL_H
+
+#include <rdma/ibtrs.h>
+
+enum ssm_state {
+ _SSM_STATE_MIN,
+ SSM_STATE_IDLE,
+ SSM_STATE_IDLE_RECONNECT,
+ SSM_STATE_WF_INFO,
+ SSM_STATE_WF_INFO_RECONNECT,
+ SSM_STATE_OPEN,
+ SSM_STATE_OPEN_RECONNECT,
+ SSM_STATE_CONNECTED,
+ SSM_STATE_RECONNECT,
+ SSM_STATE_RECONNECT_IMM,
+ SSM_STATE_CLOSE_DESTROY,
+ SSM_STATE_CLOSE_RECONNECT,
+ SSM_STATE_CLOSE_RECONNECT_IMM,
+ SSM_STATE_DISCONNECTED,
+ SSM_STATE_DESTROYED,
+ _SSM_STATE_MAX
+};
+
+enum ibtrs_fast_reg {
+ IBTRS_FAST_MEM_NONE,
+ IBTRS_FAST_MEM_FR,
+ IBTRS_FAST_MEM_FMR
+};
+
+struct ibtrs_stats_reconnects {
+ u32 successful_cnt;
+ u32 fail_cnt;
+};
+
+struct ibtrs_stats_wc_comp {
+ u32 max_wc_cnt;
+ u32 cnt;
+ u64 total_cnt;
+};
+
+struct ibtrs_stats_cpu_migration {
+ atomic_t *from;
+ int *to;
+};
+
+struct ibtrs_clt_stats_rdma_stats {
+ u64 cnt_read;
+ u64 size_total_read;
+ u64 cnt_write;
+ u64 size_total_write;
+
+ u16 inflight;
+};
+
+#define MIN_LOG_SG 2
+#define MAX_LOG_SG 5
+#define MAX_LIN_SG BIT(MIN_LOG_SG)
+#define SG_DISTR_LEN (MAX_LOG_SG - MIN_LOG_SG + MAX_LIN_SG + 1)
+
+struct ibtrs_clt_stats_rdma_lat_entry {
+ u64 read;
+ u64 write;
+};
+
+#define MAX_LOG_LATENCY 16
+#define MIN_LOG_LATENCY 0
+
+struct ibtrs_clt_stats_user_ib_msgs {
+ u32 recv_msg_cnt;
+ u32 sent_msg_cnt;
+ u64 recv_size;
+ u64 sent_size;
+};
+
+struct ibtrs_clt_stats {
+ struct ibtrs_stats_cpu_migration cpu_migr;
+ struct ibtrs_clt_stats_rdma_stats *rdma_stats;
+ u64 *sg_list_total;
+ u64 **sg_list_distr;
+ struct ibtrs_stats_reconnects reconnects;
+ struct ibtrs_clt_stats_rdma_lat_entry **rdma_lat_distr;
+ struct ibtrs_clt_stats_rdma_lat_entry *rdma_lat_max;
+ struct ibtrs_clt_stats_user_ib_msgs user_ib_msgs;
+ struct ibtrs_stats_wc_comp *wc_comp;
+};
+
+struct ibtrs_session {
+ struct list_head list; /* global session list */
+ wait_queue_head_t wait_q;
+ enum ssm_state state;
+ struct ibtrs_con *con;
+ struct ib_session ib_sess;
+ struct ib_device *ib_device;
+ struct ibtrs_iu *rdma_info_iu;
+ struct ibtrs_iu *sess_info_iu;
+ struct ibtrs_iu *dummy_rx_iu;
+ struct ibtrs_iu **usr_rx_ring;
+ struct ibtrs_iu **io_tx_ius;
+
+ spinlock_t u_msg_ius_lock ____cacheline_aligned;
+ struct list_head u_msg_ius_list;
+
+ struct rdma_req *reqs;
+ struct ib_fmr_pool *fmr_pool;
+ atomic_t ib_sess_initialized;
+ bool io_bufs_initialized;
+ size_t pdu_sz;
+ void *priv;
+ struct workqueue_struct *sm_wq;
+ struct workqueue_struct *msg_wq;
+ struct delayed_work heartbeat_dwork;
+ u32 heartbeat_timeout_srv_ms;
+ struct delayed_work reconnect_dwork;
+ struct ibtrs_heartbeat heartbeat;
+ atomic_t refcount;
+ u8 active_cnt;
+ bool enable_rdma_lat;
+ u8 ver;
+ u8 connected_cnt;
+ u32 retry_cnt;
+ s16 max_reconnect_attempts;
+ u8 reconnect_delay_sec;
+ void *tags;
+ unsigned long *tags_map;
+ wait_queue_head_t tags_wait;
+ u64 *srv_rdma_addr;
+ u32 srv_rdma_buf_rkey;
+ u32 max_io_size;
+ u32 max_req_size;
+ u32 chunk_size;
+ u32 max_desc;
+ u32 queue_depth;
+ u16 user_queue_depth;
+ enum ibtrs_fast_reg fast_reg_mode;
+ u64 mr_page_mask;
+ u32 mr_page_size;
+ u32 mr_max_size;
+ u32 max_pages_per_mr;
+ int max_sge;
+ struct sockaddr_storage peer_addr;
+ struct sockaddr_storage self_addr;
+ struct completion *destroy_completion;
+ struct kobject kobj;
+ struct kobject kobj_stats;
+ char addr[IBTRS_ADDRLEN];
+ char hostname[MAXHOSTNAMELEN];
+ struct ibtrs_clt_stats stats;
+ wait_queue_head_t mu_iu_wait_q;
+ wait_queue_head_t mu_buf_wait_q;
+ atomic_t peer_usr_msg_bufs;
+ struct completion *ib_sess_destroy_completion;
+};
+
+#define TAG_SIZE(sess) (sizeof(struct ibtrs_tag) + (sess)->pdu_sz)
+#define GET_TAG(sess, idx) ((sess)->tags + TAG_SIZE(sess) * idx)
+
+/**
+ * ibtrs_clt_reconnect() - Reconnect the session
+ * @sess: Session handler
+ */
+int ibtrs_clt_reconnect(struct ibtrs_session *sess);
+
+void ibtrs_clt_set_max_reconnect_attempts(struct ibtrs_session *sess,
+ s16 value);
+
+s16 ibtrs_clt_get_max_reconnect_attempts(const struct ibtrs_session *sess);
+int ibtrs_clt_get_user_queue_depth(struct ibtrs_session *sess);
+int ibtrs_clt_set_user_queue_depth(struct ibtrs_session *sess, u16 queue_depth);
+int ibtrs_clt_reset_sg_list_distr_stats(struct ibtrs_session *sess,
+ bool enable);
+int ibtrs_clt_stats_sg_list_distr_to_str(struct ibtrs_session *sess,
+ char *buf, size_t len);
+int ibtrs_clt_reset_rdma_lat_distr_stats(struct ibtrs_session *sess,
+ bool enable);
+ssize_t ibtrs_clt_stats_rdma_lat_distr_to_str(struct ibtrs_session *sess,
+ char *page, size_t len);
+int ibtrs_clt_reset_cpu_migr_stats(struct ibtrs_session *sess, bool enable);
+int ibtrs_clt_stats_migration_cnt_to_str(struct ibtrs_session *sess, char *buf,
+ size_t len);
+int ibtrs_clt_reset_reconnects_stat(struct ibtrs_session *sess, bool enable);
+int ibtrs_clt_stats_reconnects_to_str(struct ibtrs_session *sess, char *buf,
+ size_t len);
+int ibtrs_clt_reset_user_ib_msgs_stats(struct ibtrs_session *sess, bool enable);
+int ibtrs_clt_stats_user_ib_msgs_to_str(struct ibtrs_session *sess, char *buf,
+ size_t len);
+int ibtrs_clt_reset_wc_comp_stats(struct ibtrs_session *sess, bool enable);
+int ibtrs_clt_stats_wc_completion_to_str(struct ibtrs_session *sess, char *buf,
+ size_t len);
+int ibtrs_clt_reset_rdma_stats(struct ibtrs_session *sess, bool enable);
+ssize_t ibtrs_clt_stats_rdma_to_str(struct ibtrs_session *sess,
+ char *page, size_t len);
+bool ibtrs_clt_sess_is_connected(const struct ibtrs_session *sess);
+int ibtrs_clt_reset_all_stats(struct ibtrs_session *sess, bool enable);
+ssize_t ibtrs_clt_reset_all_help(struct ibtrs_session *sess,
+ char *page, size_t len);
+
+#endif