summaryrefslogtreecommitdiff
path: root/source4/cluster/ctdb/ib/ibwrapper_internal.h
blob: 9c6bfab519ecbc167a151e612653dced2959a977 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
/*
 * Unix SMB/CIFS implementation.
 * Wrap Infiniband calls.
 *
 * Copyright (C) Sven Oehme <oehmes@de.ibm.com> 2006
 *
 * Major code contributions by Peter Somogyi <psomogyi@gamax.hu>
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 */

struct ibw_opts {
	uint32_t	max_send_wr;
	uint32_t	max_recv_wr;
	uint32_t	recv_bufsize;
	uint32_t	recv_threshold;
};

struct ibw_wr {
	char	*buf; /* initialized in ibw_init_memory once per connection */
	int	wr_id; /* position in wr_index list; also used as wr id */

	char	*buf_large; /* allocated specially for "large" message */
	struct ibv_mr *mr_large;
	int	ref_cnt; /* reference count for ibw_wc_send to know when to release */

	char	*queued_msg; /* set at ibw_send - can be different than above */
	int	queued_ref_cnt; /* instead of adding the same to the queue again */
	uint32_t	queued_rlen; /* last wins when queued_ref_cnt>0; or simple msg size */

	struct ibw_wr *next, *prev; /* in wr_list_avail or wr_list_used */
				/* or extra_sent or extra_avail */
	struct ibw_wr *qnext, *qprev; /* in queue */
};

struct ibw_ctx_priv {
	struct event_context *ectx;

	struct ibw_opts opts;

	struct rdma_cm_id	*cm_id; /* server cm id */

	struct rdma_event_channel *cm_channel;
	struct fd_event *cm_channel_event;

	ibw_connstate_fn_t connstate_func; /* see ibw_init */
	ibw_receive_fn_t receive_func; /* see ibw_init */

	long	pagesize; /* sysconf result for memalign */
};

struct ibw_part {
	char *buf; /* talloced memory buffer */
	uint32_t bufsize; /* allocated size of buf - always grows */
	uint32_t len; /* message part length */
	uint32_t to_read; /* 4 or *((uint32_t)buf) if len>=sizeof(uint32_t) */
};

struct ibw_conn_priv {
	struct ibv_comp_channel *verbs_channel;
	struct fd_event *verbs_channel_event;

	struct rdma_cm_id *cm_id; /* client's cm id */
	struct ibv_pd	*pd;
	int	is_accepted;

	struct ibv_cq	*cq; /* qp is in cm_id */

	char *buf_send; /* max_send_wr * avg_send_size */
	struct ibv_mr *mr_send;
	struct ibw_wr *wr_list_avail;
	struct ibw_wr *wr_list_used;
	struct ibw_wr **wr_index; /* array[0..(qsize-1)] of (ibw_wr *) */
	int	wr_sent; /* # of send wrs in the CQ */

	struct ibw_wr *extra_sent;
	struct ibw_wr *extra_avail;
	int	extra_max; /* max wr_id in the queue */

	struct ibw_wr *queue;

	/* buf_recv is a ring buffer */
	char *buf_recv; /* max_recv_wr * avg_recv_size */
	struct ibv_mr *mr_recv;
	int recv_index; /* index of the next recv buffer when refilling */
	struct ibw_part part;
};

/* remove an element from a list - element doesn't have to be in list. */
#define DLIST_REMOVE2(list, p, prev, next) \
do { \
	if ((p) == (list)) { \
		(list) = (p)->next; \
		if (list) (list)->prev = NULL; \
	} else { \
		if ((p)->prev) (p)->prev->next = (p)->next; \
		if ((p)->next) (p)->next->prev = (p)->prev; \
	} \
	if ((p) != (list)) (p)->next = (p)->prev = NULL; \
} while (0)

/* hook into the end of the list - needs a tmp pointer */
#define DLIST_ADD_END2(list, p, type, prev, next) \
do { \
		if (!(list)) { \
			(list) = (p); \
			(p)->next = (p)->prev = NULL; \
		} else { \
			type tmp; \
			for (tmp = (list); tmp->next; tmp = tmp->next) ; \
			tmp->next = (p); \
			(p)->next = NULL; \
			(p)->prev = tmp; \
		} \
} while (0)