Blame view

net/rds/iw.c 8.78 KB
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
  /*
   * Copyright (c) 2006 Oracle.  All rights reserved.
   *
   * This software is available to you under a choice of one of two
   * licenses.  You may choose to be licensed under the terms of the GNU
   * General Public License (GPL) Version 2, available from the file
   * COPYING in the main directory of this source tree, or the
   * OpenIB.org BSD license below:
   *
   *     Redistribution and use in source and binary forms, with or
   *     without modification, are permitted provided that the following
   *     conditions are met:
   *
   *      - Redistributions of source code must retain the above
   *        copyright notice, this list of conditions and the following
   *        disclaimer.
   *
   *      - Redistributions in binary form must reproduce the above
   *        copyright notice, this list of conditions and the following
   *        disclaimer in the documentation and/or other materials
   *        provided with the distribution.
   *
   * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
   * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
   * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
   * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
   * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
   * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
   * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
   * SOFTWARE.
   *
   */
  #include <linux/kernel.h>
  #include <linux/in.h>
  #include <linux/if.h>
  #include <linux/netdevice.h>
  #include <linux/inetdevice.h>
  #include <linux/if_arp.h>
  #include <linux/delay.h>
5a0e3ad6a   Tejun Heo   include cleanup: ...
40
  #include <linux/slab.h>
3a9a231d9   Paul Gortmaker   net: Fix files ex...
41
  #include <linux/module.h>
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
42
43
44
45
46
47
48
49
50
51
52
53
54
  
  #include "rds.h"
  #include "iw.h"
  
  unsigned int fastreg_pool_size = RDS_FASTREG_POOL_SIZE;
  unsigned int fastreg_message_size = RDS_FASTREG_SIZE + 1; /* +1 allows for unaligned MRs */
  
  module_param(fastreg_pool_size, int, 0444);
  MODULE_PARM_DESC(fastreg_pool_size, " Max number of fastreg MRs per device");
  module_param(fastreg_message_size, int, 0444);
  MODULE_PARM_DESC(fastreg_message_size, " Max size of a RDMA transfer (fastreg MRs)");
  
  struct list_head rds_iw_devices;
745cbccac   Andy Grover   RDS: Rewrite conn...
55
  /* NOTE: if also grabbing iwdev lock, grab this first */
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
56
57
  DEFINE_SPINLOCK(iw_nodev_conns_lock);
  LIST_HEAD(iw_nodev_conns);
ff51bf841   stephen hemminger   rds: make local f...
58
  static void rds_iw_add_one(struct ib_device *device)
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
  {
  	struct rds_iw_device *rds_iwdev;
  	struct ib_device_attr *dev_attr;
  
  	/* Only handle iwarp devices */
  	if (device->node_type != RDMA_NODE_RNIC)
  		return;
  
  	dev_attr = kmalloc(sizeof *dev_attr, GFP_KERNEL);
  	if (!dev_attr)
  		return;
  
  	if (ib_query_device(device, dev_attr)) {
  		rdsdebug("Query device failed for %s
  ", device->name);
  		goto free_attr;
  	}
  
  	rds_iwdev = kmalloc(sizeof *rds_iwdev, GFP_KERNEL);
  	if (!rds_iwdev)
  		goto free_attr;
  
  	spin_lock_init(&rds_iwdev->spinlock);
  
  	rds_iwdev->dma_local_lkey = !!(dev_attr->device_cap_flags & IB_DEVICE_LOCAL_DMA_LKEY);
  	rds_iwdev->max_wrs = dev_attr->max_qp_wr;
  	rds_iwdev->max_sge = min(dev_attr->max_sge, RDS_IW_MAX_SGE);
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
86
87
88
89
90
91
  	rds_iwdev->dev = device;
  	rds_iwdev->pd = ib_alloc_pd(device);
  	if (IS_ERR(rds_iwdev->pd))
  		goto free_dev;
  
  	if (!rds_iwdev->dma_local_lkey) {
ed9e352a3   Andy Grover   RDS/IW: Remove de...
92
93
94
95
  		rds_iwdev->mr = ib_get_dma_mr(rds_iwdev->pd,
  					IB_ACCESS_REMOTE_READ |
  					IB_ACCESS_REMOTE_WRITE |
  					IB_ACCESS_LOCAL_WRITE);
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
  		if (IS_ERR(rds_iwdev->mr))
  			goto err_pd;
  	} else
  		rds_iwdev->mr = NULL;
  
  	rds_iwdev->mr_pool = rds_iw_create_mr_pool(rds_iwdev);
  	if (IS_ERR(rds_iwdev->mr_pool)) {
  		rds_iwdev->mr_pool = NULL;
  		goto err_mr;
  	}
  
  	INIT_LIST_HEAD(&rds_iwdev->cm_id_list);
  	INIT_LIST_HEAD(&rds_iwdev->conn_list);
  	list_add_tail(&rds_iwdev->list, &rds_iw_devices);
  
  	ib_set_client_data(device, &rds_iw_client, rds_iwdev);
  
  	goto free_attr;
  
  err_mr:
  	if (rds_iwdev->mr)
  		ib_dereg_mr(rds_iwdev->mr);
  err_pd:
  	ib_dealloc_pd(rds_iwdev->pd);
  free_dev:
  	kfree(rds_iwdev);
  free_attr:
  	kfree(dev_attr);
  }
ff51bf841   stephen hemminger   rds: make local f...
125
  static void rds_iw_remove_one(struct ib_device *device)
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
126
127
128
129
130
131
132
133
134
135
136
137
138
139
  {
  	struct rds_iw_device *rds_iwdev;
  	struct rds_iw_cm_id *i_cm_id, *next;
  
  	rds_iwdev = ib_get_client_data(device, &rds_iw_client);
  	if (!rds_iwdev)
  		return;
  
  	spin_lock_irq(&rds_iwdev->spinlock);
  	list_for_each_entry_safe(i_cm_id, next, &rds_iwdev->cm_id_list, list) {
  		list_del(&i_cm_id->list);
  		kfree(i_cm_id);
  	}
  	spin_unlock_irq(&rds_iwdev->spinlock);
745cbccac   Andy Grover   RDS: Rewrite conn...
140
  	rds_iw_destroy_conns(rds_iwdev);
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
  
  	if (rds_iwdev->mr_pool)
  		rds_iw_destroy_mr_pool(rds_iwdev->mr_pool);
  
  	if (rds_iwdev->mr)
  		ib_dereg_mr(rds_iwdev->mr);
  
  	while (ib_dealloc_pd(rds_iwdev->pd)) {
  		rdsdebug("Failed to dealloc pd %p
  ", rds_iwdev->pd);
  		msleep(1);
  	}
  
  	list_del(&rds_iwdev->list);
  	kfree(rds_iwdev);
  }
  
  struct ib_client rds_iw_client = {
  	.name   = "rds_iw",
  	.add    = rds_iw_add_one,
  	.remove = rds_iw_remove_one
  };
  
  static int rds_iw_conn_info_visitor(struct rds_connection *conn,
  				    void *buffer)
  {
  	struct rds_info_rdma_connection *iinfo = buffer;
  	struct rds_iw_connection *ic;
  
  	/* We will only ever look at IB transports */
  	if (conn->c_trans != &rds_iw_transport)
  		return 0;
  
  	iinfo->src_addr = conn->c_laddr;
  	iinfo->dst_addr = conn->c_faddr;
  
  	memset(&iinfo->src_gid, 0, sizeof(iinfo->src_gid));
  	memset(&iinfo->dst_gid, 0, sizeof(iinfo->dst_gid));
  	if (rds_conn_state(conn) == RDS_CONN_UP) {
  		struct rds_iw_device *rds_iwdev;
  		struct rdma_dev_addr *dev_addr;
  
  		ic = conn->c_transport_data;
  		dev_addr = &ic->i_cm_id->route.addr.dev_addr;
6f8372b69   Sean Hefty   RDMA/cm: fix loop...
185
186
  		rdma_addr_get_sgid(dev_addr, (union ib_gid *) &iinfo->src_gid);
  		rdma_addr_get_dgid(dev_addr, (union ib_gid *) &iinfo->dst_gid);
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
  
  		rds_iwdev = ib_get_client_data(ic->i_cm_id->device, &rds_iw_client);
  		iinfo->max_send_wr = ic->i_send_ring.w_nr;
  		iinfo->max_recv_wr = ic->i_recv_ring.w_nr;
  		iinfo->max_send_sge = rds_iwdev->max_sge;
  		rds_iw_get_mr_info(rds_iwdev, iinfo);
  	}
  	return 1;
  }
  
  static void rds_iw_ic_info(struct socket *sock, unsigned int len,
  			   struct rds_info_iterator *iter,
  			   struct rds_info_lengths *lens)
  {
  	rds_for_each_conn_info(sock, len, iter, lens,
  				rds_iw_conn_info_visitor,
  				sizeof(struct rds_info_rdma_connection));
  }
  
  
  /*
   * Early RDS/IB was built to only bind to an address if there is an IPoIB
   * device with that address set.
   *
   * If it were me, I'd advocate for something more flexible.  Sending and
   * receiving should be device-agnostic.  Transports would try and maintain
   * connections between peers who have messages queued.  Userspace would be
   * allowed to influence which paths have priority.  We could call userspace
   * asserting this policy "routing".
   */
  static int rds_iw_laddr_check(__be32 addr)
  {
  	int ret;
  	struct rdma_cm_id *cm_id;
  	struct sockaddr_in sin;
  
  	/* Create a CMA ID and try to bind it. This catches both
  	 * IB and iWARP capable NICs.
  	 */
b26f9b994   Sean Hefty   RDMA/cma: Pass QP...
226
  	cm_id = rdma_create_id(NULL, NULL, RDMA_PS_TCP, IB_QPT_RC);
5d57eeb52   Dan Carpenter   ERR_PTR() derefer...
227
228
  	if (IS_ERR(cm_id))
  		return PTR_ERR(cm_id);
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
  
  	memset(&sin, 0, sizeof(sin));
  	sin.sin_family = AF_INET;
  	sin.sin_addr.s_addr = addr;
  
  	/* rdma_bind_addr will only succeed for IB & iWARP devices */
  	ret = rdma_bind_addr(cm_id, (struct sockaddr *)&sin);
  	/* due to this, we will claim to support IB devices unless we
  	   check node_type. */
  	if (ret || cm_id->device->node_type != RDMA_NODE_RNIC)
  		ret = -EADDRNOTAVAIL;
  
  	rdsdebug("addr %pI4 ret %d node type %d
  ",
  		&addr, ret,
  		cm_id->device ? cm_id->device->node_type : -1);
  
  	rdma_destroy_id(cm_id);
  
  	return ret;
  }
  
  void rds_iw_exit(void)
  {
  	rds_info_deregister_func(RDS_INFO_IWARP_CONNECTIONS, rds_iw_ic_info);
745cbccac   Andy Grover   RDS: Rewrite conn...
254
  	rds_iw_destroy_nodev_conns();
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
255
256
257
258
259
260
261
262
263
264
  	ib_unregister_client(&rds_iw_client);
  	rds_iw_sysctl_exit();
  	rds_iw_recv_exit();
  	rds_trans_unregister(&rds_iw_transport);
  }
  
  struct rds_transport rds_iw_transport = {
  	.laddr_check		= rds_iw_laddr_check,
  	.xmit_complete		= rds_iw_xmit_complete,
  	.xmit			= rds_iw_xmit,
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
265
266
267
268
269
270
271
  	.xmit_rdma		= rds_iw_xmit_rdma,
  	.recv			= rds_iw_recv,
  	.conn_alloc		= rds_iw_conn_alloc,
  	.conn_free		= rds_iw_conn_free,
  	.conn_connect		= rds_iw_conn_connect,
  	.conn_shutdown		= rds_iw_conn_shutdown,
  	.inc_copy_to_user	= rds_iw_inc_copy_to_user,
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
272
273
274
275
276
277
278
279
280
281
282
283
  	.inc_free		= rds_iw_inc_free,
  	.cm_initiate_connect	= rds_iw_cm_initiate_connect,
  	.cm_handle_connect	= rds_iw_cm_handle_connect,
  	.cm_connect_complete	= rds_iw_cm_connect_complete,
  	.stats_info_copy	= rds_iw_stats_info_copy,
  	.exit			= rds_iw_exit,
  	.get_mr			= rds_iw_get_mr,
  	.sync_mr		= rds_iw_sync_mr,
  	.free_mr		= rds_iw_free_mr,
  	.flush_mrs		= rds_iw_flush_mrs,
  	.t_owner		= THIS_MODULE,
  	.t_name			= "iwarp",
335776bd6   Andy Grover   RDS: Track transp...
284
  	.t_type			= RDS_TRANS_IWARP,
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
285
286
  	.t_prefer_loopback	= 1,
  };
ef87b7ea3   Zach Brown   RDS: remove __ini...
287
  int rds_iw_init(void)
fcd8b7c0e   Andy Grover   RDS: Add iWARP su...
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
  {
  	int ret;
  
  	INIT_LIST_HEAD(&rds_iw_devices);
  
  	ret = ib_register_client(&rds_iw_client);
  	if (ret)
  		goto out;
  
  	ret = rds_iw_sysctl_init();
  	if (ret)
  		goto out_ibreg;
  
  	ret = rds_iw_recv_init();
  	if (ret)
  		goto out_sysctl;
  
  	ret = rds_trans_register(&rds_iw_transport);
  	if (ret)
  		goto out_recv;
  
  	rds_info_register_func(RDS_INFO_IWARP_CONNECTIONS, rds_iw_ic_info);
  
  	goto out;
  
  out_recv:
  	rds_iw_recv_exit();
  out_sysctl:
  	rds_iw_sysctl_exit();
  out_ibreg:
  	ib_unregister_client(&rds_iw_client);
  out:
  	return ret;
  }
  
  MODULE_LICENSE("GPL");