blob: fefcba982415a5417c630d71c48ebb7e53a34d32 [file] [log] [blame]
\"Talpey, Thomas\f58851e2007-09-10 13:50:12 -04001/*
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04002 * Copyright (c) 2003-2007 Network Appliance, Inc. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the BSD-type
8 * license below:
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 *
14 * Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 *
17 * Redistributions in binary form must reproduce the above
18 * copyright notice, this list of conditions and the following
19 * disclaimer in the documentation and/or other materials provided
20 * with the distribution.
21 *
22 * Neither the name of the Network Appliance, Inc. nor the names of
23 * its contributors may be used to endorse or promote products
24 * derived from this software without specific prior written
25 * permission.
26 *
27 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
28 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
29 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
30 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
31 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
32 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
33 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
34 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
35 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
36 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
37 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
\"Talpey, Thomas\f58851e2007-09-10 13:50:12 -040038 */
39
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -040040/*
41 * verbs.c
42 *
43 * Encapsulates the major functions managing:
44 * o adapters
45 * o endpoints
46 * o connections
47 * o buffer memory
48 */
49
Alexey Dobriyana6b7a402011-06-06 10:43:46 +000050#include <linux/interrupt.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090051#include <linux/slab.h>
Chuck Levereba8ff62015-01-21 11:03:02 -050052#include <linux/prefetch.h>
Chuck Lever0dd39ca2015-03-30 14:33:43 -040053#include <linux/sunrpc/addr.h>
Chuck Lever65866f82014-05-28 10:33:59 -040054#include <asm/bitops.h>
Devesh Sharmad0f36c42015-08-03 13:05:04 -040055#include <linux/module.h> /* try_module_get()/module_put() */
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -040056
\"Talpey, Thomas\f58851e2007-09-10 13:50:12 -040057#include "xprt_rdma.h"
58
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -040059/*
60 * Globals/Macros
61 */
62
Jeff Laytonf895b252014-11-17 16:58:04 -050063#if IS_ENABLED(CONFIG_SUNRPC_DEBUG)
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -040064# define RPCDBG_FACILITY RPCDBG_TRANS
65#endif
66
67/*
68 * internal functions
69 */
70
Chuck Leverfe97b472015-10-24 17:27:10 -040071static struct workqueue_struct *rpcrdma_receive_wq;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -040072
Chuck Leverfe97b472015-10-24 17:27:10 -040073int
74rpcrdma_alloc_wq(void)
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -040075{
Chuck Leverfe97b472015-10-24 17:27:10 -040076 struct workqueue_struct *recv_wq;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -040077
Chuck Leverfe97b472015-10-24 17:27:10 -040078 recv_wq = alloc_workqueue("xprtrdma_receive",
79 WQ_MEM_RECLAIM | WQ_UNBOUND | WQ_HIGHPRI,
80 0);
81 if (!recv_wq)
82 return -ENOMEM;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -040083
Chuck Leverfe97b472015-10-24 17:27:10 -040084 rpcrdma_receive_wq = recv_wq;
85 return 0;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -040086}
87
Chuck Leverfe97b472015-10-24 17:27:10 -040088void
89rpcrdma_destroy_wq(void)
Chuck Leverf1a03b72014-11-08 20:14:37 -050090{
Chuck Leverfe97b472015-10-24 17:27:10 -040091 struct workqueue_struct *wq;
Chuck Leverf1a03b72014-11-08 20:14:37 -050092
Chuck Leverfe97b472015-10-24 17:27:10 -040093 if (rpcrdma_receive_wq) {
94 wq = rpcrdma_receive_wq;
95 rpcrdma_receive_wq = NULL;
96 destroy_workqueue(wq);
97 }
Chuck Leverf1a03b72014-11-08 20:14:37 -050098}
99
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400100static void
101rpcrdma_qp_async_error_upcall(struct ib_event *event, void *context)
102{
103 struct rpcrdma_ep *ep = context;
104
Chuck Lever7ff11de2014-11-08 20:15:01 -0500105 pr_err("RPC: %s: %s on device %s ep %p\n",
Sagi Grimberg76357c72015-05-18 13:40:32 +0300106 __func__, ib_event_msg(event->event),
Chuck Lever7ff11de2014-11-08 20:15:01 -0500107 event->device->name, context);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400108 if (ep->rep_connected == 1) {
109 ep->rep_connected = -EIO;
Chuck Leverafadc462015-01-21 11:03:11 -0500110 rpcrdma_conn_func(ep);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400111 wake_up_all(&ep->rep_connect_wait);
112 }
113}
114
Chuck Lever2fa8f882016-03-04 11:28:53 -0500115/**
116 * rpcrdma_wc_send - Invoked by RDMA provider for each polled Send WC
117 * @cq: completion queue (ignored)
118 * @wc: completed WR
119 *
Chuck Lever4220a072015-10-24 17:26:45 -0400120 */
121static void
Chuck Lever2fa8f882016-03-04 11:28:53 -0500122rpcrdma_wc_send(struct ib_cq *cq, struct ib_wc *wc)
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400123{
Chuck Lever2fa8f882016-03-04 11:28:53 -0500124 /* WARNING: Only wr_cqe and status are reliable at this point */
125 if (wc->status != IB_WC_SUCCESS && wc->status != IB_WC_WR_FLUSH_ERR)
126 pr_err("rpcrdma: Send: %s (%u/0x%x)\n",
127 ib_wc_status_msg(wc->status),
128 wc->status, wc->vendor_err);
Chuck Leverfc664482014-05-28 10:33:25 -0400129}
130
131static void
Chuck Leverfe97b472015-10-24 17:27:10 -0400132rpcrdma_receive_worker(struct work_struct *work)
133{
134 struct rpcrdma_rep *rep =
135 container_of(work, struct rpcrdma_rep, rr_work);
136
137 rpcrdma_reply_handler(rep);
138}
139
Chuck Lever23826c72016-03-04 11:28:27 -0500140/* Perform basic sanity checking to avoid using garbage
141 * to update the credit grant value.
142 */
143static void
144rpcrdma_update_granted_credits(struct rpcrdma_rep *rep)
145{
146 struct rpcrdma_msg *rmsgp = rdmab_to_msg(rep->rr_rdmabuf);
147 struct rpcrdma_buffer *buffer = &rep->rr_rxprt->rx_buf;
148 u32 credits;
149
150 if (rep->rr_len < RPCRDMA_HDRLEN_ERR)
151 return;
152
153 credits = be32_to_cpu(rmsgp->rm_credit);
154 if (credits == 0)
155 credits = 1; /* don't deadlock */
156 else if (credits > buffer->rb_max_requests)
157 credits = buffer->rb_max_requests;
158
159 atomic_set(&buffer->rb_credits, credits);
160}
161
Chuck Lever552bf222016-03-04 11:28:36 -0500162/**
163 * rpcrdma_receive_wc - Invoked by RDMA provider for each polled Receive WC
164 * @cq: completion queue (ignored)
165 * @wc: completed WR
166 *
167 */
Chuck Leverfe97b472015-10-24 17:27:10 -0400168static void
Chuck Lever552bf222016-03-04 11:28:36 -0500169rpcrdma_receive_wc(struct ib_cq *cq, struct ib_wc *wc)
Chuck Leverfc664482014-05-28 10:33:25 -0400170{
Chuck Lever552bf222016-03-04 11:28:36 -0500171 struct ib_cqe *cqe = wc->wr_cqe;
172 struct rpcrdma_rep *rep = container_of(cqe, struct rpcrdma_rep,
173 rr_cqe);
Chuck Leverfc664482014-05-28 10:33:25 -0400174
Chuck Lever85024272015-01-21 11:02:04 -0500175 /* WARNING: Only wr_id and status are reliable at this point */
176 if (wc->status != IB_WC_SUCCESS)
177 goto out_fail;
Chuck Leverfc664482014-05-28 10:33:25 -0400178
Chuck Lever85024272015-01-21 11:02:04 -0500179 /* status == SUCCESS means all fields in wc are trustworthy */
Chuck Leverfc664482014-05-28 10:33:25 -0400180 if (wc->opcode != IB_WC_RECV)
181 return;
182
Chuck Lever85024272015-01-21 11:02:04 -0500183 dprintk("RPC: %s: rep %p opcode 'recv', length %u: success\n",
184 __func__, rep, wc->byte_len);
185
Chuck Leverfc664482014-05-28 10:33:25 -0400186 rep->rr_len = wc->byte_len;
Chuck Lever89e0d1122015-05-26 11:51:56 -0400187 ib_dma_sync_single_for_cpu(rep->rr_device,
Chuck Lever6b1184c2015-01-21 11:04:25 -0500188 rdmab_addr(rep->rr_rdmabuf),
189 rep->rr_len, DMA_FROM_DEVICE);
Chuck Lever23826c72016-03-04 11:28:27 -0500190
191 rpcrdma_update_granted_credits(rep);
Chuck Leverfc664482014-05-28 10:33:25 -0400192
193out_schedule:
Chuck Leverfe97b472015-10-24 17:27:10 -0400194 queue_work(rpcrdma_receive_wq, &rep->rr_work);
Chuck Lever85024272015-01-21 11:02:04 -0500195 return;
Chuck Leverfe97b472015-10-24 17:27:10 -0400196
Chuck Lever85024272015-01-21 11:02:04 -0500197out_fail:
198 if (wc->status != IB_WC_WR_FLUSH_ERR)
Chuck Lever552bf222016-03-04 11:28:36 -0500199 pr_err("rpcrdma: Recv: %s (%u/0x%x)\n",
200 ib_wc_status_msg(wc->status),
201 wc->status, wc->vendor_err);
Chuck Leverb0e178a2015-10-24 17:26:54 -0400202 rep->rr_len = RPCRDMA_BAD_LEN;
Chuck Lever85024272015-01-21 11:02:04 -0500203 goto out_schedule;
Chuck Leverfc664482014-05-28 10:33:25 -0400204}
205
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400206static int
207rpcrdma_conn_upcall(struct rdma_cm_id *id, struct rdma_cm_event *event)
208{
209 struct rpcrdma_xprt *xprt = id->context;
210 struct rpcrdma_ia *ia = &xprt->rx_ia;
211 struct rpcrdma_ep *ep = &xprt->rx_ep;
Jeff Laytonf895b252014-11-17 16:58:04 -0500212#if IS_ENABLED(CONFIG_SUNRPC_DEBUG)
Chuck Lever0dd39ca2015-03-30 14:33:43 -0400213 struct sockaddr *sap = (struct sockaddr *)&ep->rep_remote_addr;
Ingo Molnarff0db042008-11-25 16:58:42 -0800214#endif
Chuck Leverce1ab9a2015-01-21 11:03:35 -0500215 struct ib_qp_attr *attr = &ia->ri_qp_attr;
216 struct ib_qp_init_attr *iattr = &ia->ri_qp_init_attr;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400217 int connstate = 0;
218
219 switch (event->event) {
220 case RDMA_CM_EVENT_ADDR_RESOLVED:
221 case RDMA_CM_EVENT_ROUTE_RESOLVED:
Tom Talpey5675add2008-10-09 15:01:41 -0400222 ia->ri_async_rc = 0;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400223 complete(&ia->ri_done);
224 break;
225 case RDMA_CM_EVENT_ADDR_ERROR:
226 ia->ri_async_rc = -EHOSTUNREACH;
227 dprintk("RPC: %s: CM address resolution error, ep 0x%p\n",
228 __func__, ep);
229 complete(&ia->ri_done);
230 break;
231 case RDMA_CM_EVENT_ROUTE_ERROR:
232 ia->ri_async_rc = -ENETUNREACH;
233 dprintk("RPC: %s: CM route resolution error, ep 0x%p\n",
234 __func__, ep);
235 complete(&ia->ri_done);
236 break;
237 case RDMA_CM_EVENT_ESTABLISHED:
238 connstate = 1;
Chuck Leverce1ab9a2015-01-21 11:03:35 -0500239 ib_query_qp(ia->ri_id->qp, attr,
240 IB_QP_MAX_QP_RD_ATOMIC | IB_QP_MAX_DEST_RD_ATOMIC,
241 iattr);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400242 dprintk("RPC: %s: %d responder resources"
243 " (%d initiator)\n",
Chuck Leverce1ab9a2015-01-21 11:03:35 -0500244 __func__, attr->max_dest_rd_atomic,
245 attr->max_rd_atomic);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400246 goto connected;
247 case RDMA_CM_EVENT_CONNECT_ERROR:
248 connstate = -ENOTCONN;
249 goto connected;
250 case RDMA_CM_EVENT_UNREACHABLE:
251 connstate = -ENETDOWN;
252 goto connected;
253 case RDMA_CM_EVENT_REJECTED:
254 connstate = -ECONNREFUSED;
255 goto connected;
256 case RDMA_CM_EVENT_DISCONNECTED:
257 connstate = -ECONNABORTED;
258 goto connected;
259 case RDMA_CM_EVENT_DEVICE_REMOVAL:
260 connstate = -ENODEV;
261connected:
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400262 dprintk("RPC: %s: %sconnected\n",
263 __func__, connstate > 0 ? "" : "dis");
Chuck Lever23826c72016-03-04 11:28:27 -0500264 atomic_set(&xprt->rx_buf.rb_credits, 1);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400265 ep->rep_connected = connstate;
Chuck Leverafadc462015-01-21 11:03:11 -0500266 rpcrdma_conn_func(ep);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400267 wake_up_all(&ep->rep_connect_wait);
Chuck Lever8079fb72014-07-29 17:26:12 -0400268 /*FALLTHROUGH*/
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400269 default:
Chuck Lever0dd39ca2015-03-30 14:33:43 -0400270 dprintk("RPC: %s: %pIS:%u (ep 0x%p): %s\n",
271 __func__, sap, rpc_get_port(sap), ep,
Sagi Grimberg76357c72015-05-18 13:40:32 +0300272 rdma_event_msg(event->event));
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400273 break;
274 }
275
Jeff Laytonf895b252014-11-17 16:58:04 -0500276#if IS_ENABLED(CONFIG_SUNRPC_DEBUG)
Tom Talpeyb3cd8d42008-10-09 15:02:02 -0400277 if (connstate == 1) {
Chuck Leverce1ab9a2015-01-21 11:03:35 -0500278 int ird = attr->max_dest_rd_atomic;
Tom Talpeyb3cd8d42008-10-09 15:02:02 -0400279 int tird = ep->rep_remote_cma.responder_resources;
Chuck Lever0dd39ca2015-03-30 14:33:43 -0400280
Chuck Levera0ce85f2015-03-30 14:34:21 -0400281 pr_info("rpcrdma: connection to %pIS:%u on %s, memreg '%s', %d credits, %d responders%s\n",
Chuck Lever0dd39ca2015-03-30 14:33:43 -0400282 sap, rpc_get_port(sap),
Chuck Lever89e0d1122015-05-26 11:51:56 -0400283 ia->ri_device->name,
Chuck Levera0ce85f2015-03-30 14:34:21 -0400284 ia->ri_ops->ro_displayname,
Tom Talpeyb3cd8d42008-10-09 15:02:02 -0400285 xprt->rx_buf.rb_max_requests,
286 ird, ird < 4 && ird < tird / 2 ? " (low!)" : "");
287 } else if (connstate < 0) {
Chuck Lever0dd39ca2015-03-30 14:33:43 -0400288 pr_info("rpcrdma: connection to %pIS:%u closed (%d)\n",
289 sap, rpc_get_port(sap), connstate);
Tom Talpeyb3cd8d42008-10-09 15:02:02 -0400290 }
291#endif
292
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400293 return 0;
294}
295
Devesh Sharmad0f36c42015-08-03 13:05:04 -0400296static void rpcrdma_destroy_id(struct rdma_cm_id *id)
297{
298 if (id) {
299 module_put(id->device->owner);
300 rdma_destroy_id(id);
301 }
302}
303
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400304static struct rdma_cm_id *
305rpcrdma_create_id(struct rpcrdma_xprt *xprt,
306 struct rpcrdma_ia *ia, struct sockaddr *addr)
307{
308 struct rdma_cm_id *id;
309 int rc;
310
Tom Talpey1a954052008-10-09 15:01:31 -0400311 init_completion(&ia->ri_done);
312
Guy Shapirofa201052015-10-22 15:20:10 +0300313 id = rdma_create_id(&init_net, rpcrdma_conn_upcall, xprt, RDMA_PS_TCP,
314 IB_QPT_RC);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400315 if (IS_ERR(id)) {
316 rc = PTR_ERR(id);
317 dprintk("RPC: %s: rdma_create_id() failed %i\n",
318 __func__, rc);
319 return id;
320 }
321
Tom Talpey5675add2008-10-09 15:01:41 -0400322 ia->ri_async_rc = -ETIMEDOUT;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400323 rc = rdma_resolve_addr(id, NULL, addr, RDMA_RESOLVE_TIMEOUT);
324 if (rc) {
325 dprintk("RPC: %s: rdma_resolve_addr() failed %i\n",
326 __func__, rc);
327 goto out;
328 }
Tom Talpey5675add2008-10-09 15:01:41 -0400329 wait_for_completion_interruptible_timeout(&ia->ri_done,
330 msecs_to_jiffies(RDMA_RESOLVE_TIMEOUT) + 1);
Devesh Sharmad0f36c42015-08-03 13:05:04 -0400331
332 /* FIXME:
333 * Until xprtrdma supports DEVICE_REMOVAL, the provider must
334 * be pinned while there are active NFS/RDMA mounts to prevent
335 * hangs and crashes at umount time.
336 */
337 if (!ia->ri_async_rc && !try_module_get(id->device->owner)) {
338 dprintk("RPC: %s: Failed to get device module\n",
339 __func__);
340 ia->ri_async_rc = -ENODEV;
341 }
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400342 rc = ia->ri_async_rc;
343 if (rc)
344 goto out;
345
Tom Talpey5675add2008-10-09 15:01:41 -0400346 ia->ri_async_rc = -ETIMEDOUT;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400347 rc = rdma_resolve_route(id, RDMA_RESOLVE_TIMEOUT);
348 if (rc) {
349 dprintk("RPC: %s: rdma_resolve_route() failed %i\n",
350 __func__, rc);
Devesh Sharmad0f36c42015-08-03 13:05:04 -0400351 goto put;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400352 }
Tom Talpey5675add2008-10-09 15:01:41 -0400353 wait_for_completion_interruptible_timeout(&ia->ri_done,
354 msecs_to_jiffies(RDMA_RESOLVE_TIMEOUT) + 1);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400355 rc = ia->ri_async_rc;
356 if (rc)
Devesh Sharmad0f36c42015-08-03 13:05:04 -0400357 goto put;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400358
359 return id;
Devesh Sharmad0f36c42015-08-03 13:05:04 -0400360put:
361 module_put(id->device->owner);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400362out:
363 rdma_destroy_id(id);
364 return ERR_PTR(rc);
365}
366
367/*
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400368 * Exported functions.
369 */
370
371/*
372 * Open and initialize an Interface Adapter.
373 * o initializes fields of struct rpcrdma_ia, including
374 * interface and provider attributes and protection zone.
375 */
376int
377rpcrdma_ia_open(struct rpcrdma_xprt *xprt, struct sockaddr *addr, int memreg)
378{
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400379 struct rpcrdma_ia *ia = &xprt->rx_ia;
Chuck Leverd1ed8572015-08-03 13:03:30 -0400380 int rc;
381
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400382 ia->ri_id = rpcrdma_create_id(xprt, ia, addr);
383 if (IS_ERR(ia->ri_id)) {
384 rc = PTR_ERR(ia->ri_id);
385 goto out1;
386 }
Chuck Lever89e0d1122015-05-26 11:51:56 -0400387 ia->ri_device = ia->ri_id->device;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400388
Chuck Lever89e0d1122015-05-26 11:51:56 -0400389 ia->ri_pd = ib_alloc_pd(ia->ri_device);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400390 if (IS_ERR(ia->ri_pd)) {
391 rc = PTR_ERR(ia->ri_pd);
Chuck Leverb54054c2016-06-29 13:53:27 -0400392 pr_err("rpcrdma: ib_alloc_pd() returned %d\n", rc);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400393 goto out2;
394 }
395
Tom Talpeybd7ed1d2008-10-09 15:00:09 -0400396 switch (memreg) {
Tom Talpey3197d3092008-10-09 15:00:20 -0400397 case RPCRDMA_FRMR:
Chuck Leverb54054c2016-06-29 13:53:27 -0400398 if (frwr_is_supported(ia)) {
399 ia->ri_ops = &rpcrdma_frwr_memreg_ops;
400 break;
401 }
402 /*FALLTHROUGH*/
Tom Talpeybd7ed1d2008-10-09 15:00:09 -0400403 case RPCRDMA_MTHCAFMR:
Chuck Leverb54054c2016-06-29 13:53:27 -0400404 if (fmr_is_supported(ia)) {
405 ia->ri_ops = &rpcrdma_fmr_memreg_ops;
406 break;
407 }
408 /*FALLTHROUGH*/
Tom Talpeybd7ed1d2008-10-09 15:00:09 -0400409 default:
Chuck Leverb54054c2016-06-29 13:53:27 -0400410 pr_err("rpcrdma: Unsupported memory registration mode: %d\n",
411 memreg);
412 rc = -EINVAL;
Chuck Lever5ae711a2015-01-21 11:03:19 -0500413 goto out3;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400414 }
415
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400416 return 0;
Chuck Lever5ae711a2015-01-21 11:03:19 -0500417
418out3:
419 ib_dealloc_pd(ia->ri_pd);
420 ia->ri_pd = NULL;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400421out2:
Devesh Sharmad0f36c42015-08-03 13:05:04 -0400422 rpcrdma_destroy_id(ia->ri_id);
Tom Talpeyfee08ca2008-10-09 15:01:00 -0400423 ia->ri_id = NULL;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400424out1:
425 return rc;
426}
427
428/*
429 * Clean up/close an IA.
430 * o if event handles and PD have been initialized, free them.
431 * o close the IA
432 */
433void
434rpcrdma_ia_close(struct rpcrdma_ia *ia)
435{
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400436 dprintk("RPC: %s: entering\n", __func__);
Tom Talpeyfee08ca2008-10-09 15:01:00 -0400437 if (ia->ri_id != NULL && !IS_ERR(ia->ri_id)) {
438 if (ia->ri_id->qp)
439 rdma_destroy_qp(ia->ri_id);
Devesh Sharmad0f36c42015-08-03 13:05:04 -0400440 rpcrdma_destroy_id(ia->ri_id);
Tom Talpeyfee08ca2008-10-09 15:01:00 -0400441 ia->ri_id = NULL;
442 }
Chuck Lever6d446982015-05-26 11:51:27 -0400443
444 /* If the pd is still busy, xprtrdma missed freeing a resource */
445 if (ia->ri_pd && !IS_ERR(ia->ri_pd))
Jason Gunthorpe7dd78642015-08-05 14:34:31 -0600446 ib_dealloc_pd(ia->ri_pd);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400447}
448
449/*
450 * Create unconnected endpoint.
451 */
452int
453rpcrdma_ep_create(struct rpcrdma_ep *ep, struct rpcrdma_ia *ia,
454 struct rpcrdma_create_data_internal *cdata)
455{
Chuck Leverfc664482014-05-28 10:33:25 -0400456 struct ib_cq *sendcq, *recvcq;
Chuck Lever124fa172015-10-24 17:27:51 -0400457 unsigned int max_qp_wr;
Chuck Lever2fa8f882016-03-04 11:28:53 -0500458 int rc;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400459
Or Gerlitze3e45b12015-12-18 10:59:48 +0200460 if (ia->ri_device->attrs.max_sge < RPCRDMA_MAX_IOVS) {
Chuck Leverb3221d62015-08-03 13:03:39 -0400461 dprintk("RPC: %s: insufficient sge's available\n",
462 __func__);
463 return -ENOMEM;
464 }
465
Or Gerlitze3e45b12015-12-18 10:59:48 +0200466 if (ia->ri_device->attrs.max_qp_wr <= RPCRDMA_BACKWARD_WRS) {
Chuck Lever124fa172015-10-24 17:27:51 -0400467 dprintk("RPC: %s: insufficient wqe's available\n",
468 __func__);
469 return -ENOMEM;
470 }
Chuck Lever550d7502016-05-02 14:41:47 -0400471 max_qp_wr = ia->ri_device->attrs.max_qp_wr - RPCRDMA_BACKWARD_WRS - 1;
Chuck Lever124fa172015-10-24 17:27:51 -0400472
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400473 /* check provider's send/recv wr limits */
Chuck Lever124fa172015-10-24 17:27:51 -0400474 if (cdata->max_requests > max_qp_wr)
475 cdata->max_requests = max_qp_wr;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400476
477 ep->rep_attr.event_handler = rpcrdma_qp_async_error_upcall;
478 ep->rep_attr.qp_context = ep;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400479 ep->rep_attr.srq = NULL;
480 ep->rep_attr.cap.max_send_wr = cdata->max_requests;
Chuck Lever124fa172015-10-24 17:27:51 -0400481 ep->rep_attr.cap.max_send_wr += RPCRDMA_BACKWARD_WRS;
Chuck Lever550d7502016-05-02 14:41:47 -0400482 ep->rep_attr.cap.max_send_wr += 1; /* drain cqe */
Chuck Lever3968cb52015-03-30 14:35:26 -0400483 rc = ia->ri_ops->ro_open(ia, ep, cdata);
484 if (rc)
485 return rc;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400486 ep->rep_attr.cap.max_recv_wr = cdata->max_requests;
Chuck Lever124fa172015-10-24 17:27:51 -0400487 ep->rep_attr.cap.max_recv_wr += RPCRDMA_BACKWARD_WRS;
Chuck Lever550d7502016-05-02 14:41:47 -0400488 ep->rep_attr.cap.max_recv_wr += 1; /* drain cqe */
Chuck Leverb3221d62015-08-03 13:03:39 -0400489 ep->rep_attr.cap.max_send_sge = RPCRDMA_MAX_IOVS;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400490 ep->rep_attr.cap.max_recv_sge = 1;
491 ep->rep_attr.cap.max_inline_data = 0;
492 ep->rep_attr.sq_sig_type = IB_SIGNAL_REQ_WR;
493 ep->rep_attr.qp_type = IB_QPT_RC;
494 ep->rep_attr.port_num = ~0;
495
496 dprintk("RPC: %s: requested max: dtos: send %d recv %d; "
497 "iovs: send %d recv %d\n",
498 __func__,
499 ep->rep_attr.cap.max_send_wr,
500 ep->rep_attr.cap.max_recv_wr,
501 ep->rep_attr.cap.max_send_sge,
502 ep->rep_attr.cap.max_recv_sge);
503
504 /* set trigger for requesting send completion */
Chuck Leverfc664482014-05-28 10:33:25 -0400505 ep->rep_cqinit = ep->rep_attr.cap.max_send_wr/2 - 1;
Chuck Lever26ae9d12015-12-16 17:23:20 -0500506 if (ep->rep_cqinit <= 2)
507 ep->rep_cqinit = 0; /* always signal? */
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400508 INIT_CQCOUNT(ep);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400509 init_waitqueue_head(&ep->rep_connect_wait);
Chuck Lever254f91e2014-05-28 10:32:17 -0400510 INIT_DELAYED_WORK(&ep->rep_connect_worker, rpcrdma_connect_worker);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400511
Chuck Lever2fa8f882016-03-04 11:28:53 -0500512 sendcq = ib_alloc_cq(ia->ri_device, NULL,
513 ep->rep_attr.cap.max_send_wr + 1,
514 0, IB_POLL_SOFTIRQ);
Chuck Leverfc664482014-05-28 10:33:25 -0400515 if (IS_ERR(sendcq)) {
516 rc = PTR_ERR(sendcq);
517 dprintk("RPC: %s: failed to create send CQ: %i\n",
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400518 __func__, rc);
519 goto out1;
520 }
521
Chuck Lever552bf222016-03-04 11:28:36 -0500522 recvcq = ib_alloc_cq(ia->ri_device, NULL,
523 ep->rep_attr.cap.max_recv_wr + 1,
524 0, IB_POLL_SOFTIRQ);
Chuck Leverfc664482014-05-28 10:33:25 -0400525 if (IS_ERR(recvcq)) {
526 rc = PTR_ERR(recvcq);
527 dprintk("RPC: %s: failed to create recv CQ: %i\n",
528 __func__, rc);
529 goto out2;
530 }
531
Chuck Leverfc664482014-05-28 10:33:25 -0400532 ep->rep_attr.send_cq = sendcq;
533 ep->rep_attr.recv_cq = recvcq;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400534
535 /* Initialize cma parameters */
Chuck Leverb2dde942016-05-02 14:43:03 -0400536 memset(&ep->rep_remote_cma, 0, sizeof(ep->rep_remote_cma));
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400537
538 /* RPC/RDMA does not use private data */
539 ep->rep_remote_cma.private_data = NULL;
540 ep->rep_remote_cma.private_data_len = 0;
541
542 /* Client offers RDMA Read but does not initiate */
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400543 ep->rep_remote_cma.initiator_depth = 0;
Or Gerlitze3e45b12015-12-18 10:59:48 +0200544 if (ia->ri_device->attrs.max_qp_rd_atom > 32) /* arbitrary but <= 255 */
Tom Tuckerb334eaa2008-10-09 15:00:30 -0400545 ep->rep_remote_cma.responder_resources = 32;
546 else
Chuck Lever7bc79722015-01-21 11:03:27 -0500547 ep->rep_remote_cma.responder_resources =
Or Gerlitze3e45b12015-12-18 10:59:48 +0200548 ia->ri_device->attrs.max_qp_rd_atom;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400549
Chuck Leverb2dde942016-05-02 14:43:03 -0400550 /* Limit transport retries so client can detect server
551 * GID changes quickly. RPC layer handles re-establishing
552 * transport connection and retransmission.
553 */
554 ep->rep_remote_cma.retry_count = 6;
555
556 /* RPC-over-RDMA handles its own flow control. In addition,
557 * make all RNR NAKs visible so we know that RPC-over-RDMA
558 * flow control is working correctly (no NAKs should be seen).
559 */
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400560 ep->rep_remote_cma.flow_control = 0;
561 ep->rep_remote_cma.rnr_retry_count = 0;
562
563 return 0;
564
565out2:
Chuck Lever2fa8f882016-03-04 11:28:53 -0500566 ib_free_cq(sendcq);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400567out1:
568 return rc;
569}
570
571/*
572 * rpcrdma_ep_destroy
573 *
574 * Disconnect and destroy endpoint. After this, the only
575 * valid operations on the ep are to free it (if dynamically
576 * allocated) or re-create it.
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400577 */
Chuck Lever7f1d5412014-05-28 10:33:16 -0400578void
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400579rpcrdma_ep_destroy(struct rpcrdma_ep *ep, struct rpcrdma_ia *ia)
580{
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400581 dprintk("RPC: %s: entering, connected is %d\n",
582 __func__, ep->rep_connected);
583
Chuck Lever254f91e2014-05-28 10:32:17 -0400584 cancel_delayed_work_sync(&ep->rep_connect_worker);
585
Steve Wise72c02172015-09-21 12:24:23 -0500586 if (ia->ri_id->qp) {
Chuck Lever550d7502016-05-02 14:41:47 -0400587 rpcrdma_ep_disconnect(ep, ia);
Tom Talpeyfee08ca2008-10-09 15:01:00 -0400588 rdma_destroy_qp(ia->ri_id);
589 ia->ri_id->qp = NULL;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400590 }
591
Chuck Lever552bf222016-03-04 11:28:36 -0500592 ib_free_cq(ep->rep_attr.recv_cq);
Chuck Lever2fa8f882016-03-04 11:28:53 -0500593 ib_free_cq(ep->rep_attr.send_cq);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400594}
595
596/*
597 * Connect unconnected endpoint.
598 */
599int
600rpcrdma_ep_connect(struct rpcrdma_ep *ep, struct rpcrdma_ia *ia)
601{
Chuck Lever73806c82014-07-29 17:23:25 -0400602 struct rdma_cm_id *id, *old;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400603 int rc = 0;
604 int retry_count = 0;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400605
Tom Talpeyc0555512008-10-10 11:32:45 -0400606 if (ep->rep_connected != 0) {
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400607 struct rpcrdma_xprt *xprt;
608retry:
Chuck Leverec62f402014-05-28 10:34:07 -0400609 dprintk("RPC: %s: reconnecting...\n", __func__);
Chuck Lever282191c2014-07-29 17:25:55 -0400610
611 rpcrdma_ep_disconnect(ep, ia);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400612
613 xprt = container_of(ia, struct rpcrdma_xprt, rx_ia);
614 id = rpcrdma_create_id(xprt, ia,
615 (struct sockaddr *)&xprt->rx_data.addr);
616 if (IS_ERR(id)) {
Chuck Leverec62f402014-05-28 10:34:07 -0400617 rc = -EHOSTUNREACH;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400618 goto out;
619 }
620 /* TEMP TEMP TEMP - fail if new device:
621 * Deregister/remarshal *all* requests!
622 * Close and recreate adapter, pd, etc!
623 * Re-determine all attributes still sane!
624 * More stuff I haven't thought of!
625 * Rrrgh!
626 */
Chuck Lever89e0d1122015-05-26 11:51:56 -0400627 if (ia->ri_device != id->device) {
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400628 printk("RPC: %s: can't reconnect on "
629 "different device!\n", __func__);
Devesh Sharmad0f36c42015-08-03 13:05:04 -0400630 rpcrdma_destroy_id(id);
Chuck Leverec62f402014-05-28 10:34:07 -0400631 rc = -ENETUNREACH;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400632 goto out;
633 }
634 /* END TEMP */
Chuck Leverec62f402014-05-28 10:34:07 -0400635 rc = rdma_create_qp(id, ia->ri_pd, &ep->rep_attr);
636 if (rc) {
637 dprintk("RPC: %s: rdma_create_qp failed %i\n",
638 __func__, rc);
Devesh Sharmad0f36c42015-08-03 13:05:04 -0400639 rpcrdma_destroy_id(id);
Chuck Leverec62f402014-05-28 10:34:07 -0400640 rc = -ENETUNREACH;
641 goto out;
642 }
Chuck Lever73806c82014-07-29 17:23:25 -0400643
Chuck Lever73806c82014-07-29 17:23:25 -0400644 old = ia->ri_id;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400645 ia->ri_id = id;
Chuck Lever73806c82014-07-29 17:23:25 -0400646
647 rdma_destroy_qp(old);
Devesh Sharmad0f36c42015-08-03 13:05:04 -0400648 rpcrdma_destroy_id(old);
Chuck Leverec62f402014-05-28 10:34:07 -0400649 } else {
650 dprintk("RPC: %s: connecting...\n", __func__);
651 rc = rdma_create_qp(ia->ri_id, ia->ri_pd, &ep->rep_attr);
652 if (rc) {
653 dprintk("RPC: %s: rdma_create_qp failed %i\n",
654 __func__, rc);
655 /* do not update ep->rep_connected */
656 return -ENETUNREACH;
657 }
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400658 }
659
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400660 ep->rep_connected = 0;
661
662 rc = rdma_connect(ia->ri_id, &ep->rep_remote_cma);
663 if (rc) {
664 dprintk("RPC: %s: rdma_connect() failed with %i\n",
665 __func__, rc);
666 goto out;
667 }
668
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400669 wait_event_interruptible(ep->rep_connect_wait, ep->rep_connected != 0);
670
671 /*
672 * Check state. A non-peer reject indicates no listener
673 * (ECONNREFUSED), which may be a transient state. All
674 * others indicate a transport condition which has already
675 * undergone a best-effort.
676 */
Joe Perchesf64f9e72009-11-29 16:55:45 -0800677 if (ep->rep_connected == -ECONNREFUSED &&
678 ++retry_count <= RDMA_CONNECT_RETRY_MAX) {
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400679 dprintk("RPC: %s: non-peer_reject, retry\n", __func__);
680 goto retry;
681 }
682 if (ep->rep_connected <= 0) {
683 /* Sometimes, the only way to reliably connect to remote
684 * CMs is to use same nonzero values for ORD and IRD. */
Tom Tuckerb334eaa2008-10-09 15:00:30 -0400685 if (retry_count++ <= RDMA_CONNECT_RETRY_MAX + 1 &&
686 (ep->rep_remote_cma.responder_resources == 0 ||
687 ep->rep_remote_cma.initiator_depth !=
688 ep->rep_remote_cma.responder_resources)) {
689 if (ep->rep_remote_cma.responder_resources == 0)
690 ep->rep_remote_cma.responder_resources = 1;
691 ep->rep_remote_cma.initiator_depth =
692 ep->rep_remote_cma.responder_resources;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400693 goto retry;
Tom Tuckerb334eaa2008-10-09 15:00:30 -0400694 }
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400695 rc = ep->rep_connected;
696 } else {
Chuck Leverf531a5d2015-10-24 17:27:43 -0400697 struct rpcrdma_xprt *r_xprt;
698 unsigned int extras;
699
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400700 dprintk("RPC: %s: connected\n", __func__);
Chuck Leverf531a5d2015-10-24 17:27:43 -0400701
702 r_xprt = container_of(ia, struct rpcrdma_xprt, rx_ia);
703 extras = r_xprt->rx_buf.rb_bc_srv_max_requests;
704
705 if (extras) {
706 rc = rpcrdma_ep_post_extra_recv(r_xprt, extras);
Dan Carpenter38b95bc2015-11-05 11:37:08 +0300707 if (rc) {
Chuck Leverf531a5d2015-10-24 17:27:43 -0400708 pr_warn("%s: rpcrdma_ep_post_extra_recv: %i\n",
709 __func__, rc);
710 rc = 0;
Dan Carpenter38b95bc2015-11-05 11:37:08 +0300711 }
Chuck Leverf531a5d2015-10-24 17:27:43 -0400712 }
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400713 }
714
715out:
716 if (rc)
717 ep->rep_connected = rc;
718 return rc;
719}
720
721/*
722 * rpcrdma_ep_disconnect
723 *
724 * This is separate from destroy to facilitate the ability
725 * to reconnect without recreating the endpoint.
726 *
727 * This call is not reentrant, and must not be made in parallel
728 * on the same endpoint.
729 */
Chuck Lever282191c2014-07-29 17:25:55 -0400730void
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400731rpcrdma_ep_disconnect(struct rpcrdma_ep *ep, struct rpcrdma_ia *ia)
732{
733 int rc;
734
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400735 rc = rdma_disconnect(ia->ri_id);
736 if (!rc) {
737 /* returns without wait if not connected */
738 wait_event_interruptible(ep->rep_connect_wait,
739 ep->rep_connected != 1);
740 dprintk("RPC: %s: after wait, %sconnected\n", __func__,
741 (ep->rep_connected == 1) ? "still " : "dis");
742 } else {
743 dprintk("RPC: %s: rdma_disconnect %i\n", __func__, rc);
744 ep->rep_connected = rc;
745 }
Chuck Lever550d7502016-05-02 14:41:47 -0400746
747 ib_drain_qp(ia->ri_id->qp);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400748}
749
Chuck Lever505bbe62016-06-29 13:52:54 -0400750static void
751rpcrdma_mr_recovery_worker(struct work_struct *work)
752{
753 struct rpcrdma_buffer *buf = container_of(work, struct rpcrdma_buffer,
754 rb_recovery_worker.work);
755 struct rpcrdma_mw *mw;
756
757 spin_lock(&buf->rb_recovery_lock);
758 while (!list_empty(&buf->rb_stale_mrs)) {
759 mw = list_first_entry(&buf->rb_stale_mrs,
760 struct rpcrdma_mw, mw_list);
761 list_del_init(&mw->mw_list);
762 spin_unlock(&buf->rb_recovery_lock);
763
764 dprintk("RPC: %s: recovering MR %p\n", __func__, mw);
765 mw->mw_xprt->rx_ia.ri_ops->ro_recover_mr(mw);
766
767 spin_lock(&buf->rb_recovery_lock);
kbuild test robot53d78522016-07-16 06:02:05 +0800768 }
Chuck Lever505bbe62016-06-29 13:52:54 -0400769 spin_unlock(&buf->rb_recovery_lock);
770}
771
772void
773rpcrdma_defer_mr_recovery(struct rpcrdma_mw *mw)
774{
775 struct rpcrdma_xprt *r_xprt = mw->mw_xprt;
776 struct rpcrdma_buffer *buf = &r_xprt->rx_buf;
777
778 spin_lock(&buf->rb_recovery_lock);
779 list_add(&mw->mw_list, &buf->rb_stale_mrs);
780 spin_unlock(&buf->rb_recovery_lock);
781
782 schedule_delayed_work(&buf->rb_recovery_worker, 0);
783}
784
Chuck Levere2ac2362016-06-29 13:54:00 -0400785static void
786rpcrdma_create_mrs(struct rpcrdma_xprt *r_xprt)
787{
788 struct rpcrdma_buffer *buf = &r_xprt->rx_buf;
789 struct rpcrdma_ia *ia = &r_xprt->rx_ia;
790 unsigned int count;
791 LIST_HEAD(free);
792 LIST_HEAD(all);
793
794 for (count = 0; count < 32; count++) {
795 struct rpcrdma_mw *mw;
796 int rc;
797
798 mw = kzalloc(sizeof(*mw), GFP_KERNEL);
799 if (!mw)
800 break;
801
802 rc = ia->ri_ops->ro_init_mr(ia, mw);
803 if (rc) {
804 kfree(mw);
805 break;
806 }
807
808 mw->mw_xprt = r_xprt;
809
810 list_add(&mw->mw_list, &free);
811 list_add(&mw->mw_all, &all);
812 }
813
814 spin_lock(&buf->rb_mwlock);
815 list_splice(&free, &buf->rb_mws);
816 list_splice(&all, &buf->rb_all);
817 r_xprt->rx_stats.mrs_allocated += count;
818 spin_unlock(&buf->rb_mwlock);
819
820 dprintk("RPC: %s: created %u MRs\n", __func__, count);
821}
822
823static void
824rpcrdma_mr_refresh_worker(struct work_struct *work)
825{
826 struct rpcrdma_buffer *buf = container_of(work, struct rpcrdma_buffer,
827 rb_refresh_worker.work);
828 struct rpcrdma_xprt *r_xprt = container_of(buf, struct rpcrdma_xprt,
829 rx_buf);
830
831 rpcrdma_create_mrs(r_xprt);
832}
833
Chuck Leverf531a5d2015-10-24 17:27:43 -0400834struct rpcrdma_req *
Chuck Lever13924022015-01-21 11:03:52 -0500835rpcrdma_create_req(struct rpcrdma_xprt *r_xprt)
836{
Chuck Leverf531a5d2015-10-24 17:27:43 -0400837 struct rpcrdma_buffer *buffer = &r_xprt->rx_buf;
Chuck Lever13924022015-01-21 11:03:52 -0500838 struct rpcrdma_req *req;
Chuck Lever13924022015-01-21 11:03:52 -0500839
Chuck Lever85275c82015-01-21 11:04:16 -0500840 req = kzalloc(sizeof(*req), GFP_KERNEL);
Chuck Lever13924022015-01-21 11:03:52 -0500841 if (req == NULL)
Chuck Lever85275c82015-01-21 11:04:16 -0500842 return ERR_PTR(-ENOMEM);
Chuck Lever13924022015-01-21 11:03:52 -0500843
Chuck Leverf531a5d2015-10-24 17:27:43 -0400844 INIT_LIST_HEAD(&req->rl_free);
845 spin_lock(&buffer->rb_reqslock);
846 list_add(&req->rl_all, &buffer->rb_allreqs);
847 spin_unlock(&buffer->rb_reqslock);
Chuck Lever2fa8f882016-03-04 11:28:53 -0500848 req->rl_cqe.done = rpcrdma_wc_send;
Chuck Lever13924022015-01-21 11:03:52 -0500849 req->rl_buffer = &r_xprt->rx_buf;
Chuck Lever9d6b0402016-06-29 13:54:16 -0400850 INIT_LIST_HEAD(&req->rl_registered);
Chuck Lever13924022015-01-21 11:03:52 -0500851 return req;
Chuck Lever13924022015-01-21 11:03:52 -0500852}
853
Chuck Leverf531a5d2015-10-24 17:27:43 -0400854struct rpcrdma_rep *
Chuck Lever13924022015-01-21 11:03:52 -0500855rpcrdma_create_rep(struct rpcrdma_xprt *r_xprt)
856{
857 struct rpcrdma_create_data_internal *cdata = &r_xprt->rx_data;
Chuck Lever13924022015-01-21 11:03:52 -0500858 struct rpcrdma_ia *ia = &r_xprt->rx_ia;
859 struct rpcrdma_rep *rep;
860 int rc;
861
862 rc = -ENOMEM;
Chuck Lever6b1184c2015-01-21 11:04:25 -0500863 rep = kzalloc(sizeof(*rep), GFP_KERNEL);
Chuck Lever13924022015-01-21 11:03:52 -0500864 if (rep == NULL)
865 goto out;
Chuck Lever13924022015-01-21 11:03:52 -0500866
Chuck Lever6b1184c2015-01-21 11:04:25 -0500867 rep->rr_rdmabuf = rpcrdma_alloc_regbuf(ia, cdata->inline_rsize,
868 GFP_KERNEL);
869 if (IS_ERR(rep->rr_rdmabuf)) {
870 rc = PTR_ERR(rep->rr_rdmabuf);
Chuck Lever13924022015-01-21 11:03:52 -0500871 goto out_free;
Chuck Lever6b1184c2015-01-21 11:04:25 -0500872 }
Chuck Lever13924022015-01-21 11:03:52 -0500873
Chuck Lever89e0d1122015-05-26 11:51:56 -0400874 rep->rr_device = ia->ri_device;
Chuck Lever552bf222016-03-04 11:28:36 -0500875 rep->rr_cqe.done = rpcrdma_receive_wc;
Chuck Leverfed171b2015-05-26 11:51:37 -0400876 rep->rr_rxprt = r_xprt;
Chuck Leverfe97b472015-10-24 17:27:10 -0400877 INIT_WORK(&rep->rr_work, rpcrdma_receive_worker);
Chuck Lever13924022015-01-21 11:03:52 -0500878 return rep;
879
880out_free:
881 kfree(rep);
882out:
883 return ERR_PTR(rc);
884}
885
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400886int
Chuck Leverac920d02015-01-21 11:03:44 -0500887rpcrdma_buffer_create(struct rpcrdma_xprt *r_xprt)
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400888{
Chuck Leverac920d02015-01-21 11:03:44 -0500889 struct rpcrdma_buffer *buf = &r_xprt->rx_buf;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400890 int i, rc;
891
Chuck Lever1e465fd2015-10-24 17:27:02 -0400892 buf->rb_max_requests = r_xprt->rx_data.max_requests;
Chuck Leverf531a5d2015-10-24 17:27:43 -0400893 buf->rb_bc_srv_max_requests = 0;
Chuck Lever23826c72016-03-04 11:28:27 -0500894 atomic_set(&buf->rb_credits, 1);
Chuck Levere2ac2362016-06-29 13:54:00 -0400895 spin_lock_init(&buf->rb_mwlock);
Chuck Lever505bbe62016-06-29 13:52:54 -0400896 spin_lock_init(&buf->rb_lock);
897 spin_lock_init(&buf->rb_recovery_lock);
Chuck Levere2ac2362016-06-29 13:54:00 -0400898 INIT_LIST_HEAD(&buf->rb_mws);
899 INIT_LIST_HEAD(&buf->rb_all);
Chuck Lever505bbe62016-06-29 13:52:54 -0400900 INIT_LIST_HEAD(&buf->rb_stale_mrs);
Chuck Levere2ac2362016-06-29 13:54:00 -0400901 INIT_DELAYED_WORK(&buf->rb_refresh_worker,
902 rpcrdma_mr_refresh_worker);
Chuck Lever505bbe62016-06-29 13:52:54 -0400903 INIT_DELAYED_WORK(&buf->rb_recovery_worker,
904 rpcrdma_mr_recovery_worker);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400905
Chuck Levere2ac2362016-06-29 13:54:00 -0400906 rpcrdma_create_mrs(r_xprt);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400907
Chuck Lever1e465fd2015-10-24 17:27:02 -0400908 INIT_LIST_HEAD(&buf->rb_send_bufs);
Chuck Leverf531a5d2015-10-24 17:27:43 -0400909 INIT_LIST_HEAD(&buf->rb_allreqs);
910 spin_lock_init(&buf->rb_reqslock);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400911 for (i = 0; i < buf->rb_max_requests; i++) {
912 struct rpcrdma_req *req;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400913
Chuck Lever13924022015-01-21 11:03:52 -0500914 req = rpcrdma_create_req(r_xprt);
915 if (IS_ERR(req)) {
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400916 dprintk("RPC: %s: request buffer %d alloc"
917 " failed\n", __func__, i);
Chuck Lever13924022015-01-21 11:03:52 -0500918 rc = PTR_ERR(req);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400919 goto out;
920 }
Chuck Leverf531a5d2015-10-24 17:27:43 -0400921 req->rl_backchannel = false;
Chuck Lever1e465fd2015-10-24 17:27:02 -0400922 list_add(&req->rl_free, &buf->rb_send_bufs);
923 }
924
925 INIT_LIST_HEAD(&buf->rb_recv_bufs);
Chuck Lever78d506e2016-09-06 11:22:49 -0400926 for (i = 0; i < buf->rb_max_requests + 2; i++) {
Chuck Lever1e465fd2015-10-24 17:27:02 -0400927 struct rpcrdma_rep *rep;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400928
Chuck Lever13924022015-01-21 11:03:52 -0500929 rep = rpcrdma_create_rep(r_xprt);
930 if (IS_ERR(rep)) {
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400931 dprintk("RPC: %s: reply buffer %d alloc failed\n",
932 __func__, i);
Chuck Lever13924022015-01-21 11:03:52 -0500933 rc = PTR_ERR(rep);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400934 goto out;
935 }
Chuck Lever1e465fd2015-10-24 17:27:02 -0400936 list_add(&rep->rr_list, &buf->rb_recv_bufs);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400937 }
Chuck Lever13924022015-01-21 11:03:52 -0500938
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -0400939 return 0;
940out:
941 rpcrdma_buffer_destroy(buf);
942 return rc;
943}
944
Chuck Lever1e465fd2015-10-24 17:27:02 -0400945static struct rpcrdma_req *
946rpcrdma_buffer_get_req_locked(struct rpcrdma_buffer *buf)
947{
948 struct rpcrdma_req *req;
949
950 req = list_first_entry(&buf->rb_send_bufs,
951 struct rpcrdma_req, rl_free);
952 list_del(&req->rl_free);
953 return req;
954}
955
956static struct rpcrdma_rep *
957rpcrdma_buffer_get_rep_locked(struct rpcrdma_buffer *buf)
958{
959 struct rpcrdma_rep *rep;
960
961 rep = list_first_entry(&buf->rb_recv_bufs,
962 struct rpcrdma_rep, rr_list);
963 list_del(&rep->rr_list);
964 return rep;
965}
966
Chuck Lever2e845222014-07-29 17:25:38 -0400967static void
Chuck Lever13924022015-01-21 11:03:52 -0500968rpcrdma_destroy_rep(struct rpcrdma_ia *ia, struct rpcrdma_rep *rep)
969{
Chuck Lever6b1184c2015-01-21 11:04:25 -0500970 rpcrdma_free_regbuf(ia, rep->rr_rdmabuf);
Chuck Lever13924022015-01-21 11:03:52 -0500971 kfree(rep);
972}
973
Chuck Leverf531a5d2015-10-24 17:27:43 -0400974void
Chuck Lever13924022015-01-21 11:03:52 -0500975rpcrdma_destroy_req(struct rpcrdma_ia *ia, struct rpcrdma_req *req)
976{
Chuck Lever0ca77dc2015-01-21 11:04:08 -0500977 rpcrdma_free_regbuf(ia, req->rl_sendbuf);
Chuck Lever85275c82015-01-21 11:04:16 -0500978 rpcrdma_free_regbuf(ia, req->rl_rdmabuf);
Chuck Lever13924022015-01-21 11:03:52 -0500979 kfree(req);
980}
981
Chuck Levere2ac2362016-06-29 13:54:00 -0400982static void
983rpcrdma_destroy_mrs(struct rpcrdma_buffer *buf)
984{
985 struct rpcrdma_xprt *r_xprt = container_of(buf, struct rpcrdma_xprt,
986 rx_buf);
987 struct rpcrdma_ia *ia = rdmab_to_ia(buf);
988 struct rpcrdma_mw *mw;
989 unsigned int count;
990
991 count = 0;
992 spin_lock(&buf->rb_mwlock);
993 while (!list_empty(&buf->rb_all)) {
994 mw = list_entry(buf->rb_all.next, struct rpcrdma_mw, mw_all);
995 list_del(&mw->mw_all);
996
997 spin_unlock(&buf->rb_mwlock);
998 ia->ri_ops->ro_release_mr(mw);
999 count++;
1000 spin_lock(&buf->rb_mwlock);
1001 }
1002 spin_unlock(&buf->rb_mwlock);
1003 r_xprt->rx_stats.mrs_allocated = 0;
1004
1005 dprintk("RPC: %s: released %u MRs\n", __func__, count);
1006}
1007
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001008void
1009rpcrdma_buffer_destroy(struct rpcrdma_buffer *buf)
1010{
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001011 struct rpcrdma_ia *ia = rdmab_to_ia(buf);
1012
Chuck Lever505bbe62016-06-29 13:52:54 -04001013 cancel_delayed_work_sync(&buf->rb_recovery_worker);
1014
Chuck Lever1e465fd2015-10-24 17:27:02 -04001015 while (!list_empty(&buf->rb_recv_bufs)) {
1016 struct rpcrdma_rep *rep;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001017
Chuck Lever1e465fd2015-10-24 17:27:02 -04001018 rep = rpcrdma_buffer_get_rep_locked(buf);
1019 rpcrdma_destroy_rep(ia, rep);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001020 }
1021
Chuck Leverf531a5d2015-10-24 17:27:43 -04001022 spin_lock(&buf->rb_reqslock);
1023 while (!list_empty(&buf->rb_allreqs)) {
Chuck Lever1e465fd2015-10-24 17:27:02 -04001024 struct rpcrdma_req *req;
Allen Andrews4034ba02014-05-28 10:32:09 -04001025
Chuck Leverf531a5d2015-10-24 17:27:43 -04001026 req = list_first_entry(&buf->rb_allreqs,
1027 struct rpcrdma_req, rl_all);
1028 list_del(&req->rl_all);
1029
1030 spin_unlock(&buf->rb_reqslock);
Chuck Lever1e465fd2015-10-24 17:27:02 -04001031 rpcrdma_destroy_req(ia, req);
Chuck Leverf531a5d2015-10-24 17:27:43 -04001032 spin_lock(&buf->rb_reqslock);
Chuck Lever9f9d8022014-07-29 17:24:45 -04001033 }
Chuck Leverf531a5d2015-10-24 17:27:43 -04001034 spin_unlock(&buf->rb_reqslock);
Chuck Lever9f9d8022014-07-29 17:24:45 -04001035
Chuck Levere2ac2362016-06-29 13:54:00 -04001036 rpcrdma_destroy_mrs(buf);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001037}
1038
Chuck Lever346aa662015-05-26 11:52:06 -04001039struct rpcrdma_mw *
1040rpcrdma_get_mw(struct rpcrdma_xprt *r_xprt)
Chuck Leverc2922c02014-07-29 17:24:36 -04001041{
Chuck Lever346aa662015-05-26 11:52:06 -04001042 struct rpcrdma_buffer *buf = &r_xprt->rx_buf;
1043 struct rpcrdma_mw *mw = NULL;
Chuck Lever346aa662015-05-26 11:52:06 -04001044
Chuck Lever58d1dcf2015-05-26 11:53:13 -04001045 spin_lock(&buf->rb_mwlock);
Chuck Lever346aa662015-05-26 11:52:06 -04001046 if (!list_empty(&buf->rb_mws)) {
1047 mw = list_first_entry(&buf->rb_mws,
1048 struct rpcrdma_mw, mw_list);
1049 list_del_init(&mw->mw_list);
Chuck Leverc2922c02014-07-29 17:24:36 -04001050 }
Chuck Lever58d1dcf2015-05-26 11:53:13 -04001051 spin_unlock(&buf->rb_mwlock);
Chuck Lever346aa662015-05-26 11:52:06 -04001052
1053 if (!mw)
Chuck Levere2ac2362016-06-29 13:54:00 -04001054 goto out_nomws;
Chuck Lever346aa662015-05-26 11:52:06 -04001055 return mw;
Chuck Levere2ac2362016-06-29 13:54:00 -04001056
1057out_nomws:
1058 dprintk("RPC: %s: no MWs available\n", __func__);
1059 schedule_delayed_work(&buf->rb_refresh_worker, 0);
1060
1061 /* Allow the reply handler and refresh worker to run */
1062 cond_resched();
1063
1064 return NULL;
Chuck Leverc2922c02014-07-29 17:24:36 -04001065}
1066
Chuck Lever346aa662015-05-26 11:52:06 -04001067void
1068rpcrdma_put_mw(struct rpcrdma_xprt *r_xprt, struct rpcrdma_mw *mw)
Chuck Leverc2922c02014-07-29 17:24:36 -04001069{
Chuck Lever346aa662015-05-26 11:52:06 -04001070 struct rpcrdma_buffer *buf = &r_xprt->rx_buf;
Chuck Leverc2922c02014-07-29 17:24:36 -04001071
Chuck Lever58d1dcf2015-05-26 11:53:13 -04001072 spin_lock(&buf->rb_mwlock);
Chuck Lever346aa662015-05-26 11:52:06 -04001073 list_add_tail(&mw->mw_list, &buf->rb_mws);
Chuck Lever58d1dcf2015-05-26 11:53:13 -04001074 spin_unlock(&buf->rb_mwlock);
Chuck Leverc2922c02014-07-29 17:24:36 -04001075}
1076
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001077/*
1078 * Get a set of request/reply buffers.
Chuck Lever78d506e2016-09-06 11:22:49 -04001079 *
1080 * Reply buffer (if available) is attached to send buffer upon return.
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001081 */
1082struct rpcrdma_req *
1083rpcrdma_buffer_get(struct rpcrdma_buffer *buffers)
1084{
1085 struct rpcrdma_req *req;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001086
Chuck Levera5b027e2015-10-24 17:27:27 -04001087 spin_lock(&buffers->rb_lock);
Chuck Lever1e465fd2015-10-24 17:27:02 -04001088 if (list_empty(&buffers->rb_send_bufs))
1089 goto out_reqbuf;
1090 req = rpcrdma_buffer_get_req_locked(buffers);
1091 if (list_empty(&buffers->rb_recv_bufs))
1092 goto out_repbuf;
1093 req->rl_reply = rpcrdma_buffer_get_rep_locked(buffers);
Chuck Levera5b027e2015-10-24 17:27:27 -04001094 spin_unlock(&buffers->rb_lock);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001095 return req;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001096
Chuck Lever1e465fd2015-10-24 17:27:02 -04001097out_reqbuf:
Chuck Levera5b027e2015-10-24 17:27:27 -04001098 spin_unlock(&buffers->rb_lock);
Chuck Lever78d506e2016-09-06 11:22:49 -04001099 pr_warn("RPC: %s: out of request buffers\n", __func__);
Chuck Lever1e465fd2015-10-24 17:27:02 -04001100 return NULL;
1101out_repbuf:
Chuck Levera5b027e2015-10-24 17:27:27 -04001102 spin_unlock(&buffers->rb_lock);
Chuck Lever78d506e2016-09-06 11:22:49 -04001103 pr_warn("RPC: %s: out of reply buffers\n", __func__);
1104 req->rl_reply = NULL;
1105 return req;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001106}
1107
1108/*
1109 * Put request/reply buffers back into pool.
1110 * Pre-decrement counter/array index.
1111 */
1112void
1113rpcrdma_buffer_put(struct rpcrdma_req *req)
1114{
1115 struct rpcrdma_buffer *buffers = req->rl_buffer;
Chuck Lever1e465fd2015-10-24 17:27:02 -04001116 struct rpcrdma_rep *rep = req->rl_reply;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001117
Chuck Lever1e465fd2015-10-24 17:27:02 -04001118 req->rl_niovs = 0;
1119 req->rl_reply = NULL;
1120
Chuck Levera5b027e2015-10-24 17:27:27 -04001121 spin_lock(&buffers->rb_lock);
Chuck Lever1e465fd2015-10-24 17:27:02 -04001122 list_add_tail(&req->rl_free, &buffers->rb_send_bufs);
1123 if (rep)
1124 list_add_tail(&rep->rr_list, &buffers->rb_recv_bufs);
Chuck Levera5b027e2015-10-24 17:27:27 -04001125 spin_unlock(&buffers->rb_lock);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001126}
1127
1128/*
1129 * Recover reply buffers from pool.
Chuck Lever1e465fd2015-10-24 17:27:02 -04001130 * This happens when recovering from disconnect.
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001131 */
1132void
1133rpcrdma_recv_buffer_get(struct rpcrdma_req *req)
1134{
1135 struct rpcrdma_buffer *buffers = req->rl_buffer;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001136
Chuck Levera5b027e2015-10-24 17:27:27 -04001137 spin_lock(&buffers->rb_lock);
Chuck Lever1e465fd2015-10-24 17:27:02 -04001138 if (!list_empty(&buffers->rb_recv_bufs))
1139 req->rl_reply = rpcrdma_buffer_get_rep_locked(buffers);
Chuck Levera5b027e2015-10-24 17:27:27 -04001140 spin_unlock(&buffers->rb_lock);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001141}
1142
1143/*
1144 * Put reply buffers back into pool when not attached to
1145 * request. This happens in error conditions.
1146 */
1147void
1148rpcrdma_recv_buffer_put(struct rpcrdma_rep *rep)
1149{
Chuck Leverfed171b2015-05-26 11:51:37 -04001150 struct rpcrdma_buffer *buffers = &rep->rr_rxprt->rx_buf;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001151
Chuck Levera5b027e2015-10-24 17:27:27 -04001152 spin_lock(&buffers->rb_lock);
Chuck Lever1e465fd2015-10-24 17:27:02 -04001153 list_add_tail(&rep->rr_list, &buffers->rb_recv_bufs);
Chuck Levera5b027e2015-10-24 17:27:27 -04001154 spin_unlock(&buffers->rb_lock);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001155}
1156
1157/*
1158 * Wrappers for internal-use kmalloc memory registration, used by buffer code.
1159 */
1160
Chuck Lever9128c3e2015-01-21 11:04:00 -05001161/**
1162 * rpcrdma_alloc_regbuf - kmalloc and register memory for SEND/RECV buffers
1163 * @ia: controlling rpcrdma_ia
1164 * @size: size of buffer to be allocated, in bytes
1165 * @flags: GFP flags
1166 *
1167 * Returns pointer to private header of an area of internally
1168 * registered memory, or an ERR_PTR. The registered buffer follows
1169 * the end of the private header.
1170 *
1171 * xprtrdma uses a regbuf for posting an outgoing RDMA SEND, or for
1172 * receiving the payload of RDMA RECV operations. regbufs are not
1173 * used for RDMA READ/WRITE operations, thus are registered only for
1174 * LOCAL access.
1175 */
1176struct rpcrdma_regbuf *
1177rpcrdma_alloc_regbuf(struct rpcrdma_ia *ia, size_t size, gfp_t flags)
1178{
1179 struct rpcrdma_regbuf *rb;
Chuck Levere531dca2015-08-03 13:03:20 -04001180 struct ib_sge *iov;
Chuck Lever9128c3e2015-01-21 11:04:00 -05001181
Chuck Lever9128c3e2015-01-21 11:04:00 -05001182 rb = kmalloc(sizeof(*rb) + size, flags);
1183 if (rb == NULL)
1184 goto out;
1185
Chuck Levere531dca2015-08-03 13:03:20 -04001186 iov = &rb->rg_iov;
1187 iov->addr = ib_dma_map_single(ia->ri_device,
1188 (void *)rb->rg_base, size,
1189 DMA_BIDIRECTIONAL);
1190 if (ib_dma_mapping_error(ia->ri_device, iov->addr))
Chuck Lever9128c3e2015-01-21 11:04:00 -05001191 goto out_free;
1192
Chuck Levere531dca2015-08-03 13:03:20 -04001193 iov->length = size;
Chuck Leverbb6c96d2015-09-24 10:34:21 +03001194 iov->lkey = ia->ri_pd->local_dma_lkey;
Chuck Levere531dca2015-08-03 13:03:20 -04001195 rb->rg_size = size;
1196 rb->rg_owner = NULL;
Chuck Lever9128c3e2015-01-21 11:04:00 -05001197 return rb;
1198
1199out_free:
1200 kfree(rb);
1201out:
Chuck Levere531dca2015-08-03 13:03:20 -04001202 return ERR_PTR(-ENOMEM);
Chuck Lever9128c3e2015-01-21 11:04:00 -05001203}
1204
1205/**
1206 * rpcrdma_free_regbuf - deregister and free registered buffer
1207 * @ia: controlling rpcrdma_ia
1208 * @rb: regbuf to be deregistered and freed
1209 */
1210void
1211rpcrdma_free_regbuf(struct rpcrdma_ia *ia, struct rpcrdma_regbuf *rb)
1212{
Chuck Levere531dca2015-08-03 13:03:20 -04001213 struct ib_sge *iov;
1214
1215 if (!rb)
1216 return;
1217
1218 iov = &rb->rg_iov;
1219 ib_dma_unmap_single(ia->ri_device,
1220 iov->addr, iov->length, DMA_BIDIRECTIONAL);
1221 kfree(rb);
Chuck Lever9128c3e2015-01-21 11:04:00 -05001222}
1223
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001224/*
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001225 * Prepost any receive buffer, then post send.
1226 *
1227 * Receive buffer is donated to hardware, reclaimed upon recv completion.
1228 */
1229int
1230rpcrdma_ep_post(struct rpcrdma_ia *ia,
1231 struct rpcrdma_ep *ep,
1232 struct rpcrdma_req *req)
1233{
Chuck Leverb3221d62015-08-03 13:03:39 -04001234 struct ib_device *device = ia->ri_device;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001235 struct ib_send_wr send_wr, *send_wr_fail;
1236 struct rpcrdma_rep *rep = req->rl_reply;
Chuck Leverb3221d62015-08-03 13:03:39 -04001237 struct ib_sge *iov = req->rl_send_iov;
1238 int i, rc;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001239
1240 if (rep) {
1241 rc = rpcrdma_ep_post_recv(ia, ep, rep);
1242 if (rc)
Chuck Lever7a89f9c2016-06-29 13:53:43 -04001243 return rc;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001244 req->rl_reply = NULL;
1245 }
1246
1247 send_wr.next = NULL;
Chuck Lever2fa8f882016-03-04 11:28:53 -05001248 send_wr.wr_cqe = &req->rl_cqe;
Chuck Leverb3221d62015-08-03 13:03:39 -04001249 send_wr.sg_list = iov;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001250 send_wr.num_sge = req->rl_niovs;
1251 send_wr.opcode = IB_WR_SEND;
Chuck Leverb3221d62015-08-03 13:03:39 -04001252
1253 for (i = 0; i < send_wr.num_sge; i++)
1254 ib_dma_sync_single_for_device(device, iov[i].addr,
1255 iov[i].length, DMA_TO_DEVICE);
1256 dprintk("RPC: %s: posting %d s/g entries\n",
1257 __func__, send_wr.num_sge);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001258
1259 if (DECR_CQCOUNT(ep) > 0)
1260 send_wr.send_flags = 0;
1261 else { /* Provider must take a send completion every now and then */
1262 INIT_CQCOUNT(ep);
1263 send_wr.send_flags = IB_SEND_SIGNALED;
1264 }
1265
1266 rc = ib_post_send(ia->ri_id->qp, &send_wr, &send_wr_fail);
1267 if (rc)
Chuck Lever7a89f9c2016-06-29 13:53:43 -04001268 goto out_postsend_err;
1269 return 0;
1270
1271out_postsend_err:
1272 pr_err("rpcrdma: RDMA Send ib_post_send returned %i\n", rc);
1273 return -ENOTCONN;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001274}
1275
1276/*
1277 * (Re)post a receive buffer.
1278 */
1279int
1280rpcrdma_ep_post_recv(struct rpcrdma_ia *ia,
1281 struct rpcrdma_ep *ep,
1282 struct rpcrdma_rep *rep)
1283{
1284 struct ib_recv_wr recv_wr, *recv_wr_fail;
1285 int rc;
1286
1287 recv_wr.next = NULL;
Chuck Lever552bf222016-03-04 11:28:36 -05001288 recv_wr.wr_cqe = &rep->rr_cqe;
Chuck Lever6b1184c2015-01-21 11:04:25 -05001289 recv_wr.sg_list = &rep->rr_rdmabuf->rg_iov;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001290 recv_wr.num_sge = 1;
1291
Chuck Lever89e0d1122015-05-26 11:51:56 -04001292 ib_dma_sync_single_for_cpu(ia->ri_device,
Chuck Lever6b1184c2015-01-21 11:04:25 -05001293 rdmab_addr(rep->rr_rdmabuf),
1294 rdmab_length(rep->rr_rdmabuf),
1295 DMA_BIDIRECTIONAL);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001296
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001297 rc = ib_post_recv(ia->ri_id->qp, &recv_wr, &recv_wr_fail);
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001298 if (rc)
Chuck Lever7a89f9c2016-06-29 13:53:43 -04001299 goto out_postrecv;
1300 return 0;
1301
1302out_postrecv:
1303 pr_err("rpcrdma: ib_post_recv returned %i\n", rc);
1304 return -ENOTCONN;
\"Talpey, Thomas\c56c65f2007-09-10 13:51:18 -04001305}
Chuck Lever43e95982014-07-29 17:23:34 -04001306
Chuck Leverf531a5d2015-10-24 17:27:43 -04001307/**
1308 * rpcrdma_ep_post_extra_recv - Post buffers for incoming backchannel requests
1309 * @r_xprt: transport associated with these backchannel resources
1310 * @min_reqs: minimum number of incoming requests expected
1311 *
1312 * Returns zero if all requested buffers were posted, or a negative errno.
1313 */
1314int
1315rpcrdma_ep_post_extra_recv(struct rpcrdma_xprt *r_xprt, unsigned int count)
1316{
1317 struct rpcrdma_buffer *buffers = &r_xprt->rx_buf;
1318 struct rpcrdma_ia *ia = &r_xprt->rx_ia;
1319 struct rpcrdma_ep *ep = &r_xprt->rx_ep;
1320 struct rpcrdma_rep *rep;
Chuck Leverf531a5d2015-10-24 17:27:43 -04001321 int rc;
1322
1323 while (count--) {
Chuck Lever9b066882015-12-16 17:22:06 -05001324 spin_lock(&buffers->rb_lock);
Chuck Leverf531a5d2015-10-24 17:27:43 -04001325 if (list_empty(&buffers->rb_recv_bufs))
1326 goto out_reqbuf;
1327 rep = rpcrdma_buffer_get_rep_locked(buffers);
Chuck Lever9b066882015-12-16 17:22:06 -05001328 spin_unlock(&buffers->rb_lock);
Chuck Leverf531a5d2015-10-24 17:27:43 -04001329
1330 rc = rpcrdma_ep_post_recv(ia, ep, rep);
1331 if (rc)
1332 goto out_rc;
1333 }
1334
1335 return 0;
1336
1337out_reqbuf:
Chuck Lever9b066882015-12-16 17:22:06 -05001338 spin_unlock(&buffers->rb_lock);
Chuck Leverf531a5d2015-10-24 17:27:43 -04001339 pr_warn("%s: no extra receive buffers\n", __func__);
1340 return -ENOMEM;
1341
1342out_rc:
1343 rpcrdma_recv_buffer_put(rep);
1344 return rc;
1345}