SUNRPC: Generalize the RPC buffer allocation API

author Chuck Lever <chuck.lever@oracle.com>

Thu, 15 Sep 2016 14:55:20 +0000 (10:55 -0400)

committer Anna Schumaker <Anna.Schumaker@Netapp.com>

Mon, 19 Sep 2016 17:08:37 +0000 (13:08 -0400)
author Chuck Lever <chuck.lever@oracle.com>
Thu, 15 Sep 2016 14:55:20 +0000 (10:55 -0400)
committer Anna Schumaker <Anna.Schumaker@Netapp.com>
Mon, 19 Sep 2016 17:08:37 +0000 (13:08 -0400)
diff --git a/include/linux/sunrpc/sched.h b/include/linux/sunrpc/sched.h

index 817af0b4385ea384026b7f35e296e94211796974..38d4c1b378f2c6bf26d34796fdba07310b2258aa 100644 (file)
--- a/include/linux/sunrpc/sched.h
+++ b/include/linux/sunrpc/sched.h
@@ -239,7 +239,7 @@ struct rpc_task *rpc_wake_up_first(struct rpc_wait_queue *,
                                         void *);
  void           rpc_wake_up_status(struct rpc_wait_queue *, int);
  void           rpc_delay(struct rpc_task *, unsigned long);
-void *         rpc_malloc(struct rpc_task *, size_t);
+int            rpc_malloc(struct rpc_task *);
  void           rpc_free(void *);
  int            rpciod_up(void);
  void           rpciod_down(void);
diff --git a/include/linux/sunrpc/xprt.h b/include/linux/sunrpc/xprt.h

index 6f1d41b559a3f07280558b986c232233fcbe2910..c01f468fb374cc239743e2288a29795e3b7e34bf 100644 (file)
--- a/include/linux/sunrpc/xprt.h
+++ b/include/linux/sunrpc/xprt.h
@@ -127,7 +127,7 @@ struct rpc_xprt_ops {
         void            (*rpcbind)(struct rpc_task *task);
         void            (*set_port)(struct rpc_xprt *xprt, unsigned short port);
         void            (*connect)(struct rpc_xprt *xprt, struct rpc_task *task);
-       void *          (*buf_alloc)(struct rpc_task *task, size_t size);
+       int             (*buf_alloc)(struct rpc_task *task);
         void            (*buf_free)(void *buffer);
         int             (*send_request)(struct rpc_task *task);
         void            (*set_retrans_timeout)(struct rpc_task *task);
diff --git a/net/sunrpc/clnt.c b/net/sunrpc/clnt.c

index 6481986be7a71d3c6598027837c097780ce603e7..5499fda0c1f3dfbd02811b11e710d2a940168392 100644 (file)
--- a/net/sunrpc/clnt.c
+++ b/net/sunrpc/clnt.c
@@ -1691,6 +1691,7 @@ call_allocate(struct rpc_task *task)
         struct rpc_rqst *req = task->tk_rqstp;
         struct rpc_xprt *xprt = req->rq_xprt;
         struct rpc_procinfo *proc = task->tk_msg.rpc_proc;
+       int status;
  
         dprint_status(task);
  
@@ -1716,11 +1717,14 @@ call_allocate(struct rpc_task *task)
         req->rq_rcvsize = RPC_REPHDRSIZE + slack + proc->p_replen;
         req->rq_rcvsize <<= 2;
  
-       req->rq_buffer = xprt->ops->buf_alloc(task,
-                                       req->rq_callsize + req->rq_rcvsize);
-       if (req->rq_buffer != NULL)
-               return;
+       status = xprt->ops->buf_alloc(task);
         xprt_inject_disconnect(xprt);
+       if (status == 0)
+               return;
+       if (status != -ENOMEM) {
+               rpc_exit(task, status);
+               return;
+       }
  
         dprintk("RPC: %5u rpc_buffer allocation failed\n", task->tk_pid);
  
diff --git a/net/sunrpc/sched.c b/net/sunrpc/sched.c

index 9ae588511aafd9470736a4ff24a498c941b7ece3..b964d40b259bfdd91b52fddff933ddeba86d1265 100644 (file)
--- a/net/sunrpc/sched.c
+++ b/net/sunrpc/sched.c
@@ -849,14 +849,17 @@ static void rpc_async_schedule(struct work_struct *work)
  }
  
  /**
- * rpc_malloc - allocate an RPC buffer
- * @task: RPC task that will use this buffer
- * @size: requested byte size
+ * rpc_malloc - allocate RPC buffer resources
+ * @task: RPC task
+ *
+ * A single memory region is allocated, which is split between the
+ * RPC call and RPC reply that this task is being used for. When
+ * this RPC is retired, the memory is released by calling rpc_free.
   *
   * To prevent rpciod from hanging, this allocator never sleeps,
- * returning NULL and suppressing warning if the request cannot be serviced
- * immediately.
- * The caller can arrange to sleep in a way that is safe for rpciod.
+ * returning -ENOMEM and suppressing warning if the request cannot
+ * be serviced immediately. The caller can arrange to sleep in a
+ * way that is safe for rpciod.
   *
   * Most requests are 'small' (under 2KiB) and can be serviced from a
   * mempool, ensuring that NFS reads and writes can always proceed,
@@ -865,8 +868,10 @@ static void rpc_async_schedule(struct work_struct *work)
   * In order to avoid memory starvation triggering more writebacks of
   * NFS requests, we avoid using GFP_KERNEL.
   */
-void *rpc_malloc(struct rpc_task *task, size_t size)
+int rpc_malloc(struct rpc_task *task)
  {
+       struct rpc_rqst *rqst = task->tk_rqstp;
+       size_t size = rqst->rq_callsize + rqst->rq_rcvsize;
         struct rpc_buffer *buf;
         gfp_t gfp = GFP_NOIO | __GFP_NOWARN;
  
@@ -880,12 +885,13 @@ void *rpc_malloc(struct rpc_task *task, size_t size)
                 buf = kmalloc(size, gfp);
  
         if (!buf)
-               return NULL;
+               return -ENOMEM;
  
         buf->len = size;
         dprintk("RPC: %5u allocated buffer of size %zu at %p\n",
                         task->tk_pid, size, buf);
-       return &buf->data;
+       rqst->rq_buffer = buf->data;
+       return 0;
  }
  EXPORT_SYMBOL_GPL(rpc_malloc);
  
diff --git a/net/sunrpc/xprtrdma/svc_rdma_backchannel.c b/net/sunrpc/xprtrdma/svc_rdma_backchannel.c

index a2a7519b0f23575d3b7e891973c5026634fe0537..124688ba67e5d4679456694da8fab39975920c30 100644 (file)
--- a/net/sunrpc/xprtrdma/svc_rdma_backchannel.c
+++ b/net/sunrpc/xprtrdma/svc_rdma_backchannel.c
@@ -159,29 +159,30 @@ out_unmap:
  /* Server-side transport endpoint wants a whole page for its send
   * buffer. The client RPC code constructs the RPC header in this
   * buffer before it invokes ->send_request.
- *
- * Returns NULL if there was a temporary allocation failure.
   */
-static void *
-xprt_rdma_bc_allocate(struct rpc_task *task, size_t size)
+static int
+xprt_rdma_bc_allocate(struct rpc_task *task)
  {
         struct rpc_rqst *rqst = task->tk_rqstp;
         struct svc_xprt *sxprt = rqst->rq_xprt->bc_xprt;
+       size_t size = rqst->rq_callsize;
         struct svcxprt_rdma *rdma;
         struct page *page;
  
         rdma = container_of(sxprt, struct svcxprt_rdma, sc_xprt);
  
-       /* Prevent an infinite loop: try to make this case work */
-       if (size > PAGE_SIZE)
+       if (size > PAGE_SIZE) {
                 WARN_ONCE(1, "svcrdma: large bc buffer request (size %zu)\n",
                           size);
+               return -EINVAL;
+       }
  
         page = alloc_page(RPCRDMA_DEF_GFP);
         if (!page)
-               return NULL;
+               return -ENOMEM;
  
-       return page_address(page);
+       rqst->rq_buffer = page_address(page);
+       return 0;
  }
  
  static void
diff --git a/net/sunrpc/xprtrdma/transport.c b/net/sunrpc/xprtrdma/transport.c

index be95eced0726741624351427e6f8f42b1570aa2d..daa7d4d43fd83113bcecb92e0482e481724892cd 100644 (file)
--- a/net/sunrpc/xprtrdma/transport.c
+++ b/net/sunrpc/xprtrdma/transport.c
@@ -477,7 +477,15 @@ xprt_rdma_connect(struct rpc_xprt *xprt, struct rpc_task *task)
         }
  }
  
-/*
+/**
+ * xprt_rdma_allocate - allocate transport resources for an RPC
+ * @task: RPC task
+ *
+ * Return values:
+ *        0:   Success; rq_buffer points to RPC buffer to use
+ *   ENOMEM:   Out of memory, call again later
+ *      EIO:   A permanent error occurred, do not retry
+ *
   * The RDMA allocate/free functions need the task structure as a place
   * to hide the struct rpcrdma_req, which is necessary for the actual send/recv
   * sequence.
@@ -486,11 +494,12 @@ xprt_rdma_connect(struct rpc_xprt *xprt, struct rpc_task *task)
   * (rq_send_buf and rq_rcv_buf are both part of a single contiguous buffer).
   * We may register rq_rcv_buf when using reply chunks.
   */
-static void *
-xprt_rdma_allocate(struct rpc_task *task, size_t size)
+static int
+xprt_rdma_allocate(struct rpc_task *task)
  {
-       struct rpc_xprt *xprt = task->tk_rqstp->rq_xprt;
-       struct rpcrdma_xprt *r_xprt = rpcx_to_rdmax(xprt);
+       struct rpc_rqst *rqst = task->tk_rqstp;
+       size_t size = rqst->rq_callsize + rqst->rq_rcvsize;
+       struct rpcrdma_xprt *r_xprt = rpcx_to_rdmax(rqst->rq_xprt);
         struct rpcrdma_regbuf *rb;
         struct rpcrdma_req *req;
         size_t min_size;
@@ -498,7 +507,7 @@ xprt_rdma_allocate(struct rpc_task *task, size_t size)
  
         req = rpcrdma_buffer_get(&r_xprt->rx_buf);
         if (req == NULL)
-               return NULL;
+               return -ENOMEM;
  
         flags = RPCRDMA_DEF_GFP;
         if (RPC_IS_SWAPPER(task))
@@ -515,7 +524,8 @@ out:
         dprintk("RPC:       %s: size %zd, request 0x%p\n", __func__, size, req);
         req->rl_connect_cookie = 0;     /* our reserved value */
         req->rl_task = task;
-       return req->rl_sendbuf->rg_base;
+       rqst->rq_buffer = req->rl_sendbuf->rg_base;
+       return 0;
  
  out_rdmabuf:
         min_size = r_xprt->rx_data.inline_wsize;
@@ -558,7 +568,7 @@ out_sendbuf:
  
  out_fail:
         rpcrdma_buffer_put(req);
-       return NULL;
+       return -ENOMEM;
  }
  
  /*
diff --git a/net/sunrpc/xprtsock.c b/net/sunrpc/xprtsock.c

index bf168838a0296e9387de33ad5afabb3bdf3b35f0..bd30b4b18d726ad4a9090d718688f914000c6eef 100644 (file)
--- a/net/sunrpc/xprtsock.c
+++ b/net/sunrpc/xprtsock.c
@@ -2533,23 +2533,28 @@ static void xs_tcp_print_stats(struct rpc_xprt *xprt, struct seq_file *seq)
   * we allocate pages instead doing a kmalloc like rpc_malloc is because we want
   * to use the server side send routines.
   */
-static void *bc_malloc(struct rpc_task *task, size_t size)
+static int bc_malloc(struct rpc_task *task)
  {
+       struct rpc_rqst *rqst = task->tk_rqstp;
+       size_t size = rqst->rq_callsize;
         struct page *page;
         struct rpc_buffer *buf;
  
-       WARN_ON_ONCE(size > PAGE_SIZE - sizeof(struct rpc_buffer));
-       if (size > PAGE_SIZE - sizeof(struct rpc_buffer))
-               return NULL;
+       if (size > PAGE_SIZE - sizeof(struct rpc_buffer)) {
+               WARN_ONCE(1, "xprtsock: large bc buffer request (size %zu)\n",
+                         size);
+               return -EINVAL;
+       }
  
         page = alloc_page(GFP_KERNEL);
         if (!page)
-               return NULL;
+               return -ENOMEM;
  
         buf = page_address(page);
         buf->len = PAGE_SIZE;
  
-       return buf->data;
+       rqst->rq_buffer = buf->data;
+       return 0;
  }
  
  /*
author	Chuck Lever <chuck.lever@oracle.com>
	Thu, 15 Sep 2016 14:55:20 +0000 (10:55 -0400)
committer	Anna Schumaker <Anna.Schumaker@Netapp.com>
	Mon, 19 Sep 2016 17:08:37 +0000 (13:08 -0400)
include/linux/sunrpc/sched.h		patch \| blob \| blame \| history
include/linux/sunrpc/xprt.h		patch \| blob \| blame \| history
net/sunrpc/clnt.c		patch \| blob \| blame \| history
net/sunrpc/sched.c		patch \| blob \| blame \| history
net/sunrpc/xprtrdma/svc_rdma_backchannel.c		patch \| blob \| blame \| history
net/sunrpc/xprtrdma/transport.c		patch \| blob \| blame \| history
net/sunrpc/xprtsock.c		patch \| blob \| blame \| history