2 * Copyright (c) 2005-2006 Network Appliance, Inc. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the BSD-type
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
14 * Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
17 * Redistributions in binary form must reproduce the above
18 * copyright notice, this list of conditions and the following
19 * disclaimer in the documentation and/or other materials provided
20 * with the distribution.
22 * Neither the name of the Network Appliance, Inc. nor the names of
23 * its contributors may be used to endorse or promote products
24 * derived from this software without specific prior written
27 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
28 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
29 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
30 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
31 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
32 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
33 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
34 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
35 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
36 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
37 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
39 * Author: Tom Tucker <tom@opengridcomputing.com>
41 #include <linux/module.h>
42 #include <linux/init.h>
44 #include <linux/sysctl.h>
45 #include <linux/sunrpc/clnt.h>
46 #include <linux/sunrpc/sched.h>
47 #include <linux/sunrpc/svc_rdma.h>
49 #define RPCDBG_FACILITY RPCDBG_SVCXPRT
51 /* RPC/RDMA parameters */
52 unsigned int svcrdma_ord
= RPCRDMA_ORD
;
53 static unsigned int min_ord
= 1;
54 static unsigned int max_ord
= 4096;
55 unsigned int svcrdma_max_requests
= RPCRDMA_MAX_REQUESTS
;
56 static unsigned int min_max_requests
= 4;
57 static unsigned int max_max_requests
= 16384;
58 unsigned int svcrdma_max_req_size
= RPCRDMA_MAX_REQ_SIZE
;
59 static unsigned int min_max_inline
= 4096;
60 static unsigned int max_max_inline
= 65536;
62 atomic_t rdma_stat_recv
;
63 atomic_t rdma_stat_read
;
64 atomic_t rdma_stat_write
;
65 atomic_t rdma_stat_sq_starve
;
66 atomic_t rdma_stat_rq_starve
;
67 atomic_t rdma_stat_rq_poll
;
68 atomic_t rdma_stat_rq_prod
;
69 atomic_t rdma_stat_sq_poll
;
70 atomic_t rdma_stat_sq_prod
;
72 /* Temporary NFS request map and context caches */
73 struct kmem_cache
*svc_rdma_map_cachep
;
74 struct kmem_cache
*svc_rdma_ctxt_cachep
;
77 * This function implements reading and resetting an atomic_t stat
78 * variable through read/write to a proc file. Any write to the file
79 * resets the associated statistic to zero. Any read returns it's
82 static int read_reset_stat(ctl_table
*table
, int write
,
83 struct file
*filp
, void __user
*buffer
, size_t *lenp
,
86 atomic_t
*stat
= (atomic_t
*)table
->data
;
96 int len
= snprintf(str_buf
, 32, "%d\n", atomic_read(stat
));
99 len
= strlen(str_buf
);
104 data
= &str_buf
[*ppos
];
108 if (len
&& copy_to_user(buffer
, str_buf
, len
))
116 static struct ctl_table_header
*svcrdma_table_header
;
117 static ctl_table svcrdma_parm_table
[] = {
119 .procname
= "max_requests",
120 .data
= &svcrdma_max_requests
,
121 .maxlen
= sizeof(unsigned int),
123 .proc_handler
= &proc_dointvec_minmax
,
124 .strategy
= &sysctl_intvec
,
125 .extra1
= &min_max_requests
,
126 .extra2
= &max_max_requests
129 .procname
= "max_req_size",
130 .data
= &svcrdma_max_req_size
,
131 .maxlen
= sizeof(unsigned int),
133 .proc_handler
= &proc_dointvec_minmax
,
134 .strategy
= &sysctl_intvec
,
135 .extra1
= &min_max_inline
,
136 .extra2
= &max_max_inline
139 .procname
= "max_outbound_read_requests",
140 .data
= &svcrdma_ord
,
141 .maxlen
= sizeof(unsigned int),
143 .proc_handler
= &proc_dointvec_minmax
,
144 .strategy
= &sysctl_intvec
,
150 .procname
= "rdma_stat_read",
151 .data
= &rdma_stat_read
,
152 .maxlen
= sizeof(atomic_t
),
154 .proc_handler
= &read_reset_stat
,
157 .procname
= "rdma_stat_recv",
158 .data
= &rdma_stat_recv
,
159 .maxlen
= sizeof(atomic_t
),
161 .proc_handler
= &read_reset_stat
,
164 .procname
= "rdma_stat_write",
165 .data
= &rdma_stat_write
,
166 .maxlen
= sizeof(atomic_t
),
168 .proc_handler
= &read_reset_stat
,
171 .procname
= "rdma_stat_sq_starve",
172 .data
= &rdma_stat_sq_starve
,
173 .maxlen
= sizeof(atomic_t
),
175 .proc_handler
= &read_reset_stat
,
178 .procname
= "rdma_stat_rq_starve",
179 .data
= &rdma_stat_rq_starve
,
180 .maxlen
= sizeof(atomic_t
),
182 .proc_handler
= &read_reset_stat
,
185 .procname
= "rdma_stat_rq_poll",
186 .data
= &rdma_stat_rq_poll
,
187 .maxlen
= sizeof(atomic_t
),
189 .proc_handler
= &read_reset_stat
,
192 .procname
= "rdma_stat_rq_prod",
193 .data
= &rdma_stat_rq_prod
,
194 .maxlen
= sizeof(atomic_t
),
196 .proc_handler
= &read_reset_stat
,
199 .procname
= "rdma_stat_sq_poll",
200 .data
= &rdma_stat_sq_poll
,
201 .maxlen
= sizeof(atomic_t
),
203 .proc_handler
= &read_reset_stat
,
206 .procname
= "rdma_stat_sq_prod",
207 .data
= &rdma_stat_sq_prod
,
208 .maxlen
= sizeof(atomic_t
),
210 .proc_handler
= &read_reset_stat
,
217 static ctl_table svcrdma_table
[] = {
219 .procname
= "svc_rdma",
221 .child
= svcrdma_parm_table
228 static ctl_table svcrdma_root_table
[] = {
230 .ctl_name
= CTL_SUNRPC
,
231 .procname
= "sunrpc",
233 .child
= svcrdma_table
240 void svc_rdma_cleanup(void)
242 dprintk("SVCRDMA Module Removed, deregister RPC RDMA transport\n");
243 flush_scheduled_work();
244 if (svcrdma_table_header
) {
245 unregister_sysctl_table(svcrdma_table_header
);
246 svcrdma_table_header
= NULL
;
248 svc_unreg_xprt_class(&svc_rdma_class
);
249 kmem_cache_destroy(svc_rdma_map_cachep
);
250 kmem_cache_destroy(svc_rdma_ctxt_cachep
);
253 int svc_rdma_init(void)
255 dprintk("SVCRDMA Module Init, register RPC RDMA transport\n");
256 dprintk("\tsvcrdma_ord : %d\n", svcrdma_ord
);
257 dprintk("\tmax_requests : %d\n", svcrdma_max_requests
);
258 dprintk("\tsq_depth : %d\n",
259 svcrdma_max_requests
* RPCRDMA_SQ_DEPTH_MULT
);
260 dprintk("\tmax_inline : %d\n", svcrdma_max_req_size
);
261 if (!svcrdma_table_header
)
262 svcrdma_table_header
=
263 register_sysctl_table(svcrdma_root_table
);
265 /* Create the temporary map cache */
266 svc_rdma_map_cachep
= kmem_cache_create("svc_rdma_map_cache",
267 sizeof(struct svc_rdma_req_map
),
271 if (!svc_rdma_map_cachep
) {
272 printk(KERN_INFO
"Could not allocate map cache.\n");
276 /* Create the temporary context cache */
277 svc_rdma_ctxt_cachep
=
278 kmem_cache_create("svc_rdma_ctxt_cache",
279 sizeof(struct svc_rdma_op_ctxt
),
283 if (!svc_rdma_ctxt_cachep
) {
284 printk(KERN_INFO
"Could not allocate WR ctxt cache.\n");
288 /* Register RDMA with the SVC transport switch */
289 svc_reg_xprt_class(&svc_rdma_class
);
292 kmem_cache_destroy(svc_rdma_map_cachep
);
294 unregister_sysctl_table(svcrdma_table_header
);
297 MODULE_AUTHOR("Tom Tucker <tom@opengridcomputing.com>");
298 MODULE_DESCRIPTION("SVC RDMA Transport");
299 MODULE_LICENSE("Dual BSD/GPL");
300 module_init(svc_rdma_init
);
301 module_exit(svc_rdma_cleanup
);