Loading...
1/*
2 * Copyright (c) 2005-2006 Network Appliance, Inc. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the BSD-type
8 * license below:
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 *
14 * Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 *
17 * Redistributions in binary form must reproduce the above
18 * copyright notice, this list of conditions and the following
19 * disclaimer in the documentation and/or other materials provided
20 * with the distribution.
21 *
22 * Neither the name of the Network Appliance, Inc. nor the names of
23 * its contributors may be used to endorse or promote products
24 * derived from this software without specific prior written
25 * permission.
26 *
27 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
28 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
29 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
30 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
31 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
32 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
33 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
34 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
35 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
36 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
37 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
38 *
39 * Author: Tom Tucker <tom@opengridcomputing.com>
40 */
41
42#include <linux/slab.h>
43#include <linux/fs.h>
44#include <linux/sysctl.h>
45#include <linux/workqueue.h>
46#include <linux/sunrpc/clnt.h>
47#include <linux/sunrpc/sched.h>
48#include <linux/sunrpc/svc_rdma.h>
49#include "xprt_rdma.h"
50
51#define RPCDBG_FACILITY RPCDBG_SVCXPRT
52
53/* RPC/RDMA parameters */
54unsigned int svcrdma_ord = RPCRDMA_ORD;
55static unsigned int min_ord = 1;
56static unsigned int max_ord = 4096;
57unsigned int svcrdma_max_requests = RPCRDMA_MAX_REQUESTS;
58unsigned int svcrdma_max_bc_requests = RPCRDMA_MAX_BC_REQUESTS;
59static unsigned int min_max_requests = 4;
60static unsigned int max_max_requests = 16384;
61unsigned int svcrdma_max_req_size = RPCRDMA_MAX_REQ_SIZE;
62static unsigned int min_max_inline = 4096;
63static unsigned int max_max_inline = 65536;
64
65atomic_t rdma_stat_recv;
66atomic_t rdma_stat_read;
67atomic_t rdma_stat_write;
68atomic_t rdma_stat_sq_starve;
69atomic_t rdma_stat_rq_starve;
70atomic_t rdma_stat_rq_poll;
71atomic_t rdma_stat_rq_prod;
72atomic_t rdma_stat_sq_poll;
73atomic_t rdma_stat_sq_prod;
74
75struct workqueue_struct *svc_rdma_wq;
76
77/*
78 * This function implements reading and resetting an atomic_t stat
79 * variable through read/write to a proc file. Any write to the file
80 * resets the associated statistic to zero. Any read returns it's
81 * current value.
82 */
83static int read_reset_stat(struct ctl_table *table, int write,
84 void __user *buffer, size_t *lenp,
85 loff_t *ppos)
86{
87 atomic_t *stat = (atomic_t *)table->data;
88
89 if (!stat)
90 return -EINVAL;
91
92 if (write)
93 atomic_set(stat, 0);
94 else {
95 char str_buf[32];
96 char *data;
97 int len = snprintf(str_buf, 32, "%d\n", atomic_read(stat));
98 if (len >= 32)
99 return -EFAULT;
100 len = strlen(str_buf);
101 if (*ppos > len) {
102 *lenp = 0;
103 return 0;
104 }
105 data = &str_buf[*ppos];
106 len -= *ppos;
107 if (len > *lenp)
108 len = *lenp;
109 if (len && copy_to_user(buffer, str_buf, len))
110 return -EFAULT;
111 *lenp = len;
112 *ppos += len;
113 }
114 return 0;
115}
116
117static struct ctl_table_header *svcrdma_table_header;
118static struct ctl_table svcrdma_parm_table[] = {
119 {
120 .procname = "max_requests",
121 .data = &svcrdma_max_requests,
122 .maxlen = sizeof(unsigned int),
123 .mode = 0644,
124 .proc_handler = proc_dointvec_minmax,
125 .extra1 = &min_max_requests,
126 .extra2 = &max_max_requests
127 },
128 {
129 .procname = "max_req_size",
130 .data = &svcrdma_max_req_size,
131 .maxlen = sizeof(unsigned int),
132 .mode = 0644,
133 .proc_handler = proc_dointvec_minmax,
134 .extra1 = &min_max_inline,
135 .extra2 = &max_max_inline
136 },
137 {
138 .procname = "max_outbound_read_requests",
139 .data = &svcrdma_ord,
140 .maxlen = sizeof(unsigned int),
141 .mode = 0644,
142 .proc_handler = proc_dointvec_minmax,
143 .extra1 = &min_ord,
144 .extra2 = &max_ord,
145 },
146
147 {
148 .procname = "rdma_stat_read",
149 .data = &rdma_stat_read,
150 .maxlen = sizeof(atomic_t),
151 .mode = 0644,
152 .proc_handler = read_reset_stat,
153 },
154 {
155 .procname = "rdma_stat_recv",
156 .data = &rdma_stat_recv,
157 .maxlen = sizeof(atomic_t),
158 .mode = 0644,
159 .proc_handler = read_reset_stat,
160 },
161 {
162 .procname = "rdma_stat_write",
163 .data = &rdma_stat_write,
164 .maxlen = sizeof(atomic_t),
165 .mode = 0644,
166 .proc_handler = read_reset_stat,
167 },
168 {
169 .procname = "rdma_stat_sq_starve",
170 .data = &rdma_stat_sq_starve,
171 .maxlen = sizeof(atomic_t),
172 .mode = 0644,
173 .proc_handler = read_reset_stat,
174 },
175 {
176 .procname = "rdma_stat_rq_starve",
177 .data = &rdma_stat_rq_starve,
178 .maxlen = sizeof(atomic_t),
179 .mode = 0644,
180 .proc_handler = read_reset_stat,
181 },
182 {
183 .procname = "rdma_stat_rq_poll",
184 .data = &rdma_stat_rq_poll,
185 .maxlen = sizeof(atomic_t),
186 .mode = 0644,
187 .proc_handler = read_reset_stat,
188 },
189 {
190 .procname = "rdma_stat_rq_prod",
191 .data = &rdma_stat_rq_prod,
192 .maxlen = sizeof(atomic_t),
193 .mode = 0644,
194 .proc_handler = read_reset_stat,
195 },
196 {
197 .procname = "rdma_stat_sq_poll",
198 .data = &rdma_stat_sq_poll,
199 .maxlen = sizeof(atomic_t),
200 .mode = 0644,
201 .proc_handler = read_reset_stat,
202 },
203 {
204 .procname = "rdma_stat_sq_prod",
205 .data = &rdma_stat_sq_prod,
206 .maxlen = sizeof(atomic_t),
207 .mode = 0644,
208 .proc_handler = read_reset_stat,
209 },
210 { },
211};
212
213static struct ctl_table svcrdma_table[] = {
214 {
215 .procname = "svc_rdma",
216 .mode = 0555,
217 .child = svcrdma_parm_table
218 },
219 { },
220};
221
222static struct ctl_table svcrdma_root_table[] = {
223 {
224 .procname = "sunrpc",
225 .mode = 0555,
226 .child = svcrdma_table
227 },
228 { },
229};
230
231void svc_rdma_cleanup(void)
232{
233 dprintk("SVCRDMA Module Removed, deregister RPC RDMA transport\n");
234 destroy_workqueue(svc_rdma_wq);
235 if (svcrdma_table_header) {
236 unregister_sysctl_table(svcrdma_table_header);
237 svcrdma_table_header = NULL;
238 }
239#if defined(CONFIG_SUNRPC_BACKCHANNEL)
240 svc_unreg_xprt_class(&svc_rdma_bc_class);
241#endif
242 svc_unreg_xprt_class(&svc_rdma_class);
243}
244
245int svc_rdma_init(void)
246{
247 dprintk("SVCRDMA Module Init, register RPC RDMA transport\n");
248 dprintk("\tsvcrdma_ord : %d\n", svcrdma_ord);
249 dprintk("\tmax_requests : %u\n", svcrdma_max_requests);
250 dprintk("\tsq_depth : %u\n",
251 svcrdma_max_requests * RPCRDMA_SQ_DEPTH_MULT);
252 dprintk("\tmax_bc_requests : %u\n", svcrdma_max_bc_requests);
253 dprintk("\tmax_inline : %d\n", svcrdma_max_req_size);
254
255 svc_rdma_wq = alloc_workqueue("svc_rdma", 0, 0);
256 if (!svc_rdma_wq)
257 return -ENOMEM;
258
259 if (!svcrdma_table_header)
260 svcrdma_table_header =
261 register_sysctl_table(svcrdma_root_table);
262
263 /* Register RDMA with the SVC transport switch */
264 svc_reg_xprt_class(&svc_rdma_class);
265#if defined(CONFIG_SUNRPC_BACKCHANNEL)
266 svc_reg_xprt_class(&svc_rdma_bc_class);
267#endif
268 return 0;
269}
1// SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause
2/*
3 * Copyright (c) 2015-2018 Oracle. All rights reserved.
4 * Copyright (c) 2005-2006 Network Appliance, Inc. All rights reserved.
5 *
6 * This software is available to you under a choice of one of two
7 * licenses. You may choose to be licensed under the terms of the GNU
8 * General Public License (GPL) Version 2, available from the file
9 * COPYING in the main directory of this source tree, or the BSD-type
10 * license below:
11 *
12 * Redistribution and use in source and binary forms, with or without
13 * modification, are permitted provided that the following conditions
14 * are met:
15 *
16 * Redistributions of source code must retain the above copyright
17 * notice, this list of conditions and the following disclaimer.
18 *
19 * Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials provided
22 * with the distribution.
23 *
24 * Neither the name of the Network Appliance, Inc. nor the names of
25 * its contributors may be used to endorse or promote products
26 * derived from this software without specific prior written
27 * permission.
28 *
29 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
30 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
31 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
32 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
33 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
34 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
35 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
36 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
37 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
38 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
39 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
40 *
41 * Author: Tom Tucker <tom@opengridcomputing.com>
42 */
43
44#include <linux/slab.h>
45#include <linux/fs.h>
46#include <linux/sysctl.h>
47#include <linux/workqueue.h>
48#include <linux/sunrpc/clnt.h>
49#include <linux/sunrpc/sched.h>
50#include <linux/sunrpc/svc_rdma.h>
51
52#define RPCDBG_FACILITY RPCDBG_SVCXPRT
53
54/* RPC/RDMA parameters */
55unsigned int svcrdma_ord = 16; /* historical default */
56static unsigned int min_ord = 1;
57static unsigned int max_ord = 255;
58unsigned int svcrdma_max_requests = RPCRDMA_MAX_REQUESTS;
59unsigned int svcrdma_max_bc_requests = RPCRDMA_MAX_BC_REQUESTS;
60static unsigned int min_max_requests = 4;
61static unsigned int max_max_requests = 16384;
62unsigned int svcrdma_max_req_size = RPCRDMA_DEF_INLINE_THRESH;
63static unsigned int min_max_inline = RPCRDMA_DEF_INLINE_THRESH;
64static unsigned int max_max_inline = RPCRDMA_MAX_INLINE_THRESH;
65static unsigned int svcrdma_stat_unused;
66static unsigned int zero;
67
68struct percpu_counter svcrdma_stat_read;
69struct percpu_counter svcrdma_stat_recv;
70struct percpu_counter svcrdma_stat_sq_starve;
71struct percpu_counter svcrdma_stat_write;
72
73enum {
74 SVCRDMA_COUNTER_BUFSIZ = sizeof(unsigned long long),
75};
76
77static int svcrdma_counter_handler(struct ctl_table *table, int write,
78 void *buffer, size_t *lenp, loff_t *ppos)
79{
80 struct percpu_counter *stat = (struct percpu_counter *)table->data;
81 char tmp[SVCRDMA_COUNTER_BUFSIZ + 1];
82 int len;
83
84 if (write) {
85 percpu_counter_set(stat, 0);
86 return 0;
87 }
88
89 len = snprintf(tmp, SVCRDMA_COUNTER_BUFSIZ, "%lld\n",
90 percpu_counter_sum_positive(stat));
91 if (len >= SVCRDMA_COUNTER_BUFSIZ)
92 return -EFAULT;
93 len = strlen(tmp);
94 if (*ppos > len) {
95 *lenp = 0;
96 return 0;
97 }
98 len -= *ppos;
99 if (len > *lenp)
100 len = *lenp;
101 if (len)
102 memcpy(buffer, tmp, len);
103 *lenp = len;
104 *ppos += len;
105
106 return 0;
107}
108
109static struct ctl_table_header *svcrdma_table_header;
110static struct ctl_table svcrdma_parm_table[] = {
111 {
112 .procname = "max_requests",
113 .data = &svcrdma_max_requests,
114 .maxlen = sizeof(unsigned int),
115 .mode = 0644,
116 .proc_handler = proc_dointvec_minmax,
117 .extra1 = &min_max_requests,
118 .extra2 = &max_max_requests
119 },
120 {
121 .procname = "max_req_size",
122 .data = &svcrdma_max_req_size,
123 .maxlen = sizeof(unsigned int),
124 .mode = 0644,
125 .proc_handler = proc_dointvec_minmax,
126 .extra1 = &min_max_inline,
127 .extra2 = &max_max_inline
128 },
129 {
130 .procname = "max_outbound_read_requests",
131 .data = &svcrdma_ord,
132 .maxlen = sizeof(unsigned int),
133 .mode = 0644,
134 .proc_handler = proc_dointvec_minmax,
135 .extra1 = &min_ord,
136 .extra2 = &max_ord,
137 },
138
139 {
140 .procname = "rdma_stat_read",
141 .data = &svcrdma_stat_read,
142 .maxlen = SVCRDMA_COUNTER_BUFSIZ,
143 .mode = 0644,
144 .proc_handler = svcrdma_counter_handler,
145 },
146 {
147 .procname = "rdma_stat_recv",
148 .data = &svcrdma_stat_recv,
149 .maxlen = SVCRDMA_COUNTER_BUFSIZ,
150 .mode = 0644,
151 .proc_handler = svcrdma_counter_handler,
152 },
153 {
154 .procname = "rdma_stat_write",
155 .data = &svcrdma_stat_write,
156 .maxlen = SVCRDMA_COUNTER_BUFSIZ,
157 .mode = 0644,
158 .proc_handler = svcrdma_counter_handler,
159 },
160 {
161 .procname = "rdma_stat_sq_starve",
162 .data = &svcrdma_stat_sq_starve,
163 .maxlen = SVCRDMA_COUNTER_BUFSIZ,
164 .mode = 0644,
165 .proc_handler = svcrdma_counter_handler,
166 },
167 {
168 .procname = "rdma_stat_rq_starve",
169 .data = &svcrdma_stat_unused,
170 .maxlen = sizeof(unsigned int),
171 .mode = 0644,
172 .proc_handler = proc_dointvec_minmax,
173 .extra1 = &zero,
174 .extra2 = &zero,
175 },
176 {
177 .procname = "rdma_stat_rq_poll",
178 .data = &svcrdma_stat_unused,
179 .maxlen = sizeof(unsigned int),
180 .mode = 0644,
181 .proc_handler = proc_dointvec_minmax,
182 .extra1 = &zero,
183 .extra2 = &zero,
184 },
185 {
186 .procname = "rdma_stat_rq_prod",
187 .data = &svcrdma_stat_unused,
188 .maxlen = sizeof(unsigned int),
189 .mode = 0644,
190 .proc_handler = proc_dointvec_minmax,
191 .extra1 = &zero,
192 .extra2 = &zero,
193 },
194 {
195 .procname = "rdma_stat_sq_poll",
196 .data = &svcrdma_stat_unused,
197 .maxlen = sizeof(unsigned int),
198 .mode = 0644,
199 .proc_handler = proc_dointvec_minmax,
200 .extra1 = &zero,
201 .extra2 = &zero,
202 },
203 {
204 .procname = "rdma_stat_sq_prod",
205 .data = &svcrdma_stat_unused,
206 .maxlen = sizeof(unsigned int),
207 .mode = 0644,
208 .proc_handler = proc_dointvec_minmax,
209 .extra1 = &zero,
210 .extra2 = &zero,
211 },
212 { },
213};
214
215static struct ctl_table svcrdma_table[] = {
216 {
217 .procname = "svc_rdma",
218 .mode = 0555,
219 .child = svcrdma_parm_table
220 },
221 { },
222};
223
224static struct ctl_table svcrdma_root_table[] = {
225 {
226 .procname = "sunrpc",
227 .mode = 0555,
228 .child = svcrdma_table
229 },
230 { },
231};
232
233static void svc_rdma_proc_cleanup(void)
234{
235 if (!svcrdma_table_header)
236 return;
237 unregister_sysctl_table(svcrdma_table_header);
238 svcrdma_table_header = NULL;
239
240 percpu_counter_destroy(&svcrdma_stat_write);
241 percpu_counter_destroy(&svcrdma_stat_sq_starve);
242 percpu_counter_destroy(&svcrdma_stat_recv);
243 percpu_counter_destroy(&svcrdma_stat_read);
244}
245
246static int svc_rdma_proc_init(void)
247{
248 int rc;
249
250 if (svcrdma_table_header)
251 return 0;
252
253 rc = percpu_counter_init(&svcrdma_stat_read, 0, GFP_KERNEL);
254 if (rc)
255 goto out_err;
256 rc = percpu_counter_init(&svcrdma_stat_recv, 0, GFP_KERNEL);
257 if (rc)
258 goto out_err;
259 rc = percpu_counter_init(&svcrdma_stat_sq_starve, 0, GFP_KERNEL);
260 if (rc)
261 goto out_err;
262 rc = percpu_counter_init(&svcrdma_stat_write, 0, GFP_KERNEL);
263 if (rc)
264 goto out_err;
265
266 svcrdma_table_header = register_sysctl_table(svcrdma_root_table);
267 return 0;
268
269out_err:
270 percpu_counter_destroy(&svcrdma_stat_sq_starve);
271 percpu_counter_destroy(&svcrdma_stat_recv);
272 percpu_counter_destroy(&svcrdma_stat_read);
273 return rc;
274}
275
276void svc_rdma_cleanup(void)
277{
278 dprintk("SVCRDMA Module Removed, deregister RPC RDMA transport\n");
279 svc_unreg_xprt_class(&svc_rdma_class);
280 svc_rdma_proc_cleanup();
281}
282
283int svc_rdma_init(void)
284{
285 int rc;
286
287 dprintk("SVCRDMA Module Init, register RPC RDMA transport\n");
288 dprintk("\tsvcrdma_ord : %d\n", svcrdma_ord);
289 dprintk("\tmax_requests : %u\n", svcrdma_max_requests);
290 dprintk("\tmax_bc_requests : %u\n", svcrdma_max_bc_requests);
291 dprintk("\tmax_inline : %d\n", svcrdma_max_req_size);
292
293 rc = svc_rdma_proc_init();
294 if (rc)
295 return rc;
296
297 /* Register RDMA with the SVC transport switch */
298 svc_reg_xprt_class(&svc_rdma_class);
299 return 0;
300}