1462791bbSDust Li // SPDX-License-Identifier: GPL-2.0
2462791bbSDust Li /*
3462791bbSDust Li * Shared Memory Communications over RDMA (SMC-R) and RoCE
4462791bbSDust Li *
5462791bbSDust Li * smc_sysctl.c: sysctl interface to SMC subsystem.
6462791bbSDust Li *
7462791bbSDust Li * Copyright (c) 2022, Alibaba Inc.
8462791bbSDust Li *
9462791bbSDust Li * Author: Tony Lu <tonylu@linux.alibaba.com>
10462791bbSDust Li *
11462791bbSDust Li */
12462791bbSDust Li
13462791bbSDust Li #include <linux/init.h>
14462791bbSDust Li #include <linux/sysctl.h>
15462791bbSDust Li #include <net/net_namespace.h>
16462791bbSDust Li
1712bbb0d1SDust Li #include "smc.h"
184bc5008eSWen Gu #include "smc_core.h"
1977eee325SWen Gu #include "smc_llc.h"
20462791bbSDust Li #include "smc_sysctl.h"
21462791bbSDust Li
220227f058STony Lu static int min_sndbuf = SMC_BUF_MIN_SIZE;
230227f058STony Lu static int min_rcvbuf = SMC_BUF_MIN_SIZE;
24833bac7eSGerd Bayer static int max_sndbuf = INT_MAX / 2;
25833bac7eSGerd Bayer static int max_rcvbuf = INT_MAX / 2;
26833bac7eSGerd Bayer static const int net_smc_wmem_init = (64 * 1024);
27833bac7eSGerd Bayer static const int net_smc_rmem_init = (64 * 1024);
28f8e80fc4SGuangguan Wang static int links_per_lgr_min = SMC_LINKS_ADD_LNK_MIN;
29f8e80fc4SGuangguan Wang static int links_per_lgr_max = SMC_LINKS_ADD_LNK_MAX;
301f2c9dd7SGuangguan Wang static int conns_per_lgr_min = SMC_CONN_PER_LGR_MIN;
311f2c9dd7SGuangguan Wang static int conns_per_lgr_max = SMC_CONN_PER_LGR_MAX;
320227f058STony Lu
33462791bbSDust Li static struct ctl_table smc_table[] = {
3412bbb0d1SDust Li {
3512bbb0d1SDust Li .procname = "autocorking_size",
3612bbb0d1SDust Li .data = &init_net.smc.sysctl_autocorking_size,
3712bbb0d1SDust Li .maxlen = sizeof(unsigned int),
3812bbb0d1SDust Li .mode = 0644,
3912bbb0d1SDust Li .proc_handler = proc_douintvec,
4012bbb0d1SDust Li },
414bc5008eSWen Gu {
424bc5008eSWen Gu .procname = "smcr_buf_type",
434bc5008eSWen Gu .data = &init_net.smc.sysctl_smcr_buf_type,
444bc5008eSWen Gu .maxlen = sizeof(unsigned int),
454bc5008eSWen Gu .mode = 0644,
464bc5008eSWen Gu .proc_handler = proc_douintvec_minmax,
474bc5008eSWen Gu .extra1 = SYSCTL_ZERO,
484bc5008eSWen Gu .extra2 = SYSCTL_TWO,
494bc5008eSWen Gu },
5077eee325SWen Gu {
5177eee325SWen Gu .procname = "smcr_testlink_time",
5277eee325SWen Gu .data = &init_net.smc.sysctl_smcr_testlink_time,
5377eee325SWen Gu .maxlen = sizeof(int),
5477eee325SWen Gu .mode = 0644,
5577eee325SWen Gu .proc_handler = proc_dointvec_jiffies,
5677eee325SWen Gu },
570227f058STony Lu {
580227f058STony Lu .procname = "wmem",
590227f058STony Lu .data = &init_net.smc.sysctl_wmem,
600227f058STony Lu .maxlen = sizeof(int),
610227f058STony Lu .mode = 0644,
620227f058STony Lu .proc_handler = proc_dointvec_minmax,
630227f058STony Lu .extra1 = &min_sndbuf,
64833bac7eSGerd Bayer .extra2 = &max_sndbuf,
650227f058STony Lu },
660227f058STony Lu {
670227f058STony Lu .procname = "rmem",
680227f058STony Lu .data = &init_net.smc.sysctl_rmem,
690227f058STony Lu .maxlen = sizeof(int),
700227f058STony Lu .mode = 0644,
710227f058STony Lu .proc_handler = proc_dointvec_minmax,
720227f058STony Lu .extra1 = &min_rcvbuf,
73833bac7eSGerd Bayer .extra2 = &max_rcvbuf,
740227f058STony Lu },
75f8e80fc4SGuangguan Wang {
76f8e80fc4SGuangguan Wang .procname = "smcr_max_links_per_lgr",
77f8e80fc4SGuangguan Wang .data = &init_net.smc.sysctl_max_links_per_lgr,
78f8e80fc4SGuangguan Wang .maxlen = sizeof(int),
79f8e80fc4SGuangguan Wang .mode = 0644,
80f8e80fc4SGuangguan Wang .proc_handler = proc_dointvec_minmax,
81f8e80fc4SGuangguan Wang .extra1 = &links_per_lgr_min,
82f8e80fc4SGuangguan Wang .extra2 = &links_per_lgr_max,
83f8e80fc4SGuangguan Wang },
841f2c9dd7SGuangguan Wang {
851f2c9dd7SGuangguan Wang .procname = "smcr_max_conns_per_lgr",
861f2c9dd7SGuangguan Wang .data = &init_net.smc.sysctl_max_conns_per_lgr,
871f2c9dd7SGuangguan Wang .maxlen = sizeof(int),
881f2c9dd7SGuangguan Wang .mode = 0644,
891f2c9dd7SGuangguan Wang .proc_handler = proc_dointvec_minmax,
901f2c9dd7SGuangguan Wang .extra1 = &conns_per_lgr_min,
911f2c9dd7SGuangguan Wang .extra2 = &conns_per_lgr_max,
921f2c9dd7SGuangguan Wang },
93*f8406a2fSD. Wythe {
94*f8406a2fSD. Wythe .procname = "limit_smc_hs",
95*f8406a2fSD. Wythe .data = &init_net.smc.limit_smc_hs,
96*f8406a2fSD. Wythe .maxlen = sizeof(int),
97*f8406a2fSD. Wythe .mode = 0644,
98*f8406a2fSD. Wythe .proc_handler = proc_dointvec_minmax,
99*f8406a2fSD. Wythe .extra1 = SYSCTL_ZERO,
100*f8406a2fSD. Wythe .extra2 = SYSCTL_ONE,
101*f8406a2fSD. Wythe },
102462791bbSDust Li };
103462791bbSDust Li
smc_sysctl_net_init(struct net * net)1047de8eb0dSDust Li int __net_init smc_sysctl_net_init(struct net *net)
105462791bbSDust Li {
10673dbd8cfSJoel Granados size_t table_size = ARRAY_SIZE(smc_table);
107462791bbSDust Li struct ctl_table *table;
108462791bbSDust Li
109462791bbSDust Li table = smc_table;
110462791bbSDust Li if (!net_eq(net, &init_net)) {
111462791bbSDust Li int i;
112462791bbSDust Li
113462791bbSDust Li table = kmemdup(table, sizeof(smc_table), GFP_KERNEL);
114462791bbSDust Li if (!table)
115462791bbSDust Li goto err_alloc;
116462791bbSDust Li
11773dbd8cfSJoel Granados for (i = 0; i < table_size; i++)
118462791bbSDust Li table[i].data += (void *)net - (void *)&init_net;
119462791bbSDust Li }
120462791bbSDust Li
121c899710fSJoel Granados net->smc.smc_hdr = register_net_sysctl_sz(net, "net/smc", table,
12273dbd8cfSJoel Granados table_size);
123462791bbSDust Li if (!net->smc.smc_hdr)
124462791bbSDust Li goto err_reg;
125462791bbSDust Li
12612bbb0d1SDust Li net->smc.sysctl_autocorking_size = SMC_AUTOCORKING_DEFAULT_SIZE;
1274bc5008eSWen Gu net->smc.sysctl_smcr_buf_type = SMCR_PHYS_CONT_BUFS;
12877eee325SWen Gu net->smc.sysctl_smcr_testlink_time = SMC_LLC_TESTLINK_DEFAULT_TIME;
129833bac7eSGerd Bayer WRITE_ONCE(net->smc.sysctl_wmem, net_smc_wmem_init);
130833bac7eSGerd Bayer WRITE_ONCE(net->smc.sysctl_rmem, net_smc_rmem_init);
131f8e80fc4SGuangguan Wang net->smc.sysctl_max_links_per_lgr = SMC_LINKS_PER_LGR_MAX_PREFER;
1321f2c9dd7SGuangguan Wang net->smc.sysctl_max_conns_per_lgr = SMC_CONN_PER_LGR_PREFER;
133*f8406a2fSD. Wythe /* disable handshake limitation by default */
134*f8406a2fSD. Wythe net->smc.limit_smc_hs = 0;
13512bbb0d1SDust Li
136462791bbSDust Li return 0;
137462791bbSDust Li
138462791bbSDust Li err_reg:
139462791bbSDust Li if (!net_eq(net, &init_net))
140462791bbSDust Li kfree(table);
141462791bbSDust Li err_alloc:
142462791bbSDust Li return -ENOMEM;
143462791bbSDust Li }
144462791bbSDust Li
smc_sysctl_net_exit(struct net * net)1457de8eb0dSDust Li void __net_exit smc_sysctl_net_exit(struct net *net)
146462791bbSDust Li {
147bfa858f2SThomas Weißschuh const struct ctl_table *table;
1485ae6acf1SEric Dumazet
1495ae6acf1SEric Dumazet table = net->smc.smc_hdr->ctl_table_arg;
150462791bbSDust Li unregister_net_sysctl_table(net->smc.smc_hdr);
1515ae6acf1SEric Dumazet if (!net_eq(net, &init_net))
1525ae6acf1SEric Dumazet kfree(table);
153462791bbSDust Li }
154