xref: /linux/include/net/netns/ipv4.h (revision 0e50474fa514822e9d990874e554bf8043a201d7)
1 /* SPDX-License-Identifier: GPL-2.0 */
2 /*
3  * ipv4 in net namespaces
4  */
5 
6 #ifndef __NETNS_IPV4_H__
7 #define __NETNS_IPV4_H__
8 
9 #include <linux/uidgid.h>
10 #include <net/inet_frag.h>
11 #include <linux/rcupdate.h>
12 #include <linux/seqlock.h>
13 #include <linux/siphash.h>
14 
15 struct ctl_table_header;
16 struct ipv4_devconf;
17 struct fib_rules_ops;
18 struct hlist_head;
19 struct fib_table;
20 struct sock;
21 struct local_ports {
22 	u32		range;	/* high << 16 | low */
23 	bool		warned;
24 };
25 
26 struct ping_group_range {
27 	seqlock_t	lock;
28 	kgid_t		range[2];
29 };
30 
31 struct inet_hashinfo;
32 
33 struct inet_timewait_death_row {
34 	refcount_t		tw_refcount;
35 
36 	/* Padding to avoid false sharing, tw_refcount can be often written */
37 	struct inet_hashinfo 	*hashinfo ____cacheline_aligned_in_smp;
38 	int			sysctl_max_tw_buckets;
39 };
40 
41 struct tcp_fastopen_context;
42 
43 #ifdef CONFIG_IP_ROUTE_MULTIPATH
44 struct sysctl_fib_multipath_hash_seed {
45 	u32 user_seed;
46 	u32 mp_seed;
47 };
48 #endif
49 
50 struct udp_tunnel_gro {
51 	struct sock __rcu *sk;
52 	struct hlist_head list;
53 };
54 
55 struct netns_ipv4 {
56 	/* Cacheline organization can be found documented in
57 	 * Documentation/networking/net_cachelines/netns_ipv4_sysctl.rst.
58 	 * Please update the document when adding new fields.
59 	 */
60 
61 	/* TX readonly hotpath cache lines */
62 	__cacheline_group_begin(netns_ipv4_read_tx);
63 	u8 sysctl_tcp_early_retrans;
64 	u8 sysctl_tcp_tso_win_divisor;
65 	u8 sysctl_tcp_tso_rtt_log;
66 	u8 sysctl_tcp_autocorking;
67 	int sysctl_tcp_min_snd_mss;
68 	unsigned int sysctl_tcp_notsent_lowat;
69 	int sysctl_tcp_limit_output_bytes;
70 	int sysctl_tcp_min_rtt_wlen;
71 	int sysctl_tcp_wmem[3];
72 	u8 sysctl_ip_fwd_use_pmtu;
73 	__cacheline_group_end(netns_ipv4_read_tx);
74 
75 	/* TXRX readonly hotpath cache lines */
76 	__cacheline_group_begin(netns_ipv4_read_txrx);
77 	u8 sysctl_tcp_moderate_rcvbuf;
78 	__cacheline_group_end(netns_ipv4_read_txrx);
79 
80 	/* RX readonly hotpath cache line */
81 	__cacheline_group_begin(netns_ipv4_read_rx);
82 	u8 sysctl_ip_early_demux;
83 	u8 sysctl_tcp_early_demux;
84 	u8 sysctl_tcp_l3mdev_accept;
85 	/* 3 bytes hole, try to pack */
86 	int sysctl_tcp_reordering;
87 	int sysctl_tcp_rmem[3];
88 	__cacheline_group_end(netns_ipv4_read_rx);
89 
90 	struct inet_timewait_death_row tcp_death_row;
91 	struct udp_table *udp_table;
92 
93 #if IS_ENABLED(CONFIG_NET_UDP_TUNNEL)
94 	/* Not in a pernet subsys because need to be available at GRO stage */
95 	struct udp_tunnel_gro udp_tunnel_gro[2];
96 #endif
97 
98 #ifdef CONFIG_SYSCTL
99 	struct ctl_table_header	*forw_hdr;
100 	struct ctl_table_header	*frags_hdr;
101 	struct ctl_table_header	*ipv4_hdr;
102 	struct ctl_table_header *route_hdr;
103 	struct ctl_table_header *xfrm4_hdr;
104 #endif
105 	struct ipv4_devconf	*devconf_all;
106 	struct ipv4_devconf	*devconf_dflt;
107 	struct ip_ra_chain __rcu *ra_chain;
108 	struct mutex		ra_mutex;
109 #ifdef CONFIG_IP_MULTIPLE_TABLES
110 	struct fib_rules_ops	*rules_ops;
111 	struct fib_table __rcu	*fib_main;
112 	struct fib_table __rcu	*fib_default;
113 	unsigned int		fib_rules_require_fldissect;
114 	bool			fib_has_custom_rules;
115 #endif
116 	bool			fib_has_custom_local_routes;
117 	bool			fib_offload_disabled;
118 	u8			sysctl_tcp_shrink_window;
119 #ifdef CONFIG_IP_ROUTE_CLASSID
120 	atomic_t		fib_num_tclassid_users;
121 #endif
122 	struct hlist_head	*fib_table_hash;
123 	struct sock		*fibnl;
124 	struct hlist_head	*fib_info_hash;
125 	unsigned int		fib_info_hash_bits;
126 	unsigned int		fib_info_cnt;
127 
128 	struct sock		*mc_autojoin_sk;
129 
130 	struct inet_peer_base	*peers;
131 	struct fqdir		*fqdir;
132 
133 	u8 sysctl_icmp_echo_ignore_all;
134 	u8 sysctl_icmp_echo_enable_probe;
135 	u8 sysctl_icmp_echo_ignore_broadcasts;
136 	u8 sysctl_icmp_ignore_bogus_error_responses;
137 	u8 sysctl_icmp_errors_use_inbound_ifaddr;
138 	u8 sysctl_icmp_errors_extension_mask;
139 	int sysctl_icmp_ratelimit;
140 	int sysctl_icmp_ratemask;
141 	int sysctl_icmp_msgs_per_sec;
142 	int sysctl_icmp_msgs_burst;
143 	atomic_t icmp_global_credit;
144 	u32 icmp_global_stamp;
145 	u32 ip_rt_min_pmtu;
146 	int ip_rt_mtu_expires;
147 	int ip_rt_min_advmss;
148 
149 	struct local_ports ip_local_ports;
150 
151 	u8 sysctl_tcp_ecn;
152 	u8 sysctl_tcp_ecn_option;
153 	u8 sysctl_tcp_ecn_option_beacon;
154 	u8 sysctl_tcp_ecn_fallback;
155 
156 	u8 sysctl_ip_default_ttl;
157 	u8 sysctl_ip_no_pmtu_disc;
158 	u8 sysctl_ip_fwd_update_priority;
159 	u8 sysctl_ip_nonlocal_bind;
160 	u8 sysctl_ip_autobind_reuse;
161 	/* Shall we try to damage output packets if routing dev changes? */
162 	u8 sysctl_ip_dynaddr;
163 #ifdef CONFIG_NET_L3_MASTER_DEV
164 	u8 sysctl_raw_l3mdev_accept;
165 #endif
166 	u8 sysctl_udp_early_demux;
167 
168 	u8 sysctl_nexthop_compat_mode;
169 
170 	u8 sysctl_fwmark_reflect;
171 	u8 sysctl_tcp_fwmark_accept;
172 	u8 sysctl_tcp_mtu_probing;
173 	int sysctl_tcp_mtu_probe_floor;
174 	int sysctl_tcp_base_mss;
175 	int sysctl_tcp_probe_threshold;
176 	u32 sysctl_tcp_probe_interval;
177 
178 	int sysctl_tcp_keepalive_time;
179 	int sysctl_tcp_keepalive_intvl;
180 	u8 sysctl_tcp_keepalive_probes;
181 
182 	u8 sysctl_tcp_syn_retries;
183 	u8 sysctl_tcp_synack_retries;
184 	u8 sysctl_tcp_syncookies;
185 	u8 sysctl_tcp_migrate_req;
186 	u8 sysctl_tcp_comp_sack_nr;
187 	u8 sysctl_tcp_backlog_ack_defer;
188 	u8 sysctl_tcp_pingpong_thresh;
189 
190 	u8 sysctl_tcp_retries1;
191 	u8 sysctl_tcp_retries2;
192 	u8 sysctl_tcp_orphan_retries;
193 	u8 sysctl_tcp_tw_reuse;
194 	unsigned int sysctl_tcp_tw_reuse_delay;
195 	int sysctl_tcp_fin_timeout;
196 	u8 sysctl_tcp_sack;
197 	u8 sysctl_tcp_window_scaling;
198 	u8 sysctl_tcp_timestamps;
199 	int sysctl_tcp_rto_min_us;
200 	int sysctl_tcp_rto_max_ms;
201 	u8 sysctl_tcp_recovery;
202 	u8 sysctl_tcp_thin_linear_timeouts;
203 	u8 sysctl_tcp_slow_start_after_idle;
204 	u8 sysctl_tcp_retrans_collapse;
205 	u8 sysctl_tcp_stdurg;
206 	u8 sysctl_tcp_rfc1337;
207 	u8 sysctl_tcp_abort_on_overflow;
208 	u8 sysctl_tcp_fack; /* obsolete */
209 	int sysctl_tcp_max_reordering;
210 	int sysctl_tcp_adv_win_scale; /* obsolete */
211 	u8 sysctl_tcp_dsack;
212 	u8 sysctl_tcp_app_win;
213 	u8 sysctl_tcp_frto;
214 	u8 sysctl_tcp_nometrics_save;
215 	u8 sysctl_tcp_no_ssthresh_metrics_save;
216 	u8 sysctl_tcp_workaround_signed_windows;
217 	int sysctl_tcp_challenge_ack_limit;
218 	u8 sysctl_tcp_min_tso_segs;
219 	u8 sysctl_tcp_reflect_tos;
220 	int sysctl_tcp_invalid_ratelimit;
221 	int sysctl_tcp_pacing_ss_ratio;
222 	int sysctl_tcp_pacing_ca_ratio;
223 	unsigned int sysctl_tcp_child_ehash_entries;
224 	unsigned long sysctl_tcp_comp_sack_delay_ns;
225 	unsigned long sysctl_tcp_comp_sack_slack_ns;
226 	int sysctl_max_syn_backlog;
227 	int sysctl_tcp_fastopen;
228 	const struct tcp_congestion_ops __rcu  *tcp_congestion_control;
229 	struct tcp_fastopen_context __rcu *tcp_fastopen_ctx;
230 	unsigned int sysctl_tcp_fastopen_blackhole_timeout;
231 	atomic_t tfo_active_disable_times;
232 	unsigned long tfo_active_disable_stamp;
233 	u32 tcp_challenge_timestamp;
234 	u32 tcp_challenge_count;
235 	u8 sysctl_tcp_plb_enabled;
236 	u8 sysctl_tcp_plb_idle_rehash_rounds;
237 	u8 sysctl_tcp_plb_rehash_rounds;
238 	u8 sysctl_tcp_plb_suspend_rto_sec;
239 	int sysctl_tcp_plb_cong_thresh;
240 
241 	int sysctl_udp_wmem_min;
242 	int sysctl_udp_rmem_min;
243 
244 	u8 sysctl_fib_notify_on_flag_change;
245 	u8 sysctl_tcp_syn_linear_timeouts;
246 
247 #ifdef CONFIG_NET_L3_MASTER_DEV
248 	u8 sysctl_udp_l3mdev_accept;
249 #endif
250 
251 	u8 sysctl_igmp_llm_reports;
252 	int sysctl_igmp_max_memberships;
253 	int sysctl_igmp_max_msf;
254 	int sysctl_igmp_qrv;
255 
256 	struct ping_group_range ping_group_range;
257 	u16			ping_port_rover;
258 
259 	atomic_t dev_addr_genid;
260 
261 	unsigned int sysctl_udp_child_hash_entries;
262 
263 #ifdef CONFIG_SYSCTL
264 	unsigned long *sysctl_local_reserved_ports;
265 	int sysctl_ip_prot_sock;
266 #endif
267 
268 #ifdef CONFIG_IP_MROUTE
269 #ifndef CONFIG_IP_MROUTE_MULTIPLE_TABLES
270 	struct mr_table		*mrt;
271 #else
272 	struct list_head	mr_tables;
273 	struct fib_rules_ops	*mr_rules_ops;
274 #endif
275 #endif
276 #ifdef CONFIG_IP_ROUTE_MULTIPATH
277 	struct sysctl_fib_multipath_hash_seed sysctl_fib_multipath_hash_seed;
278 	u32 sysctl_fib_multipath_hash_fields;
279 	u8 sysctl_fib_multipath_use_neigh;
280 	u8 sysctl_fib_multipath_hash_policy;
281 #endif
282 
283 	struct fib_notifier_ops	*notifier_ops;
284 	unsigned int	fib_seq;	/* writes protected by rtnl_mutex */
285 
286 	struct fib_notifier_ops	*ipmr_notifier_ops;
287 	unsigned int	ipmr_seq;	/* protected by rtnl_mutex */
288 
289 	atomic_t	rt_genid;
290 	siphash_key_t	ip_id_key;
291 	struct hlist_head	*inet_addr_lst;
292 	struct delayed_work	addr_chk_work;
293 };
294 
295 #endif
296