xref: /linux/include/net/netns/ipv4.h (revision 69050f8d6d075dc01af7a5f2f550a8067510366f)
1 /* SPDX-License-Identifier: GPL-2.0 */
2 /*
3  * ipv4 in net namespaces
4  */
5 
6 #ifndef __NETNS_IPV4_H__
7 #define __NETNS_IPV4_H__
8 
9 #include <linux/uidgid.h>
10 #include <net/inet_frag.h>
11 #include <linux/rcupdate.h>
12 #include <linux/seqlock.h>
13 #include <linux/siphash.h>
14 
15 struct ctl_table_header;
16 struct ipv4_devconf;
17 struct fib_rules_ops;
18 struct hlist_head;
19 struct fib_table;
20 struct sock;
21 struct local_ports {
22 	u32		range;	/* high << 16 | low */
23 	bool		warned;
24 };
25 
26 struct ping_group_range {
27 	seqlock_t	lock;
28 	kgid_t		range[2];
29 };
30 
31 struct inet_hashinfo;
32 
33 struct inet_timewait_death_row {
34 	refcount_t		tw_refcount;
35 
36 	/* Padding to avoid false sharing, tw_refcount can be often written */
37 	struct inet_hashinfo 	*hashinfo ____cacheline_aligned_in_smp;
38 	int			sysctl_max_tw_buckets;
39 };
40 
41 struct tcp_fastopen_context;
42 
43 #ifdef CONFIG_IP_ROUTE_MULTIPATH
44 struct sysctl_fib_multipath_hash_seed {
45 	u32 user_seed;
46 	u32 mp_seed;
47 };
48 #endif
49 
50 struct udp_tunnel_gro {
51 	struct sock __rcu *sk;
52 	struct hlist_head list;
53 };
54 
55 struct netns_ipv4 {
56 	/* Cacheline organization can be found documented in
57 	 * Documentation/networking/net_cachelines/netns_ipv4_sysctl.rst.
58 	 * Please update the document when adding new fields.
59 	 */
60 
61 	/* TX readonly hotpath cache lines */
62 	__cacheline_group_begin(netns_ipv4_read_tx);
63 	u8 sysctl_tcp_early_retrans;
64 	u8 sysctl_tcp_tso_win_divisor;
65 	u8 sysctl_tcp_tso_rtt_log;
66 	u8 sysctl_tcp_autocorking;
67 	int sysctl_tcp_min_snd_mss;
68 	unsigned int sysctl_tcp_notsent_lowat;
69 	int sysctl_tcp_limit_output_bytes;
70 	int sysctl_tcp_min_rtt_wlen;
71 	int sysctl_tcp_wmem[3];
72 	u8 sysctl_ip_fwd_use_pmtu;
73 	__cacheline_group_end(netns_ipv4_read_tx);
74 
75 	/* TXRX readonly hotpath cache lines */
76 	__cacheline_group_begin(netns_ipv4_read_txrx);
77 	__cacheline_group_end(netns_ipv4_read_txrx);
78 
79 	/* RX readonly hotpath cache line */
80 	__cacheline_group_begin(netns_ipv4_read_rx);
81 	u8 sysctl_tcp_moderate_rcvbuf;
82 	u8 sysctl_ip_early_demux;
83 	u8 sysctl_tcp_early_demux;
84 	u8 sysctl_tcp_l3mdev_accept;
85 	/* 3 bytes hole, try to pack */
86 	int sysctl_tcp_reordering;
87 	int sysctl_tcp_rmem[3];
88 	int sysctl_tcp_rcvbuf_low_rtt;
89 	__cacheline_group_end(netns_ipv4_read_rx);
90 
91 	/* ICMP rate limiter hot cache line. */
92 	__cacheline_group_begin_aligned(icmp);
93 	atomic_t	icmp_global_credit;
94 	u32		icmp_global_stamp;
95 	__cacheline_group_end_aligned(icmp);
96 
97 	struct inet_timewait_death_row tcp_death_row;
98 	struct udp_table *udp_table;
99 
100 #if IS_ENABLED(CONFIG_NET_UDP_TUNNEL)
101 	/* Not in a pernet subsys because need to be available at GRO stage */
102 	struct udp_tunnel_gro udp_tunnel_gro[2];
103 #endif
104 
105 #ifdef CONFIG_SYSCTL
106 	struct ctl_table_header	*forw_hdr;
107 	struct ctl_table_header	*frags_hdr;
108 	struct ctl_table_header	*ipv4_hdr;
109 	struct ctl_table_header *route_hdr;
110 	struct ctl_table_header *xfrm4_hdr;
111 #endif
112 	struct ipv4_devconf	*devconf_all;
113 	struct ipv4_devconf	*devconf_dflt;
114 	struct ip_ra_chain __rcu *ra_chain;
115 	struct mutex		ra_mutex;
116 #ifdef CONFIG_IP_MULTIPLE_TABLES
117 	struct fib_rules_ops	*rules_ops;
118 	struct fib_table __rcu	*fib_main;
119 	struct fib_table __rcu	*fib_default;
120 	unsigned int		fib_rules_require_fldissect;
121 	bool			fib_has_custom_rules;
122 #endif
123 	bool			fib_has_custom_local_routes;
124 	bool			fib_offload_disabled;
125 	u8			sysctl_tcp_shrink_window;
126 #ifdef CONFIG_IP_ROUTE_CLASSID
127 	atomic_t		fib_num_tclassid_users;
128 #endif
129 	struct hlist_head	*fib_table_hash;
130 	struct sock		*fibnl;
131 	struct hlist_head	*fib_info_hash;
132 	unsigned int		fib_info_hash_bits;
133 	unsigned int		fib_info_cnt;
134 
135 	struct sock		*mc_autojoin_sk;
136 
137 	struct inet_peer_base	*peers;
138 	struct fqdir		*fqdir;
139 
140 	u8 sysctl_icmp_echo_ignore_all;
141 	u8 sysctl_icmp_echo_enable_probe;
142 	u8 sysctl_icmp_echo_ignore_broadcasts;
143 	u8 sysctl_icmp_ignore_bogus_error_responses;
144 	u8 sysctl_icmp_errors_use_inbound_ifaddr;
145 	u8 sysctl_icmp_errors_extension_mask;
146 	int sysctl_icmp_ratelimit;
147 	int sysctl_icmp_ratemask;
148 	int sysctl_icmp_msgs_per_sec;
149 	int sysctl_icmp_msgs_burst;
150 
151 	u32 ip_rt_min_pmtu;
152 	int ip_rt_mtu_expires;
153 	int ip_rt_min_advmss;
154 
155 	struct local_ports ip_local_ports;
156 
157 	u8 sysctl_tcp_ecn;
158 	u8 sysctl_tcp_ecn_option;
159 	u8 sysctl_tcp_ecn_option_beacon;
160 	u8 sysctl_tcp_ecn_fallback;
161 
162 	u8 sysctl_ip_default_ttl;
163 	u8 sysctl_ip_no_pmtu_disc;
164 	u8 sysctl_ip_fwd_update_priority;
165 	u8 sysctl_ip_nonlocal_bind;
166 	u8 sysctl_ip_autobind_reuse;
167 	/* Shall we try to damage output packets if routing dev changes? */
168 	u8 sysctl_ip_dynaddr;
169 #ifdef CONFIG_NET_L3_MASTER_DEV
170 	u8 sysctl_raw_l3mdev_accept;
171 #endif
172 	u8 sysctl_udp_early_demux;
173 
174 	u8 sysctl_nexthop_compat_mode;
175 
176 	u8 sysctl_fwmark_reflect;
177 	u8 sysctl_tcp_fwmark_accept;
178 	u8 sysctl_tcp_mtu_probing;
179 	int sysctl_tcp_mtu_probe_floor;
180 	int sysctl_tcp_base_mss;
181 	int sysctl_tcp_probe_threshold;
182 	u32 sysctl_tcp_probe_interval;
183 
184 	int sysctl_tcp_keepalive_time;
185 	int sysctl_tcp_keepalive_intvl;
186 	u8 sysctl_tcp_keepalive_probes;
187 
188 	u8 sysctl_tcp_syn_retries;
189 	u8 sysctl_tcp_synack_retries;
190 	u8 sysctl_tcp_syncookies;
191 	u8 sysctl_tcp_migrate_req;
192 	u8 sysctl_tcp_comp_sack_nr;
193 	u8 sysctl_tcp_backlog_ack_defer;
194 	u8 sysctl_tcp_pingpong_thresh;
195 
196 	u8 sysctl_tcp_retries1;
197 	u8 sysctl_tcp_retries2;
198 	u8 sysctl_tcp_orphan_retries;
199 	u8 sysctl_tcp_tw_reuse;
200 	unsigned int sysctl_tcp_tw_reuse_delay;
201 	int sysctl_tcp_fin_timeout;
202 	u8 sysctl_tcp_sack;
203 	u8 sysctl_tcp_window_scaling;
204 	u8 sysctl_tcp_timestamps;
205 	int sysctl_tcp_rto_min_us;
206 	int sysctl_tcp_rto_max_ms;
207 	u8 sysctl_tcp_recovery;
208 	u8 sysctl_tcp_thin_linear_timeouts;
209 	u8 sysctl_tcp_slow_start_after_idle;
210 	u8 sysctl_tcp_retrans_collapse;
211 	u8 sysctl_tcp_stdurg;
212 	u8 sysctl_tcp_rfc1337;
213 	u8 sysctl_tcp_abort_on_overflow;
214 	u8 sysctl_tcp_fack; /* obsolete */
215 	int sysctl_tcp_max_reordering;
216 	int sysctl_tcp_adv_win_scale; /* obsolete */
217 	u8 sysctl_tcp_dsack;
218 	u8 sysctl_tcp_app_win;
219 	u8 sysctl_tcp_frto;
220 	u8 sysctl_tcp_nometrics_save;
221 	u8 sysctl_tcp_no_ssthresh_metrics_save;
222 	u8 sysctl_tcp_workaround_signed_windows;
223 	int sysctl_tcp_challenge_ack_limit;
224 	u8 sysctl_tcp_min_tso_segs;
225 	u8 sysctl_tcp_reflect_tos;
226 	int sysctl_tcp_invalid_ratelimit;
227 	int sysctl_tcp_pacing_ss_ratio;
228 	int sysctl_tcp_pacing_ca_ratio;
229 	unsigned int sysctl_tcp_child_ehash_entries;
230 	int sysctl_tcp_comp_sack_rtt_percent;
231 	unsigned long sysctl_tcp_comp_sack_delay_ns;
232 	unsigned long sysctl_tcp_comp_sack_slack_ns;
233 	int sysctl_max_syn_backlog;
234 	int sysctl_tcp_fastopen;
235 	const struct tcp_congestion_ops __rcu  *tcp_congestion_control;
236 	struct tcp_fastopen_context __rcu *tcp_fastopen_ctx;
237 	unsigned int sysctl_tcp_fastopen_blackhole_timeout;
238 	atomic_t tfo_active_disable_times;
239 	unsigned long tfo_active_disable_stamp;
240 	u32 tcp_challenge_timestamp;
241 	u32 tcp_challenge_count;
242 	u8 sysctl_tcp_plb_enabled;
243 	u8 sysctl_tcp_plb_idle_rehash_rounds;
244 	u8 sysctl_tcp_plb_rehash_rounds;
245 	u8 sysctl_tcp_plb_suspend_rto_sec;
246 	int sysctl_tcp_plb_cong_thresh;
247 
248 	int sysctl_udp_wmem_min;
249 	int sysctl_udp_rmem_min;
250 
251 	u8 sysctl_fib_notify_on_flag_change;
252 	u8 sysctl_tcp_syn_linear_timeouts;
253 
254 #ifdef CONFIG_NET_L3_MASTER_DEV
255 	u8 sysctl_udp_l3mdev_accept;
256 #endif
257 
258 	u8 sysctl_igmp_llm_reports;
259 	int sysctl_igmp_max_memberships;
260 	int sysctl_igmp_max_msf;
261 	int sysctl_igmp_qrv;
262 
263 	struct ping_group_range ping_group_range;
264 	u16			ping_port_rover;
265 
266 	atomic_t dev_addr_genid;
267 
268 	unsigned int sysctl_udp_child_hash_entries;
269 
270 #ifdef CONFIG_SYSCTL
271 	unsigned long *sysctl_local_reserved_ports;
272 	int sysctl_ip_prot_sock;
273 #endif
274 
275 #ifdef CONFIG_IP_MROUTE
276 #ifndef CONFIG_IP_MROUTE_MULTIPLE_TABLES
277 	struct mr_table		*mrt;
278 #else
279 	struct list_head	mr_tables;
280 	struct fib_rules_ops	*mr_rules_ops;
281 #endif
282 #endif
283 #ifdef CONFIG_IP_ROUTE_MULTIPATH
284 	struct sysctl_fib_multipath_hash_seed sysctl_fib_multipath_hash_seed;
285 	u32 sysctl_fib_multipath_hash_fields;
286 	u8 sysctl_fib_multipath_use_neigh;
287 	u8 sysctl_fib_multipath_hash_policy;
288 #endif
289 
290 	struct fib_notifier_ops	*notifier_ops;
291 	unsigned int	fib_seq;	/* writes protected by rtnl_mutex */
292 
293 	struct fib_notifier_ops	*ipmr_notifier_ops;
294 	unsigned int	ipmr_seq;	/* protected by rtnl_mutex */
295 
296 	atomic_t	rt_genid;
297 	siphash_key_t	ip_id_key;
298 	struct hlist_head	*inet_addr_lst;
299 	struct delayed_work	addr_chk_work;
300 };
301 
302 #endif
303