1 /* SPDX-License-Identifier: GPL-2.0 */
2 /*
3  * ipv4 in net namespaces
4  */
5 
6 #ifndef __NETNS_IPV4_H__
7 #define __NETNS_IPV4_H__
8 
9 #include <linux/uidgid.h>
10 #include <net/inet_frag.h>
11 #include <linux/rcupdate.h>
12 #include <linux/seqlock.h>
13 #include <linux/siphash.h>
14 
15 struct ctl_table_header;
16 struct ipv4_devconf;
17 struct fib_rules_ops;
18 struct hlist_head;
19 struct fib_table;
20 struct sock;
21 struct local_ports {
22 	u32		range;	/* high << 16 | low */
23 	bool		warned;
24 };
25 
26 struct ping_group_range {
27 	seqlock_t	lock;
28 	kgid_t		range[2];
29 };
30 
31 struct inet_hashinfo;
32 
33 struct inet_timewait_death_row {
34 	refcount_t		tw_refcount;
35 
36 	/* Padding to avoid false sharing, tw_refcount can be often written */
37 	struct inet_hashinfo 	*hashinfo ____cacheline_aligned_in_smp;
38 	int			sysctl_max_tw_buckets;
39 };
40 
41 struct tcp_fastopen_context;
42 
43 #ifdef CONFIG_IP_ROUTE_MULTIPATH
44 struct sysctl_fib_multipath_hash_seed {
45 	u32 user_seed;
46 	u32 mp_seed;
47 };
48 #endif
49 
50 struct udp_tunnel_gro {
51 	struct sock __rcu *sk;
52 	struct hlist_head list;
53 };
54 
55 struct netns_ipv4 {
56 	/* Cacheline organization can be found documented in
57 	 * Documentation/networking/net_cachelines/netns_ipv4_sysctl.rst.
58 	 * Please update the document when adding new fields.
59 	 */
60 
61 	/* TX readonly hotpath cache lines */
62 	__cacheline_group_begin(netns_ipv4_read_tx);
63 	u8 sysctl_tcp_early_retrans;
64 	u8 sysctl_tcp_tso_win_divisor;
65 	u8 sysctl_tcp_tso_rtt_log;
66 	u8 sysctl_tcp_autocorking;
67 	int sysctl_tcp_min_snd_mss;
68 	unsigned int sysctl_tcp_notsent_lowat;
69 	int sysctl_tcp_limit_output_bytes;
70 	int sysctl_tcp_min_rtt_wlen;
71 	int sysctl_tcp_wmem[3];
72 	u8 sysctl_ip_fwd_use_pmtu;
73 	__cacheline_group_end(netns_ipv4_read_tx);
74 
75 	/* TXRX readonly hotpath cache lines */
76 	__cacheline_group_begin(netns_ipv4_read_txrx);
77 	u8 sysctl_tcp_moderate_rcvbuf;
78 	__cacheline_group_end(netns_ipv4_read_txrx);
79 
80 	/* RX readonly hotpath cache line */
81 	__cacheline_group_begin(netns_ipv4_read_rx);
82 	u8 sysctl_ip_early_demux;
83 	u8 sysctl_tcp_early_demux;
84 	u8 sysctl_tcp_l3mdev_accept;
85 	/* 3 bytes hole, try to pack */
86 	int sysctl_tcp_reordering;
87 	int sysctl_tcp_rmem[3];
88 	__cacheline_group_end(netns_ipv4_read_rx);
89 
90 	struct inet_timewait_death_row tcp_death_row;
91 	struct udp_table *udp_table;
92 
93 #if IS_ENABLED(CONFIG_NET_UDP_TUNNEL)
94 	/* Not in a pernet subsys because need to be available at GRO stage */
95 	struct udp_tunnel_gro udp_tunnel_gro[2];
96 #endif
97 
98 #ifdef CONFIG_SYSCTL
99 	struct ctl_table_header	*forw_hdr;
100 	struct ctl_table_header	*frags_hdr;
101 	struct ctl_table_header	*ipv4_hdr;
102 	struct ctl_table_header *route_hdr;
103 	struct ctl_table_header *xfrm4_hdr;
104 #endif
105 	struct ipv4_devconf	*devconf_all;
106 	struct ipv4_devconf	*devconf_dflt;
107 	struct ip_ra_chain __rcu *ra_chain;
108 	struct mutex		ra_mutex;
109 #ifdef CONFIG_IP_MULTIPLE_TABLES
110 	struct fib_rules_ops	*rules_ops;
111 	struct fib_table __rcu	*fib_main;
112 	struct fib_table __rcu	*fib_default;
113 	unsigned int		fib_rules_require_fldissect;
114 	bool			fib_has_custom_rules;
115 #endif
116 	bool			fib_has_custom_local_routes;
117 	bool			fib_offload_disabled;
118 	u8			sysctl_tcp_shrink_window;
119 #ifdef CONFIG_IP_ROUTE_CLASSID
120 	atomic_t		fib_num_tclassid_users;
121 #endif
122 	struct hlist_head	*fib_table_hash;
123 	struct sock		*fibnl;
124 	struct hlist_head	*fib_info_hash;
125 	unsigned int		fib_info_hash_bits;
126 	unsigned int		fib_info_cnt;
127 
128 	struct sock		*mc_autojoin_sk;
129 
130 	struct inet_peer_base	*peers;
131 	struct fqdir		*fqdir;
132 
133 	u8 sysctl_icmp_echo_ignore_all;
134 	u8 sysctl_icmp_echo_enable_probe;
135 	u8 sysctl_icmp_echo_ignore_broadcasts;
136 	u8 sysctl_icmp_ignore_bogus_error_responses;
137 	u8 sysctl_icmp_errors_use_inbound_ifaddr;
138 	int sysctl_icmp_ratelimit;
139 	int sysctl_icmp_ratemask;
140 	int sysctl_icmp_msgs_per_sec;
141 	int sysctl_icmp_msgs_burst;
142 	atomic_t icmp_global_credit;
143 	u32 icmp_global_stamp;
144 	u32 ip_rt_min_pmtu;
145 	int ip_rt_mtu_expires;
146 	int ip_rt_min_advmss;
147 
148 	struct local_ports ip_local_ports;
149 
150 	u8 sysctl_tcp_ecn;
151 	u8 sysctl_tcp_ecn_fallback;
152 
153 	u8 sysctl_ip_default_ttl;
154 	u8 sysctl_ip_no_pmtu_disc;
155 	u8 sysctl_ip_fwd_update_priority;
156 	u8 sysctl_ip_nonlocal_bind;
157 	u8 sysctl_ip_autobind_reuse;
158 	/* Shall we try to damage output packets if routing dev changes? */
159 	u8 sysctl_ip_dynaddr;
160 #ifdef CONFIG_NET_L3_MASTER_DEV
161 	u8 sysctl_raw_l3mdev_accept;
162 #endif
163 	u8 sysctl_udp_early_demux;
164 
165 	u8 sysctl_nexthop_compat_mode;
166 
167 	u8 sysctl_fwmark_reflect;
168 	u8 sysctl_tcp_fwmark_accept;
169 	u8 sysctl_tcp_mtu_probing;
170 	int sysctl_tcp_mtu_probe_floor;
171 	int sysctl_tcp_base_mss;
172 	int sysctl_tcp_probe_threshold;
173 	u32 sysctl_tcp_probe_interval;
174 
175 	int sysctl_tcp_keepalive_time;
176 	int sysctl_tcp_keepalive_intvl;
177 	u8 sysctl_tcp_keepalive_probes;
178 
179 	u8 sysctl_tcp_syn_retries;
180 	u8 sysctl_tcp_synack_retries;
181 	u8 sysctl_tcp_syncookies;
182 	u8 sysctl_tcp_migrate_req;
183 	u8 sysctl_tcp_comp_sack_nr;
184 	u8 sysctl_tcp_backlog_ack_defer;
185 	u8 sysctl_tcp_pingpong_thresh;
186 
187 	u8 sysctl_tcp_retries1;
188 	u8 sysctl_tcp_retries2;
189 	u8 sysctl_tcp_orphan_retries;
190 	u8 sysctl_tcp_tw_reuse;
191 	unsigned int sysctl_tcp_tw_reuse_delay;
192 	int sysctl_tcp_fin_timeout;
193 	u8 sysctl_tcp_sack;
194 	u8 sysctl_tcp_window_scaling;
195 	u8 sysctl_tcp_timestamps;
196 	int sysctl_tcp_rto_min_us;
197 	int sysctl_tcp_rto_max_ms;
198 	u8 sysctl_tcp_recovery;
199 	u8 sysctl_tcp_thin_linear_timeouts;
200 	u8 sysctl_tcp_slow_start_after_idle;
201 	u8 sysctl_tcp_retrans_collapse;
202 	u8 sysctl_tcp_stdurg;
203 	u8 sysctl_tcp_rfc1337;
204 	u8 sysctl_tcp_abort_on_overflow;
205 	u8 sysctl_tcp_fack; /* obsolete */
206 	int sysctl_tcp_max_reordering;
207 	int sysctl_tcp_adv_win_scale; /* obsolete */
208 	u8 sysctl_tcp_dsack;
209 	u8 sysctl_tcp_app_win;
210 	u8 sysctl_tcp_frto;
211 	u8 sysctl_tcp_nometrics_save;
212 	u8 sysctl_tcp_no_ssthresh_metrics_save;
213 	u8 sysctl_tcp_workaround_signed_windows;
214 	int sysctl_tcp_challenge_ack_limit;
215 	u8 sysctl_tcp_min_tso_segs;
216 	u8 sysctl_tcp_reflect_tos;
217 	int sysctl_tcp_invalid_ratelimit;
218 	int sysctl_tcp_pacing_ss_ratio;
219 	int sysctl_tcp_pacing_ca_ratio;
220 	unsigned int sysctl_tcp_child_ehash_entries;
221 	unsigned long sysctl_tcp_comp_sack_delay_ns;
222 	unsigned long sysctl_tcp_comp_sack_slack_ns;
223 	int sysctl_max_syn_backlog;
224 	int sysctl_tcp_fastopen;
225 	const struct tcp_congestion_ops __rcu  *tcp_congestion_control;
226 	struct tcp_fastopen_context __rcu *tcp_fastopen_ctx;
227 	unsigned int sysctl_tcp_fastopen_blackhole_timeout;
228 	atomic_t tfo_active_disable_times;
229 	unsigned long tfo_active_disable_stamp;
230 	u32 tcp_challenge_timestamp;
231 	u32 tcp_challenge_count;
232 	u8 sysctl_tcp_plb_enabled;
233 	u8 sysctl_tcp_plb_idle_rehash_rounds;
234 	u8 sysctl_tcp_plb_rehash_rounds;
235 	u8 sysctl_tcp_plb_suspend_rto_sec;
236 	int sysctl_tcp_plb_cong_thresh;
237 
238 	int sysctl_udp_wmem_min;
239 	int sysctl_udp_rmem_min;
240 
241 	u8 sysctl_fib_notify_on_flag_change;
242 	u8 sysctl_tcp_syn_linear_timeouts;
243 
244 #ifdef CONFIG_NET_L3_MASTER_DEV
245 	u8 sysctl_udp_l3mdev_accept;
246 #endif
247 
248 	u8 sysctl_igmp_llm_reports;
249 	int sysctl_igmp_max_memberships;
250 	int sysctl_igmp_max_msf;
251 	int sysctl_igmp_qrv;
252 
253 	struct ping_group_range ping_group_range;
254 
255 	atomic_t dev_addr_genid;
256 
257 	unsigned int sysctl_udp_child_hash_entries;
258 
259 #ifdef CONFIG_SYSCTL
260 	unsigned long *sysctl_local_reserved_ports;
261 	int sysctl_ip_prot_sock;
262 #endif
263 
264 #ifdef CONFIG_IP_MROUTE
265 #ifndef CONFIG_IP_MROUTE_MULTIPLE_TABLES
266 	struct mr_table		*mrt;
267 #else
268 	struct list_head	mr_tables;
269 	struct fib_rules_ops	*mr_rules_ops;
270 #endif
271 #endif
272 #ifdef CONFIG_IP_ROUTE_MULTIPATH
273 	struct sysctl_fib_multipath_hash_seed sysctl_fib_multipath_hash_seed;
274 	u32 sysctl_fib_multipath_hash_fields;
275 	u8 sysctl_fib_multipath_use_neigh;
276 	u8 sysctl_fib_multipath_hash_policy;
277 #endif
278 
279 	struct fib_notifier_ops	*notifier_ops;
280 	unsigned int	fib_seq;	/* writes protected by rtnl_mutex */
281 
282 	struct fib_notifier_ops	*ipmr_notifier_ops;
283 	unsigned int	ipmr_seq;	/* protected by rtnl_mutex */
284 
285 	atomic_t	rt_genid;
286 	siphash_key_t	ip_id_key;
287 	struct hlist_head	*inet_addr_lst;
288 	struct delayed_work	addr_chk_work;
289 };
290 
291 #endif
292