]>
Commit | Line | Data |
---|---|---|
b2441318 | 1 | // SPDX-License-Identifier: GPL-2.0 |
1da177e4 LT |
2 | /* |
3 | * INET An implementation of the TCP/IP protocol suite for the LINUX | |
4 | * operating system. INET is implemented using the BSD Socket | |
5 | * interface as the means of communication with the user level. | |
6 | * | |
7 | * The IP to API glue. | |
e905a9ed | 8 | * |
1da177e4 LT |
9 | * Authors: see ip.c |
10 | * | |
11 | * Fixes: | |
12 | * Many : Split from ip.c , see ip.c for history. | |
13 | * Martin Mares : TOS setting fixed. | |
e905a9ed | 14 | * Alan Cox : Fixed a couple of oopses in Martin's |
1da177e4 LT |
15 | * TOS tweaks. |
16 | * Mike McLagan : Routing by source | |
17 | */ | |
18 | ||
1da177e4 LT |
19 | #include <linux/module.h> |
20 | #include <linux/types.h> | |
21 | #include <linux/mm.h> | |
1da177e4 LT |
22 | #include <linux/skbuff.h> |
23 | #include <linux/ip.h> | |
24 | #include <linux/icmp.h> | |
14c85021 | 25 | #include <linux/inetdevice.h> |
1da177e4 | 26 | #include <linux/netdevice.h> |
5a0e3ad6 | 27 | #include <linux/slab.h> |
1da177e4 LT |
28 | #include <net/sock.h> |
29 | #include <net/ip.h> | |
30 | #include <net/icmp.h> | |
d83d8461 | 31 | #include <net/tcp_states.h> |
1da177e4 LT |
32 | #include <linux/udp.h> |
33 | #include <linux/igmp.h> | |
34 | #include <linux/netfilter.h> | |
35 | #include <linux/route.h> | |
36 | #include <linux/mroute.h> | |
2c67e9ac | 37 | #include <net/inet_ecn.h> |
1da177e4 LT |
38 | #include <net/route.h> |
39 | #include <net/xfrm.h> | |
dae50295 | 40 | #include <net/compat.h> |
ad6f939a | 41 | #include <net/checksum.h> |
dfd56b8b | 42 | #if IS_ENABLED(CONFIG_IPV6) |
1da177e4 LT |
43 | #include <net/transp_v6.h> |
44 | #endif | |
35ebf65e | 45 | #include <net/ip_fib.h> |
1da177e4 LT |
46 | |
47 | #include <linux/errqueue.h> | |
7c0f6ba6 | 48 | #include <linux/uaccess.h> |
1da177e4 | 49 | |
d2ba09c1 AS |
50 | #include <linux/bpfilter.h> |
51 | ||
1da177e4 LT |
52 | /* |
53 | * SOL_IP control messages. | |
54 | */ | |
55 | ||
56 | static void ip_cmsg_recv_pktinfo(struct msghdr *msg, struct sk_buff *skb) | |
57 | { | |
d826eb14 | 58 | struct in_pktinfo info = *PKTINFO_SKB_CB(skb); |
1da177e4 | 59 | |
eddc9ec5 | 60 | info.ipi_addr.s_addr = ip_hdr(skb)->daddr; |
1da177e4 LT |
61 | |
62 | put_cmsg(msg, SOL_IP, IP_PKTINFO, sizeof(info), &info); | |
63 | } | |
64 | ||
65 | static void ip_cmsg_recv_ttl(struct msghdr *msg, struct sk_buff *skb) | |
66 | { | |
eddc9ec5 | 67 | int ttl = ip_hdr(skb)->ttl; |
1da177e4 LT |
68 | put_cmsg(msg, SOL_IP, IP_TTL, sizeof(int), &ttl); |
69 | } | |
70 | ||
71 | static void ip_cmsg_recv_tos(struct msghdr *msg, struct sk_buff *skb) | |
72 | { | |
eddc9ec5 | 73 | put_cmsg(msg, SOL_IP, IP_TOS, 1, &ip_hdr(skb)->tos); |
1da177e4 LT |
74 | } |
75 | ||
76 | static void ip_cmsg_recv_opts(struct msghdr *msg, struct sk_buff *skb) | |
77 | { | |
78 | if (IPCB(skb)->opt.optlen == 0) | |
79 | return; | |
80 | ||
eddc9ec5 ACM |
81 | put_cmsg(msg, SOL_IP, IP_RECVOPTS, IPCB(skb)->opt.optlen, |
82 | ip_hdr(skb) + 1); | |
1da177e4 LT |
83 | } |
84 | ||
85 | ||
91ed1e66 PA |
86 | static void ip_cmsg_recv_retopts(struct net *net, struct msghdr *msg, |
87 | struct sk_buff *skb) | |
1da177e4 LT |
88 | { |
89 | unsigned char optbuf[sizeof(struct ip_options) + 40]; | |
5e73ea1a | 90 | struct ip_options *opt = (struct ip_options *)optbuf; |
1da177e4 LT |
91 | |
92 | if (IPCB(skb)->opt.optlen == 0) | |
93 | return; | |
94 | ||
91ed1e66 | 95 | if (ip_options_echo(net, opt, skb)) { |
1da177e4 LT |
96 | msg->msg_flags |= MSG_CTRUNC; |
97 | return; | |
98 | } | |
99 | ip_options_undo(opt); | |
100 | ||
101 | put_cmsg(msg, SOL_IP, IP_RETOPTS, opt->optlen, opt->__data); | |
102 | } | |
103 | ||
70ecc248 WB |
104 | static void ip_cmsg_recv_fragsize(struct msghdr *msg, struct sk_buff *skb) |
105 | { | |
106 | int val; | |
107 | ||
108 | if (IPCB(skb)->frag_max_size == 0) | |
109 | return; | |
110 | ||
111 | val = IPCB(skb)->frag_max_size; | |
112 | put_cmsg(msg, SOL_IP, IP_RECVFRAGSIZE, sizeof(val), &val); | |
113 | } | |
114 | ||
ad6f939a | 115 | static void ip_cmsg_recv_checksum(struct msghdr *msg, struct sk_buff *skb, |
10df8e61 | 116 | int tlen, int offset) |
ad6f939a TH |
117 | { |
118 | __wsum csum = skb->csum; | |
119 | ||
120 | if (skb->ip_summed != CHECKSUM_COMPLETE) | |
121 | return; | |
122 | ||
ca4ef457 PA |
123 | if (offset != 0) { |
124 | int tend_off = skb_transport_offset(skb) + tlen; | |
125 | csum = csum_sub(csum, skb_checksum(skb, tend_off, offset, 0)); | |
126 | } | |
ad6f939a TH |
127 | |
128 | put_cmsg(msg, SOL_IP, IP_CHECKSUM, sizeof(__wsum), &csum); | |
129 | } | |
130 | ||
2c7946a7 CZ |
131 | static void ip_cmsg_recv_security(struct msghdr *msg, struct sk_buff *skb) |
132 | { | |
133 | char *secdata; | |
dc49c1f9 | 134 | u32 seclen, secid; |
2c7946a7 CZ |
135 | int err; |
136 | ||
dc49c1f9 CZ |
137 | err = security_socket_getpeersec_dgram(NULL, skb, &secid); |
138 | if (err) | |
139 | return; | |
140 | ||
141 | err = security_secid_to_secctx(secid, &secdata, &seclen); | |
2c7946a7 CZ |
142 | if (err) |
143 | return; | |
144 | ||
145 | put_cmsg(msg, SOL_IP, SCM_SECURITY, seclen, secdata); | |
dc49c1f9 | 146 | security_release_secctx(secdata, seclen); |
2c7946a7 CZ |
147 | } |
148 | ||
21d1a161 | 149 | static void ip_cmsg_recv_dstaddr(struct msghdr *msg, struct sk_buff *skb) |
e8b2dfe9 | 150 | { |
4a06fa67 | 151 | __be16 _ports[2], *ports; |
e8b2dfe9 | 152 | struct sockaddr_in sin; |
e8b2dfe9 BS |
153 | |
154 | /* All current transport protocols have the port numbers in the | |
155 | * first four bytes of the transport header and this function is | |
156 | * written with this assumption in mind. | |
157 | */ | |
4a06fa67 WB |
158 | ports = skb_header_pointer(skb, skb_transport_offset(skb), |
159 | sizeof(_ports), &_ports); | |
160 | if (!ports) | |
161 | return; | |
e8b2dfe9 BS |
162 | |
163 | sin.sin_family = AF_INET; | |
64199fc0 | 164 | sin.sin_addr.s_addr = ip_hdr(skb)->daddr; |
e8b2dfe9 BS |
165 | sin.sin_port = ports[1]; |
166 | memset(sin.sin_zero, 0, sizeof(sin.sin_zero)); | |
167 | ||
168 | put_cmsg(msg, SOL_IP, IP_ORIGDSTADDR, sizeof(sin), &sin); | |
169 | } | |
1da177e4 | 170 | |
ad959036 PA |
171 | void ip_cmsg_recv_offset(struct msghdr *msg, struct sock *sk, |
172 | struct sk_buff *skb, int tlen, int offset) | |
1da177e4 | 173 | { |
ad959036 | 174 | struct inet_sock *inet = inet_sk(sk); |
95c96174 | 175 | unsigned int flags = inet->cmsg_flags; |
1da177e4 LT |
176 | |
177 | /* Ordered by supposed usage frequency */ | |
c44d13d6 | 178 | if (flags & IP_CMSG_PKTINFO) { |
1da177e4 | 179 | ip_cmsg_recv_pktinfo(msg, skb); |
1da177e4 | 180 | |
c44d13d6 TH |
181 | flags &= ~IP_CMSG_PKTINFO; |
182 | if (!flags) | |
183 | return; | |
184 | } | |
185 | ||
186 | if (flags & IP_CMSG_TTL) { | |
1da177e4 | 187 | ip_cmsg_recv_ttl(msg, skb); |
1da177e4 | 188 | |
c44d13d6 TH |
189 | flags &= ~IP_CMSG_TTL; |
190 | if (!flags) | |
191 | return; | |
192 | } | |
193 | ||
194 | if (flags & IP_CMSG_TOS) { | |
1da177e4 | 195 | ip_cmsg_recv_tos(msg, skb); |
1da177e4 | 196 | |
c44d13d6 TH |
197 | flags &= ~IP_CMSG_TOS; |
198 | if (!flags) | |
199 | return; | |
200 | } | |
201 | ||
202 | if (flags & IP_CMSG_RECVOPTS) { | |
1da177e4 | 203 | ip_cmsg_recv_opts(msg, skb); |
1da177e4 | 204 | |
c44d13d6 TH |
205 | flags &= ~IP_CMSG_RECVOPTS; |
206 | if (!flags) | |
207 | return; | |
208 | } | |
209 | ||
210 | if (flags & IP_CMSG_RETOPTS) { | |
91ed1e66 | 211 | ip_cmsg_recv_retopts(sock_net(sk), msg, skb); |
2c7946a7 | 212 | |
c44d13d6 TH |
213 | flags &= ~IP_CMSG_RETOPTS; |
214 | if (!flags) | |
215 | return; | |
216 | } | |
217 | ||
218 | if (flags & IP_CMSG_PASSSEC) { | |
2c7946a7 | 219 | ip_cmsg_recv_security(msg, skb); |
e8b2dfe9 | 220 | |
c44d13d6 TH |
221 | flags &= ~IP_CMSG_PASSSEC; |
222 | if (!flags) | |
223 | return; | |
224 | } | |
225 | ||
ad6f939a | 226 | if (flags & IP_CMSG_ORIGDSTADDR) { |
e8b2dfe9 BS |
227 | ip_cmsg_recv_dstaddr(msg, skb); |
228 | ||
ad6f939a TH |
229 | flags &= ~IP_CMSG_ORIGDSTADDR; |
230 | if (!flags) | |
231 | return; | |
232 | } | |
233 | ||
234 | if (flags & IP_CMSG_CHECKSUM) | |
10df8e61 | 235 | ip_cmsg_recv_checksum(msg, skb, tlen, offset); |
70ecc248 WB |
236 | |
237 | if (flags & IP_CMSG_RECVFRAGSIZE) | |
238 | ip_cmsg_recv_fragsize(msg, skb); | |
1da177e4 | 239 | } |
5961de9f | 240 | EXPORT_SYMBOL(ip_cmsg_recv_offset); |
1da177e4 | 241 | |
24025c46 | 242 | int ip_cmsg_send(struct sock *sk, struct msghdr *msg, struct ipcm_cookie *ipc, |
c8e6ad08 | 243 | bool allow_ipv6) |
1da177e4 | 244 | { |
f02db315 | 245 | int err, val; |
1da177e4 | 246 | struct cmsghdr *cmsg; |
24025c46 | 247 | struct net *net = sock_net(sk); |
1da177e4 | 248 | |
f95b414e | 249 | for_each_cmsghdr(cmsg, msg) { |
1da177e4 LT |
250 | if (!CMSG_OK(msg, cmsg)) |
251 | return -EINVAL; | |
5337b5b7 | 252 | #if IS_ENABLED(CONFIG_IPV6) |
c8e6ad08 HFS |
253 | if (allow_ipv6 && |
254 | cmsg->cmsg_level == SOL_IPV6 && | |
255 | cmsg->cmsg_type == IPV6_PKTINFO) { | |
256 | struct in6_pktinfo *src_info; | |
257 | ||
258 | if (cmsg->cmsg_len < CMSG_LEN(sizeof(*src_info))) | |
259 | return -EINVAL; | |
260 | src_info = (struct in6_pktinfo *)CMSG_DATA(cmsg); | |
261 | if (!ipv6_addr_v4mapped(&src_info->ipi6_addr)) | |
262 | return -EINVAL; | |
1cbec076 DA |
263 | if (src_info->ipi6_ifindex) |
264 | ipc->oif = src_info->ipi6_ifindex; | |
c8e6ad08 HFS |
265 | ipc->addr = src_info->ipi6_addr.s6_addr32[3]; |
266 | continue; | |
267 | } | |
268 | #endif | |
24025c46 | 269 | if (cmsg->cmsg_level == SOL_SOCKET) { |
2632616b ED |
270 | err = __sock_cmsg_send(sk, msg, cmsg, &ipc->sockc); |
271 | if (err) | |
272 | return err; | |
24025c46 SHY |
273 | continue; |
274 | } | |
275 | ||
1da177e4 LT |
276 | if (cmsg->cmsg_level != SOL_IP) |
277 | continue; | |
278 | switch (cmsg->cmsg_type) { | |
279 | case IP_RETOPTS: | |
1ff8cebf | 280 | err = cmsg->cmsg_len - sizeof(struct cmsghdr); |
91948309 ED |
281 | |
282 | /* Our caller is responsible for freeing ipc->opt */ | |
de40a3e8 CH |
283 | err = ip_options_get(net, &ipc->opt, |
284 | KERNEL_SOCKPTR(CMSG_DATA(cmsg)), | |
4d52cfbe | 285 | err < 40 ? err : 40); |
1da177e4 LT |
286 | if (err) |
287 | return err; | |
288 | break; | |
289 | case IP_PKTINFO: | |
290 | { | |
291 | struct in_pktinfo *info; | |
292 | if (cmsg->cmsg_len != CMSG_LEN(sizeof(struct in_pktinfo))) | |
293 | return -EINVAL; | |
294 | info = (struct in_pktinfo *)CMSG_DATA(cmsg); | |
1cbec076 DA |
295 | if (info->ipi_ifindex) |
296 | ipc->oif = info->ipi_ifindex; | |
1da177e4 LT |
297 | ipc->addr = info->ipi_spec_dst.s_addr; |
298 | break; | |
299 | } | |
f02db315 FF |
300 | case IP_TTL: |
301 | if (cmsg->cmsg_len != CMSG_LEN(sizeof(int))) | |
302 | return -EINVAL; | |
303 | val = *(int *)CMSG_DATA(cmsg); | |
304 | if (val < 1 || val > 255) | |
305 | return -EINVAL; | |
306 | ipc->ttl = val; | |
307 | break; | |
308 | case IP_TOS: | |
e895cdce ED |
309 | if (cmsg->cmsg_len == CMSG_LEN(sizeof(int))) |
310 | val = *(int *)CMSG_DATA(cmsg); | |
311 | else if (cmsg->cmsg_len == CMSG_LEN(sizeof(u8))) | |
312 | val = *(u8 *)CMSG_DATA(cmsg); | |
313 | else | |
f02db315 | 314 | return -EINVAL; |
f02db315 FF |
315 | if (val < 0 || val > 255) |
316 | return -EINVAL; | |
317 | ipc->tos = val; | |
318 | ipc->priority = rt_tos2priority(ipc->tos); | |
319 | break; | |
320 | ||
1da177e4 LT |
321 | default: |
322 | return -EINVAL; | |
323 | } | |
324 | } | |
325 | return 0; | |
326 | } | |
327 | ||
592fcb9d | 328 | static void ip_ra_destroy_rcu(struct rcu_head *head) |
66018506 | 329 | { |
592fcb9d ED |
330 | struct ip_ra_chain *ra = container_of(head, struct ip_ra_chain, rcu); |
331 | ||
332 | sock_put(ra->saved_sk); | |
333 | kfree(ra); | |
66018506 | 334 | } |
1da177e4 | 335 | |
4d52cfbe ED |
336 | int ip_ra_control(struct sock *sk, unsigned char on, |
337 | void (*destructor)(struct sock *)) | |
1da177e4 | 338 | { |
43a951e9 ED |
339 | struct ip_ra_chain *ra, *new_ra; |
340 | struct ip_ra_chain __rcu **rap; | |
5796ef75 | 341 | struct net *net = sock_net(sk); |
1da177e4 | 342 | |
c720c7e8 | 343 | if (sk->sk_type != SOCK_RAW || inet_sk(sk)->inet_num == IPPROTO_RAW) |
1da177e4 LT |
344 | return -EINVAL; |
345 | ||
346 | new_ra = on ? kmalloc(sizeof(*new_ra), GFP_KERNEL) : NULL; | |
425aa0e1 GZ |
347 | if (on && !new_ra) |
348 | return -ENOMEM; | |
1da177e4 | 349 | |
d9ff3049 | 350 | mutex_lock(&net->ipv4.ra_mutex); |
5796ef75 | 351 | for (rap = &net->ipv4.ra_chain; |
76d3e153 | 352 | (ra = rcu_dereference_protected(*rap, |
d9ff3049 | 353 | lockdep_is_held(&net->ipv4.ra_mutex))) != NULL; |
43a951e9 | 354 | rap = &ra->next) { |
1da177e4 LT |
355 | if (ra->sk == sk) { |
356 | if (on) { | |
d9ff3049 | 357 | mutex_unlock(&net->ipv4.ra_mutex); |
a51482bd | 358 | kfree(new_ra); |
1da177e4 LT |
359 | return -EADDRINUSE; |
360 | } | |
592fcb9d ED |
361 | /* dont let ip_call_ra_chain() use sk again */ |
362 | ra->sk = NULL; | |
8e380f00 | 363 | RCU_INIT_POINTER(*rap, ra->next); |
d9ff3049 | 364 | mutex_unlock(&net->ipv4.ra_mutex); |
1da177e4 LT |
365 | |
366 | if (ra->destructor) | |
367 | ra->destructor(sk); | |
592fcb9d ED |
368 | /* |
369 | * Delay sock_put(sk) and kfree(ra) after one rcu grace | |
370 | * period. This guarantee ip_call_ra_chain() dont need | |
371 | * to mess with socket refcounts. | |
372 | */ | |
373 | ra->saved_sk = sk; | |
374 | call_rcu(&ra->rcu, ip_ra_destroy_rcu); | |
1da177e4 LT |
375 | return 0; |
376 | } | |
377 | } | |
76d3e153 | 378 | if (!new_ra) { |
d9ff3049 | 379 | mutex_unlock(&net->ipv4.ra_mutex); |
1da177e4 | 380 | return -ENOBUFS; |
76d3e153 | 381 | } |
1da177e4 LT |
382 | new_ra->sk = sk; |
383 | new_ra->destructor = destructor; | |
384 | ||
8e380f00 | 385 | RCU_INIT_POINTER(new_ra->next, ra); |
66018506 | 386 | rcu_assign_pointer(*rap, new_ra); |
1da177e4 | 387 | sock_hold(sk); |
d9ff3049 | 388 | mutex_unlock(&net->ipv4.ra_mutex); |
1da177e4 LT |
389 | |
390 | return 0; | |
391 | } | |
392 | ||
178c49d9 WB |
393 | static void ipv4_icmp_error_rfc4884(const struct sk_buff *skb, |
394 | struct sock_ee_data_rfc4884 *out) | |
395 | { | |
396 | switch (icmp_hdr(skb)->type) { | |
397 | case ICMP_DEST_UNREACH: | |
398 | case ICMP_TIME_EXCEEDED: | |
399 | case ICMP_PARAMETERPROB: | |
400 | ip_icmp_error_rfc4884(skb, out, sizeof(struct icmphdr), | |
401 | icmp_hdr(skb)->un.reserved[1] * 4); | |
402 | } | |
403 | } | |
404 | ||
e905a9ed | 405 | void ip_icmp_error(struct sock *sk, struct sk_buff *skb, int err, |
35986b32 | 406 | __be16 port, u32 info, u8 *payload) |
1da177e4 | 407 | { |
1da177e4 LT |
408 | struct sock_exterr_skb *serr; |
409 | ||
1da177e4 LT |
410 | skb = skb_clone(skb, GFP_ATOMIC); |
411 | if (!skb) | |
412 | return; | |
413 | ||
e905a9ed | 414 | serr = SKB_EXT_ERR(skb); |
1da177e4 LT |
415 | serr->ee.ee_errno = err; |
416 | serr->ee.ee_origin = SO_EE_ORIGIN_ICMP; | |
88c7664f ACM |
417 | serr->ee.ee_type = icmp_hdr(skb)->type; |
418 | serr->ee.ee_code = icmp_hdr(skb)->code; | |
1da177e4 LT |
419 | serr->ee.ee_pad = 0; |
420 | serr->ee.ee_info = info; | |
421 | serr->ee.ee_data = 0; | |
88c7664f | 422 | serr->addr_offset = (u8 *)&(((struct iphdr *)(icmp_hdr(skb) + 1))->daddr) - |
d56f90a7 | 423 | skb_network_header(skb); |
1da177e4 LT |
424 | serr->port = port; |
425 | ||
00db4124 | 426 | if (skb_pull(skb, payload - skb->data)) { |
eba75c58 | 427 | if (inet_sk(sk)->recverr_rfc4884) |
178c49d9 | 428 | ipv4_icmp_error_rfc4884(skb, &serr->ee.ee_rfc4884); |
eba75c58 | 429 | |
bd82393c ACM |
430 | skb_reset_transport_header(skb); |
431 | if (sock_queue_err_skb(sk, skb) == 0) | |
432 | return; | |
433 | } | |
434 | kfree_skb(skb); | |
1da177e4 LT |
435 | } |
436 | ||
0579016e | 437 | void ip_local_error(struct sock *sk, int err, __be32 daddr, __be16 port, u32 info) |
1da177e4 LT |
438 | { |
439 | struct inet_sock *inet = inet_sk(sk); | |
440 | struct sock_exterr_skb *serr; | |
441 | struct iphdr *iph; | |
442 | struct sk_buff *skb; | |
443 | ||
444 | if (!inet->recverr) | |
445 | return; | |
446 | ||
447 | skb = alloc_skb(sizeof(struct iphdr), GFP_ATOMIC); | |
448 | if (!skb) | |
449 | return; | |
450 | ||
2ca9e6f2 ACM |
451 | skb_put(skb, sizeof(struct iphdr)); |
452 | skb_reset_network_header(skb); | |
eddc9ec5 | 453 | iph = ip_hdr(skb); |
1da177e4 LT |
454 | iph->daddr = daddr; |
455 | ||
e905a9ed | 456 | serr = SKB_EXT_ERR(skb); |
1da177e4 LT |
457 | serr->ee.ee_errno = err; |
458 | serr->ee.ee_origin = SO_EE_ORIGIN_LOCAL; | |
e905a9ed | 459 | serr->ee.ee_type = 0; |
1da177e4 LT |
460 | serr->ee.ee_code = 0; |
461 | serr->ee.ee_pad = 0; | |
462 | serr->ee.ee_info = info; | |
463 | serr->ee.ee_data = 0; | |
d56f90a7 | 464 | serr->addr_offset = (u8 *)&iph->daddr - skb_network_header(skb); |
1da177e4 LT |
465 | serr->port = port; |
466 | ||
27a884dc | 467 | __skb_pull(skb, skb_tail_pointer(skb) - skb->data); |
bd82393c | 468 | skb_reset_transport_header(skb); |
1da177e4 LT |
469 | |
470 | if (sock_queue_err_skb(sk, skb)) | |
471 | kfree_skb(skb); | |
472 | } | |
473 | ||
34b99df4 JA |
474 | /* For some errors we have valid addr_offset even with zero payload and |
475 | * zero port. Also, addr_offset should be supported if port is set. | |
476 | */ | |
477 | static inline bool ipv4_datagram_support_addr(struct sock_exterr_skb *serr) | |
478 | { | |
479 | return serr->ee.ee_origin == SO_EE_ORIGIN_ICMP || | |
480 | serr->ee.ee_origin == SO_EE_ORIGIN_LOCAL || serr->port; | |
481 | } | |
482 | ||
c247f053 WB |
483 | /* IPv4 supports cmsg on all imcp errors and some timestamps |
484 | * | |
485 | * Timestamp code paths do not initialize the fields expected by cmsg: | |
486 | * the PKTINFO fields in skb->cb[]. Fill those in here. | |
487 | */ | |
488 | static bool ipv4_datagram_support_cmsg(const struct sock *sk, | |
489 | struct sk_buff *skb, | |
490 | int ee_origin) | |
829ae9d6 | 491 | { |
c247f053 WB |
492 | struct in_pktinfo *info; |
493 | ||
494 | if (ee_origin == SO_EE_ORIGIN_ICMP) | |
495 | return true; | |
829ae9d6 | 496 | |
c247f053 WB |
497 | if (ee_origin == SO_EE_ORIGIN_LOCAL) |
498 | return false; | |
499 | ||
500 | /* Support IP_PKTINFO on tstamp packets if requested, to correlate | |
1862d620 | 501 | * timestamp with egress dev. Not possible for packets without iif |
c247f053 WB |
502 | * or without payload (SOF_TIMESTAMPING_OPT_TSONLY). |
503 | */ | |
1862d620 WB |
504 | info = PKTINFO_SKB_CB(skb); |
505 | if (!(sk->sk_tsflags & SOF_TIMESTAMPING_OPT_CMSG) || | |
506 | !info->ipi_ifindex) | |
829ae9d6 WB |
507 | return false; |
508 | ||
509 | info->ipi_spec_dst.s_addr = ip_hdr(skb)->saddr; | |
829ae9d6 WB |
510 | return true; |
511 | } | |
512 | ||
e905a9ed | 513 | /* |
1da177e4 LT |
514 | * Handle MSG_ERRQUEUE |
515 | */ | |
85fbaa75 | 516 | int ip_recv_error(struct sock *sk, struct msghdr *msg, int len, int *addr_len) |
1da177e4 LT |
517 | { |
518 | struct sock_exterr_skb *serr; | |
364a9e93 | 519 | struct sk_buff *skb; |
342dfc30 | 520 | DECLARE_SOCKADDR(struct sockaddr_in *, sin, msg->msg_name); |
1da177e4 LT |
521 | struct { |
522 | struct sock_extended_err ee; | |
523 | struct sockaddr_in offender; | |
524 | } errhdr; | |
525 | int err; | |
526 | int copied; | |
527 | ||
528 | err = -EAGAIN; | |
364a9e93 | 529 | skb = sock_dequeue_err_skb(sk); |
51456b29 | 530 | if (!skb) |
1da177e4 LT |
531 | goto out; |
532 | ||
533 | copied = skb->len; | |
534 | if (copied > len) { | |
535 | msg->msg_flags |= MSG_TRUNC; | |
536 | copied = len; | |
537 | } | |
51f3d02b | 538 | err = skb_copy_datagram_msg(skb, 0, msg, copied); |
960a2628 ED |
539 | if (unlikely(err)) { |
540 | kfree_skb(skb); | |
541 | return err; | |
542 | } | |
1da177e4 LT |
543 | sock_recv_timestamp(msg, sk, skb); |
544 | ||
545 | serr = SKB_EXT_ERR(skb); | |
546 | ||
34b99df4 | 547 | if (sin && ipv4_datagram_support_addr(serr)) { |
1da177e4 | 548 | sin->sin_family = AF_INET; |
d56f90a7 ACM |
549 | sin->sin_addr.s_addr = *(__be32 *)(skb_network_header(skb) + |
550 | serr->addr_offset); | |
1da177e4 LT |
551 | sin->sin_port = serr->port; |
552 | memset(&sin->sin_zero, 0, sizeof(sin->sin_zero)); | |
85fbaa75 | 553 | *addr_len = sizeof(*sin); |
1da177e4 LT |
554 | } |
555 | ||
556 | memcpy(&errhdr.ee, &serr->ee, sizeof(struct sock_extended_err)); | |
557 | sin = &errhdr.offender; | |
f812116b | 558 | memset(sin, 0, sizeof(*sin)); |
829ae9d6 | 559 | |
c247f053 | 560 | if (ipv4_datagram_support_cmsg(sk, skb, serr->ee.ee_origin)) { |
1da177e4 | 561 | sin->sin_family = AF_INET; |
eddc9ec5 | 562 | sin->sin_addr.s_addr = ip_hdr(skb)->saddr; |
f812116b | 563 | if (inet_sk(sk)->cmsg_flags) |
1da177e4 LT |
564 | ip_cmsg_recv(msg, skb); |
565 | } | |
566 | ||
567 | put_cmsg(msg, SOL_IP, IP_RECVERR, sizeof(errhdr), &errhdr); | |
568 | ||
569 | /* Now we could try to dump offended packet options */ | |
570 | ||
571 | msg->msg_flags |= MSG_ERRQUEUE; | |
572 | err = copied; | |
573 | ||
960a2628 | 574 | consume_skb(skb); |
1da177e4 LT |
575 | out: |
576 | return err; | |
577 | } | |
578 | ||
4f47d5d5 | 579 | void __ip_sock_set_tos(struct sock *sk, int val) |
6ebf71ba CH |
580 | { |
581 | if (sk->sk_type == SOCK_STREAM) { | |
582 | val &= ~INET_ECN_MASK; | |
583 | val |= inet_sk(sk)->tos & INET_ECN_MASK; | |
584 | } | |
585 | if (inet_sk(sk)->tos != val) { | |
586 | inet_sk(sk)->tos = val; | |
587 | sk->sk_priority = rt_tos2priority(val); | |
588 | sk_dst_reset(sk); | |
589 | } | |
590 | } | |
591 | ||
592 | void ip_sock_set_tos(struct sock *sk, int val) | |
593 | { | |
594 | lock_sock(sk); | |
595 | __ip_sock_set_tos(sk, val); | |
596 | release_sock(sk); | |
597 | } | |
598 | EXPORT_SYMBOL(ip_sock_set_tos); | |
1da177e4 | 599 | |
c4e446bf CH |
600 | void ip_sock_set_freebind(struct sock *sk) |
601 | { | |
602 | lock_sock(sk); | |
603 | inet_sk(sk)->freebind = true; | |
604 | release_sock(sk); | |
605 | } | |
606 | EXPORT_SYMBOL(ip_sock_set_freebind); | |
607 | ||
db45c0ef CH |
608 | void ip_sock_set_recverr(struct sock *sk) |
609 | { | |
610 | lock_sock(sk); | |
611 | inet_sk(sk)->recverr = true; | |
612 | release_sock(sk); | |
613 | } | |
614 | EXPORT_SYMBOL(ip_sock_set_recverr); | |
615 | ||
2de569bd CH |
616 | int ip_sock_set_mtu_discover(struct sock *sk, int val) |
617 | { | |
618 | if (val < IP_PMTUDISC_DONT || val > IP_PMTUDISC_OMIT) | |
619 | return -EINVAL; | |
620 | lock_sock(sk); | |
621 | inet_sk(sk)->pmtudisc = val; | |
622 | release_sock(sk); | |
623 | return 0; | |
624 | } | |
625 | EXPORT_SYMBOL(ip_sock_set_mtu_discover); | |
626 | ||
c1f9ec57 CH |
627 | void ip_sock_set_pktinfo(struct sock *sk) |
628 | { | |
629 | lock_sock(sk); | |
630 | inet_sk(sk)->cmsg_flags |= IP_CMSG_PKTINFO; | |
631 | release_sock(sk); | |
632 | } | |
633 | EXPORT_SYMBOL(ip_sock_set_pktinfo); | |
634 | ||
1da177e4 | 635 | /* |
4d52cfbe ED |
636 | * Socket option code for IP. This is the end of the line after any |
637 | * TCP,UDP etc options on an IP socket. | |
1da177e4 | 638 | */ |
baf606d9 MRL |
639 | static bool setsockopt_needs_rtnl(int optname) |
640 | { | |
641 | switch (optname) { | |
642 | case IP_ADD_MEMBERSHIP: | |
643 | case IP_ADD_SOURCE_MEMBERSHIP: | |
54ff9ef3 | 644 | case IP_BLOCK_SOURCE: |
baf606d9 | 645 | case IP_DROP_MEMBERSHIP: |
54ff9ef3 MRL |
646 | case IP_DROP_SOURCE_MEMBERSHIP: |
647 | case IP_MSFILTER: | |
648 | case IP_UNBLOCK_SOURCE: | |
649 | case MCAST_BLOCK_SOURCE: | |
650 | case MCAST_MSFILTER: | |
baf606d9 | 651 | case MCAST_JOIN_GROUP: |
54ff9ef3 | 652 | case MCAST_JOIN_SOURCE_GROUP: |
baf606d9 | 653 | case MCAST_LEAVE_GROUP: |
54ff9ef3 MRL |
654 | case MCAST_LEAVE_SOURCE_GROUP: |
655 | case MCAST_UNBLOCK_SOURCE: | |
baf606d9 MRL |
656 | return true; |
657 | } | |
658 | return false; | |
659 | } | |
1da177e4 | 660 | |
e986d4da AV |
661 | static int set_mcast_msfilter(struct sock *sk, int ifindex, |
662 | int numsrc, int fmode, | |
663 | struct sockaddr_storage *group, | |
664 | struct sockaddr_storage *list) | |
665 | { | |
e986d4da AV |
666 | struct ip_msfilter *msf; |
667 | struct sockaddr_in *psin; | |
668 | int err, i; | |
669 | ||
4167a960 | 670 | msf = kmalloc(IP_MSFILTER_SIZE(numsrc), GFP_KERNEL); |
e986d4da AV |
671 | if (!msf) |
672 | return -ENOBUFS; | |
673 | ||
674 | psin = (struct sockaddr_in *)group; | |
675 | if (psin->sin_family != AF_INET) | |
676 | goto Eaddrnotavail; | |
677 | msf->imsf_multiaddr = psin->sin_addr.s_addr; | |
678 | msf->imsf_interface = 0; | |
679 | msf->imsf_fmode = fmode; | |
680 | msf->imsf_numsrc = numsrc; | |
681 | for (i = 0; i < numsrc; ++i) { | |
682 | psin = (struct sockaddr_in *)&list[i]; | |
683 | ||
684 | if (psin->sin_family != AF_INET) | |
685 | goto Eaddrnotavail; | |
2d3e5caf | 686 | msf->imsf_slist_flex[i] = psin->sin_addr.s_addr; |
e986d4da AV |
687 | } |
688 | err = ip_mc_msfilter(sk, msf, ifindex); | |
689 | kfree(msf); | |
690 | return err; | |
691 | ||
692 | Eaddrnotavail: | |
693 | kfree(msf); | |
694 | return -EADDRNOTAVAIL; | |
695 | } | |
696 | ||
89654c5f CH |
697 | static int copy_group_source_from_sockptr(struct group_source_req *greqs, |
698 | sockptr_t optval, int optlen) | |
b6238c04 CH |
699 | { |
700 | if (in_compat_syscall()) { | |
701 | struct compat_group_source_req gr32; | |
702 | ||
703 | if (optlen != sizeof(gr32)) | |
704 | return -EINVAL; | |
89654c5f | 705 | if (copy_from_sockptr(&gr32, optval, sizeof(gr32))) |
b6238c04 CH |
706 | return -EFAULT; |
707 | greqs->gsr_interface = gr32.gsr_interface; | |
708 | greqs->gsr_group = gr32.gsr_group; | |
709 | greqs->gsr_source = gr32.gsr_source; | |
710 | } else { | |
711 | if (optlen != sizeof(*greqs)) | |
712 | return -EINVAL; | |
89654c5f | 713 | if (copy_from_sockptr(greqs, optval, sizeof(*greqs))) |
b6238c04 CH |
714 | return -EFAULT; |
715 | } | |
716 | ||
717 | return 0; | |
718 | } | |
719 | ||
2bbf8c1e | 720 | static int do_mcast_group_source(struct sock *sk, int optname, |
89654c5f | 721 | sockptr_t optval, int optlen) |
2bbf8c1e | 722 | { |
b6238c04 | 723 | struct group_source_req greqs; |
2bbf8c1e AV |
724 | struct ip_mreq_source mreqs; |
725 | struct sockaddr_in *psin; | |
726 | int omode, add, err; | |
727 | ||
89654c5f | 728 | err = copy_group_source_from_sockptr(&greqs, optval, optlen); |
b6238c04 CH |
729 | if (err) |
730 | return err; | |
731 | ||
732 | if (greqs.gsr_group.ss_family != AF_INET || | |
733 | greqs.gsr_source.ss_family != AF_INET) | |
2bbf8c1e AV |
734 | return -EADDRNOTAVAIL; |
735 | ||
b6238c04 | 736 | psin = (struct sockaddr_in *)&greqs.gsr_group; |
2bbf8c1e | 737 | mreqs.imr_multiaddr = psin->sin_addr.s_addr; |
b6238c04 | 738 | psin = (struct sockaddr_in *)&greqs.gsr_source; |
2bbf8c1e AV |
739 | mreqs.imr_sourceaddr = psin->sin_addr.s_addr; |
740 | mreqs.imr_interface = 0; /* use index for mc_source */ | |
741 | ||
742 | if (optname == MCAST_BLOCK_SOURCE) { | |
743 | omode = MCAST_EXCLUDE; | |
744 | add = 1; | |
745 | } else if (optname == MCAST_UNBLOCK_SOURCE) { | |
746 | omode = MCAST_EXCLUDE; | |
747 | add = 0; | |
748 | } else if (optname == MCAST_JOIN_SOURCE_GROUP) { | |
749 | struct ip_mreqn mreq; | |
750 | ||
b6238c04 | 751 | psin = (struct sockaddr_in *)&greqs.gsr_group; |
2bbf8c1e AV |
752 | mreq.imr_multiaddr = psin->sin_addr; |
753 | mreq.imr_address.s_addr = 0; | |
b6238c04 | 754 | mreq.imr_ifindex = greqs.gsr_interface; |
2bbf8c1e AV |
755 | err = ip_mc_join_group_ssm(sk, &mreq, MCAST_INCLUDE); |
756 | if (err && err != -EADDRINUSE) | |
757 | return err; | |
b6238c04 | 758 | greqs.gsr_interface = mreq.imr_ifindex; |
2bbf8c1e AV |
759 | omode = MCAST_INCLUDE; |
760 | add = 1; | |
761 | } else /* MCAST_LEAVE_SOURCE_GROUP */ { | |
762 | omode = MCAST_INCLUDE; | |
763 | add = 0; | |
764 | } | |
b6238c04 | 765 | return ip_mc_source(add, omode, sk, &mreqs, greqs.gsr_interface); |
2bbf8c1e AV |
766 | } |
767 | ||
89654c5f | 768 | static int ip_set_mcast_msfilter(struct sock *sk, sockptr_t optval, int optlen) |
d62c38f6 CH |
769 | { |
770 | struct group_filter *gsf = NULL; | |
771 | int err; | |
772 | ||
773 | if (optlen < GROUP_FILTER_SIZE(0)) | |
774 | return -EINVAL; | |
7de6d09f | 775 | if (optlen > READ_ONCE(sysctl_optmem_max)) |
d62c38f6 CH |
776 | return -ENOBUFS; |
777 | ||
89654c5f | 778 | gsf = memdup_sockptr(optval, optlen); |
d62c38f6 CH |
779 | if (IS_ERR(gsf)) |
780 | return PTR_ERR(gsf); | |
781 | ||
782 | /* numsrc >= (4G-140)/128 overflow in 32 bits */ | |
783 | err = -ENOBUFS; | |
784 | if (gsf->gf_numsrc >= 0x1ffffff || | |
6ae0f2e5 | 785 | gsf->gf_numsrc > READ_ONCE(sock_net(sk)->ipv4.sysctl_igmp_max_msf)) |
d62c38f6 CH |
786 | goto out_free_gsf; |
787 | ||
788 | err = -EINVAL; | |
789 | if (GROUP_FILTER_SIZE(gsf->gf_numsrc) > optlen) | |
790 | goto out_free_gsf; | |
791 | ||
792 | err = set_mcast_msfilter(sk, gsf->gf_interface, gsf->gf_numsrc, | |
db243b79 GS |
793 | gsf->gf_fmode, &gsf->gf_group, |
794 | gsf->gf_slist_flex); | |
d62c38f6 CH |
795 | out_free_gsf: |
796 | kfree(gsf); | |
797 | return err; | |
798 | } | |
799 | ||
89654c5f | 800 | static int compat_ip_set_mcast_msfilter(struct sock *sk, sockptr_t optval, |
d62c38f6 CH |
801 | int optlen) |
802 | { | |
db243b79 | 803 | const int size0 = offsetof(struct compat_group_filter, gf_slist_flex); |
d62c38f6 CH |
804 | struct compat_group_filter *gf32; |
805 | unsigned int n; | |
806 | void *p; | |
807 | int err; | |
808 | ||
809 | if (optlen < size0) | |
810 | return -EINVAL; | |
7de6d09f | 811 | if (optlen > READ_ONCE(sysctl_optmem_max) - 4) |
d62c38f6 CH |
812 | return -ENOBUFS; |
813 | ||
814 | p = kmalloc(optlen + 4, GFP_KERNEL); | |
815 | if (!p) | |
816 | return -ENOMEM; | |
db243b79 | 817 | gf32 = p + 4; /* we want ->gf_group and ->gf_slist_flex aligned */ |
d62c38f6 CH |
818 | |
819 | err = -EFAULT; | |
89654c5f | 820 | if (copy_from_sockptr(gf32, optval, optlen)) |
d62c38f6 CH |
821 | goto out_free_gsf; |
822 | ||
823 | /* numsrc >= (4G-140)/128 overflow in 32 bits */ | |
824 | n = gf32->gf_numsrc; | |
825 | err = -ENOBUFS; | |
826 | if (n >= 0x1ffffff) | |
827 | goto out_free_gsf; | |
828 | ||
829 | err = -EINVAL; | |
db243b79 | 830 | if (offsetof(struct compat_group_filter, gf_slist_flex[n]) > optlen) |
d62c38f6 CH |
831 | goto out_free_gsf; |
832 | ||
d62c38f6 CH |
833 | /* numsrc >= (4G-140)/128 overflow in 32 bits */ |
834 | err = -ENOBUFS; | |
6ae0f2e5 | 835 | if (n > READ_ONCE(sock_net(sk)->ipv4.sysctl_igmp_max_msf)) |
b6238c04 | 836 | goto out_free_gsf; |
d62c38f6 | 837 | err = set_mcast_msfilter(sk, gf32->gf_interface, n, gf32->gf_fmode, |
db243b79 | 838 | &gf32->gf_group, gf32->gf_slist_flex); |
d62c38f6 CH |
839 | out_free_gsf: |
840 | kfree(p); | |
841 | return err; | |
842 | } | |
d62c38f6 | 843 | |
02caad7c | 844 | static int ip_mcast_join_leave(struct sock *sk, int optname, |
89654c5f | 845 | sockptr_t optval, int optlen) |
02caad7c CH |
846 | { |
847 | struct ip_mreqn mreq = { }; | |
848 | struct sockaddr_in *psin; | |
849 | struct group_req greq; | |
850 | ||
851 | if (optlen < sizeof(struct group_req)) | |
852 | return -EINVAL; | |
89654c5f | 853 | if (copy_from_sockptr(&greq, optval, sizeof(greq))) |
02caad7c CH |
854 | return -EFAULT; |
855 | ||
856 | psin = (struct sockaddr_in *)&greq.gr_group; | |
857 | if (psin->sin_family != AF_INET) | |
858 | return -EINVAL; | |
859 | mreq.imr_multiaddr = psin->sin_addr; | |
860 | mreq.imr_ifindex = greq.gr_interface; | |
861 | if (optname == MCAST_JOIN_GROUP) | |
862 | return ip_mc_join_group(sk, &mreq); | |
863 | return ip_mc_leave_group(sk, &mreq); | |
864 | } | |
865 | ||
02caad7c | 866 | static int compat_ip_mcast_join_leave(struct sock *sk, int optname, |
89654c5f | 867 | sockptr_t optval, int optlen) |
02caad7c CH |
868 | { |
869 | struct compat_group_req greq; | |
870 | struct ip_mreqn mreq = { }; | |
871 | struct sockaddr_in *psin; | |
02caad7c CH |
872 | |
873 | if (optlen < sizeof(struct compat_group_req)) | |
874 | return -EINVAL; | |
89654c5f | 875 | if (copy_from_sockptr(&greq, optval, sizeof(greq))) |
02caad7c CH |
876 | return -EFAULT; |
877 | ||
878 | psin = (struct sockaddr_in *)&greq.gr_group; | |
879 | if (psin->sin_family != AF_INET) | |
880 | return -EINVAL; | |
881 | mreq.imr_multiaddr = psin->sin_addr; | |
882 | mreq.imr_ifindex = greq.gr_interface; | |
883 | ||
02caad7c | 884 | if (optname == MCAST_JOIN_GROUP) |
b6238c04 CH |
885 | return ip_mc_join_group(sk, &mreq); |
886 | return ip_mc_leave_group(sk, &mreq); | |
02caad7c | 887 | } |
02caad7c | 888 | |
020e71a3 ED |
889 | DEFINE_STATIC_KEY_FALSE(ip4_min_ttl); |
890 | ||
89654c5f CH |
891 | static int do_ip_setsockopt(struct sock *sk, int level, int optname, |
892 | sockptr_t optval, unsigned int optlen) | |
1da177e4 LT |
893 | { |
894 | struct inet_sock *inet = inet_sk(sk); | |
166b6b2d | 895 | struct net *net = sock_net(sk); |
09cb105e | 896 | int val = 0, err; |
baf606d9 | 897 | bool needs_rtnl = setsockopt_needs_rtnl(optname); |
1da177e4 | 898 | |
0c9f79be XW |
899 | switch (optname) { |
900 | case IP_PKTINFO: | |
901 | case IP_RECVTTL: | |
902 | case IP_RECVOPTS: | |
903 | case IP_RECVTOS: | |
904 | case IP_RETOPTS: | |
905 | case IP_TOS: | |
906 | case IP_TTL: | |
907 | case IP_HDRINCL: | |
908 | case IP_MTU_DISCOVER: | |
909 | case IP_RECVERR: | |
910 | case IP_ROUTER_ALERT: | |
911 | case IP_FREEBIND: | |
912 | case IP_PASSSEC: | |
913 | case IP_TRANSPARENT: | |
914 | case IP_MINTTL: | |
915 | case IP_NODEFRAG: | |
90c337da | 916 | case IP_BIND_ADDRESS_NO_PORT: |
0c9f79be XW |
917 | case IP_UNICAST_IF: |
918 | case IP_MULTICAST_TTL: | |
919 | case IP_MULTICAST_ALL: | |
920 | case IP_MULTICAST_LOOP: | |
921 | case IP_RECVORIGDSTADDR: | |
ad6f939a | 922 | case IP_CHECKSUM: |
70ecc248 | 923 | case IP_RECVFRAGSIZE: |
eba75c58 | 924 | case IP_RECVERR_RFC4884: |
1da177e4 | 925 | if (optlen >= sizeof(int)) { |
89654c5f | 926 | if (copy_from_sockptr(&val, optval, sizeof(val))) |
1da177e4 LT |
927 | return -EFAULT; |
928 | } else if (optlen >= sizeof(char)) { | |
929 | unsigned char ucval; | |
930 | ||
89654c5f | 931 | if (copy_from_sockptr(&ucval, optval, sizeof(ucval))) |
1da177e4 LT |
932 | return -EFAULT; |
933 | val = (int) ucval; | |
934 | } | |
935 | } | |
936 | ||
937 | /* If optlen==0, it is equivalent to val == 0 */ | |
938 | ||
0526947f KT |
939 | if (optname == IP_ROUTER_ALERT) |
940 | return ip_ra_control(sk, val ? 1 : 0, NULL); | |
6a9fb947 | 941 | if (ip_mroute_opt(optname)) |
89654c5f | 942 | return ip_mroute_setsockopt(sk, optname, optval, optlen); |
1da177e4 LT |
943 | |
944 | err = 0; | |
baf606d9 MRL |
945 | if (needs_rtnl) |
946 | rtnl_lock(); | |
1da177e4 LT |
947 | lock_sock(sk); |
948 | ||
949 | switch (optname) { | |
132adf54 SH |
950 | case IP_OPTIONS: |
951 | { | |
f6d8bd05 ED |
952 | struct ip_options_rcu *old, *opt = NULL; |
953 | ||
65a1c4ff | 954 | if (optlen > 40) |
132adf54 | 955 | goto e_inval; |
89654c5f | 956 | err = ip_options_get(sock_net(sk), &opt, optval, optlen); |
132adf54 SH |
957 | if (err) |
958 | break; | |
f6d8bd05 | 959 | old = rcu_dereference_protected(inet->inet_opt, |
1e1d04e6 | 960 | lockdep_sock_is_held(sk)); |
132adf54 SH |
961 | if (inet->is_icsk) { |
962 | struct inet_connection_sock *icsk = inet_csk(sk); | |
dfd56b8b | 963 | #if IS_ENABLED(CONFIG_IPV6) |
132adf54 SH |
964 | if (sk->sk_family == PF_INET || |
965 | (!((1 << sk->sk_state) & | |
966 | (TCPF_LISTEN | TCPF_CLOSE)) && | |
c720c7e8 | 967 | inet->inet_daddr != LOOPBACK4_IPV6)) { |
1da177e4 | 968 | #endif |
f6d8bd05 ED |
969 | if (old) |
970 | icsk->icsk_ext_hdr_len -= old->opt.optlen; | |
132adf54 | 971 | if (opt) |
f6d8bd05 | 972 | icsk->icsk_ext_hdr_len += opt->opt.optlen; |
132adf54 | 973 | icsk->icsk_sync_mss(sk, icsk->icsk_pmtu_cookie); |
dfd56b8b | 974 | #if IS_ENABLED(CONFIG_IPV6) |
1da177e4 | 975 | } |
132adf54 | 976 | #endif |
1da177e4 | 977 | } |
f6d8bd05 ED |
978 | rcu_assign_pointer(inet->inet_opt, opt); |
979 | if (old) | |
605b4afe | 980 | kfree_rcu(old, rcu); |
132adf54 SH |
981 | break; |
982 | } | |
983 | case IP_PKTINFO: | |
984 | if (val) | |
985 | inet->cmsg_flags |= IP_CMSG_PKTINFO; | |
986 | else | |
987 | inet->cmsg_flags &= ~IP_CMSG_PKTINFO; | |
988 | break; | |
989 | case IP_RECVTTL: | |
990 | if (val) | |
991 | inet->cmsg_flags |= IP_CMSG_TTL; | |
992 | else | |
993 | inet->cmsg_flags &= ~IP_CMSG_TTL; | |
994 | break; | |
995 | case IP_RECVTOS: | |
996 | if (val) | |
997 | inet->cmsg_flags |= IP_CMSG_TOS; | |
998 | else | |
999 | inet->cmsg_flags &= ~IP_CMSG_TOS; | |
1000 | break; | |
1001 | case IP_RECVOPTS: | |
1002 | if (val) | |
1003 | inet->cmsg_flags |= IP_CMSG_RECVOPTS; | |
1004 | else | |
1005 | inet->cmsg_flags &= ~IP_CMSG_RECVOPTS; | |
1006 | break; | |
1007 | case IP_RETOPTS: | |
1008 | if (val) | |
1009 | inet->cmsg_flags |= IP_CMSG_RETOPTS; | |
1010 | else | |
1011 | inet->cmsg_flags &= ~IP_CMSG_RETOPTS; | |
1012 | break; | |
1013 | case IP_PASSSEC: | |
1014 | if (val) | |
1015 | inet->cmsg_flags |= IP_CMSG_PASSSEC; | |
1016 | else | |
1017 | inet->cmsg_flags &= ~IP_CMSG_PASSSEC; | |
1018 | break; | |
e8b2dfe9 BS |
1019 | case IP_RECVORIGDSTADDR: |
1020 | if (val) | |
1021 | inet->cmsg_flags |= IP_CMSG_ORIGDSTADDR; | |
1022 | else | |
1023 | inet->cmsg_flags &= ~IP_CMSG_ORIGDSTADDR; | |
1024 | break; | |
ad6f939a TH |
1025 | case IP_CHECKSUM: |
1026 | if (val) { | |
1027 | if (!(inet->cmsg_flags & IP_CMSG_CHECKSUM)) { | |
1028 | inet_inc_convert_csum(sk); | |
1029 | inet->cmsg_flags |= IP_CMSG_CHECKSUM; | |
1030 | } | |
1031 | } else { | |
1032 | if (inet->cmsg_flags & IP_CMSG_CHECKSUM) { | |
1033 | inet_dec_convert_csum(sk); | |
1034 | inet->cmsg_flags &= ~IP_CMSG_CHECKSUM; | |
1035 | } | |
1036 | } | |
1037 | break; | |
70ecc248 WB |
1038 | case IP_RECVFRAGSIZE: |
1039 | if (sk->sk_type != SOCK_RAW && sk->sk_type != SOCK_DGRAM) | |
1040 | goto e_inval; | |
1041 | if (val) | |
1042 | inet->cmsg_flags |= IP_CMSG_RECVFRAGSIZE; | |
1043 | else | |
1044 | inet->cmsg_flags &= ~IP_CMSG_RECVFRAGSIZE; | |
1045 | break; | |
132adf54 | 1046 | case IP_TOS: /* This sets both TOS and Precedence */ |
6ebf71ba | 1047 | __ip_sock_set_tos(sk, val); |
132adf54 SH |
1048 | break; |
1049 | case IP_TTL: | |
4d52cfbe | 1050 | if (optlen < 1) |
132adf54 | 1051 | goto e_inval; |
c9be4a5c | 1052 | if (val != -1 && (val < 1 || val > 255)) |
132adf54 SH |
1053 | goto e_inval; |
1054 | inet->uc_ttl = val; | |
1055 | break; | |
1056 | case IP_HDRINCL: | |
1057 | if (sk->sk_type != SOCK_RAW) { | |
1058 | err = -ENOPROTOOPT; | |
2c7946a7 | 1059 | break; |
132adf54 SH |
1060 | } |
1061 | inet->hdrincl = val ? 1 : 0; | |
1062 | break; | |
7b2ff18e JO |
1063 | case IP_NODEFRAG: |
1064 | if (sk->sk_type != SOCK_RAW) { | |
1065 | err = -ENOPROTOOPT; | |
1066 | break; | |
1067 | } | |
1068 | inet->nodefrag = val ? 1 : 0; | |
1069 | break; | |
90c337da ED |
1070 | case IP_BIND_ADDRESS_NO_PORT: |
1071 | inet->bind_address_no_port = val ? 1 : 0; | |
1072 | break; | |
132adf54 | 1073 | case IP_MTU_DISCOVER: |
1b346576 | 1074 | if (val < IP_PMTUDISC_DONT || val > IP_PMTUDISC_OMIT) |
132adf54 SH |
1075 | goto e_inval; |
1076 | inet->pmtudisc = val; | |
1077 | break; | |
1078 | case IP_RECVERR: | |
1079 | inet->recverr = !!val; | |
1080 | if (!val) | |
1081 | skb_queue_purge(&sk->sk_error_queue); | |
1082 | break; | |
eba75c58 WB |
1083 | case IP_RECVERR_RFC4884: |
1084 | if (val < 0 || val > 1) | |
1085 | goto e_inval; | |
1086 | inet->recverr_rfc4884 = !!val; | |
1087 | break; | |
132adf54 SH |
1088 | case IP_MULTICAST_TTL: |
1089 | if (sk->sk_type == SOCK_STREAM) | |
1090 | goto e_inval; | |
4d52cfbe | 1091 | if (optlen < 1) |
132adf54 | 1092 | goto e_inval; |
09cb105e | 1093 | if (val == -1) |
132adf54 SH |
1094 | val = 1; |
1095 | if (val < 0 || val > 255) | |
1096 | goto e_inval; | |
1097 | inet->mc_ttl = val; | |
1098 | break; | |
1099 | case IP_MULTICAST_LOOP: | |
4d52cfbe | 1100 | if (optlen < 1) |
132adf54 SH |
1101 | goto e_inval; |
1102 | inet->mc_loop = !!val; | |
1103 | break; | |
76e21053 EH |
1104 | case IP_UNICAST_IF: |
1105 | { | |
1106 | struct net_device *dev = NULL; | |
1107 | int ifindex; | |
9515a2e0 | 1108 | int midx; |
76e21053 EH |
1109 | |
1110 | if (optlen != sizeof(int)) | |
1111 | goto e_inval; | |
1112 | ||
1113 | ifindex = (__force int)ntohl((__force __be32)val); | |
1114 | if (ifindex == 0) { | |
1115 | inet->uc_index = 0; | |
1116 | err = 0; | |
1117 | break; | |
1118 | } | |
1119 | ||
1120 | dev = dev_get_by_index(sock_net(sk), ifindex); | |
1121 | err = -EADDRNOTAVAIL; | |
1122 | if (!dev) | |
1123 | break; | |
9515a2e0 DA |
1124 | |
1125 | midx = l3mdev_master_ifindex(dev); | |
76e21053 EH |
1126 | dev_put(dev); |
1127 | ||
1128 | err = -EINVAL; | |
fdf1923b | 1129 | if (sk->sk_bound_dev_if && midx != sk->sk_bound_dev_if) |
76e21053 EH |
1130 | break; |
1131 | ||
1132 | inet->uc_index = ifindex; | |
1133 | err = 0; | |
1134 | break; | |
1135 | } | |
132adf54 SH |
1136 | case IP_MULTICAST_IF: |
1137 | { | |
1138 | struct ip_mreqn mreq; | |
1139 | struct net_device *dev = NULL; | |
7bb387c5 | 1140 | int midx; |
132adf54 SH |
1141 | |
1142 | if (sk->sk_type == SOCK_STREAM) | |
1143 | goto e_inval; | |
1144 | /* | |
1145 | * Check the arguments are allowable | |
1146 | */ | |
1147 | ||
0915921b SW |
1148 | if (optlen < sizeof(struct in_addr)) |
1149 | goto e_inval; | |
1150 | ||
132adf54 SH |
1151 | err = -EFAULT; |
1152 | if (optlen >= sizeof(struct ip_mreqn)) { | |
89654c5f | 1153 | if (copy_from_sockptr(&mreq, optval, sizeof(mreq))) |
1da177e4 | 1154 | break; |
132adf54 SH |
1155 | } else { |
1156 | memset(&mreq, 0, sizeof(mreq)); | |
3a084ddb | 1157 | if (optlen >= sizeof(struct ip_mreq)) { |
89654c5f CH |
1158 | if (copy_from_sockptr(&mreq, optval, |
1159 | sizeof(struct ip_mreq))) | |
3a084ddb JP |
1160 | break; |
1161 | } else if (optlen >= sizeof(struct in_addr)) { | |
89654c5f CH |
1162 | if (copy_from_sockptr(&mreq.imr_address, optval, |
1163 | sizeof(struct in_addr))) | |
3a084ddb JP |
1164 | break; |
1165 | } | |
132adf54 SH |
1166 | } |
1167 | ||
1168 | if (!mreq.imr_ifindex) { | |
e6f1cebf | 1169 | if (mreq.imr_address.s_addr == htonl(INADDR_ANY)) { |
132adf54 SH |
1170 | inet->mc_index = 0; |
1171 | inet->mc_addr = 0; | |
1172 | err = 0; | |
1da177e4 LT |
1173 | break; |
1174 | } | |
3b1e0a65 | 1175 | dev = ip_dev_find(sock_net(sk), mreq.imr_address.s_addr); |
55b80503 | 1176 | if (dev) |
132adf54 | 1177 | mreq.imr_ifindex = dev->ifindex; |
132adf54 | 1178 | } else |
55b80503 | 1179 | dev = dev_get_by_index(sock_net(sk), mreq.imr_ifindex); |
1da177e4 | 1180 | |
1da177e4 | 1181 | |
132adf54 SH |
1182 | err = -EADDRNOTAVAIL; |
1183 | if (!dev) | |
1184 | break; | |
7bb387c5 DA |
1185 | |
1186 | midx = l3mdev_master_ifindex(dev); | |
1187 | ||
55b80503 | 1188 | dev_put(dev); |
132adf54 SH |
1189 | |
1190 | err = -EINVAL; | |
1191 | if (sk->sk_bound_dev_if && | |
7bb387c5 | 1192 | mreq.imr_ifindex != sk->sk_bound_dev_if && |
fdf1923b | 1193 | midx != sk->sk_bound_dev_if) |
132adf54 | 1194 | break; |
1da177e4 | 1195 | |
132adf54 SH |
1196 | inet->mc_index = mreq.imr_ifindex; |
1197 | inet->mc_addr = mreq.imr_address.s_addr; | |
1198 | err = 0; | |
1199 | break; | |
1200 | } | |
1da177e4 | 1201 | |
132adf54 SH |
1202 | case IP_ADD_MEMBERSHIP: |
1203 | case IP_DROP_MEMBERSHIP: | |
1204 | { | |
1205 | struct ip_mreqn mreq; | |
1da177e4 | 1206 | |
a96fb49b FL |
1207 | err = -EPROTO; |
1208 | if (inet_sk(sk)->is_icsk) | |
1209 | break; | |
1210 | ||
132adf54 SH |
1211 | if (optlen < sizeof(struct ip_mreq)) |
1212 | goto e_inval; | |
1213 | err = -EFAULT; | |
1214 | if (optlen >= sizeof(struct ip_mreqn)) { | |
89654c5f | 1215 | if (copy_from_sockptr(&mreq, optval, sizeof(mreq))) |
1da177e4 | 1216 | break; |
132adf54 SH |
1217 | } else { |
1218 | memset(&mreq, 0, sizeof(mreq)); | |
89654c5f CH |
1219 | if (copy_from_sockptr(&mreq, optval, |
1220 | sizeof(struct ip_mreq))) | |
1da177e4 | 1221 | break; |
132adf54 | 1222 | } |
1da177e4 | 1223 | |
132adf54 | 1224 | if (optname == IP_ADD_MEMBERSHIP) |
54ff9ef3 | 1225 | err = ip_mc_join_group(sk, &mreq); |
132adf54 | 1226 | else |
54ff9ef3 | 1227 | err = ip_mc_leave_group(sk, &mreq); |
132adf54 SH |
1228 | break; |
1229 | } | |
1230 | case IP_MSFILTER: | |
1231 | { | |
132adf54 SH |
1232 | struct ip_msfilter *msf; |
1233 | ||
4167a960 | 1234 | if (optlen < IP_MSFILTER_SIZE(0)) |
132adf54 | 1235 | goto e_inval; |
7de6d09f | 1236 | if (optlen > READ_ONCE(sysctl_optmem_max)) { |
132adf54 | 1237 | err = -ENOBUFS; |
1da177e4 LT |
1238 | break; |
1239 | } | |
89654c5f | 1240 | msf = memdup_sockptr(optval, optlen); |
a2c841d9 AV |
1241 | if (IS_ERR(msf)) { |
1242 | err = PTR_ERR(msf); | |
132adf54 SH |
1243 | break; |
1244 | } | |
1245 | /* numsrc >= (1G-4) overflow in 32 bits */ | |
1246 | if (msf->imsf_numsrc >= 0x3ffffffcU || | |
6ae0f2e5 | 1247 | msf->imsf_numsrc > READ_ONCE(net->ipv4.sysctl_igmp_max_msf)) { |
132adf54 SH |
1248 | kfree(msf); |
1249 | err = -ENOBUFS; | |
1250 | break; | |
1251 | } | |
4167a960 | 1252 | if (IP_MSFILTER_SIZE(msf->imsf_numsrc) > optlen) { |
132adf54 SH |
1253 | kfree(msf); |
1254 | err = -EINVAL; | |
1255 | break; | |
1256 | } | |
1257 | err = ip_mc_msfilter(sk, msf, 0); | |
1258 | kfree(msf); | |
1259 | break; | |
1260 | } | |
1261 | case IP_BLOCK_SOURCE: | |
1262 | case IP_UNBLOCK_SOURCE: | |
1263 | case IP_ADD_SOURCE_MEMBERSHIP: | |
1264 | case IP_DROP_SOURCE_MEMBERSHIP: | |
1265 | { | |
1266 | struct ip_mreq_source mreqs; | |
1267 | int omode, add; | |
1da177e4 | 1268 | |
132adf54 SH |
1269 | if (optlen != sizeof(struct ip_mreq_source)) |
1270 | goto e_inval; | |
89654c5f | 1271 | if (copy_from_sockptr(&mreqs, optval, sizeof(mreqs))) { |
1da177e4 | 1272 | err = -EFAULT; |
1da177e4 LT |
1273 | break; |
1274 | } | |
132adf54 SH |
1275 | if (optname == IP_BLOCK_SOURCE) { |
1276 | omode = MCAST_EXCLUDE; | |
1277 | add = 1; | |
1278 | } else if (optname == IP_UNBLOCK_SOURCE) { | |
1279 | omode = MCAST_EXCLUDE; | |
1280 | add = 0; | |
1281 | } else if (optname == IP_ADD_SOURCE_MEMBERSHIP) { | |
1282 | struct ip_mreqn mreq; | |
1da177e4 | 1283 | |
132adf54 SH |
1284 | mreq.imr_multiaddr.s_addr = mreqs.imr_multiaddr; |
1285 | mreq.imr_address.s_addr = mreqs.imr_interface; | |
1286 | mreq.imr_ifindex = 0; | |
6e2059b5 | 1287 | err = ip_mc_join_group_ssm(sk, &mreq, MCAST_INCLUDE); |
132adf54 | 1288 | if (err && err != -EADDRINUSE) |
1da177e4 | 1289 | break; |
132adf54 SH |
1290 | omode = MCAST_INCLUDE; |
1291 | add = 1; | |
1292 | } else /* IP_DROP_SOURCE_MEMBERSHIP */ { | |
1293 | omode = MCAST_INCLUDE; | |
1294 | add = 0; | |
1295 | } | |
1296 | err = ip_mc_source(add, omode, sk, &mreqs, 0); | |
1297 | break; | |
1298 | } | |
1299 | case MCAST_JOIN_GROUP: | |
1300 | case MCAST_LEAVE_GROUP: | |
b6238c04 CH |
1301 | if (in_compat_syscall()) |
1302 | err = compat_ip_mcast_join_leave(sk, optname, optval, | |
1303 | optlen); | |
1304 | else | |
1305 | err = ip_mcast_join_leave(sk, optname, optval, optlen); | |
132adf54 | 1306 | break; |
132adf54 SH |
1307 | case MCAST_JOIN_SOURCE_GROUP: |
1308 | case MCAST_LEAVE_SOURCE_GROUP: | |
1309 | case MCAST_BLOCK_SOURCE: | |
1310 | case MCAST_UNBLOCK_SOURCE: | |
b6238c04 | 1311 | err = do_mcast_group_source(sk, optname, optval, optlen); |
132adf54 | 1312 | break; |
132adf54 | 1313 | case MCAST_MSFILTER: |
b6238c04 CH |
1314 | if (in_compat_syscall()) |
1315 | err = compat_ip_set_mcast_msfilter(sk, optval, optlen); | |
1316 | else | |
1317 | err = ip_set_mcast_msfilter(sk, optval, optlen); | |
132adf54 | 1318 | break; |
f771bef9 NS |
1319 | case IP_MULTICAST_ALL: |
1320 | if (optlen < 1) | |
1321 | goto e_inval; | |
1322 | if (val != 0 && val != 1) | |
1323 | goto e_inval; | |
1324 | inet->mc_all = val; | |
1325 | break; | |
132adf54 SH |
1326 | |
1327 | case IP_FREEBIND: | |
4d52cfbe | 1328 | if (optlen < 1) |
132adf54 SH |
1329 | goto e_inval; |
1330 | inet->freebind = !!val; | |
1331 | break; | |
1332 | ||
1333 | case IP_IPSEC_POLICY: | |
1334 | case IP_XFRM_POLICY: | |
1335 | err = -EPERM; | |
52e804c6 | 1336 | if (!ns_capable(sock_net(sk)->user_ns, CAP_NET_ADMIN)) |
1da177e4 | 1337 | break; |
89654c5f | 1338 | err = xfrm_user_policy(sk, optname, optval, optlen); |
132adf54 | 1339 | break; |
1da177e4 | 1340 | |
f5715aea | 1341 | case IP_TRANSPARENT: |
52e804c6 EB |
1342 | if (!!val && !ns_capable(sock_net(sk)->user_ns, CAP_NET_RAW) && |
1343 | !ns_capable(sock_net(sk)->user_ns, CAP_NET_ADMIN)) { | |
f5715aea KK |
1344 | err = -EPERM; |
1345 | break; | |
1346 | } | |
1347 | if (optlen < 1) | |
1348 | goto e_inval; | |
1349 | inet->transparent = !!val; | |
1350 | break; | |
1351 | ||
d218d111 SH |
1352 | case IP_MINTTL: |
1353 | if (optlen < 1) | |
1354 | goto e_inval; | |
1355 | if (val < 0 || val > 255) | |
1356 | goto e_inval; | |
020e71a3 ED |
1357 | |
1358 | if (val) | |
1359 | static_branch_enable(&ip4_min_ttl); | |
1360 | ||
14834c4f ED |
1361 | /* tcp_v4_err() and tcp_v4_rcv() might read min_ttl |
1362 | * while we are changint it. | |
1363 | */ | |
1364 | WRITE_ONCE(inet->min_ttl, val); | |
d218d111 SH |
1365 | break; |
1366 | ||
132adf54 SH |
1367 | default: |
1368 | err = -ENOPROTOOPT; | |
1369 | break; | |
1da177e4 LT |
1370 | } |
1371 | release_sock(sk); | |
baf606d9 MRL |
1372 | if (needs_rtnl) |
1373 | rtnl_unlock(); | |
1da177e4 LT |
1374 | return err; |
1375 | ||
1376 | e_inval: | |
1377 | release_sock(sk); | |
baf606d9 MRL |
1378 | if (needs_rtnl) |
1379 | rtnl_unlock(); | |
1da177e4 LT |
1380 | return -EINVAL; |
1381 | } | |
1382 | ||
f84af32c | 1383 | /** |
829ae9d6 | 1384 | * ipv4_pktinfo_prepare - transfer some info from rtable to skb |
f84af32c ED |
1385 | * @sk: socket |
1386 | * @skb: buffer | |
1387 | * | |
35ebf65e DM |
1388 | * To support IP_CMSG_PKTINFO option, we store rt_iif and specific |
1389 | * destination in skb->cb[] before dst drop. | |
8e3bff96 | 1390 | * This way, receiver doesn't make cache line misses to read rtable. |
f84af32c | 1391 | */ |
fbf8866d | 1392 | void ipv4_pktinfo_prepare(const struct sock *sk, struct sk_buff *skb) |
f84af32c | 1393 | { |
d826eb14 | 1394 | struct in_pktinfo *pktinfo = PKTINFO_SKB_CB(skb); |
4b261c75 HFS |
1395 | bool prepare = (inet_sk(sk)->cmsg_flags & IP_CMSG_PKTINFO) || |
1396 | ipv6_sk_rxinfo(sk); | |
d826eb14 | 1397 | |
4b261c75 | 1398 | if (prepare && skb_rtable(skb)) { |
0b922b7a DA |
1399 | /* skb->cb is overloaded: prior to this point it is IP{6}CB |
1400 | * which has interface index (iif) as the first member of the | |
1401 | * underlying inet{6}_skb_parm struct. This code then overlays | |
1402 | * PKTINFO_SKB_CB and in_pktinfo also has iif as the first | |
f0c16ba8 WZ |
1403 | * element so the iif is picked up from the prior IPCB. If iif |
1404 | * is the loopback interface, then return the sending interface | |
1405 | * (e.g., process binds socket to eth0 for Tx which is | |
1406 | * redirected to loopback in the rtable/dst). | |
0b922b7a | 1407 | */ |
cbea8f02 DA |
1408 | struct rtable *rt = skb_rtable(skb); |
1409 | bool l3slave = ipv4_l3mdev_skb(IPCB(skb)->flags); | |
1410 | ||
1411 | if (pktinfo->ipi_ifindex == LOOPBACK_IFINDEX) | |
f0c16ba8 | 1412 | pktinfo->ipi_ifindex = inet_iif(skb); |
cbea8f02 DA |
1413 | else if (l3slave && rt && rt->rt_iif) |
1414 | pktinfo->ipi_ifindex = rt->rt_iif; | |
f0c16ba8 | 1415 | |
35ebf65e | 1416 | pktinfo->ipi_spec_dst.s_addr = fib_compute_spec_dst(skb); |
d826eb14 ED |
1417 | } else { |
1418 | pktinfo->ipi_ifindex = 0; | |
1419 | pktinfo->ipi_spec_dst.s_addr = 0; | |
1420 | } | |
61a1030b | 1421 | skb_dst_drop(skb); |
f84af32c | 1422 | } |
f84af32c | 1423 | |
a7b75c5a CH |
1424 | int ip_setsockopt(struct sock *sk, int level, int optname, sockptr_t optval, |
1425 | unsigned int optlen) | |
3fdadf7d DM |
1426 | { |
1427 | int err; | |
1428 | ||
1429 | if (level != SOL_IP) | |
1430 | return -ENOPROTOOPT; | |
1431 | ||
a7b75c5a | 1432 | err = do_ip_setsockopt(sk, level, optname, optval, optlen); |
97adadda | 1433 | #if IS_ENABLED(CONFIG_BPFILTER_UMH) |
d2ba09c1 AS |
1434 | if (optname >= BPFILTER_IPT_SO_SET_REPLACE && |
1435 | optname < BPFILTER_IPT_SET_MAX) | |
a7b75c5a | 1436 | err = bpfilter_ip_set_sockopt(sk, optname, optval, optlen); |
d2ba09c1 | 1437 | #endif |
3fdadf7d DM |
1438 | #ifdef CONFIG_NETFILTER |
1439 | /* we need to exclude all possible ENOPROTOOPTs except default case */ | |
1440 | if (err == -ENOPROTOOPT && optname != IP_HDRINCL && | |
6a9fb947 PE |
1441 | optname != IP_IPSEC_POLICY && |
1442 | optname != IP_XFRM_POLICY && | |
3f34cfae | 1443 | !ip_mroute_opt(optname)) |
a7b75c5a | 1444 | err = nf_setsockopt(sk, PF_INET, optname, optval, optlen); |
3fdadf7d DM |
1445 | #endif |
1446 | return err; | |
1447 | } | |
4d52cfbe | 1448 | EXPORT_SYMBOL(ip_setsockopt); |
3fdadf7d | 1449 | |
1da177e4 | 1450 | /* |
4d52cfbe ED |
1451 | * Get the options. Note for future reference. The GET of IP options gets |
1452 | * the _received_ ones. The set sets the _sent_ ones. | |
1da177e4 LT |
1453 | */ |
1454 | ||
87e9f031 WC |
1455 | static bool getsockopt_needs_rtnl(int optname) |
1456 | { | |
1457 | switch (optname) { | |
1458 | case IP_MSFILTER: | |
1459 | case MCAST_MSFILTER: | |
1460 | return true; | |
1461 | } | |
1462 | return false; | |
1463 | } | |
1464 | ||
49e74c24 CH |
1465 | static int ip_get_mcast_msfilter(struct sock *sk, void __user *optval, |
1466 | int __user *optlen, int len) | |
1467 | { | |
db243b79 | 1468 | const int size0 = offsetof(struct group_filter, gf_slist_flex); |
49e74c24 CH |
1469 | struct group_filter __user *p = optval; |
1470 | struct group_filter gsf; | |
1471 | int num; | |
1472 | int err; | |
1473 | ||
1474 | if (len < size0) | |
1475 | return -EINVAL; | |
1476 | if (copy_from_user(&gsf, p, size0)) | |
1477 | return -EFAULT; | |
1478 | ||
1479 | num = gsf.gf_numsrc; | |
db243b79 | 1480 | err = ip_mc_gsfget(sk, &gsf, p->gf_slist_flex); |
49e74c24 CH |
1481 | if (err) |
1482 | return err; | |
1483 | if (gsf.gf_numsrc < num) | |
1484 | num = gsf.gf_numsrc; | |
1485 | if (put_user(GROUP_FILTER_SIZE(num), optlen) || | |
1486 | copy_to_user(p, &gsf, size0)) | |
1487 | return -EFAULT; | |
1488 | return 0; | |
1489 | } | |
1490 | ||
49e74c24 | 1491 | static int compat_ip_get_mcast_msfilter(struct sock *sk, void __user *optval, |
b6238c04 | 1492 | int __user *optlen, int len) |
49e74c24 | 1493 | { |
db243b79 | 1494 | const int size0 = offsetof(struct compat_group_filter, gf_slist_flex); |
49e74c24 CH |
1495 | struct compat_group_filter __user *p = optval; |
1496 | struct compat_group_filter gf32; | |
1497 | struct group_filter gf; | |
49e74c24 | 1498 | int num; |
b6238c04 | 1499 | int err; |
49e74c24 | 1500 | |
49e74c24 CH |
1501 | if (len < size0) |
1502 | return -EINVAL; | |
49e74c24 CH |
1503 | if (copy_from_user(&gf32, p, size0)) |
1504 | return -EFAULT; | |
1505 | ||
1506 | gf.gf_interface = gf32.gf_interface; | |
1507 | gf.gf_fmode = gf32.gf_fmode; | |
1508 | num = gf.gf_numsrc = gf32.gf_numsrc; | |
1509 | gf.gf_group = gf32.gf_group; | |
1510 | ||
db243b79 | 1511 | err = ip_mc_gsfget(sk, &gf, p->gf_slist_flex); |
49e74c24 CH |
1512 | if (err) |
1513 | return err; | |
1514 | if (gf.gf_numsrc < num) | |
1515 | num = gf.gf_numsrc; | |
1516 | len = GROUP_FILTER_SIZE(num) - (sizeof(gf) - sizeof(gf32)); | |
1517 | if (put_user(len, optlen) || | |
1518 | put_user(gf.gf_fmode, &p->gf_fmode) || | |
1519 | put_user(gf.gf_numsrc, &p->gf_numsrc)) | |
1520 | return -EFAULT; | |
1521 | return 0; | |
1522 | } | |
49e74c24 | 1523 | |
3fdadf7d | 1524 | static int do_ip_getsockopt(struct sock *sk, int level, int optname, |
b6238c04 | 1525 | char __user *optval, int __user *optlen) |
1da177e4 LT |
1526 | { |
1527 | struct inet_sock *inet = inet_sk(sk); | |
87e9f031 WC |
1528 | bool needs_rtnl = getsockopt_needs_rtnl(optname); |
1529 | int val, err = 0; | |
1da177e4 | 1530 | int len; |
e905a9ed | 1531 | |
132adf54 | 1532 | if (level != SOL_IP) |
1da177e4 LT |
1533 | return -EOPNOTSUPP; |
1534 | ||
6a9fb947 | 1535 | if (ip_mroute_opt(optname)) |
09cb105e | 1536 | return ip_mroute_getsockopt(sk, optname, optval, optlen); |
1da177e4 | 1537 | |
09cb105e | 1538 | if (get_user(len, optlen)) |
1da177e4 | 1539 | return -EFAULT; |
132adf54 | 1540 | if (len < 0) |
1da177e4 | 1541 | return -EINVAL; |
e905a9ed | 1542 | |
87e9f031 WC |
1543 | if (needs_rtnl) |
1544 | rtnl_lock(); | |
1da177e4 LT |
1545 | lock_sock(sk); |
1546 | ||
132adf54 SH |
1547 | switch (optname) { |
1548 | case IP_OPTIONS: | |
1549 | { | |
1550 | unsigned char optbuf[sizeof(struct ip_options)+40]; | |
f6d8bd05 ED |
1551 | struct ip_options *opt = (struct ip_options *)optbuf; |
1552 | struct ip_options_rcu *inet_opt; | |
1553 | ||
1554 | inet_opt = rcu_dereference_protected(inet->inet_opt, | |
1e1d04e6 | 1555 | lockdep_sock_is_held(sk)); |
132adf54 | 1556 | opt->optlen = 0; |
f6d8bd05 ED |
1557 | if (inet_opt) |
1558 | memcpy(optbuf, &inet_opt->opt, | |
1559 | sizeof(struct ip_options) + | |
1560 | inet_opt->opt.optlen); | |
132adf54 SH |
1561 | release_sock(sk); |
1562 | ||
1563 | if (opt->optlen == 0) | |
1564 | return put_user(0, optlen); | |
1565 | ||
1566 | ip_options_undo(opt); | |
1567 | ||
1568 | len = min_t(unsigned int, len, opt->optlen); | |
1569 | if (put_user(len, optlen)) | |
1570 | return -EFAULT; | |
1571 | if (copy_to_user(optval, opt->__data, len)) | |
1572 | return -EFAULT; | |
1573 | return 0; | |
1574 | } | |
1575 | case IP_PKTINFO: | |
1576 | val = (inet->cmsg_flags & IP_CMSG_PKTINFO) != 0; | |
1577 | break; | |
1578 | case IP_RECVTTL: | |
1579 | val = (inet->cmsg_flags & IP_CMSG_TTL) != 0; | |
1580 | break; | |
1581 | case IP_RECVTOS: | |
1582 | val = (inet->cmsg_flags & IP_CMSG_TOS) != 0; | |
1583 | break; | |
1584 | case IP_RECVOPTS: | |
1585 | val = (inet->cmsg_flags & IP_CMSG_RECVOPTS) != 0; | |
1586 | break; | |
1587 | case IP_RETOPTS: | |
1588 | val = (inet->cmsg_flags & IP_CMSG_RETOPTS) != 0; | |
1589 | break; | |
1590 | case IP_PASSSEC: | |
1591 | val = (inet->cmsg_flags & IP_CMSG_PASSSEC) != 0; | |
1592 | break; | |
e8b2dfe9 BS |
1593 | case IP_RECVORIGDSTADDR: |
1594 | val = (inet->cmsg_flags & IP_CMSG_ORIGDSTADDR) != 0; | |
1595 | break; | |
ad6f939a TH |
1596 | case IP_CHECKSUM: |
1597 | val = (inet->cmsg_flags & IP_CMSG_CHECKSUM) != 0; | |
1598 | break; | |
70ecc248 WB |
1599 | case IP_RECVFRAGSIZE: |
1600 | val = (inet->cmsg_flags & IP_CMSG_RECVFRAGSIZE) != 0; | |
1601 | break; | |
132adf54 SH |
1602 | case IP_TOS: |
1603 | val = inet->tos; | |
1604 | break; | |
1605 | case IP_TTL: | |
fa50d974 NB |
1606 | { |
1607 | struct net *net = sock_net(sk); | |
132adf54 | 1608 | val = (inet->uc_ttl == -1 ? |
8281b7ec | 1609 | READ_ONCE(net->ipv4.sysctl_ip_default_ttl) : |
132adf54 SH |
1610 | inet->uc_ttl); |
1611 | break; | |
fa50d974 | 1612 | } |
132adf54 SH |
1613 | case IP_HDRINCL: |
1614 | val = inet->hdrincl; | |
1615 | break; | |
a89b4763 MK |
1616 | case IP_NODEFRAG: |
1617 | val = inet->nodefrag; | |
1618 | break; | |
90c337da ED |
1619 | case IP_BIND_ADDRESS_NO_PORT: |
1620 | val = inet->bind_address_no_port; | |
1621 | break; | |
132adf54 SH |
1622 | case IP_MTU_DISCOVER: |
1623 | val = inet->pmtudisc; | |
1624 | break; | |
1625 | case IP_MTU: | |
1626 | { | |
1627 | struct dst_entry *dst; | |
1628 | val = 0; | |
1629 | dst = sk_dst_get(sk); | |
1630 | if (dst) { | |
1631 | val = dst_mtu(dst); | |
1632 | dst_release(dst); | |
1da177e4 | 1633 | } |
132adf54 | 1634 | if (!val) { |
1da177e4 | 1635 | release_sock(sk); |
132adf54 | 1636 | return -ENOTCONN; |
1da177e4 | 1637 | } |
132adf54 SH |
1638 | break; |
1639 | } | |
1640 | case IP_RECVERR: | |
1641 | val = inet->recverr; | |
1642 | break; | |
eba75c58 WB |
1643 | case IP_RECVERR_RFC4884: |
1644 | val = inet->recverr_rfc4884; | |
1645 | break; | |
132adf54 SH |
1646 | case IP_MULTICAST_TTL: |
1647 | val = inet->mc_ttl; | |
1648 | break; | |
1649 | case IP_MULTICAST_LOOP: | |
1650 | val = inet->mc_loop; | |
1651 | break; | |
76e21053 EH |
1652 | case IP_UNICAST_IF: |
1653 | val = (__force int)htonl((__u32) inet->uc_index); | |
1654 | break; | |
132adf54 SH |
1655 | case IP_MULTICAST_IF: |
1656 | { | |
1657 | struct in_addr addr; | |
1658 | len = min_t(unsigned int, len, sizeof(struct in_addr)); | |
1659 | addr.s_addr = inet->mc_addr; | |
1660 | release_sock(sk); | |
1da177e4 | 1661 | |
132adf54 SH |
1662 | if (put_user(len, optlen)) |
1663 | return -EFAULT; | |
1664 | if (copy_to_user(optval, &addr, len)) | |
1665 | return -EFAULT; | |
1666 | return 0; | |
1667 | } | |
1668 | case IP_MSFILTER: | |
1669 | { | |
1670 | struct ip_msfilter msf; | |
132adf54 | 1671 | |
4167a960 | 1672 | if (len < IP_MSFILTER_SIZE(0)) { |
87e9f031 WC |
1673 | err = -EINVAL; |
1674 | goto out; | |
1da177e4 | 1675 | } |
4167a960 | 1676 | if (copy_from_user(&msf, optval, IP_MSFILTER_SIZE(0))) { |
87e9f031 WC |
1677 | err = -EFAULT; |
1678 | goto out; | |
1da177e4 | 1679 | } |
132adf54 SH |
1680 | err = ip_mc_msfget(sk, &msf, |
1681 | (struct ip_msfilter __user *)optval, optlen); | |
87e9f031 | 1682 | goto out; |
132adf54 SH |
1683 | } |
1684 | case MCAST_MSFILTER: | |
b6238c04 CH |
1685 | if (in_compat_syscall()) |
1686 | err = compat_ip_get_mcast_msfilter(sk, optval, optlen, | |
1687 | len); | |
1688 | else | |
1689 | err = ip_get_mcast_msfilter(sk, optval, optlen, len); | |
87e9f031 | 1690 | goto out; |
f771bef9 NS |
1691 | case IP_MULTICAST_ALL: |
1692 | val = inet->mc_all; | |
1693 | break; | |
132adf54 SH |
1694 | case IP_PKTOPTIONS: |
1695 | { | |
1696 | struct msghdr msg; | |
1da177e4 | 1697 | |
132adf54 | 1698 | release_sock(sk); |
1da177e4 | 1699 | |
132adf54 SH |
1700 | if (sk->sk_type != SOCK_STREAM) |
1701 | return -ENOPROTOOPT; | |
1da177e4 | 1702 | |
1f466e1f CH |
1703 | msg.msg_control_is_user = true; |
1704 | msg.msg_control_user = optval; | |
132adf54 | 1705 | msg.msg_controllen = len; |
b6238c04 | 1706 | msg.msg_flags = in_compat_syscall() ? MSG_CMSG_COMPAT : 0; |
1da177e4 | 1707 | |
132adf54 SH |
1708 | if (inet->cmsg_flags & IP_CMSG_PKTINFO) { |
1709 | struct in_pktinfo info; | |
1710 | ||
c720c7e8 ED |
1711 | info.ipi_addr.s_addr = inet->inet_rcv_saddr; |
1712 | info.ipi_spec_dst.s_addr = inet->inet_rcv_saddr; | |
132adf54 SH |
1713 | info.ipi_ifindex = inet->mc_index; |
1714 | put_cmsg(&msg, SOL_IP, IP_PKTINFO, sizeof(info), &info); | |
1da177e4 | 1715 | } |
132adf54 SH |
1716 | if (inet->cmsg_flags & IP_CMSG_TTL) { |
1717 | int hlim = inet->mc_ttl; | |
1718 | put_cmsg(&msg, SOL_IP, IP_TTL, sizeof(hlim), &hlim); | |
1719 | } | |
4c507d28 JB |
1720 | if (inet->cmsg_flags & IP_CMSG_TOS) { |
1721 | int tos = inet->rcv_tos; | |
1722 | put_cmsg(&msg, SOL_IP, IP_TOS, sizeof(tos), &tos); | |
1723 | } | |
132adf54 SH |
1724 | len -= msg.msg_controllen; |
1725 | return put_user(len, optlen); | |
1726 | } | |
1727 | case IP_FREEBIND: | |
1728 | val = inet->freebind; | |
1729 | break; | |
f5715aea KK |
1730 | case IP_TRANSPARENT: |
1731 | val = inet->transparent; | |
1732 | break; | |
d218d111 SH |
1733 | case IP_MINTTL: |
1734 | val = inet->min_ttl; | |
1735 | break; | |
132adf54 SH |
1736 | default: |
1737 | release_sock(sk); | |
1738 | return -ENOPROTOOPT; | |
1da177e4 LT |
1739 | } |
1740 | release_sock(sk); | |
e905a9ed | 1741 | |
4d52cfbe | 1742 | if (len < sizeof(int) && len > 0 && val >= 0 && val <= 255) { |
1da177e4 LT |
1743 | unsigned char ucval = (unsigned char)val; |
1744 | len = 1; | |
132adf54 | 1745 | if (put_user(len, optlen)) |
1da177e4 | 1746 | return -EFAULT; |
09cb105e | 1747 | if (copy_to_user(optval, &ucval, 1)) |
1da177e4 LT |
1748 | return -EFAULT; |
1749 | } else { | |
1750 | len = min_t(unsigned int, sizeof(int), len); | |
132adf54 | 1751 | if (put_user(len, optlen)) |
1da177e4 | 1752 | return -EFAULT; |
09cb105e | 1753 | if (copy_to_user(optval, &val, len)) |
1da177e4 LT |
1754 | return -EFAULT; |
1755 | } | |
1756 | return 0; | |
87e9f031 WC |
1757 | |
1758 | out: | |
1759 | release_sock(sk); | |
1760 | if (needs_rtnl) | |
1761 | rtnl_unlock(); | |
1762 | return err; | |
1da177e4 LT |
1763 | } |
1764 | ||
3fdadf7d | 1765 | int ip_getsockopt(struct sock *sk, int level, |
132adf54 | 1766 | int optname, char __user *optval, int __user *optlen) |
3fdadf7d DM |
1767 | { |
1768 | int err; | |
1769 | ||
b6238c04 | 1770 | err = do_ip_getsockopt(sk, level, optname, optval, optlen); |
42908c69 | 1771 | |
97adadda | 1772 | #if IS_ENABLED(CONFIG_BPFILTER_UMH) |
d2ba09c1 AS |
1773 | if (optname >= BPFILTER_IPT_SO_GET_INFO && |
1774 | optname < BPFILTER_IPT_GET_MAX) | |
1775 | err = bpfilter_ip_get_sockopt(sk, optname, optval, optlen); | |
1776 | #endif | |
3fdadf7d DM |
1777 | #ifdef CONFIG_NETFILTER |
1778 | /* we need to exclude all possible ENOPROTOOPTs except default case */ | |
6a9fb947 PE |
1779 | if (err == -ENOPROTOOPT && optname != IP_PKTOPTIONS && |
1780 | !ip_mroute_opt(optname)) { | |
e905a9ed | 1781 | int len; |
3fdadf7d | 1782 | |
543d9cfe | 1783 | if (get_user(len, optlen)) |
3fdadf7d DM |
1784 | return -EFAULT; |
1785 | ||
77d4df41 | 1786 | err = nf_getsockopt(sk, PF_INET, optname, optval, &len); |
3fdadf7d DM |
1787 | if (err >= 0) |
1788 | err = put_user(len, optlen); | |
1789 | return err; | |
1790 | } | |
1791 | #endif | |
1792 | return err; | |
1793 | } | |
b6238c04 | 1794 | EXPORT_SYMBOL(ip_getsockopt); |