10abdde82SPaolo Abeni // SPDX-License-Identifier: GPL-2.0
20abdde82SPaolo Abeni /* Multipath TCP
30abdde82SPaolo Abeni *
40abdde82SPaolo Abeni * Copyright (c) 2021, Red Hat.
50abdde82SPaolo Abeni */
60abdde82SPaolo Abeni
70abdde82SPaolo Abeni #define pr_fmt(fmt) "MPTCP: " fmt
80abdde82SPaolo Abeni
90abdde82SPaolo Abeni #include <linux/kernel.h>
100abdde82SPaolo Abeni #include <linux/module.h>
110abdde82SPaolo Abeni #include <net/sock.h>
120abdde82SPaolo Abeni #include <net/protocol.h>
130abdde82SPaolo Abeni #include <net/tcp.h>
140abdde82SPaolo Abeni #include <net/mptcp.h>
150abdde82SPaolo Abeni #include "protocol.h"
160abdde82SPaolo Abeni
1706f15ceeSFlorian Westphal #define MIN_INFO_OPTLEN_SIZE 16
1849243207SPaolo Abeni #define MIN_FULL_INFO_OPTLEN_SIZE 40
1906f15ceeSFlorian Westphal
__mptcp_tcp_fallback(struct mptcp_sock * msk)200abdde82SPaolo Abeni static struct sock *__mptcp_tcp_fallback(struct mptcp_sock *msk)
210abdde82SPaolo Abeni {
22109cdeb8SGeliang Tang msk_owned_by_me(msk);
230abdde82SPaolo Abeni
240abdde82SPaolo Abeni if (likely(!__mptcp_check_fallback(msk)))
250abdde82SPaolo Abeni return NULL;
260abdde82SPaolo Abeni
270abdde82SPaolo Abeni return msk->first;
280abdde82SPaolo Abeni }
290abdde82SPaolo Abeni
sockopt_seq_reset(const struct sock * sk)30df00b087SFlorian Westphal static u32 sockopt_seq_reset(const struct sock *sk)
31df00b087SFlorian Westphal {
32df00b087SFlorian Westphal sock_owned_by_me(sk);
33df00b087SFlorian Westphal
34df00b087SFlorian Westphal /* Highbits contain state. Allows to distinguish sockopt_seq
35df00b087SFlorian Westphal * of listener and established:
36df00b087SFlorian Westphal * s0 = new_listener()
37df00b087SFlorian Westphal * sockopt(s0) - seq is 1
38df00b087SFlorian Westphal * s1 = accept(s0) - s1 inherits seq 1 if listener sk (s0)
39df00b087SFlorian Westphal * sockopt(s0) - seq increments to 2 on s0
40df00b087SFlorian Westphal * sockopt(s1) // seq increments to 2 on s1 (different option)
41df00b087SFlorian Westphal * new ssk completes join, inherits options from s0 // seq 2
42df00b087SFlorian Westphal * Needs sync from mptcp join logic, but ssk->seq == msk->seq
43df00b087SFlorian Westphal *
44df00b087SFlorian Westphal * Set High order bits to sk_state so ssk->seq == msk->seq test
45df00b087SFlorian Westphal * will fail.
46df00b087SFlorian Westphal */
47df00b087SFlorian Westphal
48df00b087SFlorian Westphal return (u32)sk->sk_state << 24u;
49df00b087SFlorian Westphal }
50df00b087SFlorian Westphal
sockopt_seq_inc(struct mptcp_sock * msk)511b3e7edeSFlorian Westphal static void sockopt_seq_inc(struct mptcp_sock *msk)
521b3e7edeSFlorian Westphal {
531b3e7edeSFlorian Westphal u32 seq = (msk->setsockopt_seq + 1) & 0x00ffffff;
541b3e7edeSFlorian Westphal
551b3e7edeSFlorian Westphal msk->setsockopt_seq = sockopt_seq_reset((struct sock *)msk) + seq;
561b3e7edeSFlorian Westphal }
571b3e7edeSFlorian Westphal
mptcp_get_int_option(struct mptcp_sock * msk,sockptr_t optval,unsigned int optlen,int * val)581b3e7edeSFlorian Westphal static int mptcp_get_int_option(struct mptcp_sock *msk, sockptr_t optval,
591b3e7edeSFlorian Westphal unsigned int optlen, int *val)
601b3e7edeSFlorian Westphal {
611b3e7edeSFlorian Westphal if (optlen < sizeof(int))
621b3e7edeSFlorian Westphal return -EINVAL;
631b3e7edeSFlorian Westphal
641b3e7edeSFlorian Westphal if (copy_from_sockptr(val, optval, sizeof(*val)))
651b3e7edeSFlorian Westphal return -EFAULT;
661b3e7edeSFlorian Westphal
671b3e7edeSFlorian Westphal return 0;
681b3e7edeSFlorian Westphal }
691b3e7edeSFlorian Westphal
mptcp_sol_socket_sync_intval(struct mptcp_sock * msk,int optname,int val)701b3e7edeSFlorian Westphal static void mptcp_sol_socket_sync_intval(struct mptcp_sock *msk, int optname, int val)
711b3e7edeSFlorian Westphal {
721b3e7edeSFlorian Westphal struct mptcp_subflow_context *subflow;
731b3e7edeSFlorian Westphal struct sock *sk = (struct sock *)msk;
741b3e7edeSFlorian Westphal
751b3e7edeSFlorian Westphal lock_sock(sk);
761b3e7edeSFlorian Westphal sockopt_seq_inc(msk);
771b3e7edeSFlorian Westphal
781b3e7edeSFlorian Westphal mptcp_for_each_subflow(msk, subflow) {
791b3e7edeSFlorian Westphal struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
801b3e7edeSFlorian Westphal bool slow = lock_sock_fast(ssk);
811b3e7edeSFlorian Westphal
821b3e7edeSFlorian Westphal switch (optname) {
83a03c99b2SFlorian Westphal case SO_DEBUG:
84a03c99b2SFlorian Westphal sock_valbool_flag(ssk, SOCK_DBG, !!val);
85a03c99b2SFlorian Westphal break;
861b3e7edeSFlorian Westphal case SO_KEEPALIVE:
871b3e7edeSFlorian Westphal if (ssk->sk_prot->keepalive)
881b3e7edeSFlorian Westphal ssk->sk_prot->keepalive(ssk, !!val);
891b3e7edeSFlorian Westphal sock_valbool_flag(ssk, SOCK_KEEPOPEN, !!val);
901b3e7edeSFlorian Westphal break;
911b3e7edeSFlorian Westphal case SO_PRIORITY:
9210bbf165SEric Dumazet WRITE_ONCE(ssk->sk_priority, val);
931b3e7edeSFlorian Westphal break;
945d0a6bc8SFlorian Westphal case SO_SNDBUF:
955d0a6bc8SFlorian Westphal case SO_SNDBUFFORCE:
965d0a6bc8SFlorian Westphal ssk->sk_userlocks |= SOCK_SNDBUF_LOCK;
975d0a6bc8SFlorian Westphal WRITE_ONCE(ssk->sk_sndbuf, sk->sk_sndbuf);
988005184fSPaolo Abeni mptcp_subflow_ctx(ssk)->cached_sndbuf = sk->sk_sndbuf;
995d0a6bc8SFlorian Westphal break;
1005d0a6bc8SFlorian Westphal case SO_RCVBUF:
1015d0a6bc8SFlorian Westphal case SO_RCVBUFFORCE:
1025d0a6bc8SFlorian Westphal ssk->sk_userlocks |= SOCK_RCVBUF_LOCK;
1035d0a6bc8SFlorian Westphal WRITE_ONCE(ssk->sk_rcvbuf, sk->sk_rcvbuf);
1045d0a6bc8SFlorian Westphal break;
10536704413SFlorian Westphal case SO_MARK:
10636704413SFlorian Westphal if (READ_ONCE(ssk->sk_mark) != sk->sk_mark) {
1073c5b4d69SEric Dumazet WRITE_ONCE(ssk->sk_mark, sk->sk_mark);
10836704413SFlorian Westphal sk_dst_reset(ssk);
10936704413SFlorian Westphal }
11036704413SFlorian Westphal break;
1116f0d7198SFlorian Westphal case SO_INCOMING_CPU:
1126f0d7198SFlorian Westphal WRITE_ONCE(ssk->sk_incoming_cpu, val);
1136f0d7198SFlorian Westphal break;
1141b3e7edeSFlorian Westphal }
1151b3e7edeSFlorian Westphal
1161b3e7edeSFlorian Westphal subflow->setsockopt_seq = msk->setsockopt_seq;
1171b3e7edeSFlorian Westphal unlock_sock_fast(ssk, slow);
1181b3e7edeSFlorian Westphal }
1191b3e7edeSFlorian Westphal
1201b3e7edeSFlorian Westphal release_sock(sk);
1211b3e7edeSFlorian Westphal }
1221b3e7edeSFlorian Westphal
mptcp_sol_socket_intval(struct mptcp_sock * msk,int optname,int val)1231b3e7edeSFlorian Westphal static int mptcp_sol_socket_intval(struct mptcp_sock *msk, int optname, int val)
1241b3e7edeSFlorian Westphal {
1251b3e7edeSFlorian Westphal sockptr_t optval = KERNEL_SOCKPTR(&val);
1261b3e7edeSFlorian Westphal struct sock *sk = (struct sock *)msk;
1271b3e7edeSFlorian Westphal int ret;
1281b3e7edeSFlorian Westphal
1291b3e7edeSFlorian Westphal ret = sock_setsockopt(sk->sk_socket, SOL_SOCKET, optname,
1301b3e7edeSFlorian Westphal optval, sizeof(val));
1311b3e7edeSFlorian Westphal if (ret)
1321b3e7edeSFlorian Westphal return ret;
1331b3e7edeSFlorian Westphal
1341b3e7edeSFlorian Westphal mptcp_sol_socket_sync_intval(msk, optname, val);
1351b3e7edeSFlorian Westphal return 0;
1361b3e7edeSFlorian Westphal }
1371b3e7edeSFlorian Westphal
mptcp_so_incoming_cpu(struct mptcp_sock * msk,int val)1386f0d7198SFlorian Westphal static void mptcp_so_incoming_cpu(struct mptcp_sock *msk, int val)
1396f0d7198SFlorian Westphal {
1406f0d7198SFlorian Westphal struct sock *sk = (struct sock *)msk;
1416f0d7198SFlorian Westphal
1426f0d7198SFlorian Westphal WRITE_ONCE(sk->sk_incoming_cpu, val);
1436f0d7198SFlorian Westphal
1446f0d7198SFlorian Westphal mptcp_sol_socket_sync_intval(msk, SO_INCOMING_CPU, val);
1456f0d7198SFlorian Westphal }
1466f0d7198SFlorian Westphal
mptcp_setsockopt_sol_socket_tstamp(struct mptcp_sock * msk,int optname,int val)1479061f24bSFlorian Westphal static int mptcp_setsockopt_sol_socket_tstamp(struct mptcp_sock *msk, int optname, int val)
1489061f24bSFlorian Westphal {
1499061f24bSFlorian Westphal sockptr_t optval = KERNEL_SOCKPTR(&val);
1509061f24bSFlorian Westphal struct mptcp_subflow_context *subflow;
1519061f24bSFlorian Westphal struct sock *sk = (struct sock *)msk;
1529061f24bSFlorian Westphal int ret;
1539061f24bSFlorian Westphal
1549061f24bSFlorian Westphal ret = sock_setsockopt(sk->sk_socket, SOL_SOCKET, optname,
1559061f24bSFlorian Westphal optval, sizeof(val));
1569061f24bSFlorian Westphal if (ret)
1579061f24bSFlorian Westphal return ret;
1589061f24bSFlorian Westphal
1599061f24bSFlorian Westphal lock_sock(sk);
1609061f24bSFlorian Westphal mptcp_for_each_subflow(msk, subflow) {
1619061f24bSFlorian Westphal struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
1629061f24bSFlorian Westphal bool slow = lock_sock_fast(ssk);
1639061f24bSFlorian Westphal
1649061f24bSFlorian Westphal sock_set_timestamp(sk, optname, !!val);
1659061f24bSFlorian Westphal unlock_sock_fast(ssk, slow);
1669061f24bSFlorian Westphal }
1679061f24bSFlorian Westphal
1689061f24bSFlorian Westphal release_sock(sk);
1699061f24bSFlorian Westphal return 0;
1709061f24bSFlorian Westphal }
1719061f24bSFlorian Westphal
mptcp_setsockopt_sol_socket_int(struct mptcp_sock * msk,int optname,sockptr_t optval,unsigned int optlen)1721b3e7edeSFlorian Westphal static int mptcp_setsockopt_sol_socket_int(struct mptcp_sock *msk, int optname,
1736c9a0a0fSYangbo Lu sockptr_t optval,
1746c9a0a0fSYangbo Lu unsigned int optlen)
1751b3e7edeSFlorian Westphal {
1761b3e7edeSFlorian Westphal int val, ret;
1771b3e7edeSFlorian Westphal
1781b3e7edeSFlorian Westphal ret = mptcp_get_int_option(msk, optval, optlen, &val);
1791b3e7edeSFlorian Westphal if (ret)
1801b3e7edeSFlorian Westphal return ret;
1811b3e7edeSFlorian Westphal
1821b3e7edeSFlorian Westphal switch (optname) {
1831b3e7edeSFlorian Westphal case SO_KEEPALIVE:
184a03c99b2SFlorian Westphal case SO_DEBUG:
18536704413SFlorian Westphal case SO_MARK:
1861b3e7edeSFlorian Westphal case SO_PRIORITY:
1875d0a6bc8SFlorian Westphal case SO_SNDBUF:
1885d0a6bc8SFlorian Westphal case SO_SNDBUFFORCE:
1895d0a6bc8SFlorian Westphal case SO_RCVBUF:
1905d0a6bc8SFlorian Westphal case SO_RCVBUFFORCE:
1911b3e7edeSFlorian Westphal return mptcp_sol_socket_intval(msk, optname, val);
1926f0d7198SFlorian Westphal case SO_INCOMING_CPU:
1936f0d7198SFlorian Westphal mptcp_so_incoming_cpu(msk, val);
1946f0d7198SFlorian Westphal return 0;
1959061f24bSFlorian Westphal case SO_TIMESTAMP_OLD:
1969061f24bSFlorian Westphal case SO_TIMESTAMP_NEW:
1979061f24bSFlorian Westphal case SO_TIMESTAMPNS_OLD:
1989061f24bSFlorian Westphal case SO_TIMESTAMPNS_NEW:
1999061f24bSFlorian Westphal return mptcp_setsockopt_sol_socket_tstamp(msk, optname, val);
2001b3e7edeSFlorian Westphal }
2011b3e7edeSFlorian Westphal
2021b3e7edeSFlorian Westphal return -ENOPROTOOPT;
2031b3e7edeSFlorian Westphal }
2041b3e7edeSFlorian Westphal
mptcp_setsockopt_sol_socket_timestamping(struct mptcp_sock * msk,int optname,sockptr_t optval,unsigned int optlen)2056c9a0a0fSYangbo Lu static int mptcp_setsockopt_sol_socket_timestamping(struct mptcp_sock *msk,
2066c9a0a0fSYangbo Lu int optname,
2076c9a0a0fSYangbo Lu sockptr_t optval,
2086c9a0a0fSYangbo Lu unsigned int optlen)
2096c9a0a0fSYangbo Lu {
2106c9a0a0fSYangbo Lu struct mptcp_subflow_context *subflow;
2116c9a0a0fSYangbo Lu struct sock *sk = (struct sock *)msk;
212d463126eSYangbo Lu struct so_timestamping timestamping;
213d463126eSYangbo Lu int ret;
2146c9a0a0fSYangbo Lu
215d463126eSYangbo Lu if (optlen == sizeof(timestamping)) {
216d463126eSYangbo Lu if (copy_from_sockptr(×tamping, optval,
217d463126eSYangbo Lu sizeof(timestamping)))
218d463126eSYangbo Lu return -EFAULT;
219d463126eSYangbo Lu } else if (optlen == sizeof(int)) {
220d463126eSYangbo Lu memset(×tamping, 0, sizeof(timestamping));
221d463126eSYangbo Lu
222d463126eSYangbo Lu if (copy_from_sockptr(×tamping.flags, optval, sizeof(int)))
223d463126eSYangbo Lu return -EFAULT;
224d463126eSYangbo Lu } else {
225d463126eSYangbo Lu return -EINVAL;
226d463126eSYangbo Lu }
2276c9a0a0fSYangbo Lu
2286c9a0a0fSYangbo Lu ret = sock_setsockopt(sk->sk_socket, SOL_SOCKET, optname,
229d463126eSYangbo Lu KERNEL_SOCKPTR(×tamping),
230d463126eSYangbo Lu sizeof(timestamping));
2316c9a0a0fSYangbo Lu if (ret)
2326c9a0a0fSYangbo Lu return ret;
2336c9a0a0fSYangbo Lu
2346c9a0a0fSYangbo Lu lock_sock(sk);
2356c9a0a0fSYangbo Lu
2366c9a0a0fSYangbo Lu mptcp_for_each_subflow(msk, subflow) {
2376c9a0a0fSYangbo Lu struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
2386c9a0a0fSYangbo Lu bool slow = lock_sock_fast(ssk);
2396c9a0a0fSYangbo Lu
240d463126eSYangbo Lu sock_set_timestamping(sk, optname, timestamping);
2416c9a0a0fSYangbo Lu unlock_sock_fast(ssk, slow);
2426c9a0a0fSYangbo Lu }
2436c9a0a0fSYangbo Lu
2446c9a0a0fSYangbo Lu release_sock(sk);
2456c9a0a0fSYangbo Lu
2466c9a0a0fSYangbo Lu return 0;
2476c9a0a0fSYangbo Lu }
2486c9a0a0fSYangbo Lu
mptcp_setsockopt_sol_socket_linger(struct mptcp_sock * msk,sockptr_t optval,unsigned int optlen)249268b1238SFlorian Westphal static int mptcp_setsockopt_sol_socket_linger(struct mptcp_sock *msk, sockptr_t optval,
250268b1238SFlorian Westphal unsigned int optlen)
251268b1238SFlorian Westphal {
252268b1238SFlorian Westphal struct mptcp_subflow_context *subflow;
253268b1238SFlorian Westphal struct sock *sk = (struct sock *)msk;
254268b1238SFlorian Westphal struct linger ling;
255268b1238SFlorian Westphal sockptr_t kopt;
256268b1238SFlorian Westphal int ret;
257268b1238SFlorian Westphal
258268b1238SFlorian Westphal if (optlen < sizeof(ling))
259268b1238SFlorian Westphal return -EINVAL;
260268b1238SFlorian Westphal
261268b1238SFlorian Westphal if (copy_from_sockptr(&ling, optval, sizeof(ling)))
262268b1238SFlorian Westphal return -EFAULT;
263268b1238SFlorian Westphal
264268b1238SFlorian Westphal kopt = KERNEL_SOCKPTR(&ling);
265268b1238SFlorian Westphal ret = sock_setsockopt(sk->sk_socket, SOL_SOCKET, SO_LINGER, kopt, sizeof(ling));
266268b1238SFlorian Westphal if (ret)
267268b1238SFlorian Westphal return ret;
268268b1238SFlorian Westphal
269268b1238SFlorian Westphal lock_sock(sk);
270268b1238SFlorian Westphal sockopt_seq_inc(msk);
271268b1238SFlorian Westphal mptcp_for_each_subflow(msk, subflow) {
272268b1238SFlorian Westphal struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
273268b1238SFlorian Westphal bool slow = lock_sock_fast(ssk);
274268b1238SFlorian Westphal
275268b1238SFlorian Westphal if (!ling.l_onoff) {
276268b1238SFlorian Westphal sock_reset_flag(ssk, SOCK_LINGER);
277268b1238SFlorian Westphal } else {
278268b1238SFlorian Westphal ssk->sk_lingertime = sk->sk_lingertime;
279268b1238SFlorian Westphal sock_set_flag(ssk, SOCK_LINGER);
280268b1238SFlorian Westphal }
281268b1238SFlorian Westphal
282268b1238SFlorian Westphal subflow->setsockopt_seq = msk->setsockopt_seq;
283268b1238SFlorian Westphal unlock_sock_fast(ssk, slow);
284268b1238SFlorian Westphal }
285268b1238SFlorian Westphal
286268b1238SFlorian Westphal release_sock(sk);
287268b1238SFlorian Westphal return 0;
288268b1238SFlorian Westphal }
289268b1238SFlorian Westphal
mptcp_setsockopt_sol_socket(struct mptcp_sock * msk,int optname,sockptr_t optval,unsigned int optlen)2900abdde82SPaolo Abeni static int mptcp_setsockopt_sol_socket(struct mptcp_sock *msk, int optname,
2910abdde82SPaolo Abeni sockptr_t optval, unsigned int optlen)
2920abdde82SPaolo Abeni {
2930abdde82SPaolo Abeni struct sock *sk = (struct sock *)msk;
294f0bc514bSPaolo Abeni struct sock *ssk;
2950abdde82SPaolo Abeni int ret;
2960abdde82SPaolo Abeni
2970abdde82SPaolo Abeni switch (optname) {
2980abdde82SPaolo Abeni case SO_REUSEPORT:
2990abdde82SPaolo Abeni case SO_REUSEADDR:
3005d0a6bc8SFlorian Westphal case SO_BINDTODEVICE:
3015d0a6bc8SFlorian Westphal case SO_BINDTOIFINDEX:
3020abdde82SPaolo Abeni lock_sock(sk);
3033f326a82SPaolo Abeni ssk = __mptcp_nmpc_sk(msk);
3043f326a82SPaolo Abeni if (IS_ERR(ssk)) {
3050abdde82SPaolo Abeni release_sock(sk);
3063f326a82SPaolo Abeni return PTR_ERR(ssk);
3070abdde82SPaolo Abeni }
3080abdde82SPaolo Abeni
309f0bc514bSPaolo Abeni ret = sk_setsockopt(ssk, SOL_SOCKET, optname, optval, optlen);
3100abdde82SPaolo Abeni if (ret == 0) {
3110abdde82SPaolo Abeni if (optname == SO_REUSEPORT)
312f0bc514bSPaolo Abeni sk->sk_reuseport = ssk->sk_reuseport;
3130abdde82SPaolo Abeni else if (optname == SO_REUSEADDR)
314f0bc514bSPaolo Abeni sk->sk_reuse = ssk->sk_reuse;
3155d0a6bc8SFlorian Westphal else if (optname == SO_BINDTODEVICE)
316f0bc514bSPaolo Abeni sk->sk_bound_dev_if = ssk->sk_bound_dev_if;
3175d0a6bc8SFlorian Westphal else if (optname == SO_BINDTOIFINDEX)
318f0bc514bSPaolo Abeni sk->sk_bound_dev_if = ssk->sk_bound_dev_if;
3190abdde82SPaolo Abeni }
3200abdde82SPaolo Abeni release_sock(sk);
3210abdde82SPaolo Abeni return ret;
3221b3e7edeSFlorian Westphal case SO_KEEPALIVE:
3231b3e7edeSFlorian Westphal case SO_PRIORITY:
3245d0a6bc8SFlorian Westphal case SO_SNDBUF:
3255d0a6bc8SFlorian Westphal case SO_SNDBUFFORCE:
3265d0a6bc8SFlorian Westphal case SO_RCVBUF:
3275d0a6bc8SFlorian Westphal case SO_RCVBUFFORCE:
32836704413SFlorian Westphal case SO_MARK:
3296f0d7198SFlorian Westphal case SO_INCOMING_CPU:
330a03c99b2SFlorian Westphal case SO_DEBUG:
3319061f24bSFlorian Westphal case SO_TIMESTAMP_OLD:
3329061f24bSFlorian Westphal case SO_TIMESTAMP_NEW:
3339061f24bSFlorian Westphal case SO_TIMESTAMPNS_OLD:
3349061f24bSFlorian Westphal case SO_TIMESTAMPNS_NEW:
3356c9a0a0fSYangbo Lu return mptcp_setsockopt_sol_socket_int(msk, optname, optval,
3366c9a0a0fSYangbo Lu optlen);
3379061f24bSFlorian Westphal case SO_TIMESTAMPING_OLD:
3389061f24bSFlorian Westphal case SO_TIMESTAMPING_NEW:
3396c9a0a0fSYangbo Lu return mptcp_setsockopt_sol_socket_timestamping(msk, optname,
3406c9a0a0fSYangbo Lu optval, optlen);
341268b1238SFlorian Westphal case SO_LINGER:
342268b1238SFlorian Westphal return mptcp_setsockopt_sol_socket_linger(msk, optval, optlen);
3437a009a70SFlorian Westphal case SO_RCVLOWAT:
3447a009a70SFlorian Westphal case SO_RCVTIMEO_OLD:
3457a009a70SFlorian Westphal case SO_RCVTIMEO_NEW:
346d6ab5ea2SGeliang Tang case SO_SNDTIMEO_OLD:
347d6ab5ea2SGeliang Tang case SO_SNDTIMEO_NEW:
3487a009a70SFlorian Westphal case SO_BUSY_POLL:
3497a009a70SFlorian Westphal case SO_PREFER_BUSY_POLL:
3507a009a70SFlorian Westphal case SO_BUSY_POLL_BUDGET:
3517a009a70SFlorian Westphal /* No need to copy: only relevant for msk */
3527a009a70SFlorian Westphal return sock_setsockopt(sk->sk_socket, SOL_SOCKET, optname, optval, optlen);
353a03c99b2SFlorian Westphal case SO_NO_CHECK:
354a03c99b2SFlorian Westphal case SO_DONTROUTE:
355a03c99b2SFlorian Westphal case SO_BROADCAST:
356a03c99b2SFlorian Westphal case SO_BSDCOMPAT:
357a03c99b2SFlorian Westphal case SO_PASSCRED:
3585e2ff670SAlexander Mikhalitsyn case SO_PASSPIDFD:
359a03c99b2SFlorian Westphal case SO_PASSSEC:
360a03c99b2SFlorian Westphal case SO_RXQ_OVFL:
361a03c99b2SFlorian Westphal case SO_WIFI_STATUS:
362a03c99b2SFlorian Westphal case SO_NOFCS:
363a03c99b2SFlorian Westphal case SO_SELECT_ERR_QUEUE:
364a03c99b2SFlorian Westphal return 0;
3650abdde82SPaolo Abeni }
3660abdde82SPaolo Abeni
3677a009a70SFlorian Westphal /* SO_OOBINLINE is not supported, let's avoid the related mess
3687a009a70SFlorian Westphal * SO_ATTACH_FILTER, SO_ATTACH_BPF, SO_ATTACH_REUSEPORT_CBPF,
3697a009a70SFlorian Westphal * SO_DETACH_REUSEPORT_BPF, SO_DETACH_FILTER, SO_LOCK_FILTER,
3707a009a70SFlorian Westphal * we must be careful with subflows
3717a009a70SFlorian Westphal *
3727a009a70SFlorian Westphal * SO_ATTACH_REUSEPORT_EBPF is not supported, at it checks
3737a009a70SFlorian Westphal * explicitly the sk_protocol field
3747a009a70SFlorian Westphal *
3757a009a70SFlorian Westphal * SO_PEEK_OFF is unsupported, as it is for plain TCP
3767a009a70SFlorian Westphal * SO_MAX_PACING_RATE is unsupported, we must be careful with subflows
3777a009a70SFlorian Westphal * SO_CNX_ADVICE is currently unsupported, could possibly be relevant,
3787a009a70SFlorian Westphal * but likely needs careful design
3797a009a70SFlorian Westphal *
3807a009a70SFlorian Westphal * SO_ZEROCOPY is currently unsupported, TODO in sndmsg
3817a009a70SFlorian Westphal * SO_TXTIME is currently unsupported
3827a009a70SFlorian Westphal */
3837a009a70SFlorian Westphal
3847a009a70SFlorian Westphal return -EOPNOTSUPP;
3850abdde82SPaolo Abeni }
3860abdde82SPaolo Abeni
mptcp_setsockopt_v6(struct mptcp_sock * msk,int optname,sockptr_t optval,unsigned int optlen)3870abdde82SPaolo Abeni static int mptcp_setsockopt_v6(struct mptcp_sock *msk, int optname,
3880abdde82SPaolo Abeni sockptr_t optval, unsigned int optlen)
3890abdde82SPaolo Abeni {
3900abdde82SPaolo Abeni struct sock *sk = (struct sock *)msk;
3910abdde82SPaolo Abeni int ret = -EOPNOTSUPP;
392f0bc514bSPaolo Abeni struct sock *ssk;
3930abdde82SPaolo Abeni
3940abdde82SPaolo Abeni switch (optname) {
3950abdde82SPaolo Abeni case IPV6_V6ONLY:
396c9406a23SFlorian Westphal case IPV6_TRANSPARENT:
397c9406a23SFlorian Westphal case IPV6_FREEBIND:
3980abdde82SPaolo Abeni lock_sock(sk);
3993f326a82SPaolo Abeni ssk = __mptcp_nmpc_sk(msk);
4003f326a82SPaolo Abeni if (IS_ERR(ssk)) {
4010abdde82SPaolo Abeni release_sock(sk);
4023f326a82SPaolo Abeni return PTR_ERR(ssk);
4030abdde82SPaolo Abeni }
4040abdde82SPaolo Abeni
405f0bc514bSPaolo Abeni ret = tcp_setsockopt(ssk, SOL_IPV6, optname, optval, optlen);
406c9406a23SFlorian Westphal if (ret != 0) {
407c9406a23SFlorian Westphal release_sock(sk);
408c9406a23SFlorian Westphal return ret;
409c9406a23SFlorian Westphal }
410c9406a23SFlorian Westphal
411c9406a23SFlorian Westphal sockopt_seq_inc(msk);
412c9406a23SFlorian Westphal
413c9406a23SFlorian Westphal switch (optname) {
414c9406a23SFlorian Westphal case IPV6_V6ONLY:
415f0bc514bSPaolo Abeni sk->sk_ipv6only = ssk->sk_ipv6only;
416c9406a23SFlorian Westphal break;
417c9406a23SFlorian Westphal case IPV6_TRANSPARENT:
4184bd0623fSEric Dumazet inet_assign_bit(TRANSPARENT, sk,
4194bd0623fSEric Dumazet inet_test_bit(TRANSPARENT, ssk));
420c9406a23SFlorian Westphal break;
421c9406a23SFlorian Westphal case IPV6_FREEBIND:
4223f7e7532SEric Dumazet inet_assign_bit(FREEBIND, sk,
4233f7e7532SEric Dumazet inet_test_bit(FREEBIND, ssk));
424c9406a23SFlorian Westphal break;
425c9406a23SFlorian Westphal }
4260abdde82SPaolo Abeni
4270abdde82SPaolo Abeni release_sock(sk);
4280abdde82SPaolo Abeni break;
4290abdde82SPaolo Abeni }
4300abdde82SPaolo Abeni
4310abdde82SPaolo Abeni return ret;
4320abdde82SPaolo Abeni }
4330abdde82SPaolo Abeni
mptcp_supported_sockopt(int level,int optname)434d9e4c129SPaolo Abeni static bool mptcp_supported_sockopt(int level, int optname)
435d9e4c129SPaolo Abeni {
436d9e4c129SPaolo Abeni if (level == SOL_IP) {
437d9e4c129SPaolo Abeni switch (optname) {
438d9e4c129SPaolo Abeni /* should work fine */
439d9e4c129SPaolo Abeni case IP_FREEBIND:
440d9e4c129SPaolo Abeni case IP_TRANSPARENT:
441c85636a2SMaxim Galaganov case IP_BIND_ADDRESS_NO_PORT:
442c85636a2SMaxim Galaganov case IP_LOCAL_PORT_RANGE:
443d9e4c129SPaolo Abeni
444d9e4c129SPaolo Abeni /* the following are control cmsg related */
445d9e4c129SPaolo Abeni case IP_PKTINFO:
446d9e4c129SPaolo Abeni case IP_RECVTTL:
447d9e4c129SPaolo Abeni case IP_RECVTOS:
448d9e4c129SPaolo Abeni case IP_RECVOPTS:
449d9e4c129SPaolo Abeni case IP_RETOPTS:
450d9e4c129SPaolo Abeni case IP_PASSSEC:
451d9e4c129SPaolo Abeni case IP_RECVORIGDSTADDR:
452d9e4c129SPaolo Abeni case IP_CHECKSUM:
453d9e4c129SPaolo Abeni case IP_RECVFRAGSIZE:
454d9e4c129SPaolo Abeni
455d9e4c129SPaolo Abeni /* common stuff that need some love */
456d9e4c129SPaolo Abeni case IP_TOS:
457d9e4c129SPaolo Abeni case IP_TTL:
458d9e4c129SPaolo Abeni case IP_MTU_DISCOVER:
459d9e4c129SPaolo Abeni case IP_RECVERR:
460d9e4c129SPaolo Abeni
461d9e4c129SPaolo Abeni /* possibly less common may deserve some love */
462d9e4c129SPaolo Abeni case IP_MINTTL:
463d9e4c129SPaolo Abeni
464d9e4c129SPaolo Abeni /* the following is apparently a no-op for plain TCP */
465d9e4c129SPaolo Abeni case IP_RECVERR_RFC4884:
466d9e4c129SPaolo Abeni return true;
467d9e4c129SPaolo Abeni }
468d9e4c129SPaolo Abeni
469d9e4c129SPaolo Abeni /* IP_OPTIONS is not supported, needs subflow care */
470d9e4c129SPaolo Abeni /* IP_HDRINCL, IP_NODEFRAG are not supported, RAW specific */
471d9e4c129SPaolo Abeni /* IP_MULTICAST_TTL, IP_MULTICAST_LOOP, IP_UNICAST_IF,
472d9e4c129SPaolo Abeni * IP_ADD_MEMBERSHIP, IP_ADD_SOURCE_MEMBERSHIP, IP_DROP_MEMBERSHIP,
473d9e4c129SPaolo Abeni * IP_DROP_SOURCE_MEMBERSHIP, IP_BLOCK_SOURCE, IP_UNBLOCK_SOURCE,
474d9e4c129SPaolo Abeni * MCAST_JOIN_GROUP, MCAST_LEAVE_GROUP MCAST_JOIN_SOURCE_GROUP,
475d9e4c129SPaolo Abeni * MCAST_LEAVE_SOURCE_GROUP, MCAST_BLOCK_SOURCE, MCAST_UNBLOCK_SOURCE,
476d9e4c129SPaolo Abeni * MCAST_MSFILTER, IP_MULTICAST_ALL are not supported, better not deal
477d9e4c129SPaolo Abeni * with mcast stuff
478d9e4c129SPaolo Abeni */
479d9e4c129SPaolo Abeni /* IP_IPSEC_POLICY, IP_XFRM_POLICY are nut supported, unrelated here */
480d9e4c129SPaolo Abeni return false;
481d9e4c129SPaolo Abeni }
482d9e4c129SPaolo Abeni if (level == SOL_IPV6) {
483d9e4c129SPaolo Abeni switch (optname) {
484d9e4c129SPaolo Abeni case IPV6_V6ONLY:
485d9e4c129SPaolo Abeni
486d9e4c129SPaolo Abeni /* the following are control cmsg related */
487d9e4c129SPaolo Abeni case IPV6_RECVPKTINFO:
488d9e4c129SPaolo Abeni case IPV6_2292PKTINFO:
489d9e4c129SPaolo Abeni case IPV6_RECVHOPLIMIT:
490d9e4c129SPaolo Abeni case IPV6_2292HOPLIMIT:
491d9e4c129SPaolo Abeni case IPV6_RECVRTHDR:
492d9e4c129SPaolo Abeni case IPV6_2292RTHDR:
493d9e4c129SPaolo Abeni case IPV6_RECVHOPOPTS:
494d9e4c129SPaolo Abeni case IPV6_2292HOPOPTS:
495d9e4c129SPaolo Abeni case IPV6_RECVDSTOPTS:
496d9e4c129SPaolo Abeni case IPV6_2292DSTOPTS:
497d9e4c129SPaolo Abeni case IPV6_RECVTCLASS:
498d9e4c129SPaolo Abeni case IPV6_FLOWINFO:
499d9e4c129SPaolo Abeni case IPV6_RECVPATHMTU:
500d9e4c129SPaolo Abeni case IPV6_RECVORIGDSTADDR:
501d9e4c129SPaolo Abeni case IPV6_RECVFRAGSIZE:
502d9e4c129SPaolo Abeni
503d9e4c129SPaolo Abeni /* the following ones need some love but are quite common */
504d9e4c129SPaolo Abeni case IPV6_TCLASS:
505d9e4c129SPaolo Abeni case IPV6_TRANSPARENT:
506d9e4c129SPaolo Abeni case IPV6_FREEBIND:
507d9e4c129SPaolo Abeni case IPV6_PKTINFO:
508d9e4c129SPaolo Abeni case IPV6_2292PKTOPTIONS:
509d9e4c129SPaolo Abeni case IPV6_UNICAST_HOPS:
510d9e4c129SPaolo Abeni case IPV6_MTU_DISCOVER:
511d9e4c129SPaolo Abeni case IPV6_MTU:
512d9e4c129SPaolo Abeni case IPV6_RECVERR:
513d9e4c129SPaolo Abeni case IPV6_FLOWINFO_SEND:
514d9e4c129SPaolo Abeni case IPV6_FLOWLABEL_MGR:
515d9e4c129SPaolo Abeni case IPV6_MINHOPCOUNT:
516d9e4c129SPaolo Abeni case IPV6_DONTFRAG:
517d9e4c129SPaolo Abeni case IPV6_AUTOFLOWLABEL:
518d9e4c129SPaolo Abeni
519d9e4c129SPaolo Abeni /* the following one is a no-op for plain TCP */
520d9e4c129SPaolo Abeni case IPV6_RECVERR_RFC4884:
521d9e4c129SPaolo Abeni return true;
522d9e4c129SPaolo Abeni }
523d9e4c129SPaolo Abeni
524d9e4c129SPaolo Abeni /* IPV6_HOPOPTS, IPV6_RTHDRDSTOPTS, IPV6_RTHDR, IPV6_DSTOPTS are
525d9e4c129SPaolo Abeni * not supported
526d9e4c129SPaolo Abeni */
527d9e4c129SPaolo Abeni /* IPV6_MULTICAST_HOPS, IPV6_MULTICAST_LOOP, IPV6_UNICAST_IF,
528d9e4c129SPaolo Abeni * IPV6_MULTICAST_IF, IPV6_ADDRFORM,
529d9e4c129SPaolo Abeni * IPV6_ADD_MEMBERSHIP, IPV6_DROP_MEMBERSHIP, IPV6_JOIN_ANYCAST,
530d9e4c129SPaolo Abeni * IPV6_LEAVE_ANYCAST, IPV6_MULTICAST_ALL, MCAST_JOIN_GROUP, MCAST_LEAVE_GROUP,
531d9e4c129SPaolo Abeni * MCAST_JOIN_SOURCE_GROUP, MCAST_LEAVE_SOURCE_GROUP,
532d9e4c129SPaolo Abeni * MCAST_BLOCK_SOURCE, MCAST_UNBLOCK_SOURCE, MCAST_MSFILTER
533d9e4c129SPaolo Abeni * are not supported better not deal with mcast
534d9e4c129SPaolo Abeni */
535d9e4c129SPaolo Abeni /* IPV6_ROUTER_ALERT, IPV6_ROUTER_ALERT_ISOLATE are not supported, since are evil */
536d9e4c129SPaolo Abeni
537d9e4c129SPaolo Abeni /* IPV6_IPSEC_POLICY, IPV6_XFRM_POLICY are not supported */
538d9e4c129SPaolo Abeni /* IPV6_ADDR_PREFERENCES is not supported, we must be careful with subflows */
539d9e4c129SPaolo Abeni return false;
540d9e4c129SPaolo Abeni }
541d9e4c129SPaolo Abeni if (level == SOL_TCP) {
542d9e4c129SPaolo Abeni switch (optname) {
543d9e4c129SPaolo Abeni /* the following are no-op or should work just fine */
544d9e4c129SPaolo Abeni case TCP_THIN_DUPACK:
545d9e4c129SPaolo Abeni case TCP_DEFER_ACCEPT:
546d9e4c129SPaolo Abeni
547d9e4c129SPaolo Abeni /* the following need some love */
548d9e4c129SPaolo Abeni case TCP_MAXSEG:
549d9e4c129SPaolo Abeni case TCP_NODELAY:
550d9e4c129SPaolo Abeni case TCP_THIN_LINEAR_TIMEOUTS:
551d9e4c129SPaolo Abeni case TCP_CONGESTION:
552d9e4c129SPaolo Abeni case TCP_CORK:
553d9e4c129SPaolo Abeni case TCP_KEEPIDLE:
554d9e4c129SPaolo Abeni case TCP_KEEPINTVL:
555d9e4c129SPaolo Abeni case TCP_KEEPCNT:
556d9e4c129SPaolo Abeni case TCP_SYNCNT:
557d9e4c129SPaolo Abeni case TCP_SAVE_SYN:
558d9e4c129SPaolo Abeni case TCP_LINGER2:
559d9e4c129SPaolo Abeni case TCP_WINDOW_CLAMP:
560d9e4c129SPaolo Abeni case TCP_QUICKACK:
561d9e4c129SPaolo Abeni case TCP_USER_TIMEOUT:
562d9e4c129SPaolo Abeni case TCP_TIMESTAMP:
563d9e4c129SPaolo Abeni case TCP_NOTSENT_LOWAT:
564d9e4c129SPaolo Abeni case TCP_TX_DELAY:
5652c9e7765SFlorian Westphal case TCP_INQ:
5664ffb0a02SDmytro Shytyi case TCP_FASTOPEN:
56754635bd0SBenjamin Hesmans case TCP_FASTOPEN_CONNECT:
568cb99816cSMatthieu Baerts case TCP_FASTOPEN_KEY:
569e64d4debSMatthieu Baerts case TCP_FASTOPEN_NO_COOKIE:
570d9e4c129SPaolo Abeni return true;
571d9e4c129SPaolo Abeni }
572d9e4c129SPaolo Abeni
573d9e4c129SPaolo Abeni /* TCP_MD5SIG, TCP_MD5SIG_EXT are not supported, MD5 is not compatible with MPTCP */
574d9e4c129SPaolo Abeni
575d9e4c129SPaolo Abeni /* TCP_REPAIR, TCP_REPAIR_QUEUE, TCP_QUEUE_SEQ, TCP_REPAIR_OPTIONS,
576d9e4c129SPaolo Abeni * TCP_REPAIR_WINDOW are not supported, better avoid this mess
577d9e4c129SPaolo Abeni */
578d9e4c129SPaolo Abeni }
579d9e4c129SPaolo Abeni return false;
580d9e4c129SPaolo Abeni }
581d9e4c129SPaolo Abeni
mptcp_setsockopt_sol_tcp_congestion(struct mptcp_sock * msk,sockptr_t optval,unsigned int optlen)582aa1fbd94SFlorian Westphal static int mptcp_setsockopt_sol_tcp_congestion(struct mptcp_sock *msk, sockptr_t optval,
583aa1fbd94SFlorian Westphal unsigned int optlen)
584aa1fbd94SFlorian Westphal {
585aa1fbd94SFlorian Westphal struct mptcp_subflow_context *subflow;
586aa1fbd94SFlorian Westphal struct sock *sk = (struct sock *)msk;
587aa1fbd94SFlorian Westphal char name[TCP_CA_NAME_MAX];
588aa1fbd94SFlorian Westphal bool cap_net_admin;
589aa1fbd94SFlorian Westphal int ret;
590aa1fbd94SFlorian Westphal
591aa1fbd94SFlorian Westphal if (optlen < 1)
592aa1fbd94SFlorian Westphal return -EINVAL;
593aa1fbd94SFlorian Westphal
594aa1fbd94SFlorian Westphal ret = strncpy_from_sockptr(name, optval,
595aa1fbd94SFlorian Westphal min_t(long, TCP_CA_NAME_MAX - 1, optlen));
596aa1fbd94SFlorian Westphal if (ret < 0)
597aa1fbd94SFlorian Westphal return -EFAULT;
598aa1fbd94SFlorian Westphal
599aa1fbd94SFlorian Westphal name[ret] = 0;
600aa1fbd94SFlorian Westphal
601aa1fbd94SFlorian Westphal cap_net_admin = ns_capable(sock_net(sk)->user_ns, CAP_NET_ADMIN);
602aa1fbd94SFlorian Westphal
603aa1fbd94SFlorian Westphal ret = 0;
604aa1fbd94SFlorian Westphal lock_sock(sk);
605aa1fbd94SFlorian Westphal sockopt_seq_inc(msk);
606aa1fbd94SFlorian Westphal mptcp_for_each_subflow(msk, subflow) {
607aa1fbd94SFlorian Westphal struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
608aa1fbd94SFlorian Westphal int err;
609aa1fbd94SFlorian Westphal
610aa1fbd94SFlorian Westphal lock_sock(ssk);
611aa1fbd94SFlorian Westphal err = tcp_set_congestion_control(ssk, name, true, cap_net_admin);
612aa1fbd94SFlorian Westphal if (err < 0 && ret == 0)
613aa1fbd94SFlorian Westphal ret = err;
614aa1fbd94SFlorian Westphal subflow->setsockopt_seq = msk->setsockopt_seq;
615aa1fbd94SFlorian Westphal release_sock(ssk);
616aa1fbd94SFlorian Westphal }
617aa1fbd94SFlorian Westphal
618aa1fbd94SFlorian Westphal if (ret == 0)
619*5eae7a82SMatthieu Baerts (NGI0) strscpy(msk->ca_name, name, sizeof(msk->ca_name));
620aa1fbd94SFlorian Westphal
621aa1fbd94SFlorian Westphal release_sock(sk);
622aa1fbd94SFlorian Westphal return ret;
623aa1fbd94SFlorian Westphal }
624aa1fbd94SFlorian Westphal
__mptcp_setsockopt_set_val(struct mptcp_sock * msk,int max,int (* set_val)(struct sock *,int),int * msk_val,int val)625bd11dc4fSMatthieu Baerts (NGI0) static int __mptcp_setsockopt_set_val(struct mptcp_sock *msk, int max,
626bd11dc4fSMatthieu Baerts (NGI0) int (*set_val)(struct sock *, int),
627bd11dc4fSMatthieu Baerts (NGI0) int *msk_val, int val)
628bd11dc4fSMatthieu Baerts (NGI0) {
629bd11dc4fSMatthieu Baerts (NGI0) struct mptcp_subflow_context *subflow;
630bd11dc4fSMatthieu Baerts (NGI0) int err = 0;
631bd11dc4fSMatthieu Baerts (NGI0)
632bd11dc4fSMatthieu Baerts (NGI0) mptcp_for_each_subflow(msk, subflow) {
633bd11dc4fSMatthieu Baerts (NGI0) struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
634bd11dc4fSMatthieu Baerts (NGI0) int ret;
635bd11dc4fSMatthieu Baerts (NGI0)
636bd11dc4fSMatthieu Baerts (NGI0) lock_sock(ssk);
637bd11dc4fSMatthieu Baerts (NGI0) ret = set_val(ssk, val);
638bd11dc4fSMatthieu Baerts (NGI0) err = err ? : ret;
639bd11dc4fSMatthieu Baerts (NGI0) release_sock(ssk);
640bd11dc4fSMatthieu Baerts (NGI0) }
641bd11dc4fSMatthieu Baerts (NGI0)
642bd11dc4fSMatthieu Baerts (NGI0) if (!err) {
643bd11dc4fSMatthieu Baerts (NGI0) *msk_val = val;
644bd11dc4fSMatthieu Baerts (NGI0) sockopt_seq_inc(msk);
645bd11dc4fSMatthieu Baerts (NGI0) }
646bd11dc4fSMatthieu Baerts (NGI0)
647bd11dc4fSMatthieu Baerts (NGI0) return err;
648bd11dc4fSMatthieu Baerts (NGI0) }
649bd11dc4fSMatthieu Baerts (NGI0)
__mptcp_setsockopt_sol_tcp_cork(struct mptcp_sock * msk,int val)6507f71a337SPaolo Abeni static int __mptcp_setsockopt_sol_tcp_cork(struct mptcp_sock *msk, int val)
6514f6e14bdSMaxim Galaganov {
6524f6e14bdSMaxim Galaganov struct mptcp_subflow_context *subflow;
6534f6e14bdSMaxim Galaganov struct sock *sk = (struct sock *)msk;
6544f6e14bdSMaxim Galaganov
6554f6e14bdSMaxim Galaganov sockopt_seq_inc(msk);
6564f6e14bdSMaxim Galaganov msk->cork = !!val;
6574f6e14bdSMaxim Galaganov mptcp_for_each_subflow(msk, subflow) {
6584f6e14bdSMaxim Galaganov struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
6594f6e14bdSMaxim Galaganov
6604f6e14bdSMaxim Galaganov lock_sock(ssk);
6614f6e14bdSMaxim Galaganov __tcp_sock_set_cork(ssk, !!val);
6624f6e14bdSMaxim Galaganov release_sock(ssk);
6634f6e14bdSMaxim Galaganov }
6644f6e14bdSMaxim Galaganov if (!val)
6654f6e14bdSMaxim Galaganov mptcp_check_and_set_pending(sk);
6664f6e14bdSMaxim Galaganov
6674f6e14bdSMaxim Galaganov return 0;
6684f6e14bdSMaxim Galaganov }
6694f6e14bdSMaxim Galaganov
__mptcp_setsockopt_sol_tcp_nodelay(struct mptcp_sock * msk,int val)6707f71a337SPaolo Abeni static int __mptcp_setsockopt_sol_tcp_nodelay(struct mptcp_sock *msk, int val)
6714f6e14bdSMaxim Galaganov {
6724f6e14bdSMaxim Galaganov struct mptcp_subflow_context *subflow;
6734f6e14bdSMaxim Galaganov struct sock *sk = (struct sock *)msk;
6744f6e14bdSMaxim Galaganov
6754f6e14bdSMaxim Galaganov sockopt_seq_inc(msk);
6764f6e14bdSMaxim Galaganov msk->nodelay = !!val;
6774f6e14bdSMaxim Galaganov mptcp_for_each_subflow(msk, subflow) {
6784f6e14bdSMaxim Galaganov struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
6794f6e14bdSMaxim Galaganov
6804f6e14bdSMaxim Galaganov lock_sock(ssk);
6814f6e14bdSMaxim Galaganov __tcp_sock_set_nodelay(ssk, !!val);
6824f6e14bdSMaxim Galaganov release_sock(ssk);
6834f6e14bdSMaxim Galaganov }
6844f6e14bdSMaxim Galaganov if (val)
6854f6e14bdSMaxim Galaganov mptcp_check_and_set_pending(sk);
6864f6e14bdSMaxim Galaganov return 0;
6874f6e14bdSMaxim Galaganov }
6884f6e14bdSMaxim Galaganov
mptcp_setsockopt_sol_ip_set(struct mptcp_sock * msk,int optname,sockptr_t optval,unsigned int optlen)68957d3117cSMaxim Galaganov static int mptcp_setsockopt_sol_ip_set(struct mptcp_sock *msk, int optname,
690c9406a23SFlorian Westphal sockptr_t optval, unsigned int optlen)
691c9406a23SFlorian Westphal {
692c9406a23SFlorian Westphal struct sock *sk = (struct sock *)msk;
6933f326a82SPaolo Abeni struct sock *ssk;
694c9406a23SFlorian Westphal int err;
695c9406a23SFlorian Westphal
696c9406a23SFlorian Westphal err = ip_setsockopt(sk, SOL_IP, optname, optval, optlen);
697c9406a23SFlorian Westphal if (err != 0)
698c9406a23SFlorian Westphal return err;
699c9406a23SFlorian Westphal
700c9406a23SFlorian Westphal lock_sock(sk);
701c9406a23SFlorian Westphal
7023f326a82SPaolo Abeni ssk = __mptcp_nmpc_sk(msk);
7033f326a82SPaolo Abeni if (IS_ERR(ssk)) {
704c9406a23SFlorian Westphal release_sock(sk);
7053f326a82SPaolo Abeni return PTR_ERR(ssk);
706c9406a23SFlorian Westphal }
707c9406a23SFlorian Westphal
708c9406a23SFlorian Westphal switch (optname) {
709c9406a23SFlorian Westphal case IP_FREEBIND:
7103f7e7532SEric Dumazet inet_assign_bit(FREEBIND, ssk, inet_test_bit(FREEBIND, sk));
711c9406a23SFlorian Westphal break;
712c9406a23SFlorian Westphal case IP_TRANSPARENT:
7134bd0623fSEric Dumazet inet_assign_bit(TRANSPARENT, ssk,
7144bd0623fSEric Dumazet inet_test_bit(TRANSPARENT, sk));
715c9406a23SFlorian Westphal break;
716c85636a2SMaxim Galaganov case IP_BIND_ADDRESS_NO_PORT:
717c85636a2SMaxim Galaganov inet_assign_bit(BIND_ADDRESS_NO_PORT, ssk,
718c85636a2SMaxim Galaganov inet_test_bit(BIND_ADDRESS_NO_PORT, sk));
719c85636a2SMaxim Galaganov break;
720c85636a2SMaxim Galaganov case IP_LOCAL_PORT_RANGE:
721c85636a2SMaxim Galaganov WRITE_ONCE(inet_sk(ssk)->local_port_range,
722c85636a2SMaxim Galaganov READ_ONCE(inet_sk(sk)->local_port_range));
723c85636a2SMaxim Galaganov break;
724c9406a23SFlorian Westphal default:
725c9406a23SFlorian Westphal release_sock(sk);
726c9406a23SFlorian Westphal WARN_ON_ONCE(1);
727c9406a23SFlorian Westphal return -EOPNOTSUPP;
728c9406a23SFlorian Westphal }
729c9406a23SFlorian Westphal
730c9406a23SFlorian Westphal sockopt_seq_inc(msk);
731c9406a23SFlorian Westphal release_sock(sk);
732c9406a23SFlorian Westphal return 0;
733c9406a23SFlorian Westphal }
734c9406a23SFlorian Westphal
mptcp_setsockopt_v4_set_tos(struct mptcp_sock * msk,int optname,sockptr_t optval,unsigned int optlen)735ffcacff8SPoorva Sonparote static int mptcp_setsockopt_v4_set_tos(struct mptcp_sock *msk, int optname,
736ffcacff8SPoorva Sonparote sockptr_t optval, unsigned int optlen)
737ffcacff8SPoorva Sonparote {
738ffcacff8SPoorva Sonparote struct mptcp_subflow_context *subflow;
739ffcacff8SPoorva Sonparote struct sock *sk = (struct sock *)msk;
740ffcacff8SPoorva Sonparote int err, val;
741ffcacff8SPoorva Sonparote
742ffcacff8SPoorva Sonparote err = ip_setsockopt(sk, SOL_IP, optname, optval, optlen);
743ffcacff8SPoorva Sonparote
744ffcacff8SPoorva Sonparote if (err != 0)
745ffcacff8SPoorva Sonparote return err;
746ffcacff8SPoorva Sonparote
747ffcacff8SPoorva Sonparote lock_sock(sk);
748ffcacff8SPoorva Sonparote sockopt_seq_inc(msk);
749e08d0b3dSEric Dumazet val = READ_ONCE(inet_sk(sk)->tos);
750ffcacff8SPoorva Sonparote mptcp_for_each_subflow(msk, subflow) {
751ffcacff8SPoorva Sonparote struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
7527679d34fSPaolo Abeni bool slow;
753ffcacff8SPoorva Sonparote
7547679d34fSPaolo Abeni slow = lock_sock_fast(ssk);
755878d951cSEric Dumazet __ip_sock_set_tos(ssk, val);
7567679d34fSPaolo Abeni unlock_sock_fast(ssk, slow);
757ffcacff8SPoorva Sonparote }
758ffcacff8SPoorva Sonparote release_sock(sk);
759ffcacff8SPoorva Sonparote
76003e7d28cSMatthieu Baerts return 0;
761ffcacff8SPoorva Sonparote }
762ffcacff8SPoorva Sonparote
mptcp_setsockopt_v4(struct mptcp_sock * msk,int optname,sockptr_t optval,unsigned int optlen)763ffcacff8SPoorva Sonparote static int mptcp_setsockopt_v4(struct mptcp_sock *msk, int optname,
764ffcacff8SPoorva Sonparote sockptr_t optval, unsigned int optlen)
765ffcacff8SPoorva Sonparote {
766ffcacff8SPoorva Sonparote switch (optname) {
767c9406a23SFlorian Westphal case IP_FREEBIND:
768c9406a23SFlorian Westphal case IP_TRANSPARENT:
769c85636a2SMaxim Galaganov case IP_BIND_ADDRESS_NO_PORT:
770c85636a2SMaxim Galaganov case IP_LOCAL_PORT_RANGE:
77157d3117cSMaxim Galaganov return mptcp_setsockopt_sol_ip_set(msk, optname, optval, optlen);
772ffcacff8SPoorva Sonparote case IP_TOS:
773ffcacff8SPoorva Sonparote return mptcp_setsockopt_v4_set_tos(msk, optname, optval, optlen);
774ffcacff8SPoorva Sonparote }
775ffcacff8SPoorva Sonparote
776ffcacff8SPoorva Sonparote return -EOPNOTSUPP;
777ffcacff8SPoorva Sonparote }
778ffcacff8SPoorva Sonparote
mptcp_setsockopt_first_sf_only(struct mptcp_sock * msk,int level,int optname,sockptr_t optval,unsigned int optlen)779d3d42904SMatthieu Baerts static int mptcp_setsockopt_first_sf_only(struct mptcp_sock *msk, int level, int optname,
780d3d42904SMatthieu Baerts sockptr_t optval, unsigned int optlen)
78154635bd0SBenjamin Hesmans {
78221e43569SPaolo Abeni struct sock *sk = (struct sock *)msk;
7833f326a82SPaolo Abeni struct sock *ssk;
784ddb1a072SPaolo Abeni int ret;
78554635bd0SBenjamin Hesmans
786d3d42904SMatthieu Baerts /* Limit to first subflow, before the connection establishment */
78721e43569SPaolo Abeni lock_sock(sk);
7883f326a82SPaolo Abeni ssk = __mptcp_nmpc_sk(msk);
7893f326a82SPaolo Abeni if (IS_ERR(ssk)) {
7903f326a82SPaolo Abeni ret = PTR_ERR(ssk);
79121e43569SPaolo Abeni goto unlock;
792ddb1a072SPaolo Abeni }
79354635bd0SBenjamin Hesmans
7943f326a82SPaolo Abeni ret = tcp_setsockopt(ssk, level, optname, optval, optlen);
79521e43569SPaolo Abeni
79621e43569SPaolo Abeni unlock:
79721e43569SPaolo Abeni release_sock(sk);
79821e43569SPaolo Abeni return ret;
79954635bd0SBenjamin Hesmans }
80054635bd0SBenjamin Hesmans
mptcp_setsockopt_sol_tcp(struct mptcp_sock * msk,int optname,sockptr_t optval,unsigned int optlen)801aa1fbd94SFlorian Westphal static int mptcp_setsockopt_sol_tcp(struct mptcp_sock *msk, int optname,
802aa1fbd94SFlorian Westphal sockptr_t optval, unsigned int optlen)
803aa1fbd94SFlorian Westphal {
8042c9e7765SFlorian Westphal struct sock *sk = (void *)msk;
8052c9e7765SFlorian Westphal int ret, val;
8062c9e7765SFlorian Westphal
807aa1fbd94SFlorian Westphal switch (optname) {
808aa1fbd94SFlorian Westphal case TCP_ULP:
809aa1fbd94SFlorian Westphal return -EOPNOTSUPP;
810aa1fbd94SFlorian Westphal case TCP_CONGESTION:
811aa1fbd94SFlorian Westphal return mptcp_setsockopt_sol_tcp_congestion(msk, optval, optlen);
812ea1e301dSFlorian Westphal case TCP_DEFER_ACCEPT:
813caea6467SMatthieu Baerts /* See tcp.c: TCP_DEFER_ACCEPT does not fail */
814caea6467SMatthieu Baerts mptcp_setsockopt_first_sf_only(msk, SOL_TCP, optname, optval, optlen);
815caea6467SMatthieu Baerts return 0;
8164ffb0a02SDmytro Shytyi case TCP_FASTOPEN:
81754635bd0SBenjamin Hesmans case TCP_FASTOPEN_CONNECT:
818cb99816cSMatthieu Baerts case TCP_FASTOPEN_KEY:
819e64d4debSMatthieu Baerts case TCP_FASTOPEN_NO_COOKIE:
820d3d42904SMatthieu Baerts return mptcp_setsockopt_first_sf_only(msk, SOL_TCP, optname,
821d3d42904SMatthieu Baerts optval, optlen);
822aa1fbd94SFlorian Westphal }
823aa1fbd94SFlorian Westphal
8247f71a337SPaolo Abeni ret = mptcp_get_int_option(msk, optval, optlen, &val);
8257f71a337SPaolo Abeni if (ret)
8267f71a337SPaolo Abeni return ret;
8277f71a337SPaolo Abeni
8287f71a337SPaolo Abeni lock_sock(sk);
8297f71a337SPaolo Abeni switch (optname) {
8307f71a337SPaolo Abeni case TCP_INQ:
8317f71a337SPaolo Abeni if (val < 0 || val > 1)
8327f71a337SPaolo Abeni ret = -EINVAL;
8337f71a337SPaolo Abeni else
8347f71a337SPaolo Abeni msk->recvmsg_inq = !!val;
8357f71a337SPaolo Abeni break;
8367f71a337SPaolo Abeni case TCP_NOTSENT_LOWAT:
8377f71a337SPaolo Abeni WRITE_ONCE(msk->notsent_lowat, val);
8387f71a337SPaolo Abeni mptcp_write_space(sk);
8397f71a337SPaolo Abeni break;
8407f71a337SPaolo Abeni case TCP_CORK:
8417f71a337SPaolo Abeni ret = __mptcp_setsockopt_sol_tcp_cork(msk, val);
8427f71a337SPaolo Abeni break;
8437f71a337SPaolo Abeni case TCP_NODELAY:
8447f71a337SPaolo Abeni ret = __mptcp_setsockopt_sol_tcp_nodelay(msk, val);
8457f71a337SPaolo Abeni break;
846bd11dc4fSMatthieu Baerts (NGI0) case TCP_KEEPIDLE:
847bd11dc4fSMatthieu Baerts (NGI0) ret = __mptcp_setsockopt_set_val(msk, MAX_TCP_KEEPIDLE,
848bd11dc4fSMatthieu Baerts (NGI0) &tcp_sock_set_keepidle_locked,
849bd11dc4fSMatthieu Baerts (NGI0) &msk->keepalive_idle, val);
850bd11dc4fSMatthieu Baerts (NGI0) break;
851bd11dc4fSMatthieu Baerts (NGI0) case TCP_KEEPINTVL:
852bd11dc4fSMatthieu Baerts (NGI0) ret = __mptcp_setsockopt_set_val(msk, MAX_TCP_KEEPINTVL,
853bd11dc4fSMatthieu Baerts (NGI0) &tcp_sock_set_keepintvl,
854bd11dc4fSMatthieu Baerts (NGI0) &msk->keepalive_intvl, val);
855bd11dc4fSMatthieu Baerts (NGI0) break;
856bd11dc4fSMatthieu Baerts (NGI0) case TCP_KEEPCNT:
857bd11dc4fSMatthieu Baerts (NGI0) ret = __mptcp_setsockopt_set_val(msk, MAX_TCP_KEEPCNT,
858bd11dc4fSMatthieu Baerts (NGI0) &tcp_sock_set_keepcnt,
859bd11dc4fSMatthieu Baerts (NGI0) &msk->keepalive_cnt,
860bd11dc4fSMatthieu Baerts (NGI0) val);
861bd11dc4fSMatthieu Baerts (NGI0) break;
8627f71a337SPaolo Abeni default:
8637f71a337SPaolo Abeni ret = -ENOPROTOOPT;
8647f71a337SPaolo Abeni }
8657f71a337SPaolo Abeni
8667f71a337SPaolo Abeni release_sock(sk);
8677f71a337SPaolo Abeni return ret;
868aa1fbd94SFlorian Westphal }
869aa1fbd94SFlorian Westphal
mptcp_setsockopt(struct sock * sk,int level,int optname,sockptr_t optval,unsigned int optlen)8700abdde82SPaolo Abeni int mptcp_setsockopt(struct sock *sk, int level, int optname,
8710abdde82SPaolo Abeni sockptr_t optval, unsigned int optlen)
8720abdde82SPaolo Abeni {
8730abdde82SPaolo Abeni struct mptcp_sock *msk = mptcp_sk(sk);
8740abdde82SPaolo Abeni struct sock *ssk;
8750abdde82SPaolo Abeni
8760abdde82SPaolo Abeni pr_debug("msk=%p", msk);
8770abdde82SPaolo Abeni
8780abdde82SPaolo Abeni if (level == SOL_SOCKET)
8790abdde82SPaolo Abeni return mptcp_setsockopt_sol_socket(msk, optname, optval, optlen);
8800abdde82SPaolo Abeni
8817a009a70SFlorian Westphal if (!mptcp_supported_sockopt(level, optname))
8827a009a70SFlorian Westphal return -ENOPROTOOPT;
8837a009a70SFlorian Westphal
8840abdde82SPaolo Abeni /* @@ the meaning of setsockopt() when the socket is connected and
8850abdde82SPaolo Abeni * there are multiple subflows is not yet defined. It is up to the
8860abdde82SPaolo Abeni * MPTCP-level socket to configure the subflows until the subflow
8870abdde82SPaolo Abeni * is in TCP fallback, when TCP socket options are passed through
8880abdde82SPaolo Abeni * to the one remaining subflow.
8890abdde82SPaolo Abeni */
8900abdde82SPaolo Abeni lock_sock(sk);
8910abdde82SPaolo Abeni ssk = __mptcp_tcp_fallback(msk);
8920abdde82SPaolo Abeni release_sock(sk);
8930abdde82SPaolo Abeni if (ssk)
8940abdde82SPaolo Abeni return tcp_setsockopt(ssk, level, optname, optval, optlen);
8950abdde82SPaolo Abeni
896ffcacff8SPoorva Sonparote if (level == SOL_IP)
897ffcacff8SPoorva Sonparote return mptcp_setsockopt_v4(msk, optname, optval, optlen);
898ffcacff8SPoorva Sonparote
8990abdde82SPaolo Abeni if (level == SOL_IPV6)
9000abdde82SPaolo Abeni return mptcp_setsockopt_v6(msk, optname, optval, optlen);
9010abdde82SPaolo Abeni
902aa1fbd94SFlorian Westphal if (level == SOL_TCP)
903aa1fbd94SFlorian Westphal return mptcp_setsockopt_sol_tcp(msk, optname, optval, optlen);
904aa1fbd94SFlorian Westphal
905aa1fbd94SFlorian Westphal return -EOPNOTSUPP;
906aa1fbd94SFlorian Westphal }
907aa1fbd94SFlorian Westphal
mptcp_getsockopt_first_sf_only(struct mptcp_sock * msk,int level,int optname,char __user * optval,int __user * optlen)908aa1fbd94SFlorian Westphal static int mptcp_getsockopt_first_sf_only(struct mptcp_sock *msk, int level, int optname,
909aa1fbd94SFlorian Westphal char __user *optval, int __user *optlen)
910aa1fbd94SFlorian Westphal {
911aa1fbd94SFlorian Westphal struct sock *sk = (struct sock *)msk;
912aa1fbd94SFlorian Westphal struct sock *ssk;
913f0bc514bSPaolo Abeni int ret;
914aa1fbd94SFlorian Westphal
915aa1fbd94SFlorian Westphal lock_sock(sk);
916aa1fbd94SFlorian Westphal ssk = msk->first;
917aa1fbd94SFlorian Westphal if (ssk) {
918aa1fbd94SFlorian Westphal ret = tcp_getsockopt(ssk, level, optname, optval, optlen);
919aa1fbd94SFlorian Westphal goto out;
920aa1fbd94SFlorian Westphal }
921aa1fbd94SFlorian Westphal
9223f326a82SPaolo Abeni ssk = __mptcp_nmpc_sk(msk);
9233f326a82SPaolo Abeni if (IS_ERR(ssk)) {
9243f326a82SPaolo Abeni ret = PTR_ERR(ssk);
925aa1fbd94SFlorian Westphal goto out;
926ddb1a072SPaolo Abeni }
927aa1fbd94SFlorian Westphal
928f0bc514bSPaolo Abeni ret = tcp_getsockopt(ssk, level, optname, optval, optlen);
929aa1fbd94SFlorian Westphal
930aa1fbd94SFlorian Westphal out:
931aa1fbd94SFlorian Westphal release_sock(sk);
932aa1fbd94SFlorian Westphal return ret;
933aa1fbd94SFlorian Westphal }
934aa1fbd94SFlorian Westphal
mptcp_diag_fill_info(struct mptcp_sock * msk,struct mptcp_info * info)93561bc6e82SFlorian Westphal void mptcp_diag_fill_info(struct mptcp_sock *msk, struct mptcp_info *info)
93661bc6e82SFlorian Westphal {
93738967f42SPaolo Abeni struct sock *sk = (struct sock *)msk;
93861bc6e82SFlorian Westphal u32 flags = 0;
93938967f42SPaolo Abeni bool slow;
94018d82cdeSGeliang Tang u32 now;
94161bc6e82SFlorian Westphal
94255c42fa7SFlorian Westphal memset(info, 0, sizeof(*info));
94355c42fa7SFlorian Westphal
94461bc6e82SFlorian Westphal info->mptcpi_subflows = READ_ONCE(msk->pm.subflows);
94561bc6e82SFlorian Westphal info->mptcpi_add_addr_signal = READ_ONCE(msk->pm.add_addr_signaled);
94661bc6e82SFlorian Westphal info->mptcpi_add_addr_accepted = READ_ONCE(msk->pm.add_addr_accepted);
94761bc6e82SFlorian Westphal info->mptcpi_local_addr_used = READ_ONCE(msk->pm.local_addr_used);
948e925a032SMatthieu Baerts
94938967f42SPaolo Abeni if (inet_sk_state_load(sk) == TCP_LISTEN)
95038967f42SPaolo Abeni return;
95138967f42SPaolo Abeni
952e925a032SMatthieu Baerts /* The following limits only make sense for the in-kernel PM */
953e925a032SMatthieu Baerts if (mptcp_pm_is_kernel(msk)) {
954e925a032SMatthieu Baerts info->mptcpi_subflows_max =
955e925a032SMatthieu Baerts mptcp_pm_get_subflows_max(msk);
956e925a032SMatthieu Baerts info->mptcpi_add_addr_signal_max =
957e925a032SMatthieu Baerts mptcp_pm_get_add_addr_signal_max(msk);
958e925a032SMatthieu Baerts info->mptcpi_add_addr_accepted_max =
959e925a032SMatthieu Baerts mptcp_pm_get_add_addr_accept_max(msk);
960e925a032SMatthieu Baerts info->mptcpi_local_addr_max =
961e925a032SMatthieu Baerts mptcp_pm_get_local_addr_max(msk);
962e925a032SMatthieu Baerts }
963e925a032SMatthieu Baerts
96483d580ddSGeliang Tang if (__mptcp_check_fallback(msk))
96561bc6e82SFlorian Westphal flags |= MPTCP_INFO_FLAG_FALLBACK;
96661bc6e82SFlorian Westphal if (READ_ONCE(msk->can_ack))
96761bc6e82SFlorian Westphal flags |= MPTCP_INFO_FLAG_REMOTE_KEY_RECEIVED;
96861bc6e82SFlorian Westphal info->mptcpi_flags = flags;
96938967f42SPaolo Abeni
97038967f42SPaolo Abeni slow = lock_sock_fast(sk);
97128e5c138SPaolo Abeni info->mptcpi_csum_enabled = READ_ONCE(msk->csum_enabled);
97238967f42SPaolo Abeni info->mptcpi_token = msk->token;
97338967f42SPaolo Abeni info->mptcpi_write_seq = msk->write_seq;
97438967f42SPaolo Abeni info->mptcpi_retransmits = inet_csk(sk)->icsk_retransmits;
97538967f42SPaolo Abeni info->mptcpi_bytes_sent = msk->bytes_sent;
97638967f42SPaolo Abeni info->mptcpi_bytes_received = msk->bytes_received;
97738967f42SPaolo Abeni info->mptcpi_bytes_retrans = msk->bytes_retrans;
9786ebf6f90SGeliang Tang info->mptcpi_subflows_total = info->mptcpi_subflows +
9796ebf6f90SGeliang Tang __mptcp_has_initial_subflow(msk);
98018d82cdeSGeliang Tang now = tcp_jiffies32;
98118d82cdeSGeliang Tang info->mptcpi_last_data_sent = jiffies_to_msecs(now - msk->last_data_sent);
98218d82cdeSGeliang Tang info->mptcpi_last_data_recv = jiffies_to_msecs(now - msk->last_data_recv);
98338967f42SPaolo Abeni unlock_sock_fast(sk, slow);
98418d82cdeSGeliang Tang
98518d82cdeSGeliang Tang mptcp_data_lock(sk);
98618d82cdeSGeliang Tang info->mptcpi_last_ack_recv = jiffies_to_msecs(now - msk->last_ack_recv);
98718d82cdeSGeliang Tang info->mptcpi_snd_una = msk->snd_una;
98818d82cdeSGeliang Tang info->mptcpi_rcv_nxt = msk->ack_seq;
98918d82cdeSGeliang Tang info->mptcpi_bytes_acked = msk->bytes_acked;
99018d82cdeSGeliang Tang mptcp_data_unlock(sk);
99161bc6e82SFlorian Westphal }
99261bc6e82SFlorian Westphal EXPORT_SYMBOL_GPL(mptcp_diag_fill_info);
99361bc6e82SFlorian Westphal
mptcp_getsockopt_info(struct mptcp_sock * msk,char __user * optval,int __user * optlen)99455c42fa7SFlorian Westphal static int mptcp_getsockopt_info(struct mptcp_sock *msk, char __user *optval, int __user *optlen)
99555c42fa7SFlorian Westphal {
99655c42fa7SFlorian Westphal struct mptcp_info m_info;
99755c42fa7SFlorian Westphal int len;
99855c42fa7SFlorian Westphal
99955c42fa7SFlorian Westphal if (get_user(len, optlen))
100055c42fa7SFlorian Westphal return -EFAULT;
100155c42fa7SFlorian Westphal
1002ce5f6f71SMatthieu Baerts (NGI0) /* When used only to check if a fallback to TCP happened. */
1003ce5f6f71SMatthieu Baerts (NGI0) if (len == 0)
1004ce5f6f71SMatthieu Baerts (NGI0) return 0;
1005ce5f6f71SMatthieu Baerts (NGI0)
100655c42fa7SFlorian Westphal len = min_t(unsigned int, len, sizeof(struct mptcp_info));
100755c42fa7SFlorian Westphal
100855c42fa7SFlorian Westphal mptcp_diag_fill_info(msk, &m_info);
100955c42fa7SFlorian Westphal
101055c42fa7SFlorian Westphal if (put_user(len, optlen))
101155c42fa7SFlorian Westphal return -EFAULT;
101255c42fa7SFlorian Westphal
101355c42fa7SFlorian Westphal if (copy_to_user(optval, &m_info, len))
101455c42fa7SFlorian Westphal return -EFAULT;
101555c42fa7SFlorian Westphal
101655c42fa7SFlorian Westphal return 0;
101755c42fa7SFlorian Westphal }
101855c42fa7SFlorian Westphal
mptcp_put_subflow_data(struct mptcp_subflow_data * sfd,char __user * optval,u32 copied,int __user * optlen)101906f15ceeSFlorian Westphal static int mptcp_put_subflow_data(struct mptcp_subflow_data *sfd,
102006f15ceeSFlorian Westphal char __user *optval,
102106f15ceeSFlorian Westphal u32 copied,
102206f15ceeSFlorian Westphal int __user *optlen)
102306f15ceeSFlorian Westphal {
102406f15ceeSFlorian Westphal u32 copylen = min_t(u32, sfd->size_subflow_data, sizeof(*sfd));
102506f15ceeSFlorian Westphal
102606f15ceeSFlorian Westphal if (copied)
102706f15ceeSFlorian Westphal copied += sfd->size_subflow_data;
102806f15ceeSFlorian Westphal else
102906f15ceeSFlorian Westphal copied = copylen;
103006f15ceeSFlorian Westphal
103106f15ceeSFlorian Westphal if (put_user(copied, optlen))
103206f15ceeSFlorian Westphal return -EFAULT;
103306f15ceeSFlorian Westphal
103406f15ceeSFlorian Westphal if (copy_to_user(optval, sfd, copylen))
103506f15ceeSFlorian Westphal return -EFAULT;
103606f15ceeSFlorian Westphal
103706f15ceeSFlorian Westphal return 0;
103806f15ceeSFlorian Westphal }
103906f15ceeSFlorian Westphal
mptcp_get_subflow_data(struct mptcp_subflow_data * sfd,char __user * optval,int __user * optlen)104006f15ceeSFlorian Westphal static int mptcp_get_subflow_data(struct mptcp_subflow_data *sfd,
104149243207SPaolo Abeni char __user *optval,
104249243207SPaolo Abeni int __user *optlen)
104306f15ceeSFlorian Westphal {
104406f15ceeSFlorian Westphal int len, copylen;
104506f15ceeSFlorian Westphal
104606f15ceeSFlorian Westphal if (get_user(len, optlen))
104706f15ceeSFlorian Westphal return -EFAULT;
104806f15ceeSFlorian Westphal
104906f15ceeSFlorian Westphal /* if mptcp_subflow_data size is changed, need to adjust
105006f15ceeSFlorian Westphal * this function to deal with programs using old version.
105106f15ceeSFlorian Westphal */
105206f15ceeSFlorian Westphal BUILD_BUG_ON(sizeof(*sfd) != MIN_INFO_OPTLEN_SIZE);
105306f15ceeSFlorian Westphal
105406f15ceeSFlorian Westphal if (len < MIN_INFO_OPTLEN_SIZE)
105506f15ceeSFlorian Westphal return -EINVAL;
105606f15ceeSFlorian Westphal
105706f15ceeSFlorian Westphal memset(sfd, 0, sizeof(*sfd));
105806f15ceeSFlorian Westphal
105906f15ceeSFlorian Westphal copylen = min_t(unsigned int, len, sizeof(*sfd));
106006f15ceeSFlorian Westphal if (copy_from_user(sfd, optval, copylen))
106106f15ceeSFlorian Westphal return -EFAULT;
106206f15ceeSFlorian Westphal
106306f15ceeSFlorian Westphal /* size_subflow_data is u32, but len is signed */
106406f15ceeSFlorian Westphal if (sfd->size_subflow_data > INT_MAX ||
106506f15ceeSFlorian Westphal sfd->size_user > INT_MAX)
106606f15ceeSFlorian Westphal return -EINVAL;
106706f15ceeSFlorian Westphal
106806f15ceeSFlorian Westphal if (sfd->size_subflow_data < MIN_INFO_OPTLEN_SIZE ||
106906f15ceeSFlorian Westphal sfd->size_subflow_data > len)
107006f15ceeSFlorian Westphal return -EINVAL;
107106f15ceeSFlorian Westphal
107206f15ceeSFlorian Westphal if (sfd->num_subflows || sfd->size_kernel)
107306f15ceeSFlorian Westphal return -EINVAL;
107406f15ceeSFlorian Westphal
107506f15ceeSFlorian Westphal return len - sfd->size_subflow_data;
107606f15ceeSFlorian Westphal }
107706f15ceeSFlorian Westphal
mptcp_getsockopt_tcpinfo(struct mptcp_sock * msk,char __user * optval,int __user * optlen)107806f15ceeSFlorian Westphal static int mptcp_getsockopt_tcpinfo(struct mptcp_sock *msk, char __user *optval,
107906f15ceeSFlorian Westphal int __user *optlen)
108006f15ceeSFlorian Westphal {
108106f15ceeSFlorian Westphal struct mptcp_subflow_context *subflow;
108280638684SGeliang Tang struct sock *sk = (struct sock *)msk;
108306f15ceeSFlorian Westphal unsigned int sfcount = 0, copied = 0;
108406f15ceeSFlorian Westphal struct mptcp_subflow_data sfd;
108506f15ceeSFlorian Westphal char __user *infoptr;
108606f15ceeSFlorian Westphal int len;
108706f15ceeSFlorian Westphal
108806f15ceeSFlorian Westphal len = mptcp_get_subflow_data(&sfd, optval, optlen);
108906f15ceeSFlorian Westphal if (len < 0)
109006f15ceeSFlorian Westphal return len;
109106f15ceeSFlorian Westphal
109206f15ceeSFlorian Westphal sfd.size_kernel = sizeof(struct tcp_info);
109306f15ceeSFlorian Westphal sfd.size_user = min_t(unsigned int, sfd.size_user,
109406f15ceeSFlorian Westphal sizeof(struct tcp_info));
109506f15ceeSFlorian Westphal
109606f15ceeSFlorian Westphal infoptr = optval + sfd.size_subflow_data;
109706f15ceeSFlorian Westphal
109806f15ceeSFlorian Westphal lock_sock(sk);
109906f15ceeSFlorian Westphal
110006f15ceeSFlorian Westphal mptcp_for_each_subflow(msk, subflow) {
110106f15ceeSFlorian Westphal struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
110206f15ceeSFlorian Westphal
110306f15ceeSFlorian Westphal ++sfcount;
110406f15ceeSFlorian Westphal
110506f15ceeSFlorian Westphal if (len && len >= sfd.size_user) {
110606f15ceeSFlorian Westphal struct tcp_info info;
110706f15ceeSFlorian Westphal
110806f15ceeSFlorian Westphal tcp_get_info(ssk, &info);
110906f15ceeSFlorian Westphal
111006f15ceeSFlorian Westphal if (copy_to_user(infoptr, &info, sfd.size_user)) {
111106f15ceeSFlorian Westphal release_sock(sk);
111206f15ceeSFlorian Westphal return -EFAULT;
111306f15ceeSFlorian Westphal }
111406f15ceeSFlorian Westphal
111506f15ceeSFlorian Westphal infoptr += sfd.size_user;
111606f15ceeSFlorian Westphal copied += sfd.size_user;
111706f15ceeSFlorian Westphal len -= sfd.size_user;
111806f15ceeSFlorian Westphal }
111906f15ceeSFlorian Westphal }
112006f15ceeSFlorian Westphal
112106f15ceeSFlorian Westphal release_sock(sk);
112206f15ceeSFlorian Westphal
112306f15ceeSFlorian Westphal sfd.num_subflows = sfcount;
112406f15ceeSFlorian Westphal
112506f15ceeSFlorian Westphal if (mptcp_put_subflow_data(&sfd, optval, copied, optlen))
112606f15ceeSFlorian Westphal return -EFAULT;
112706f15ceeSFlorian Westphal
112806f15ceeSFlorian Westphal return 0;
112906f15ceeSFlorian Westphal }
113006f15ceeSFlorian Westphal
mptcp_get_sub_addrs(const struct sock * sk,struct mptcp_subflow_addrs * a)1131c11c5906SFlorian Westphal static void mptcp_get_sub_addrs(const struct sock *sk, struct mptcp_subflow_addrs *a)
1132c11c5906SFlorian Westphal {
1133abc17a11SEric Dumazet const struct inet_sock *inet = inet_sk(sk);
1134c11c5906SFlorian Westphal
1135c11c5906SFlorian Westphal memset(a, 0, sizeof(*a));
1136c11c5906SFlorian Westphal
1137c11c5906SFlorian Westphal if (sk->sk_family == AF_INET) {
1138c11c5906SFlorian Westphal a->sin_local.sin_family = AF_INET;
1139c11c5906SFlorian Westphal a->sin_local.sin_port = inet->inet_sport;
1140c11c5906SFlorian Westphal a->sin_local.sin_addr.s_addr = inet->inet_rcv_saddr;
1141c11c5906SFlorian Westphal
1142c11c5906SFlorian Westphal if (!a->sin_local.sin_addr.s_addr)
1143c11c5906SFlorian Westphal a->sin_local.sin_addr.s_addr = inet->inet_saddr;
1144c11c5906SFlorian Westphal
1145c11c5906SFlorian Westphal a->sin_remote.sin_family = AF_INET;
1146c11c5906SFlorian Westphal a->sin_remote.sin_port = inet->inet_dport;
1147c11c5906SFlorian Westphal a->sin_remote.sin_addr.s_addr = inet->inet_daddr;
1148c11c5906SFlorian Westphal #if IS_ENABLED(CONFIG_IPV6)
1149c11c5906SFlorian Westphal } else if (sk->sk_family == AF_INET6) {
1150c11c5906SFlorian Westphal const struct ipv6_pinfo *np = inet6_sk(sk);
1151c11c5906SFlorian Westphal
115229211e7dSTim Gardner if (WARN_ON_ONCE(!np))
115329211e7dSTim Gardner return;
115429211e7dSTim Gardner
1155c11c5906SFlorian Westphal a->sin6_local.sin6_family = AF_INET6;
1156c11c5906SFlorian Westphal a->sin6_local.sin6_port = inet->inet_sport;
1157c11c5906SFlorian Westphal
1158c11c5906SFlorian Westphal if (ipv6_addr_any(&sk->sk_v6_rcv_saddr))
1159c11c5906SFlorian Westphal a->sin6_local.sin6_addr = np->saddr;
1160c11c5906SFlorian Westphal else
1161c11c5906SFlorian Westphal a->sin6_local.sin6_addr = sk->sk_v6_rcv_saddr;
1162c11c5906SFlorian Westphal
1163c11c5906SFlorian Westphal a->sin6_remote.sin6_family = AF_INET6;
1164c11c5906SFlorian Westphal a->sin6_remote.sin6_port = inet->inet_dport;
1165c11c5906SFlorian Westphal a->sin6_remote.sin6_addr = sk->sk_v6_daddr;
1166c11c5906SFlorian Westphal #endif
1167c11c5906SFlorian Westphal }
1168c11c5906SFlorian Westphal }
1169c11c5906SFlorian Westphal
mptcp_getsockopt_subflow_addrs(struct mptcp_sock * msk,char __user * optval,int __user * optlen)1170c11c5906SFlorian Westphal static int mptcp_getsockopt_subflow_addrs(struct mptcp_sock *msk, char __user *optval,
1171c11c5906SFlorian Westphal int __user *optlen)
1172c11c5906SFlorian Westphal {
1173c11c5906SFlorian Westphal struct mptcp_subflow_context *subflow;
117480638684SGeliang Tang struct sock *sk = (struct sock *)msk;
1175c11c5906SFlorian Westphal unsigned int sfcount = 0, copied = 0;
1176c11c5906SFlorian Westphal struct mptcp_subflow_data sfd;
1177c11c5906SFlorian Westphal char __user *addrptr;
1178c11c5906SFlorian Westphal int len;
1179c11c5906SFlorian Westphal
1180c11c5906SFlorian Westphal len = mptcp_get_subflow_data(&sfd, optval, optlen);
1181c11c5906SFlorian Westphal if (len < 0)
1182c11c5906SFlorian Westphal return len;
1183c11c5906SFlorian Westphal
1184c11c5906SFlorian Westphal sfd.size_kernel = sizeof(struct mptcp_subflow_addrs);
1185c11c5906SFlorian Westphal sfd.size_user = min_t(unsigned int, sfd.size_user,
1186c11c5906SFlorian Westphal sizeof(struct mptcp_subflow_addrs));
1187c11c5906SFlorian Westphal
1188c11c5906SFlorian Westphal addrptr = optval + sfd.size_subflow_data;
1189c11c5906SFlorian Westphal
1190c11c5906SFlorian Westphal lock_sock(sk);
1191c11c5906SFlorian Westphal
1192c11c5906SFlorian Westphal mptcp_for_each_subflow(msk, subflow) {
1193c11c5906SFlorian Westphal struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
1194c11c5906SFlorian Westphal
1195c11c5906SFlorian Westphal ++sfcount;
1196c11c5906SFlorian Westphal
1197c11c5906SFlorian Westphal if (len && len >= sfd.size_user) {
1198c11c5906SFlorian Westphal struct mptcp_subflow_addrs a;
1199c11c5906SFlorian Westphal
1200c11c5906SFlorian Westphal mptcp_get_sub_addrs(ssk, &a);
1201c11c5906SFlorian Westphal
1202c11c5906SFlorian Westphal if (copy_to_user(addrptr, &a, sfd.size_user)) {
1203c11c5906SFlorian Westphal release_sock(sk);
1204c11c5906SFlorian Westphal return -EFAULT;
1205c11c5906SFlorian Westphal }
1206c11c5906SFlorian Westphal
1207c11c5906SFlorian Westphal addrptr += sfd.size_user;
1208c11c5906SFlorian Westphal copied += sfd.size_user;
1209c11c5906SFlorian Westphal len -= sfd.size_user;
1210c11c5906SFlorian Westphal }
1211c11c5906SFlorian Westphal }
1212c11c5906SFlorian Westphal
1213c11c5906SFlorian Westphal release_sock(sk);
1214c11c5906SFlorian Westphal
1215c11c5906SFlorian Westphal sfd.num_subflows = sfcount;
1216c11c5906SFlorian Westphal
1217c11c5906SFlorian Westphal if (mptcp_put_subflow_data(&sfd, optval, copied, optlen))
1218c11c5906SFlorian Westphal return -EFAULT;
1219c11c5906SFlorian Westphal
1220c11c5906SFlorian Westphal return 0;
1221c11c5906SFlorian Westphal }
1222c11c5906SFlorian Westphal
mptcp_get_full_info(struct mptcp_full_info * mfi,char __user * optval,int __user * optlen)122349243207SPaolo Abeni static int mptcp_get_full_info(struct mptcp_full_info *mfi,
122449243207SPaolo Abeni char __user *optval,
122549243207SPaolo Abeni int __user *optlen)
122649243207SPaolo Abeni {
122749243207SPaolo Abeni int len;
122849243207SPaolo Abeni
122949243207SPaolo Abeni BUILD_BUG_ON(offsetof(struct mptcp_full_info, mptcp_info) !=
123049243207SPaolo Abeni MIN_FULL_INFO_OPTLEN_SIZE);
123149243207SPaolo Abeni
123249243207SPaolo Abeni if (get_user(len, optlen))
123349243207SPaolo Abeni return -EFAULT;
123449243207SPaolo Abeni
123549243207SPaolo Abeni if (len < MIN_FULL_INFO_OPTLEN_SIZE)
123649243207SPaolo Abeni return -EINVAL;
123749243207SPaolo Abeni
123849243207SPaolo Abeni memset(mfi, 0, sizeof(*mfi));
123949243207SPaolo Abeni if (copy_from_user(mfi, optval, MIN_FULL_INFO_OPTLEN_SIZE))
124049243207SPaolo Abeni return -EFAULT;
124149243207SPaolo Abeni
124249243207SPaolo Abeni if (mfi->size_tcpinfo_kernel ||
124349243207SPaolo Abeni mfi->size_sfinfo_kernel ||
124449243207SPaolo Abeni mfi->num_subflows)
124549243207SPaolo Abeni return -EINVAL;
124649243207SPaolo Abeni
124749243207SPaolo Abeni if (mfi->size_sfinfo_user > INT_MAX ||
124849243207SPaolo Abeni mfi->size_tcpinfo_user > INT_MAX)
124949243207SPaolo Abeni return -EINVAL;
125049243207SPaolo Abeni
125149243207SPaolo Abeni return len - MIN_FULL_INFO_OPTLEN_SIZE;
125249243207SPaolo Abeni }
125349243207SPaolo Abeni
mptcp_put_full_info(struct mptcp_full_info * mfi,char __user * optval,u32 copylen,int __user * optlen)125449243207SPaolo Abeni static int mptcp_put_full_info(struct mptcp_full_info *mfi,
125549243207SPaolo Abeni char __user *optval,
125649243207SPaolo Abeni u32 copylen,
125749243207SPaolo Abeni int __user *optlen)
125849243207SPaolo Abeni {
125949243207SPaolo Abeni copylen += MIN_FULL_INFO_OPTLEN_SIZE;
126049243207SPaolo Abeni if (put_user(copylen, optlen))
126149243207SPaolo Abeni return -EFAULT;
126249243207SPaolo Abeni
126349243207SPaolo Abeni if (copy_to_user(optval, mfi, copylen))
126449243207SPaolo Abeni return -EFAULT;
126549243207SPaolo Abeni return 0;
126649243207SPaolo Abeni }
126749243207SPaolo Abeni
mptcp_getsockopt_full_info(struct mptcp_sock * msk,char __user * optval,int __user * optlen)126849243207SPaolo Abeni static int mptcp_getsockopt_full_info(struct mptcp_sock *msk, char __user *optval,
126949243207SPaolo Abeni int __user *optlen)
127049243207SPaolo Abeni {
127149243207SPaolo Abeni unsigned int sfcount = 0, copylen = 0;
127249243207SPaolo Abeni struct mptcp_subflow_context *subflow;
127349243207SPaolo Abeni struct sock *sk = (struct sock *)msk;
127449243207SPaolo Abeni void __user *tcpinfoptr, *sfinfoptr;
127549243207SPaolo Abeni struct mptcp_full_info mfi;
127649243207SPaolo Abeni int len;
127749243207SPaolo Abeni
127849243207SPaolo Abeni len = mptcp_get_full_info(&mfi, optval, optlen);
127949243207SPaolo Abeni if (len < 0)
128049243207SPaolo Abeni return len;
128149243207SPaolo Abeni
128249243207SPaolo Abeni /* don't bother filling the mptcp info if there is not enough
128349243207SPaolo Abeni * user-space-provided storage
128449243207SPaolo Abeni */
128549243207SPaolo Abeni if (len > 0) {
128649243207SPaolo Abeni mptcp_diag_fill_info(msk, &mfi.mptcp_info);
128749243207SPaolo Abeni copylen += min_t(unsigned int, len, sizeof(struct mptcp_info));
128849243207SPaolo Abeni }
128949243207SPaolo Abeni
129049243207SPaolo Abeni mfi.size_tcpinfo_kernel = sizeof(struct tcp_info);
129149243207SPaolo Abeni mfi.size_tcpinfo_user = min_t(unsigned int, mfi.size_tcpinfo_user,
129249243207SPaolo Abeni sizeof(struct tcp_info));
129349243207SPaolo Abeni sfinfoptr = u64_to_user_ptr(mfi.subflow_info);
129449243207SPaolo Abeni mfi.size_sfinfo_kernel = sizeof(struct mptcp_subflow_info);
129549243207SPaolo Abeni mfi.size_sfinfo_user = min_t(unsigned int, mfi.size_sfinfo_user,
129649243207SPaolo Abeni sizeof(struct mptcp_subflow_info));
129749243207SPaolo Abeni tcpinfoptr = u64_to_user_ptr(mfi.tcp_info);
129849243207SPaolo Abeni
129949243207SPaolo Abeni lock_sock(sk);
130049243207SPaolo Abeni mptcp_for_each_subflow(msk, subflow) {
130149243207SPaolo Abeni struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
130249243207SPaolo Abeni struct mptcp_subflow_info sfinfo;
130349243207SPaolo Abeni struct tcp_info tcp_info;
130449243207SPaolo Abeni
130549243207SPaolo Abeni if (sfcount++ >= mfi.size_arrays_user)
130649243207SPaolo Abeni continue;
130749243207SPaolo Abeni
130849243207SPaolo Abeni /* fetch addr/tcp_info only if the user space buffers
130949243207SPaolo Abeni * are wide enough
131049243207SPaolo Abeni */
131149243207SPaolo Abeni memset(&sfinfo, 0, sizeof(sfinfo));
131249243207SPaolo Abeni sfinfo.id = subflow->subflow_id;
131349243207SPaolo Abeni if (mfi.size_sfinfo_user >
131449243207SPaolo Abeni offsetof(struct mptcp_subflow_info, addrs))
131549243207SPaolo Abeni mptcp_get_sub_addrs(ssk, &sfinfo.addrs);
131649243207SPaolo Abeni if (copy_to_user(sfinfoptr, &sfinfo, mfi.size_sfinfo_user))
131749243207SPaolo Abeni goto fail_release;
131849243207SPaolo Abeni
131949243207SPaolo Abeni if (mfi.size_tcpinfo_user) {
132049243207SPaolo Abeni tcp_get_info(ssk, &tcp_info);
132149243207SPaolo Abeni if (copy_to_user(tcpinfoptr, &tcp_info,
132249243207SPaolo Abeni mfi.size_tcpinfo_user))
132349243207SPaolo Abeni goto fail_release;
132449243207SPaolo Abeni }
132549243207SPaolo Abeni
132649243207SPaolo Abeni tcpinfoptr += mfi.size_tcpinfo_user;
132749243207SPaolo Abeni sfinfoptr += mfi.size_sfinfo_user;
132849243207SPaolo Abeni }
132949243207SPaolo Abeni release_sock(sk);
133049243207SPaolo Abeni
133149243207SPaolo Abeni mfi.num_subflows = sfcount;
133249243207SPaolo Abeni if (mptcp_put_full_info(&mfi, optval, copylen, optlen))
133349243207SPaolo Abeni return -EFAULT;
133449243207SPaolo Abeni
133549243207SPaolo Abeni return 0;
133649243207SPaolo Abeni
133749243207SPaolo Abeni fail_release:
133849243207SPaolo Abeni release_sock(sk);
133949243207SPaolo Abeni return -EFAULT;
134049243207SPaolo Abeni }
134149243207SPaolo Abeni
mptcp_put_int_option(struct mptcp_sock * msk,char __user * optval,int __user * optlen,int val)13422c9e7765SFlorian Westphal static int mptcp_put_int_option(struct mptcp_sock *msk, char __user *optval,
13432c9e7765SFlorian Westphal int __user *optlen, int val)
13442c9e7765SFlorian Westphal {
13452c9e7765SFlorian Westphal int len;
13462c9e7765SFlorian Westphal
13472c9e7765SFlorian Westphal if (get_user(len, optlen))
13482c9e7765SFlorian Westphal return -EFAULT;
13492c9e7765SFlorian Westphal if (len < 0)
13502c9e7765SFlorian Westphal return -EINVAL;
13512c9e7765SFlorian Westphal
13523b1e21ebSFlorian Westphal if (len < sizeof(int) && len > 0 && val >= 0 && val <= 255) {
13533b1e21ebSFlorian Westphal unsigned char ucval = (unsigned char)val;
13543b1e21ebSFlorian Westphal
13553b1e21ebSFlorian Westphal len = 1;
13563b1e21ebSFlorian Westphal if (put_user(len, optlen))
13573b1e21ebSFlorian Westphal return -EFAULT;
13583b1e21ebSFlorian Westphal if (copy_to_user(optval, &ucval, 1))
13593b1e21ebSFlorian Westphal return -EFAULT;
13603b1e21ebSFlorian Westphal } else {
13613b1e21ebSFlorian Westphal len = min_t(unsigned int, len, sizeof(int));
13622c9e7765SFlorian Westphal if (put_user(len, optlen))
13632c9e7765SFlorian Westphal return -EFAULT;
13642c9e7765SFlorian Westphal if (copy_to_user(optval, &val, len))
13652c9e7765SFlorian Westphal return -EFAULT;
13663b1e21ebSFlorian Westphal }
13672c9e7765SFlorian Westphal
13682c9e7765SFlorian Westphal return 0;
13692c9e7765SFlorian Westphal }
13702c9e7765SFlorian Westphal
mptcp_getsockopt_sol_tcp(struct mptcp_sock * msk,int optname,char __user * optval,int __user * optlen)1371aa1fbd94SFlorian Westphal static int mptcp_getsockopt_sol_tcp(struct mptcp_sock *msk, int optname,
1372aa1fbd94SFlorian Westphal char __user *optval, int __user *optlen)
1373aa1fbd94SFlorian Westphal {
1374bd11dc4fSMatthieu Baerts (NGI0) struct sock *sk = (void *)msk;
1375bd11dc4fSMatthieu Baerts (NGI0)
1376aa1fbd94SFlorian Westphal switch (optname) {
1377aa1fbd94SFlorian Westphal case TCP_ULP:
1378aa1fbd94SFlorian Westphal case TCP_CONGESTION:
1379aa1fbd94SFlorian Westphal case TCP_INFO:
1380aa1fbd94SFlorian Westphal case TCP_CC_INFO:
1381ea1e301dSFlorian Westphal case TCP_DEFER_ACCEPT:
13824ffb0a02SDmytro Shytyi case TCP_FASTOPEN:
138354635bd0SBenjamin Hesmans case TCP_FASTOPEN_CONNECT:
1384cb99816cSMatthieu Baerts case TCP_FASTOPEN_KEY:
1385e64d4debSMatthieu Baerts case TCP_FASTOPEN_NO_COOKIE:
1386aa1fbd94SFlorian Westphal return mptcp_getsockopt_first_sf_only(msk, SOL_TCP, optname,
1387aa1fbd94SFlorian Westphal optval, optlen);
13882c9e7765SFlorian Westphal case TCP_INQ:
13892c9e7765SFlorian Westphal return mptcp_put_int_option(msk, optval, optlen, msk->recvmsg_inq);
13904f6e14bdSMaxim Galaganov case TCP_CORK:
13914f6e14bdSMaxim Galaganov return mptcp_put_int_option(msk, optval, optlen, msk->cork);
13924f6e14bdSMaxim Galaganov case TCP_NODELAY:
13934f6e14bdSMaxim Galaganov return mptcp_put_int_option(msk, optval, optlen, msk->nodelay);
1394bd11dc4fSMatthieu Baerts (NGI0) case TCP_KEEPIDLE:
1395bd11dc4fSMatthieu Baerts (NGI0) return mptcp_put_int_option(msk, optval, optlen,
1396bd11dc4fSMatthieu Baerts (NGI0) msk->keepalive_idle ? :
1397bd11dc4fSMatthieu Baerts (NGI0) READ_ONCE(sock_net(sk)->ipv4.sysctl_tcp_keepalive_time) / HZ);
1398bd11dc4fSMatthieu Baerts (NGI0) case TCP_KEEPINTVL:
1399bd11dc4fSMatthieu Baerts (NGI0) return mptcp_put_int_option(msk, optval, optlen,
1400bd11dc4fSMatthieu Baerts (NGI0) msk->keepalive_intvl ? :
1401bd11dc4fSMatthieu Baerts (NGI0) READ_ONCE(sock_net(sk)->ipv4.sysctl_tcp_keepalive_intvl) / HZ);
1402bd11dc4fSMatthieu Baerts (NGI0) case TCP_KEEPCNT:
1403bd11dc4fSMatthieu Baerts (NGI0) return mptcp_put_int_option(msk, optval, optlen,
1404bd11dc4fSMatthieu Baerts (NGI0) msk->keepalive_cnt ? :
1405bd11dc4fSMatthieu Baerts (NGI0) READ_ONCE(sock_net(sk)->ipv4.sysctl_tcp_keepalive_probes));
140629b5e5efSPaolo Abeni case TCP_NOTSENT_LOWAT:
140729b5e5efSPaolo Abeni return mptcp_put_int_option(msk, optval, optlen, msk->notsent_lowat);
1408c084ebd7SMatthieu Baerts (NGI0) case TCP_IS_MPTCP:
1409c084ebd7SMatthieu Baerts (NGI0) return mptcp_put_int_option(msk, optval, optlen, 1);
1410aa1fbd94SFlorian Westphal }
14110abdde82SPaolo Abeni return -EOPNOTSUPP;
14120abdde82SPaolo Abeni }
14130abdde82SPaolo Abeni
mptcp_getsockopt_v4(struct mptcp_sock * msk,int optname,char __user * optval,int __user * optlen)14143b1e21ebSFlorian Westphal static int mptcp_getsockopt_v4(struct mptcp_sock *msk, int optname,
14153b1e21ebSFlorian Westphal char __user *optval, int __user *optlen)
14163b1e21ebSFlorian Westphal {
14173b1e21ebSFlorian Westphal struct sock *sk = (void *)msk;
14183b1e21ebSFlorian Westphal
14193b1e21ebSFlorian Westphal switch (optname) {
14203b1e21ebSFlorian Westphal case IP_TOS:
1421e08d0b3dSEric Dumazet return mptcp_put_int_option(msk, optval, optlen, READ_ONCE(inet_sk(sk)->tos));
1422c85636a2SMaxim Galaganov case IP_BIND_ADDRESS_NO_PORT:
1423c85636a2SMaxim Galaganov return mptcp_put_int_option(msk, optval, optlen,
1424c85636a2SMaxim Galaganov inet_test_bit(BIND_ADDRESS_NO_PORT, sk));
1425c85636a2SMaxim Galaganov case IP_LOCAL_PORT_RANGE:
1426c85636a2SMaxim Galaganov return mptcp_put_int_option(msk, optval, optlen,
1427c85636a2SMaxim Galaganov READ_ONCE(inet_sk(sk)->local_port_range));
14283b1e21ebSFlorian Westphal }
14293b1e21ebSFlorian Westphal
14303b1e21ebSFlorian Westphal return -EOPNOTSUPP;
14313b1e21ebSFlorian Westphal }
14323b1e21ebSFlorian Westphal
mptcp_getsockopt_sol_mptcp(struct mptcp_sock * msk,int optname,char __user * optval,int __user * optlen)143355c42fa7SFlorian Westphal static int mptcp_getsockopt_sol_mptcp(struct mptcp_sock *msk, int optname,
143455c42fa7SFlorian Westphal char __user *optval, int __user *optlen)
143555c42fa7SFlorian Westphal {
143655c42fa7SFlorian Westphal switch (optname) {
143755c42fa7SFlorian Westphal case MPTCP_INFO:
143855c42fa7SFlorian Westphal return mptcp_getsockopt_info(msk, optval, optlen);
143949243207SPaolo Abeni case MPTCP_FULL_INFO:
144049243207SPaolo Abeni return mptcp_getsockopt_full_info(msk, optval, optlen);
144106f15ceeSFlorian Westphal case MPTCP_TCPINFO:
144206f15ceeSFlorian Westphal return mptcp_getsockopt_tcpinfo(msk, optval, optlen);
1443c11c5906SFlorian Westphal case MPTCP_SUBFLOW_ADDRS:
1444c11c5906SFlorian Westphal return mptcp_getsockopt_subflow_addrs(msk, optval, optlen);
144555c42fa7SFlorian Westphal }
144655c42fa7SFlorian Westphal
144755c42fa7SFlorian Westphal return -EOPNOTSUPP;
144855c42fa7SFlorian Westphal }
144955c42fa7SFlorian Westphal
mptcp_getsockopt(struct sock * sk,int level,int optname,char __user * optval,int __user * option)14500abdde82SPaolo Abeni int mptcp_getsockopt(struct sock *sk, int level, int optname,
14510abdde82SPaolo Abeni char __user *optval, int __user *option)
14520abdde82SPaolo Abeni {
14530abdde82SPaolo Abeni struct mptcp_sock *msk = mptcp_sk(sk);
14540abdde82SPaolo Abeni struct sock *ssk;
14550abdde82SPaolo Abeni
14560abdde82SPaolo Abeni pr_debug("msk=%p", msk);
14570abdde82SPaolo Abeni
14580abdde82SPaolo Abeni /* @@ the meaning of setsockopt() when the socket is connected and
14590abdde82SPaolo Abeni * there are multiple subflows is not yet defined. It is up to the
14600abdde82SPaolo Abeni * MPTCP-level socket to configure the subflows until the subflow
14610abdde82SPaolo Abeni * is in TCP fallback, when socket options are passed through
14620abdde82SPaolo Abeni * to the one remaining subflow.
14630abdde82SPaolo Abeni */
14640abdde82SPaolo Abeni lock_sock(sk);
14650abdde82SPaolo Abeni ssk = __mptcp_tcp_fallback(msk);
14660abdde82SPaolo Abeni release_sock(sk);
14670abdde82SPaolo Abeni if (ssk)
14680abdde82SPaolo Abeni return tcp_getsockopt(ssk, level, optname, optval, option);
14690abdde82SPaolo Abeni
14703b1e21ebSFlorian Westphal if (level == SOL_IP)
14713b1e21ebSFlorian Westphal return mptcp_getsockopt_v4(msk, optname, optval, option);
1472aa1fbd94SFlorian Westphal if (level == SOL_TCP)
1473aa1fbd94SFlorian Westphal return mptcp_getsockopt_sol_tcp(msk, optname, optval, option);
147455c42fa7SFlorian Westphal if (level == SOL_MPTCP)
147555c42fa7SFlorian Westphal return mptcp_getsockopt_sol_mptcp(msk, optname, optval, option);
14760abdde82SPaolo Abeni return -EOPNOTSUPP;
14770abdde82SPaolo Abeni }
14780abdde82SPaolo Abeni
sync_socket_options(struct mptcp_sock * msk,struct sock * ssk)14791b3e7edeSFlorian Westphal static void sync_socket_options(struct mptcp_sock *msk, struct sock *ssk)
14801b3e7edeSFlorian Westphal {
14815d0a6bc8SFlorian Westphal static const unsigned int tx_rx_locks = SOCK_RCVBUF_LOCK | SOCK_SNDBUF_LOCK;
14821b3e7edeSFlorian Westphal struct sock *sk = (struct sock *)msk;
14831b3e7edeSFlorian Westphal
14841b3e7edeSFlorian Westphal if (ssk->sk_prot->keepalive) {
14851b3e7edeSFlorian Westphal if (sock_flag(sk, SOCK_KEEPOPEN))
14861b3e7edeSFlorian Westphal ssk->sk_prot->keepalive(ssk, 1);
14871b3e7edeSFlorian Westphal else
14881b3e7edeSFlorian Westphal ssk->sk_prot->keepalive(ssk, 0);
14891b3e7edeSFlorian Westphal }
14901b3e7edeSFlorian Westphal
14911b3e7edeSFlorian Westphal ssk->sk_priority = sk->sk_priority;
14925d0a6bc8SFlorian Westphal ssk->sk_bound_dev_if = sk->sk_bound_dev_if;
14935d0a6bc8SFlorian Westphal ssk->sk_incoming_cpu = sk->sk_incoming_cpu;
14947e9740e0SMatthieu Baerts ssk->sk_ipv6only = sk->sk_ipv6only;
1495878d951cSEric Dumazet __ip_sock_set_tos(ssk, inet_sk(sk)->tos);
14965d0a6bc8SFlorian Westphal
14975d0a6bc8SFlorian Westphal if (sk->sk_userlocks & tx_rx_locks) {
14985d0a6bc8SFlorian Westphal ssk->sk_userlocks |= sk->sk_userlocks & tx_rx_locks;
14998005184fSPaolo Abeni if (sk->sk_userlocks & SOCK_SNDBUF_LOCK) {
15005d0a6bc8SFlorian Westphal WRITE_ONCE(ssk->sk_sndbuf, sk->sk_sndbuf);
15018005184fSPaolo Abeni mptcp_subflow_ctx(ssk)->cached_sndbuf = sk->sk_sndbuf;
15028005184fSPaolo Abeni }
15035d0a6bc8SFlorian Westphal if (sk->sk_userlocks & SOCK_RCVBUF_LOCK)
15045d0a6bc8SFlorian Westphal WRITE_ONCE(ssk->sk_rcvbuf, sk->sk_rcvbuf);
15055d0a6bc8SFlorian Westphal }
15065d0a6bc8SFlorian Westphal
15075d0a6bc8SFlorian Westphal if (sock_flag(sk, SOCK_LINGER)) {
15085d0a6bc8SFlorian Westphal ssk->sk_lingertime = sk->sk_lingertime;
15095d0a6bc8SFlorian Westphal sock_set_flag(ssk, SOCK_LINGER);
15105d0a6bc8SFlorian Westphal } else {
15115d0a6bc8SFlorian Westphal sock_reset_flag(ssk, SOCK_LINGER);
15125d0a6bc8SFlorian Westphal }
15135d0a6bc8SFlorian Westphal
15145d0a6bc8SFlorian Westphal if (sk->sk_mark != ssk->sk_mark) {
15155d0a6bc8SFlorian Westphal ssk->sk_mark = sk->sk_mark;
15165d0a6bc8SFlorian Westphal sk_dst_reset(ssk);
15175d0a6bc8SFlorian Westphal }
15185d0a6bc8SFlorian Westphal
15195d0a6bc8SFlorian Westphal sock_valbool_flag(ssk, SOCK_DBG, sock_flag(sk, SOCK_DBG));
15205d0a6bc8SFlorian Westphal
15215d0a6bc8SFlorian Westphal if (inet_csk(sk)->icsk_ca_ops != inet_csk(ssk)->icsk_ca_ops)
152220b5759fSPaolo Abeni tcp_set_congestion_control(ssk, msk->ca_name, false, true);
15234f6e14bdSMaxim Galaganov __tcp_sock_set_cork(ssk, !!msk->cork);
15244f6e14bdSMaxim Galaganov __tcp_sock_set_nodelay(ssk, !!msk->nodelay);
1525bd11dc4fSMatthieu Baerts (NGI0) tcp_sock_set_keepidle_locked(ssk, msk->keepalive_idle);
1526bd11dc4fSMatthieu Baerts (NGI0) tcp_sock_set_keepintvl(ssk, msk->keepalive_intvl);
1527bd11dc4fSMatthieu Baerts (NGI0) tcp_sock_set_keepcnt(ssk, msk->keepalive_cnt);
1528c9406a23SFlorian Westphal
15294bd0623fSEric Dumazet inet_assign_bit(TRANSPARENT, ssk, inet_test_bit(TRANSPARENT, sk));
15303f7e7532SEric Dumazet inet_assign_bit(FREEBIND, ssk, inet_test_bit(FREEBIND, sk));
1531c85636a2SMaxim Galaganov inet_assign_bit(BIND_ADDRESS_NO_PORT, ssk, inet_test_bit(BIND_ADDRESS_NO_PORT, sk));
1532c85636a2SMaxim Galaganov WRITE_ONCE(inet_sk(ssk)->local_port_range, READ_ONCE(inet_sk(sk)->local_port_range));
15331b3e7edeSFlorian Westphal }
15341b3e7edeSFlorian Westphal
mptcp_sockopt_sync_locked(struct mptcp_sock * msk,struct sock * ssk)15353e501490SPaolo Abeni void mptcp_sockopt_sync_locked(struct mptcp_sock *msk, struct sock *ssk)
153678962489SFlorian Westphal {
15373e501490SPaolo Abeni struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(ssk);
153878962489SFlorian Westphal
15393e501490SPaolo Abeni msk_owned_by_me(msk);
154078962489SFlorian Westphal
15415684ab1aSPaolo Abeni ssk->sk_rcvlowat = 0;
15425684ab1aSPaolo Abeni
15439fdc7793SPaolo Abeni /* subflows must ignore any latency-related settings: will not affect
15449fdc7793SPaolo Abeni * the user-space - only the msk is relevant - but will foul the
15459fdc7793SPaolo Abeni * mptcp scheduler
15469fdc7793SPaolo Abeni */
15479fdc7793SPaolo Abeni tcp_sk(ssk)->notsent_lowat = UINT_MAX;
15489fdc7793SPaolo Abeni
15493e501490SPaolo Abeni if (READ_ONCE(subflow->setsockopt_seq) != msk->setsockopt_seq) {
15503e501490SPaolo Abeni sync_socket_options(msk, ssk);
155178962489SFlorian Westphal
15523e501490SPaolo Abeni subflow->setsockopt_seq = msk->setsockopt_seq;
1553df00b087SFlorian Westphal }
155478962489SFlorian Westphal }
15555684ab1aSPaolo Abeni
15565684ab1aSPaolo Abeni /* unfortunately this is different enough from the tcp version so
15575684ab1aSPaolo Abeni * that we can't factor it out
15585684ab1aSPaolo Abeni */
mptcp_set_rcvlowat(struct sock * sk,int val)15595684ab1aSPaolo Abeni int mptcp_set_rcvlowat(struct sock *sk, int val)
15605684ab1aSPaolo Abeni {
15615684ab1aSPaolo Abeni struct mptcp_subflow_context *subflow;
15625684ab1aSPaolo Abeni int space, cap;
15635684ab1aSPaolo Abeni
1564fcf4692fSPaolo Abeni /* bpf can land here with a wrong sk type */
1565fcf4692fSPaolo Abeni if (sk->sk_protocol == IPPROTO_TCP)
1566fcf4692fSPaolo Abeni return -EINVAL;
1567fcf4692fSPaolo Abeni
15685684ab1aSPaolo Abeni if (sk->sk_userlocks & SOCK_RCVBUF_LOCK)
15695684ab1aSPaolo Abeni cap = sk->sk_rcvbuf >> 1;
15705684ab1aSPaolo Abeni else
15715684ab1aSPaolo Abeni cap = READ_ONCE(sock_net(sk)->ipv4.sysctl_tcp_rmem[2]) >> 1;
15725684ab1aSPaolo Abeni val = min(val, cap);
15735684ab1aSPaolo Abeni WRITE_ONCE(sk->sk_rcvlowat, val ? : 1);
15745684ab1aSPaolo Abeni
15755684ab1aSPaolo Abeni /* Check if we need to signal EPOLLIN right now */
15765684ab1aSPaolo Abeni if (mptcp_epollin_ready(sk))
15775684ab1aSPaolo Abeni sk->sk_data_ready(sk);
15785684ab1aSPaolo Abeni
15795684ab1aSPaolo Abeni if (sk->sk_userlocks & SOCK_RCVBUF_LOCK)
15805684ab1aSPaolo Abeni return 0;
15815684ab1aSPaolo Abeni
15825684ab1aSPaolo Abeni space = __tcp_space_from_win(mptcp_sk(sk)->scaling_ratio, val);
15835684ab1aSPaolo Abeni if (space <= sk->sk_rcvbuf)
15845684ab1aSPaolo Abeni return 0;
15855684ab1aSPaolo Abeni
15865684ab1aSPaolo Abeni /* propagate the rcvbuf changes to all the subflows */
15875684ab1aSPaolo Abeni WRITE_ONCE(sk->sk_rcvbuf, space);
15885684ab1aSPaolo Abeni mptcp_for_each_subflow(mptcp_sk(sk), subflow) {
15895684ab1aSPaolo Abeni struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
15905684ab1aSPaolo Abeni bool slow;
15915684ab1aSPaolo Abeni
15925684ab1aSPaolo Abeni slow = lock_sock_fast(ssk);
15935684ab1aSPaolo Abeni WRITE_ONCE(ssk->sk_rcvbuf, space);
1594f410cbeaSEric Dumazet WRITE_ONCE(tcp_sk(ssk)->window_clamp, val);
15955684ab1aSPaolo Abeni unlock_sock_fast(ssk, slow);
15965684ab1aSPaolo Abeni }
15975684ab1aSPaolo Abeni return 0;
15985684ab1aSPaolo Abeni }
1599