Skip to content

Commit 1f62f58

Browse files
committed
Merge branch 'mptcp-cleanups-ephemeral-port-sockopts'
Matthieu Baerts says: ==================== mptcp: cleanup and support more ephemeral ports sockopts Patch 1 is a cleanup one: mptcp_is_tcpsk() helper was modifying sock_ops in some cases which is unexpected with that name. Patch 2 to 4 add support for two socket options: IP_LOCAL_PORT_RANGE and IP_BIND_ADDRESS_NO_PORT. The first one is a preparation patch, the second one adds the support while the last one modifies an existing selftest to validate the new features. ==================== Signed-off-by: Matthieu Baerts <[email protected]> Signed-off-by: David S. Miller <[email protected]>
2 parents 7961ef1 + 122db5e commit 1f62f58

File tree

3 files changed

+79
-68
lines changed

3 files changed

+79
-68
lines changed

net/mptcp/protocol.c

Lines changed: 44 additions & 64 deletions
Original file line numberDiff line numberDiff line change
@@ -55,28 +55,14 @@ static u64 mptcp_wnd_end(const struct mptcp_sock *msk)
5555
return READ_ONCE(msk->wnd_end);
5656
}
5757

58-
static bool mptcp_is_tcpsk(struct sock *sk)
58+
static const struct proto_ops *mptcp_fallback_tcp_ops(const struct sock *sk)
5959
{
60-
struct socket *sock = sk->sk_socket;
61-
62-
if (unlikely(sk->sk_prot == &tcp_prot)) {
63-
/* we are being invoked after mptcp_accept() has
64-
* accepted a non-mp-capable flow: sk is a tcp_sk,
65-
* not an mptcp one.
66-
*
67-
* Hand the socket over to tcp so all further socket ops
68-
* bypass mptcp.
69-
*/
70-
WRITE_ONCE(sock->ops, &inet_stream_ops);
71-
return true;
7260
#if IS_ENABLED(CONFIG_MPTCP_IPV6)
73-
} else if (unlikely(sk->sk_prot == &tcpv6_prot)) {
74-
WRITE_ONCE(sock->ops, &inet6_stream_ops);
75-
return true;
61+
if (sk->sk_prot == &tcpv6_prot)
62+
return &inet6_stream_ops;
7663
#endif
77-
}
78-
79-
return false;
64+
WARN_ON_ONCE(sk->sk_prot != &tcp_prot);
65+
return &inet_stream_ops;
8066
}
8167

8268
static int __mptcp_socket_create(struct mptcp_sock *msk)
@@ -3258,44 +3244,6 @@ void mptcp_rcv_space_init(struct mptcp_sock *msk, const struct sock *ssk)
32583244
WRITE_ONCE(msk->wnd_end, msk->snd_nxt + tcp_sk(ssk)->snd_wnd);
32593245
}
32603246

3261-
static struct sock *mptcp_accept(struct sock *ssk, int flags, int *err,
3262-
bool kern)
3263-
{
3264-
struct sock *newsk;
3265-
3266-
pr_debug("ssk=%p, listener=%p", ssk, mptcp_subflow_ctx(ssk));
3267-
newsk = inet_csk_accept(ssk, flags, err, kern);
3268-
if (!newsk)
3269-
return NULL;
3270-
3271-
pr_debug("newsk=%p, subflow is mptcp=%d", newsk, sk_is_mptcp(newsk));
3272-
if (sk_is_mptcp(newsk)) {
3273-
struct mptcp_subflow_context *subflow;
3274-
struct sock *new_mptcp_sock;
3275-
3276-
subflow = mptcp_subflow_ctx(newsk);
3277-
new_mptcp_sock = subflow->conn;
3278-
3279-
/* is_mptcp should be false if subflow->conn is missing, see
3280-
* subflow_syn_recv_sock()
3281-
*/
3282-
if (WARN_ON_ONCE(!new_mptcp_sock)) {
3283-
tcp_sk(newsk)->is_mptcp = 0;
3284-
goto out;
3285-
}
3286-
3287-
newsk = new_mptcp_sock;
3288-
MPTCP_INC_STATS(sock_net(ssk), MPTCP_MIB_MPCAPABLEPASSIVEACK);
3289-
} else {
3290-
MPTCP_INC_STATS(sock_net(ssk),
3291-
MPTCP_MIB_MPCAPABLEPASSIVEFALLBACK);
3292-
}
3293-
3294-
out:
3295-
newsk->sk_kern_sock = kern;
3296-
return newsk;
3297-
}
3298-
32993247
void mptcp_destroy_common(struct mptcp_sock *msk, unsigned int flags)
33003248
{
33013249
struct mptcp_subflow_context *subflow, *tmp;
@@ -3739,7 +3687,6 @@ static struct proto mptcp_prot = {
37393687
.connect = mptcp_connect,
37403688
.disconnect = mptcp_disconnect,
37413689
.close = mptcp_close,
3742-
.accept = mptcp_accept,
37433690
.setsockopt = mptcp_setsockopt,
37443691
.getsockopt = mptcp_getsockopt,
37453692
.shutdown = mptcp_shutdown,
@@ -3849,18 +3796,36 @@ static int mptcp_stream_accept(struct socket *sock, struct socket *newsock,
38493796
if (!ssk)
38503797
return -EINVAL;
38513798

3852-
newsk = mptcp_accept(ssk, flags, &err, kern);
3799+
pr_debug("ssk=%p, listener=%p", ssk, mptcp_subflow_ctx(ssk));
3800+
newsk = inet_csk_accept(ssk, flags, &err, kern);
38533801
if (!newsk)
38543802
return err;
38553803

3856-
lock_sock(newsk);
3857-
3858-
__inet_accept(sock, newsock, newsk);
3859-
if (!mptcp_is_tcpsk(newsock->sk)) {
3860-
struct mptcp_sock *msk = mptcp_sk(newsk);
3804+
pr_debug("newsk=%p, subflow is mptcp=%d", newsk, sk_is_mptcp(newsk));
3805+
if (sk_is_mptcp(newsk)) {
38613806
struct mptcp_subflow_context *subflow;
3807+
struct sock *new_mptcp_sock;
3808+
3809+
subflow = mptcp_subflow_ctx(newsk);
3810+
new_mptcp_sock = subflow->conn;
3811+
3812+
/* is_mptcp should be false if subflow->conn is missing, see
3813+
* subflow_syn_recv_sock()
3814+
*/
3815+
if (WARN_ON_ONCE(!new_mptcp_sock)) {
3816+
tcp_sk(newsk)->is_mptcp = 0;
3817+
goto tcpfallback;
3818+
}
3819+
3820+
newsk = new_mptcp_sock;
3821+
MPTCP_INC_STATS(sock_net(ssk), MPTCP_MIB_MPCAPABLEPASSIVEACK);
3822+
3823+
newsk->sk_kern_sock = kern;
3824+
lock_sock(newsk);
3825+
__inet_accept(sock, newsock, newsk);
38623826

38633827
set_bit(SOCK_CUSTOM_SOCKOPT, &newsock->flags);
3828+
msk = mptcp_sk(newsk);
38643829
msk->in_accept_queue = 0;
38653830

38663831
/* set ssk->sk_socket of accept()ed flows to mptcp socket.
@@ -3882,6 +3847,21 @@ static int mptcp_stream_accept(struct socket *sock, struct socket *newsock,
38823847
if (unlikely(list_is_singular(&msk->conn_list)))
38833848
inet_sk_state_store(newsk, TCP_CLOSE);
38843849
}
3850+
} else {
3851+
MPTCP_INC_STATS(sock_net(ssk),
3852+
MPTCP_MIB_MPCAPABLEPASSIVEFALLBACK);
3853+
tcpfallback:
3854+
newsk->sk_kern_sock = kern;
3855+
lock_sock(newsk);
3856+
__inet_accept(sock, newsock, newsk);
3857+
/* we are being invoked after accepting a non-mp-capable
3858+
* flow: sk is a tcp_sk, not an mptcp one.
3859+
*
3860+
* Hand the socket over to tcp so all further socket ops
3861+
* bypass mptcp.
3862+
*/
3863+
WRITE_ONCE(newsock->sk->sk_socket->ops,
3864+
mptcp_fallback_tcp_ops(newsock->sk));
38853865
}
38863866
release_sock(newsk);
38873867

net/mptcp/sockopt.c

Lines changed: 23 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -440,6 +440,8 @@ static bool mptcp_supported_sockopt(int level, int optname)
440440
/* should work fine */
441441
case IP_FREEBIND:
442442
case IP_TRANSPARENT:
443+
case IP_BIND_ADDRESS_NO_PORT:
444+
case IP_LOCAL_PORT_RANGE:
443445

444446
/* the following are control cmsg related */
445447
case IP_PKTINFO:
@@ -455,7 +457,6 @@ static bool mptcp_supported_sockopt(int level, int optname)
455457
/* common stuff that need some love */
456458
case IP_TOS:
457459
case IP_TTL:
458-
case IP_BIND_ADDRESS_NO_PORT:
459460
case IP_MTU_DISCOVER:
460461
case IP_RECVERR:
461462

@@ -683,8 +684,8 @@ static int mptcp_setsockopt_sol_tcp_nodelay(struct mptcp_sock *msk, sockptr_t op
683684
return 0;
684685
}
685686

686-
static int mptcp_setsockopt_sol_ip_set_transparent(struct mptcp_sock *msk, int optname,
687-
sockptr_t optval, unsigned int optlen)
687+
static int mptcp_setsockopt_sol_ip_set(struct mptcp_sock *msk, int optname,
688+
sockptr_t optval, unsigned int optlen)
688689
{
689690
struct sock *sk = (struct sock *)msk;
690691
struct sock *ssk;
@@ -710,6 +711,14 @@ static int mptcp_setsockopt_sol_ip_set_transparent(struct mptcp_sock *msk, int o
710711
inet_assign_bit(TRANSPARENT, ssk,
711712
inet_test_bit(TRANSPARENT, sk));
712713
break;
714+
case IP_BIND_ADDRESS_NO_PORT:
715+
inet_assign_bit(BIND_ADDRESS_NO_PORT, ssk,
716+
inet_test_bit(BIND_ADDRESS_NO_PORT, sk));
717+
break;
718+
case IP_LOCAL_PORT_RANGE:
719+
WRITE_ONCE(inet_sk(ssk)->local_port_range,
720+
READ_ONCE(inet_sk(sk)->local_port_range));
721+
break;
713722
default:
714723
release_sock(sk);
715724
WARN_ON_ONCE(1);
@@ -755,7 +764,9 @@ static int mptcp_setsockopt_v4(struct mptcp_sock *msk, int optname,
755764
switch (optname) {
756765
case IP_FREEBIND:
757766
case IP_TRANSPARENT:
758-
return mptcp_setsockopt_sol_ip_set_transparent(msk, optname, optval, optlen);
767+
case IP_BIND_ADDRESS_NO_PORT:
768+
case IP_LOCAL_PORT_RANGE:
769+
return mptcp_setsockopt_sol_ip_set(msk, optname, optval, optlen);
759770
case IP_TOS:
760771
return mptcp_setsockopt_v4_set_tos(msk, optname, optval, optlen);
761772
}
@@ -1350,6 +1361,12 @@ static int mptcp_getsockopt_v4(struct mptcp_sock *msk, int optname,
13501361
switch (optname) {
13511362
case IP_TOS:
13521363
return mptcp_put_int_option(msk, optval, optlen, READ_ONCE(inet_sk(sk)->tos));
1364+
case IP_BIND_ADDRESS_NO_PORT:
1365+
return mptcp_put_int_option(msk, optval, optlen,
1366+
inet_test_bit(BIND_ADDRESS_NO_PORT, sk));
1367+
case IP_LOCAL_PORT_RANGE:
1368+
return mptcp_put_int_option(msk, optval, optlen,
1369+
READ_ONCE(inet_sk(sk)->local_port_range));
13531370
}
13541371

13551372
return -EOPNOTSUPP;
@@ -1450,6 +1467,8 @@ static void sync_socket_options(struct mptcp_sock *msk, struct sock *ssk)
14501467

14511468
inet_assign_bit(TRANSPARENT, ssk, inet_test_bit(TRANSPARENT, sk));
14521469
inet_assign_bit(FREEBIND, ssk, inet_test_bit(FREEBIND, sk));
1470+
inet_assign_bit(BIND_ADDRESS_NO_PORT, ssk, inet_test_bit(BIND_ADDRESS_NO_PORT, sk));
1471+
WRITE_ONCE(inet_sk(ssk)->local_port_range, READ_ONCE(inet_sk(sk)->local_port_range));
14531472
}
14541473

14551474
void mptcp_sockopt_sync_locked(struct mptcp_sock *msk, struct sock *ssk)

tools/testing/selftests/net/ip_local_port_range.c

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -146,6 +146,12 @@ FIXTURE_VARIANT_ADD(ip_local_port_range, ip4_stcp) {
146146
.so_protocol = IPPROTO_SCTP,
147147
};
148148

149+
FIXTURE_VARIANT_ADD(ip_local_port_range, ip4_mptcp) {
150+
.so_domain = AF_INET,
151+
.so_type = SOCK_STREAM,
152+
.so_protocol = IPPROTO_MPTCP,
153+
};
154+
149155
FIXTURE_VARIANT_ADD(ip_local_port_range, ip6_tcp) {
150156
.so_domain = AF_INET6,
151157
.so_type = SOCK_STREAM,
@@ -164,6 +170,12 @@ FIXTURE_VARIANT_ADD(ip_local_port_range, ip6_stcp) {
164170
.so_protocol = IPPROTO_SCTP,
165171
};
166172

173+
FIXTURE_VARIANT_ADD(ip_local_port_range, ip6_mptcp) {
174+
.so_domain = AF_INET6,
175+
.so_type = SOCK_STREAM,
176+
.so_protocol = IPPROTO_MPTCP,
177+
};
178+
167179
TEST_F(ip_local_port_range, invalid_option_value)
168180
{
169181
__u16 val16;

0 commit comments

Comments
 (0)