Skip to content

Commit cdd760d

Browse files
matttbeFlorian Bezannier
authored and
Florian Bezannier
committed
mptcp: fix full TCP keep-alive support
commit bd11dc4 upstream. SO_KEEPALIVE support has been added a while ago, as part of a series "adding SOL_SOCKET" support. To have a full control of this keep-alive feature, it is important to also support TCP_KEEP* socket options at the SOL_TCP level. Supporting them on the setsockopt() part is easy, it is just a matter of remembering each value in the MPTCP sock structure, and calling tcp_sock_set_keep*() helpers on each subflow. If the value is not modified (0), calling these helpers will not do anything. For the getsockopt() part, the corresponding value from the MPTCP sock structure or the default one is simply returned. All of this is very similar to other TCP_* socket options supported by MPTCP. It looks important for kernels supporting SO_KEEPALIVE, to also support TCP_KEEP* options as well: some apps seem to (wrongly) consider that if the former is supported, the latter ones will be supported as well. But also, not having this simple and isolated change is preventing MPTCP support in some apps, and libraries like GoLang [1]. This is why this patch is seen as a fix. Closes: multipath-tcp/mptcp_net-next#383 Fixes: 1b3e7ed ("mptcp: setsockopt: handle SO_KEEPALIVE and SO_PRIORITY") Link: golang/go#56539 [1] Acked-by: Paolo Abeni <[email protected]> Signed-off-by: Matthieu Baerts (NGI0) <[email protected]> Signed-off-by: Mat Martineau <[email protected]> Link: https://lore.kernel.org/r/[email protected] Signed-off-by: Jakub Kicinski <[email protected]> [ Conflicts in the same context, because commit 29b5e5e ("mptcp: implement TCP_NOTSENT_LOWAT support") (new feature), commit 013e317 ("mptcp: fix rcv space initialization") (not backported because of the various conflicts, and because the race fixed by this commit "does not produce ill effects in practice"), and commit 4f6e14b ("mptcp: support TCP_CORK and TCP_NODELAY") are not in this version. The adaptations done by 7f71a33 ("mptcp: cleanup SOL_TCP handling") have been adapted to this case here. Also, TCP_KEEPINTVL and TCP_KEEPCNT value had to be set without lock, the same way it was done on TCP side prior commit 6fd70a6 ("tcp: set TCP_KEEPINTVL locklessly") and commit 8448508 ("tcp: set TCP_KEEPCNT locklessly"). ] Signed-off-by: Matthieu Baerts (NGI0) <[email protected]> Signed-off-by: Greg Kroah-Hartman <[email protected]>
1 parent bf1c2c8 commit cdd760d

File tree

2 files changed

+118
-0
lines changed

2 files changed

+118
-0
lines changed

net/mptcp/protocol.h

+3
Original file line numberDiff line numberDiff line change
@@ -250,6 +250,9 @@ struct mptcp_sock {
250250
bool use_64bit_ack; /* Set when we received a 64-bit DSN */
251251
bool csum_enabled;
252252
spinlock_t join_list_lock;
253+
int keepalive_cnt;
254+
int keepalive_idle;
255+
int keepalive_intvl;
253256
struct work_struct work;
254257
struct sk_buff *ooo_last_skb;
255258
struct rb_root out_of_order_queue;

net/mptcp/sockopt.c

+115
Original file line numberDiff line numberDiff line change
@@ -593,6 +593,60 @@ static int mptcp_setsockopt_sol_tcp_congestion(struct mptcp_sock *msk, sockptr_t
593593
return ret;
594594
}
595595

596+
static int __tcp_sock_set_keepintvl(struct sock *sk, int val)
597+
{
598+
if (val < 1 || val > MAX_TCP_KEEPINTVL)
599+
return -EINVAL;
600+
601+
WRITE_ONCE(tcp_sk(sk)->keepalive_intvl, val * HZ);
602+
603+
return 0;
604+
}
605+
606+
static int __tcp_sock_set_keepcnt(struct sock *sk, int val)
607+
{
608+
if (val < 1 || val > MAX_TCP_KEEPCNT)
609+
return -EINVAL;
610+
611+
/* Paired with READ_ONCE() in keepalive_probes() */
612+
WRITE_ONCE(tcp_sk(sk)->keepalive_probes, val);
613+
614+
return 0;
615+
}
616+
617+
static int mptcp_setsockopt_set_val(struct mptcp_sock *msk, int max,
618+
int (*set_val)(struct sock *, int),
619+
int *msk_val, sockptr_t optval,
620+
unsigned int optlen)
621+
{
622+
struct mptcp_subflow_context *subflow;
623+
struct sock *sk = (struct sock *)msk;
624+
int val, err;
625+
626+
err = mptcp_get_int_option(msk, optval, optlen, &val);
627+
if (err)
628+
return err;
629+
630+
lock_sock(sk);
631+
mptcp_for_each_subflow(msk, subflow) {
632+
struct sock *ssk = mptcp_subflow_tcp_sock(subflow);
633+
int ret;
634+
635+
lock_sock(ssk);
636+
ret = set_val(ssk, val);
637+
err = err ? : ret;
638+
release_sock(ssk);
639+
}
640+
641+
if (!err) {
642+
*msk_val = val;
643+
sockopt_seq_inc(msk);
644+
}
645+
release_sock(sk);
646+
647+
return err;
648+
}
649+
596650
static int mptcp_setsockopt_sol_tcp(struct mptcp_sock *msk, int optname,
597651
sockptr_t optval, unsigned int optlen)
598652
{
@@ -601,6 +655,21 @@ static int mptcp_setsockopt_sol_tcp(struct mptcp_sock *msk, int optname,
601655
return -EOPNOTSUPP;
602656
case TCP_CONGESTION:
603657
return mptcp_setsockopt_sol_tcp_congestion(msk, optval, optlen);
658+
case TCP_KEEPIDLE:
659+
return mptcp_setsockopt_set_val(msk, MAX_TCP_KEEPIDLE,
660+
&tcp_sock_set_keepidle_locked,
661+
&msk->keepalive_idle,
662+
optval, optlen);
663+
case TCP_KEEPINTVL:
664+
return mptcp_setsockopt_set_val(msk, MAX_TCP_KEEPINTVL,
665+
&__tcp_sock_set_keepintvl,
666+
&msk->keepalive_intvl,
667+
optval, optlen);
668+
case TCP_KEEPCNT:
669+
return mptcp_setsockopt_set_val(msk, MAX_TCP_KEEPCNT,
670+
&__tcp_sock_set_keepcnt,
671+
&msk->keepalive_cnt,
672+
optval, optlen);
604673
}
605674

606675
return -EOPNOTSUPP;
@@ -667,16 +736,59 @@ static int mptcp_getsockopt_first_sf_only(struct mptcp_sock *msk, int level, int
667736
return ret;
668737
}
669738

739+
static int mptcp_put_int_option(struct mptcp_sock *msk, char __user *optval,
740+
int __user *optlen, int val)
741+
{
742+
int len;
743+
744+
if (get_user(len, optlen))
745+
return -EFAULT;
746+
if (len < 0)
747+
return -EINVAL;
748+
749+
if (len < sizeof(int) && len > 0 && val >= 0 && val <= 255) {
750+
unsigned char ucval = (unsigned char)val;
751+
752+
len = 1;
753+
if (put_user(len, optlen))
754+
return -EFAULT;
755+
if (copy_to_user(optval, &ucval, 1))
756+
return -EFAULT;
757+
} else {
758+
len = min_t(unsigned int, len, sizeof(int));
759+
if (put_user(len, optlen))
760+
return -EFAULT;
761+
if (copy_to_user(optval, &val, len))
762+
return -EFAULT;
763+
}
764+
765+
return 0;
766+
}
767+
670768
static int mptcp_getsockopt_sol_tcp(struct mptcp_sock *msk, int optname,
671769
char __user *optval, int __user *optlen)
672770
{
771+
struct sock *sk = (void *)msk;
772+
673773
switch (optname) {
674774
case TCP_ULP:
675775
case TCP_CONGESTION:
676776
case TCP_INFO:
677777
case TCP_CC_INFO:
678778
return mptcp_getsockopt_first_sf_only(msk, SOL_TCP, optname,
679779
optval, optlen);
780+
case TCP_KEEPIDLE:
781+
return mptcp_put_int_option(msk, optval, optlen,
782+
msk->keepalive_idle ? :
783+
READ_ONCE(sock_net(sk)->ipv4.sysctl_tcp_keepalive_time) / HZ);
784+
case TCP_KEEPINTVL:
785+
return mptcp_put_int_option(msk, optval, optlen,
786+
msk->keepalive_intvl ? :
787+
READ_ONCE(sock_net(sk)->ipv4.sysctl_tcp_keepalive_intvl) / HZ);
788+
case TCP_KEEPCNT:
789+
return mptcp_put_int_option(msk, optval, optlen,
790+
msk->keepalive_cnt ? :
791+
READ_ONCE(sock_net(sk)->ipv4.sysctl_tcp_keepalive_probes));
680792
}
681793
return -EOPNOTSUPP;
682794
}
@@ -746,6 +858,9 @@ static void sync_socket_options(struct mptcp_sock *msk, struct sock *ssk)
746858

747859
if (inet_csk(sk)->icsk_ca_ops != inet_csk(ssk)->icsk_ca_ops)
748860
tcp_set_congestion_control(ssk, msk->ca_name, false, true);
861+
tcp_sock_set_keepidle_locked(ssk, msk->keepalive_idle);
862+
__tcp_sock_set_keepintvl(ssk, msk->keepalive_intvl);
863+
__tcp_sock_set_keepcnt(ssk, msk->keepalive_cnt);
749864
}
750865

751866
static void __mptcp_sockopt_sync(struct mptcp_sock *msk, struct sock *ssk)

0 commit comments

Comments
 (0)