Commit e2223995 authored by Paolo Abeni's avatar Paolo Abeni Committed by Jakub Kicinski

mptcp: use tcp_build_frag()

mptcp_push_pending() is called even on orphaned
msk (and orphaned subflows), if there is outstanding
data at close() time.

To cope with the above MPTCP needs to handle explicitly
the allocation failure on xmit. The newly introduced
do_tcp_sendfrag() allows that, just plug it.

We can additionally drop a couple of sanity checks,
duplicate in the TCP code.
Signed-off-by: default avatarPaolo Abeni <pabeni@redhat.com>
Signed-off-by: default avatarJakub Kicinski <kuba@kernel.org>
parent b796d04b
...@@ -992,17 +992,13 @@ static int mptcp_sendmsg_frag(struct sock *sk, struct sock *ssk, ...@@ -992,17 +992,13 @@ static int mptcp_sendmsg_frag(struct sock *sk, struct sock *ssk,
psize = min_t(size_t, dfrag->data_len, avail_size); psize = min_t(size_t, dfrag->data_len, avail_size);
} }
/* tell the TCP stack to delay the push so that we can safely tail = tcp_build_frag(ssk, psize, msg->msg_flags, page, offset, &psize);
* access the skb after the sendpages call if (!tail) {
*/ tcp_remove_empty_skb(sk, tcp_write_queue_tail(ssk));
ret = do_tcp_sendpages(ssk, page, offset, psize, return -ENOMEM;
msg->msg_flags | MSG_SENDPAGE_NOTLAST | MSG_DONTWAIT);
if (ret <= 0) {
if (!retransmission)
iov_iter_revert(&msg->msg_iter, psize);
return ret;
} }
ret = psize;
frag_truesize += ret; frag_truesize += ret;
if (!retransmission) { if (!retransmission) {
if (unlikely(ret < psize)) if (unlikely(ret < psize))
...@@ -1026,20 +1022,15 @@ static int mptcp_sendmsg_frag(struct sock *sk, struct sock *ssk, ...@@ -1026,20 +1022,15 @@ static int mptcp_sendmsg_frag(struct sock *sk, struct sock *ssk,
sk->sk_forward_alloc -= frag_truesize; sk->sk_forward_alloc -= frag_truesize;
} }
/* if the tail skb extension is still the cached one, collapsing /* if the tail skb is still the cached one, collapsing really happened.
* really happened. Note: we can't check for 'same skb' as the sk_buff
* hdr on tail can be transmitted, freed and re-allocated by the
* do_tcp_sendpages() call
*/ */
tail = tcp_write_queue_tail(ssk); if (skb == tail) {
if (mpext && tail && mpext == skb_ext_find(tail, SKB_EXT_MPTCP)) {
WARN_ON_ONCE(!can_collapse); WARN_ON_ONCE(!can_collapse);
mpext->data_len += ret; mpext->data_len += ret;
goto out; goto out;
} }
skb = tcp_write_queue_tail(ssk); mpext = __skb_ext_set(tail, SKB_EXT_MPTCP, msk->cached_ext);
mpext = __skb_ext_set(skb, SKB_EXT_MPTCP, msk->cached_ext);
msk->cached_ext = NULL; msk->cached_ext = NULL;
memset(mpext, 0, sizeof(*mpext)); memset(mpext, 0, sizeof(*mpext));
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment