Commit 7716682c authored by Eric Dumazet's avatar Eric Dumazet Committed by David S. Miller

tcp/dccp: fix another race at listener dismantle

Ilya reported following lockdep splat:

kernel: =========================
kernel: [ BUG: held lock freed! ]
kernel: 4.5.0-rc1-ceph-00026-g5e0a311 #1 Not tainted
kernel: -------------------------
kernel: swapper/5/0 is freeing memory
ffff880035c9d200-ffff880035c9dbff, with a lock still held there!
kernel: (&(&queue->rskq_lock)->rlock){+.-...}, at:
[<ffffffff816f6a88>] inet_csk_reqsk_queue_add+0x28/0xa0
kernel: 4 locks held by swapper/5/0:
kernel: #0:  (rcu_read_lock){......}, at: [<ffffffff8169ef6b>]
netif_receive_skb_internal+0x4b/0x1f0
kernel: #1:  (rcu_read_lock){......}, at: [<ffffffff816e977f>]
ip_local_deliver_finish+0x3f/0x380
kernel: #2:  (slock-AF_INET){+.-...}, at: [<ffffffff81685ffb>]
sk_clone_lock+0x19b/0x440
kernel: #3:  (&(&queue->rskq_lock)->rlock){+.-...}, at:
[<ffffffff816f6a88>] inet_csk_reqsk_queue_add+0x28/0xa0

To properly fix this issue, inet_csk_reqsk_queue_add() needs
to return to its callers if the child as been queued
into accept queue.

We also need to make sure listener is still there before
calling sk->sk_data_ready(), by holding a reference on it,
since the reference carried by the child can disappear as
soon as the child is put on accept queue.
Reported-by: default avatarIlya Dryomov <idryomov@gmail.com>
Fixes: ebb516af ("tcp/dccp: fix race at listener dismantle phase")
Signed-off-by: default avatarEric Dumazet <edumazet@google.com>
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parent deed49df
...@@ -270,8 +270,9 @@ struct dst_entry *inet_csk_route_child_sock(const struct sock *sk, ...@@ -270,8 +270,9 @@ struct dst_entry *inet_csk_route_child_sock(const struct sock *sk,
struct sock *newsk, struct sock *newsk,
const struct request_sock *req); const struct request_sock *req);
void inet_csk_reqsk_queue_add(struct sock *sk, struct request_sock *req, struct sock *inet_csk_reqsk_queue_add(struct sock *sk,
struct sock *child); struct request_sock *req,
struct sock *child);
void inet_csk_reqsk_queue_hash_add(struct sock *sk, struct request_sock *req, void inet_csk_reqsk_queue_hash_add(struct sock *sk, struct request_sock *req,
unsigned long timeout); unsigned long timeout);
struct sock *inet_csk_complete_hashdance(struct sock *sk, struct sock *child, struct sock *inet_csk_complete_hashdance(struct sock *sk, struct sock *child,
......
...@@ -824,26 +824,26 @@ static int dccp_v4_rcv(struct sk_buff *skb) ...@@ -824,26 +824,26 @@ static int dccp_v4_rcv(struct sk_buff *skb)
if (sk->sk_state == DCCP_NEW_SYN_RECV) { if (sk->sk_state == DCCP_NEW_SYN_RECV) {
struct request_sock *req = inet_reqsk(sk); struct request_sock *req = inet_reqsk(sk);
struct sock *nsk = NULL; struct sock *nsk;
sk = req->rsk_listener; sk = req->rsk_listener;
if (likely(sk->sk_state == DCCP_LISTEN)) { if (unlikely(sk->sk_state != DCCP_LISTEN)) {
nsk = dccp_check_req(sk, skb, req);
} else {
inet_csk_reqsk_queue_drop_and_put(sk, req); inet_csk_reqsk_queue_drop_and_put(sk, req);
goto lookup; goto lookup;
} }
sock_hold(sk);
nsk = dccp_check_req(sk, skb, req);
if (!nsk) { if (!nsk) {
reqsk_put(req); reqsk_put(req);
goto discard_it; goto discard_and_relse;
} }
if (nsk == sk) { if (nsk == sk) {
sock_hold(sk);
reqsk_put(req); reqsk_put(req);
} else if (dccp_child_process(sk, nsk, skb)) { } else if (dccp_child_process(sk, nsk, skb)) {
dccp_v4_ctl_send_reset(sk, skb); dccp_v4_ctl_send_reset(sk, skb);
goto discard_it; goto discard_and_relse;
} else { } else {
sock_put(sk);
return 0; return 0;
} }
} }
......
...@@ -691,26 +691,26 @@ static int dccp_v6_rcv(struct sk_buff *skb) ...@@ -691,26 +691,26 @@ static int dccp_v6_rcv(struct sk_buff *skb)
if (sk->sk_state == DCCP_NEW_SYN_RECV) { if (sk->sk_state == DCCP_NEW_SYN_RECV) {
struct request_sock *req = inet_reqsk(sk); struct request_sock *req = inet_reqsk(sk);
struct sock *nsk = NULL; struct sock *nsk;
sk = req->rsk_listener; sk = req->rsk_listener;
if (likely(sk->sk_state == DCCP_LISTEN)) { if (unlikely(sk->sk_state != DCCP_LISTEN)) {
nsk = dccp_check_req(sk, skb, req);
} else {
inet_csk_reqsk_queue_drop_and_put(sk, req); inet_csk_reqsk_queue_drop_and_put(sk, req);
goto lookup; goto lookup;
} }
sock_hold(sk);
nsk = dccp_check_req(sk, skb, req);
if (!nsk) { if (!nsk) {
reqsk_put(req); reqsk_put(req);
goto discard_it; goto discard_and_relse;
} }
if (nsk == sk) { if (nsk == sk) {
sock_hold(sk);
reqsk_put(req); reqsk_put(req);
} else if (dccp_child_process(sk, nsk, skb)) { } else if (dccp_child_process(sk, nsk, skb)) {
dccp_v6_ctl_send_reset(sk, skb); dccp_v6_ctl_send_reset(sk, skb);
goto discard_it; goto discard_and_relse;
} else { } else {
sock_put(sk);
return 0; return 0;
} }
} }
......
...@@ -789,14 +789,16 @@ static void inet_child_forget(struct sock *sk, struct request_sock *req, ...@@ -789,14 +789,16 @@ static void inet_child_forget(struct sock *sk, struct request_sock *req,
reqsk_put(req); reqsk_put(req);
} }
void inet_csk_reqsk_queue_add(struct sock *sk, struct request_sock *req, struct sock *inet_csk_reqsk_queue_add(struct sock *sk,
struct sock *child) struct request_sock *req,
struct sock *child)
{ {
struct request_sock_queue *queue = &inet_csk(sk)->icsk_accept_queue; struct request_sock_queue *queue = &inet_csk(sk)->icsk_accept_queue;
spin_lock(&queue->rskq_lock); spin_lock(&queue->rskq_lock);
if (unlikely(sk->sk_state != TCP_LISTEN)) { if (unlikely(sk->sk_state != TCP_LISTEN)) {
inet_child_forget(sk, req, child); inet_child_forget(sk, req, child);
child = NULL;
} else { } else {
req->sk = child; req->sk = child;
req->dl_next = NULL; req->dl_next = NULL;
...@@ -808,6 +810,7 @@ void inet_csk_reqsk_queue_add(struct sock *sk, struct request_sock *req, ...@@ -808,6 +810,7 @@ void inet_csk_reqsk_queue_add(struct sock *sk, struct request_sock *req,
sk_acceptq_added(sk); sk_acceptq_added(sk);
} }
spin_unlock(&queue->rskq_lock); spin_unlock(&queue->rskq_lock);
return child;
} }
EXPORT_SYMBOL(inet_csk_reqsk_queue_add); EXPORT_SYMBOL(inet_csk_reqsk_queue_add);
...@@ -817,11 +820,8 @@ struct sock *inet_csk_complete_hashdance(struct sock *sk, struct sock *child, ...@@ -817,11 +820,8 @@ struct sock *inet_csk_complete_hashdance(struct sock *sk, struct sock *child,
if (own_req) { if (own_req) {
inet_csk_reqsk_queue_drop(sk, req); inet_csk_reqsk_queue_drop(sk, req);
reqsk_queue_removed(&inet_csk(sk)->icsk_accept_queue, req); reqsk_queue_removed(&inet_csk(sk)->icsk_accept_queue, req);
inet_csk_reqsk_queue_add(sk, req, child); if (inet_csk_reqsk_queue_add(sk, req, child))
/* Warning: caller must not call reqsk_put(req); return child;
* child stole last reference on it.
*/
return child;
} }
/* Too bad, another child took ownership of the request, undo. */ /* Too bad, another child took ownership of the request, undo. */
bh_unlock_sock(child); bh_unlock_sock(child);
......
...@@ -1597,30 +1597,30 @@ int tcp_v4_rcv(struct sk_buff *skb) ...@@ -1597,30 +1597,30 @@ int tcp_v4_rcv(struct sk_buff *skb)
if (sk->sk_state == TCP_NEW_SYN_RECV) { if (sk->sk_state == TCP_NEW_SYN_RECV) {
struct request_sock *req = inet_reqsk(sk); struct request_sock *req = inet_reqsk(sk);
struct sock *nsk = NULL; struct sock *nsk;
sk = req->rsk_listener; sk = req->rsk_listener;
if (unlikely(tcp_v4_inbound_md5_hash(sk, skb))) { if (unlikely(tcp_v4_inbound_md5_hash(sk, skb))) {
reqsk_put(req); reqsk_put(req);
goto discard_it; goto discard_it;
} }
if (likely(sk->sk_state == TCP_LISTEN)) { if (unlikely(sk->sk_state != TCP_LISTEN)) {
nsk = tcp_check_req(sk, skb, req, false);
} else {
inet_csk_reqsk_queue_drop_and_put(sk, req); inet_csk_reqsk_queue_drop_and_put(sk, req);
goto lookup; goto lookup;
} }
sock_hold(sk);
nsk = tcp_check_req(sk, skb, req, false);
if (!nsk) { if (!nsk) {
reqsk_put(req); reqsk_put(req);
goto discard_it; goto discard_and_relse;
} }
if (nsk == sk) { if (nsk == sk) {
sock_hold(sk);
reqsk_put(req); reqsk_put(req);
} else if (tcp_child_process(sk, nsk, skb)) { } else if (tcp_child_process(sk, nsk, skb)) {
tcp_v4_send_reset(nsk, skb); tcp_v4_send_reset(nsk, skb);
goto discard_it; goto discard_and_relse;
} else { } else {
sock_put(sk);
return 0; return 0;
} }
} }
......
...@@ -1387,7 +1387,7 @@ static int tcp_v6_rcv(struct sk_buff *skb) ...@@ -1387,7 +1387,7 @@ static int tcp_v6_rcv(struct sk_buff *skb)
if (sk->sk_state == TCP_NEW_SYN_RECV) { if (sk->sk_state == TCP_NEW_SYN_RECV) {
struct request_sock *req = inet_reqsk(sk); struct request_sock *req = inet_reqsk(sk);
struct sock *nsk = NULL; struct sock *nsk;
sk = req->rsk_listener; sk = req->rsk_listener;
tcp_v6_fill_cb(skb, hdr, th); tcp_v6_fill_cb(skb, hdr, th);
...@@ -1395,24 +1395,24 @@ static int tcp_v6_rcv(struct sk_buff *skb) ...@@ -1395,24 +1395,24 @@ static int tcp_v6_rcv(struct sk_buff *skb)
reqsk_put(req); reqsk_put(req);
goto discard_it; goto discard_it;
} }
if (likely(sk->sk_state == TCP_LISTEN)) { if (unlikely(sk->sk_state != TCP_LISTEN)) {
nsk = tcp_check_req(sk, skb, req, false);
} else {
inet_csk_reqsk_queue_drop_and_put(sk, req); inet_csk_reqsk_queue_drop_and_put(sk, req);
goto lookup; goto lookup;
} }
sock_hold(sk);
nsk = tcp_check_req(sk, skb, req, false);
if (!nsk) { if (!nsk) {
reqsk_put(req); reqsk_put(req);
goto discard_it; goto discard_and_relse;
} }
if (nsk == sk) { if (nsk == sk) {
sock_hold(sk);
reqsk_put(req); reqsk_put(req);
tcp_v6_restore_cb(skb); tcp_v6_restore_cb(skb);
} else if (tcp_child_process(sk, nsk, skb)) { } else if (tcp_child_process(sk, nsk, skb)) {
tcp_v6_send_reset(nsk, skb); tcp_v6_send_reset(nsk, skb);
goto discard_it; goto discard_and_relse;
} else { } else {
sock_put(sk);
return 0; return 0;
} }
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment