Commit f10f13cb authored by Herbert Xu's avatar Herbert Xu Committed by Zefan Li

net: Clone skb before setting peeked flag

commit 738ac1eb upstream.

Shared skbs must not be modified and this is crucial for broadcast
and/or multicast paths where we use it as an optimisation to avoid
unnecessary cloning.

The function skb_recv_datagram breaks this rule by setting peeked
without cloning the skb first.  This causes funky races which leads
to double-free.

This patch fixes this by cloning the skb and replacing the skb
in the list when setting skb->peeked.

Fixes: a59322be ("[UDP]: Only increment counter on first peek/recv")
Reported-by: default avatarKonstantin Khlebnikov <khlebnikov@yandex-team.ru>
Signed-off-by: default avatarHerbert Xu <herbert@gondor.apana.org.au>
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
[lizf: Backported to 3.4: adjust context]
Signed-off-by: default avatarZefan Li <lizefan@huawei.com>
parent 8c12b3ba
...@@ -127,6 +127,35 @@ static int wait_for_packet(struct sock *sk, int *err, long *timeo_p) ...@@ -127,6 +127,35 @@ static int wait_for_packet(struct sock *sk, int *err, long *timeo_p)
goto out; goto out;
} }
static int skb_set_peeked(struct sk_buff *skb)
{
struct sk_buff *nskb;
if (skb->peeked)
return 0;
/* We have to unshare an skb before modifying it. */
if (!skb_shared(skb))
goto done;
nskb = skb_clone(skb, GFP_ATOMIC);
if (!nskb)
return -ENOMEM;
skb->prev->next = nskb;
skb->next->prev = nskb;
nskb->prev = skb->prev;
nskb->next = skb->next;
consume_skb(skb);
skb = nskb;
done:
skb->peeked = 1;
return 0;
}
/** /**
* __skb_recv_datagram - Receive a datagram skbuff * __skb_recv_datagram - Receive a datagram skbuff
* @sk: socket * @sk: socket
...@@ -161,7 +190,9 @@ static int wait_for_packet(struct sock *sk, int *err, long *timeo_p) ...@@ -161,7 +190,9 @@ static int wait_for_packet(struct sock *sk, int *err, long *timeo_p)
struct sk_buff *__skb_recv_datagram(struct sock *sk, unsigned flags, struct sk_buff *__skb_recv_datagram(struct sock *sk, unsigned flags,
int *peeked, int *off, int *err) int *peeked, int *off, int *err)
{ {
struct sk_buff_head *queue = &sk->sk_receive_queue;
struct sk_buff *skb; struct sk_buff *skb;
unsigned long cpu_flags;
long timeo; long timeo;
/* /*
* Caller is allowed not to check sk->sk_err before skb_recv_datagram() * Caller is allowed not to check sk->sk_err before skb_recv_datagram()
...@@ -180,8 +211,6 @@ struct sk_buff *__skb_recv_datagram(struct sock *sk, unsigned flags, ...@@ -180,8 +211,6 @@ struct sk_buff *__skb_recv_datagram(struct sock *sk, unsigned flags,
* Look at current nfs client by the way... * Look at current nfs client by the way...
* However, this function was correct in any case. 8) * However, this function was correct in any case. 8)
*/ */
unsigned long cpu_flags;
struct sk_buff_head *queue = &sk->sk_receive_queue;
spin_lock_irqsave(&queue->lock, cpu_flags); spin_lock_irqsave(&queue->lock, cpu_flags);
skb_queue_walk(queue, skb) { skb_queue_walk(queue, skb) {
...@@ -191,7 +220,11 @@ struct sk_buff *__skb_recv_datagram(struct sock *sk, unsigned flags, ...@@ -191,7 +220,11 @@ struct sk_buff *__skb_recv_datagram(struct sock *sk, unsigned flags,
*off -= skb->len; *off -= skb->len;
continue; continue;
} }
skb->peeked = 1;
error = skb_set_peeked(skb);
if (error)
goto unlock_err;
atomic_inc(&skb->users); atomic_inc(&skb->users);
} else } else
__skb_unlink(skb, queue); __skb_unlink(skb, queue);
...@@ -210,6 +243,8 @@ struct sk_buff *__skb_recv_datagram(struct sock *sk, unsigned flags, ...@@ -210,6 +243,8 @@ struct sk_buff *__skb_recv_datagram(struct sock *sk, unsigned flags,
return NULL; return NULL;
unlock_err:
spin_unlock_irqrestore(&queue->lock, cpu_flags);
no_packet: no_packet:
*err = error; *err = error;
return NULL; return NULL;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment