On Tue, May 27, 2008 at 07:47:10PM +0400, Evgeniy Polyakov (johnpol@2ka.mipt.ru) wrote:And actually this will lead to data corruption, since different process can enter and change socket values under us. Without temporal lock drop we can deadlock (first process locked socket and then waiting for i_mutex, while another one grabbed i_mutex and waiting for socket lock in sendfile()). Please try attached patch on top of vanilla tree. It does not use skb after socket was dropped, but instead search it again when socket is locked, so if socket is alive, it will find it and clean otherwise it will exit. diff --git a/net/core/skbuff.c b/net/core/skbuff.c index 6087013..d285817 100644 --- a/net/core/skbuff.c +++ b/net/core/skbuff.c @@ -1349,6 +1349,7 @@ done: if (spd.nr_pages) { int ret; + struct sock *sk = __skb->sk; /* * Drop the socket lock, otherwise we have reverse @@ -1359,9 +1360,9 @@ done: * we call into ->sendpage() with the i_mutex lock held * and networking will grab the socket lock. */ - release_sock(__skb->sk); + release_sock(sk); ret = splice_to_pipe(pipe, &spd); - lock_sock(__skb->sk); + lock_sock(sk); return ret; } diff --git a/net/ipv4/tcp.c b/net/ipv4/tcp.c index 39b629a..217dc59 100644 --- a/net/ipv4/tcp.c +++ b/net/ipv4/tcp.c @@ -1200,15 +1200,17 @@ int tcp_read_sock(struct sock *sk, read_descriptor_t *desc, struct tcp_sock *tp = tcp_sk(sk); u32 seq = tp->copied_seq; u32 offset; - int copied = 0; + int copied = 0, fin; + size_t used, len, skb_len; if (sk->sk_state == TCP_LISTEN) return -ENOTCONN; while ((skb = tcp_recv_skb(sk, seq, &offset)) != NULL) { + used = 0; if (offset < skb->len) { - size_t used, len; - len = skb->len - offset; + skb_len = skb->len; + len = skb_len - offset; /* Stop reading if we hit a patch of urgent data */ if (tp->urg_data) { u32 urg_offset = tp->urg_seq - seq; @@ -1217,6 +1219,7 @@ int tcp_read_sock(struct sock *sk, read_descriptor_t *desc, if (!len) break; } + used = recv_actor(desc, skb, offset, len); if (used < 0) { if (!copied) @@ -1227,15 +1230,22 @@ int tcp_read_sock(struct sock *sk, read_descriptor_t *desc, copied += used; offset += used; } - if (offset != skb->len) + if (offset != skb_len) break; } - if (tcp_hdr(skb)->fin) { - sk_eat_skb(sk, skb, 0); - ++seq; + skb = tcp_recv_skb(sk, seq-used, &offset); + if (!skb) { + if (!copied) + copied = -EINVAL; break; } + fin = tcp_hdr(skb)->fin; sk_eat_skb(sk, skb, 0); + + if (fin) { + ++seq; + break; + } if (!desc->count) break; } -- Evgeniy Polyakov -- To unsubscribe from this list: send the line "unsubscribe netdev" in the body of a message to majordomo@vger.kernel.org More majordomo info at http://vger.kernel.org/majordomo-info.html
| Greg Kroah-Hartman | [PATCH 001/196] Chinese: Add the known_regression URI to the HOWTO |
| Linus Torvalds | Re: Dual-Licensing Linux Kernel with GPL V2 and GPL V3 |
| Andrew Morton | 2.6.25-mm1 |
| Vladislav Bolkhovitin | Re: Integration of SCST in the mainstream Linux kernel |
git: | |
| David Miller | [GIT]: Networking |
| David Miller | Re: [PATCH] pkt_sched: Destroy gen estimators under rtnl_lock(). |
| Gerrit Renker | [PATCH 0/37] dccp: Feature negotiation - last call for comments |
| Natalie Protasevich | [BUG] New Kernel Bugs |
