2005-04-17 06:20:36 +08:00
|
|
|
/*
|
|
|
|
* SUCS NET3:
|
|
|
|
*
|
|
|
|
* Generic stream handling routines. These are generic for most
|
|
|
|
* protocols. Even IP. Tonight 8-).
|
|
|
|
* This is used because TCP, LLC (others too) layer all have mostly
|
|
|
|
* identical sendmsg() and recvmsg() code.
|
|
|
|
* So we (will) share it here.
|
|
|
|
*
|
|
|
|
* Authors: Arnaldo Carvalho de Melo <acme@conectiva.com.br>
|
|
|
|
* (from old tcp.c code)
|
|
|
|
* Alan Cox <alan@redhat.com> (Borrowed comments 8-))
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <linux/module.h>
|
|
|
|
#include <linux/net.h>
|
|
|
|
#include <linux/signal.h>
|
|
|
|
#include <linux/tcp.h>
|
|
|
|
#include <linux/wait.h>
|
|
|
|
#include <net/sock.h>
|
|
|
|
|
|
|
|
/**
|
|
|
|
* sk_stream_write_space - stream socket write_space callback.
|
2005-05-01 23:59:25 +08:00
|
|
|
* @sk: socket
|
2005-04-17 06:20:36 +08:00
|
|
|
*
|
|
|
|
* FIXME: write proper description
|
|
|
|
*/
|
|
|
|
void sk_stream_write_space(struct sock *sk)
|
|
|
|
{
|
|
|
|
struct socket *sock = sk->sk_socket;
|
|
|
|
|
|
|
|
if (sk_stream_wspace(sk) >= sk_stream_min_wspace(sk) && sock) {
|
|
|
|
clear_bit(SOCK_NOSPACE, &sock->flags);
|
|
|
|
|
|
|
|
if (sk->sk_sleep && waitqueue_active(sk->sk_sleep))
|
|
|
|
wake_up_interruptible(sk->sk_sleep);
|
|
|
|
if (sock->fasync_list && !(sk->sk_shutdown & SEND_SHUTDOWN))
|
|
|
|
sock_wake_async(sock, 2, POLL_OUT);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
EXPORT_SYMBOL(sk_stream_write_space);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* sk_stream_wait_connect - Wait for a socket to get into the connected state
|
2005-05-01 23:59:25 +08:00
|
|
|
* @sk: sock to wait on
|
|
|
|
* @timeo_p: for how long to wait
|
2005-04-17 06:20:36 +08:00
|
|
|
*
|
|
|
|
* Must be called with the socket locked.
|
|
|
|
*/
|
|
|
|
int sk_stream_wait_connect(struct sock *sk, long *timeo_p)
|
|
|
|
{
|
|
|
|
struct task_struct *tsk = current;
|
|
|
|
DEFINE_WAIT(wait);
|
2005-11-04 06:56:56 +08:00
|
|
|
int done;
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2005-11-04 06:56:56 +08:00
|
|
|
do {
|
2005-12-14 15:22:19 +08:00
|
|
|
int err = sock_error(sk);
|
|
|
|
if (err)
|
|
|
|
return err;
|
2005-04-17 06:20:36 +08:00
|
|
|
if ((1 << sk->sk_state) & ~(TCPF_SYN_SENT | TCPF_SYN_RECV))
|
|
|
|
return -EPIPE;
|
|
|
|
if (!*timeo_p)
|
|
|
|
return -EAGAIN;
|
|
|
|
if (signal_pending(tsk))
|
|
|
|
return sock_intr_errno(*timeo_p);
|
|
|
|
|
|
|
|
prepare_to_wait(sk->sk_sleep, &wait, TASK_INTERRUPTIBLE);
|
|
|
|
sk->sk_write_pending++;
|
2005-11-04 06:56:56 +08:00
|
|
|
done = sk_wait_event(sk, timeo_p,
|
2005-12-14 15:22:19 +08:00
|
|
|
!sk->sk_err &&
|
2007-02-09 22:24:36 +08:00
|
|
|
!((1 << sk->sk_state) &
|
2005-11-04 06:56:56 +08:00
|
|
|
~(TCPF_ESTABLISHED | TCPF_CLOSE_WAIT)));
|
2005-04-17 06:20:36 +08:00
|
|
|
finish_wait(sk->sk_sleep, &wait);
|
|
|
|
sk->sk_write_pending--;
|
2005-11-04 06:56:56 +08:00
|
|
|
} while (!done);
|
2005-04-17 06:20:36 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
EXPORT_SYMBOL(sk_stream_wait_connect);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* sk_stream_closing - Return 1 if we still have things to send in our buffers.
|
2005-05-01 23:59:25 +08:00
|
|
|
* @sk: socket to verify
|
2005-04-17 06:20:36 +08:00
|
|
|
*/
|
|
|
|
static inline int sk_stream_closing(struct sock *sk)
|
|
|
|
{
|
|
|
|
return (1 << sk->sk_state) &
|
|
|
|
(TCPF_FIN_WAIT1 | TCPF_CLOSING | TCPF_LAST_ACK);
|
|
|
|
}
|
|
|
|
|
|
|
|
void sk_stream_wait_close(struct sock *sk, long timeout)
|
|
|
|
{
|
|
|
|
if (timeout) {
|
|
|
|
DEFINE_WAIT(wait);
|
|
|
|
|
|
|
|
do {
|
|
|
|
prepare_to_wait(sk->sk_sleep, &wait,
|
|
|
|
TASK_INTERRUPTIBLE);
|
|
|
|
if (sk_wait_event(sk, &timeout, !sk_stream_closing(sk)))
|
|
|
|
break;
|
|
|
|
} while (!signal_pending(current) && timeout);
|
|
|
|
|
|
|
|
finish_wait(sk->sk_sleep, &wait);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
EXPORT_SYMBOL(sk_stream_wait_close);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* sk_stream_wait_memory - Wait for more memory for a socket
|
2005-05-01 23:59:25 +08:00
|
|
|
* @sk: socket to wait for memory
|
|
|
|
* @timeo_p: for how long
|
2005-04-17 06:20:36 +08:00
|
|
|
*/
|
|
|
|
int sk_stream_wait_memory(struct sock *sk, long *timeo_p)
|
|
|
|
{
|
|
|
|
int err = 0;
|
|
|
|
long vm_wait = 0;
|
|
|
|
long current_timeo = *timeo_p;
|
|
|
|
DEFINE_WAIT(wait);
|
|
|
|
|
|
|
|
if (sk_stream_memory_free(sk))
|
|
|
|
current_timeo = vm_wait = (net_random() % (HZ / 5)) + 2;
|
|
|
|
|
|
|
|
while (1) {
|
|
|
|
set_bit(SOCK_ASYNC_NOSPACE, &sk->sk_socket->flags);
|
|
|
|
|
|
|
|
prepare_to_wait(sk->sk_sleep, &wait, TASK_INTERRUPTIBLE);
|
|
|
|
|
|
|
|
if (sk->sk_err || (sk->sk_shutdown & SEND_SHUTDOWN))
|
|
|
|
goto do_error;
|
|
|
|
if (!*timeo_p)
|
|
|
|
goto do_nonblock;
|
|
|
|
if (signal_pending(current))
|
|
|
|
goto do_interrupted;
|
|
|
|
clear_bit(SOCK_ASYNC_NOSPACE, &sk->sk_socket->flags);
|
|
|
|
if (sk_stream_memory_free(sk) && !vm_wait)
|
|
|
|
break;
|
|
|
|
|
|
|
|
set_bit(SOCK_NOSPACE, &sk->sk_socket->flags);
|
|
|
|
sk->sk_write_pending++;
|
2007-02-09 22:24:36 +08:00
|
|
|
sk_wait_event(sk, ¤t_timeo, !sk->sk_err &&
|
2005-12-14 15:22:19 +08:00
|
|
|
!(sk->sk_shutdown & SEND_SHUTDOWN) &&
|
|
|
|
sk_stream_memory_free(sk) &&
|
2005-04-17 06:20:36 +08:00
|
|
|
vm_wait);
|
|
|
|
sk->sk_write_pending--;
|
|
|
|
|
|
|
|
if (vm_wait) {
|
|
|
|
vm_wait -= current_timeo;
|
|
|
|
current_timeo = *timeo_p;
|
|
|
|
if (current_timeo != MAX_SCHEDULE_TIMEOUT &&
|
|
|
|
(current_timeo -= vm_wait) < 0)
|
|
|
|
current_timeo = 0;
|
|
|
|
vm_wait = 0;
|
|
|
|
}
|
|
|
|
*timeo_p = current_timeo;
|
|
|
|
}
|
|
|
|
out:
|
|
|
|
finish_wait(sk->sk_sleep, &wait);
|
|
|
|
return err;
|
|
|
|
|
|
|
|
do_error:
|
|
|
|
err = -EPIPE;
|
|
|
|
goto out;
|
|
|
|
do_nonblock:
|
|
|
|
err = -EAGAIN;
|
|
|
|
goto out;
|
|
|
|
do_interrupted:
|
|
|
|
err = sock_intr_errno(*timeo_p);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
EXPORT_SYMBOL(sk_stream_wait_memory);
|
|
|
|
|
|
|
|
void sk_stream_rfree(struct sk_buff *skb)
|
|
|
|
{
|
|
|
|
struct sock *sk = skb->sk;
|
|
|
|
|
2006-04-20 15:10:50 +08:00
|
|
|
skb_truesize_check(skb);
|
2005-04-17 06:20:36 +08:00
|
|
|
atomic_sub(skb->truesize, &sk->sk_rmem_alloc);
|
|
|
|
sk->sk_forward_alloc += skb->truesize;
|
|
|
|
}
|
|
|
|
|
|
|
|
EXPORT_SYMBOL(sk_stream_rfree);
|
|
|
|
|
|
|
|
int sk_stream_error(struct sock *sk, int flags, int err)
|
|
|
|
{
|
|
|
|
if (err == -EPIPE)
|
|
|
|
err = sock_error(sk) ? : -EPIPE;
|
|
|
|
if (err == -EPIPE && !(flags & MSG_NOSIGNAL))
|
|
|
|
send_sig(SIGPIPE, current, 0);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
EXPORT_SYMBOL(sk_stream_error);
|
|
|
|
|
|
|
|
void __sk_stream_mem_reclaim(struct sock *sk)
|
|
|
|
{
|
2006-07-13 08:58:53 +08:00
|
|
|
atomic_sub(sk->sk_forward_alloc / SK_STREAM_MEM_QUANTUM,
|
|
|
|
sk->sk_prot->memory_allocated);
|
|
|
|
sk->sk_forward_alloc &= SK_STREAM_MEM_QUANTUM - 1;
|
|
|
|
if (*sk->sk_prot->memory_pressure &&
|
|
|
|
(atomic_read(sk->sk_prot->memory_allocated) <
|
|
|
|
sk->sk_prot->sysctl_mem[0]))
|
|
|
|
*sk->sk_prot->memory_pressure = 0;
|
2005-04-17 06:20:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
EXPORT_SYMBOL(__sk_stream_mem_reclaim);
|
|
|
|
|
|
|
|
int sk_stream_mem_schedule(struct sock *sk, int size, int kind)
|
|
|
|
{
|
|
|
|
int amt = sk_stream_pages(size);
|
|
|
|
|
|
|
|
sk->sk_forward_alloc += amt * SK_STREAM_MEM_QUANTUM;
|
|
|
|
atomic_add(amt, sk->sk_prot->memory_allocated);
|
|
|
|
|
|
|
|
/* Under limit. */
|
|
|
|
if (atomic_read(sk->sk_prot->memory_allocated) < sk->sk_prot->sysctl_mem[0]) {
|
|
|
|
if (*sk->sk_prot->memory_pressure)
|
|
|
|
*sk->sk_prot->memory_pressure = 0;
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Over hard limit. */
|
|
|
|
if (atomic_read(sk->sk_prot->memory_allocated) > sk->sk_prot->sysctl_mem[2]) {
|
|
|
|
sk->sk_prot->enter_memory_pressure();
|
|
|
|
goto suppress_allocation;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Under pressure. */
|
|
|
|
if (atomic_read(sk->sk_prot->memory_allocated) > sk->sk_prot->sysctl_mem[1])
|
|
|
|
sk->sk_prot->enter_memory_pressure();
|
|
|
|
|
|
|
|
if (kind) {
|
|
|
|
if (atomic_read(&sk->sk_rmem_alloc) < sk->sk_prot->sysctl_rmem[0])
|
|
|
|
return 1;
|
|
|
|
} else if (sk->sk_wmem_queued < sk->sk_prot->sysctl_wmem[0])
|
|
|
|
return 1;
|
|
|
|
|
|
|
|
if (!*sk->sk_prot->memory_pressure ||
|
|
|
|
sk->sk_prot->sysctl_mem[2] > atomic_read(sk->sk_prot->sockets_allocated) *
|
|
|
|
sk_stream_pages(sk->sk_wmem_queued +
|
|
|
|
atomic_read(&sk->sk_rmem_alloc) +
|
|
|
|
sk->sk_forward_alloc))
|
|
|
|
return 1;
|
|
|
|
|
|
|
|
suppress_allocation:
|
|
|
|
|
|
|
|
if (!kind) {
|
|
|
|
sk_stream_moderate_sndbuf(sk);
|
|
|
|
|
|
|
|
/* Fail only if socket is _under_ its sndbuf.
|
|
|
|
* In this case we cannot block, so that we have to fail.
|
|
|
|
*/
|
|
|
|
if (sk->sk_wmem_queued + size >= sk->sk_sndbuf)
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Alas. Undo changes. */
|
|
|
|
sk->sk_forward_alloc -= amt * SK_STREAM_MEM_QUANTUM;
|
|
|
|
atomic_sub(amt, sk->sk_prot->memory_allocated);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
EXPORT_SYMBOL(sk_stream_mem_schedule);
|
|
|
|
|
|
|
|
void sk_stream_kill_queues(struct sock *sk)
|
|
|
|
{
|
|
|
|
/* First the read buffer. */
|
|
|
|
__skb_queue_purge(&sk->sk_receive_queue);
|
|
|
|
|
|
|
|
/* Next, the error queue. */
|
|
|
|
__skb_queue_purge(&sk->sk_error_queue);
|
|
|
|
|
|
|
|
/* Next, the write queue. */
|
|
|
|
BUG_TRAP(skb_queue_empty(&sk->sk_write_queue));
|
|
|
|
|
|
|
|
/* Account for returned memory. */
|
|
|
|
sk_stream_mem_reclaim(sk);
|
|
|
|
|
|
|
|
BUG_TRAP(!sk->sk_wmem_queued);
|
|
|
|
BUG_TRAP(!sk->sk_forward_alloc);
|
|
|
|
|
|
|
|
/* It is _impossible_ for the backlog to contain anything
|
|
|
|
* when we get here. All user references to this socket
|
|
|
|
* have gone away, only the net layer knows can touch it.
|
|
|
|
*/
|
|
|
|
}
|
|
|
|
|
|
|
|
EXPORT_SYMBOL(sk_stream_kill_queues);
|