blob: 5586879bb9b3815f8e021a8907d03ce04059bb50 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * SUCS NET3:
3 *
4 * Generic stream handling routines. These are generic for most
5 * protocols. Even IP. Tonight 8-).
6 * This is used because TCP, LLC (others too) layer all have mostly
7 * identical sendmsg() and recvmsg() code.
8 * So we (will) share it here.
9 *
10 * Authors: Arnaldo Carvalho de Melo <acme@conectiva.com.br>
11 * (from old tcp.c code)
12 * Alan Cox <alan@redhat.com> (Borrowed comments 8-))
13 */
14
15#include <linux/module.h>
16#include <linux/net.h>
17#include <linux/signal.h>
18#include <linux/tcp.h>
19#include <linux/wait.h>
20#include <net/sock.h>
21
22/**
23 * sk_stream_write_space - stream socket write_space callback.
Pavel Pisa4dc3b162005-05-01 08:59:25 -070024 * @sk: socket
Linus Torvalds1da177e2005-04-16 15:20:36 -070025 *
26 * FIXME: write proper description
27 */
28void sk_stream_write_space(struct sock *sk)
29{
30 struct socket *sock = sk->sk_socket;
31
32 if (sk_stream_wspace(sk) >= sk_stream_min_wspace(sk) && sock) {
33 clear_bit(SOCK_NOSPACE, &sock->flags);
34
35 if (sk->sk_sleep && waitqueue_active(sk->sk_sleep))
36 wake_up_interruptible(sk->sk_sleep);
37 if (sock->fasync_list && !(sk->sk_shutdown & SEND_SHUTDOWN))
Pavel Emelyanov8d8ad9d2007-11-26 20:10:50 +080038 sock_wake_async(sock, SOCK_WAKE_SPACE, POLL_OUT);
Linus Torvalds1da177e2005-04-16 15:20:36 -070039 }
40}
41
42EXPORT_SYMBOL(sk_stream_write_space);
43
44/**
45 * sk_stream_wait_connect - Wait for a socket to get into the connected state
Pavel Pisa4dc3b162005-05-01 08:59:25 -070046 * @sk: sock to wait on
47 * @timeo_p: for how long to wait
Linus Torvalds1da177e2005-04-16 15:20:36 -070048 *
49 * Must be called with the socket locked.
50 */
51int sk_stream_wait_connect(struct sock *sk, long *timeo_p)
52{
53 struct task_struct *tsk = current;
54 DEFINE_WAIT(wait);
Herbert Xu6151b312005-11-04 09:56:56 +110055 int done;
Linus Torvalds1da177e2005-04-16 15:20:36 -070056
Herbert Xu6151b312005-11-04 09:56:56 +110057 do {
Benjamin LaHaisec1cbe4b2005-12-13 23:22:19 -080058 int err = sock_error(sk);
59 if (err)
60 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -070061 if ((1 << sk->sk_state) & ~(TCPF_SYN_SENT | TCPF_SYN_RECV))
62 return -EPIPE;
63 if (!*timeo_p)
64 return -EAGAIN;
65 if (signal_pending(tsk))
66 return sock_intr_errno(*timeo_p);
67
68 prepare_to_wait(sk->sk_sleep, &wait, TASK_INTERRUPTIBLE);
69 sk->sk_write_pending++;
Herbert Xu6151b312005-11-04 09:56:56 +110070 done = sk_wait_event(sk, timeo_p,
Benjamin LaHaisec1cbe4b2005-12-13 23:22:19 -080071 !sk->sk_err &&
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +090072 !((1 << sk->sk_state) &
Herbert Xu6151b312005-11-04 09:56:56 +110073 ~(TCPF_ESTABLISHED | TCPF_CLOSE_WAIT)));
Linus Torvalds1da177e2005-04-16 15:20:36 -070074 finish_wait(sk->sk_sleep, &wait);
75 sk->sk_write_pending--;
Herbert Xu6151b312005-11-04 09:56:56 +110076 } while (!done);
Linus Torvalds1da177e2005-04-16 15:20:36 -070077 return 0;
78}
79
80EXPORT_SYMBOL(sk_stream_wait_connect);
81
82/**
83 * sk_stream_closing - Return 1 if we still have things to send in our buffers.
Pavel Pisa4dc3b162005-05-01 08:59:25 -070084 * @sk: socket to verify
Linus Torvalds1da177e2005-04-16 15:20:36 -070085 */
86static inline int sk_stream_closing(struct sock *sk)
87{
88 return (1 << sk->sk_state) &
89 (TCPF_FIN_WAIT1 | TCPF_CLOSING | TCPF_LAST_ACK);
90}
91
92void sk_stream_wait_close(struct sock *sk, long timeout)
93{
94 if (timeout) {
95 DEFINE_WAIT(wait);
96
97 do {
98 prepare_to_wait(sk->sk_sleep, &wait,
99 TASK_INTERRUPTIBLE);
100 if (sk_wait_event(sk, &timeout, !sk_stream_closing(sk)))
101 break;
102 } while (!signal_pending(current) && timeout);
103
104 finish_wait(sk->sk_sleep, &wait);
105 }
106}
107
108EXPORT_SYMBOL(sk_stream_wait_close);
109
110/**
111 * sk_stream_wait_memory - Wait for more memory for a socket
Pavel Pisa4dc3b162005-05-01 08:59:25 -0700112 * @sk: socket to wait for memory
113 * @timeo_p: for how long
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114 */
115int sk_stream_wait_memory(struct sock *sk, long *timeo_p)
116{
117 int err = 0;
118 long vm_wait = 0;
119 long current_timeo = *timeo_p;
120 DEFINE_WAIT(wait);
121
122 if (sk_stream_memory_free(sk))
123 current_timeo = vm_wait = (net_random() % (HZ / 5)) + 2;
124
125 while (1) {
126 set_bit(SOCK_ASYNC_NOSPACE, &sk->sk_socket->flags);
127
128 prepare_to_wait(sk->sk_sleep, &wait, TASK_INTERRUPTIBLE);
129
130 if (sk->sk_err || (sk->sk_shutdown & SEND_SHUTDOWN))
131 goto do_error;
132 if (!*timeo_p)
133 goto do_nonblock;
134 if (signal_pending(current))
135 goto do_interrupted;
136 clear_bit(SOCK_ASYNC_NOSPACE, &sk->sk_socket->flags);
137 if (sk_stream_memory_free(sk) && !vm_wait)
138 break;
139
140 set_bit(SOCK_NOSPACE, &sk->sk_socket->flags);
141 sk->sk_write_pending++;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900142 sk_wait_event(sk, &current_timeo, !sk->sk_err &&
Benjamin LaHaisec1cbe4b2005-12-13 23:22:19 -0800143 !(sk->sk_shutdown & SEND_SHUTDOWN) &&
144 sk_stream_memory_free(sk) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145 vm_wait);
146 sk->sk_write_pending--;
147
148 if (vm_wait) {
149 vm_wait -= current_timeo;
150 current_timeo = *timeo_p;
151 if (current_timeo != MAX_SCHEDULE_TIMEOUT &&
152 (current_timeo -= vm_wait) < 0)
153 current_timeo = 0;
154 vm_wait = 0;
155 }
156 *timeo_p = current_timeo;
157 }
158out:
159 finish_wait(sk->sk_sleep, &wait);
160 return err;
161
162do_error:
163 err = -EPIPE;
164 goto out;
165do_nonblock:
166 err = -EAGAIN;
167 goto out;
168do_interrupted:
169 err = sock_intr_errno(*timeo_p);
170 goto out;
171}
172
173EXPORT_SYMBOL(sk_stream_wait_memory);
174
175void sk_stream_rfree(struct sk_buff *skb)
176{
177 struct sock *sk = skb->sk;
178
David S. Millerdc6de332006-04-20 00:10:50 -0700179 skb_truesize_check(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 atomic_sub(skb->truesize, &sk->sk_rmem_alloc);
181 sk->sk_forward_alloc += skb->truesize;
182}
183
184EXPORT_SYMBOL(sk_stream_rfree);
185
186int sk_stream_error(struct sock *sk, int flags, int err)
187{
188 if (err == -EPIPE)
189 err = sock_error(sk) ? : -EPIPE;
190 if (err == -EPIPE && !(flags & MSG_NOSIGNAL))
191 send_sig(SIGPIPE, current, 0);
192 return err;
193}
194
195EXPORT_SYMBOL(sk_stream_error);
196
197void __sk_stream_mem_reclaim(struct sock *sk)
198{
Ian McDonalda6f157a2006-07-12 17:58:53 -0700199 atomic_sub(sk->sk_forward_alloc / SK_STREAM_MEM_QUANTUM,
200 sk->sk_prot->memory_allocated);
201 sk->sk_forward_alloc &= SK_STREAM_MEM_QUANTUM - 1;
202 if (*sk->sk_prot->memory_pressure &&
203 (atomic_read(sk->sk_prot->memory_allocated) <
204 sk->sk_prot->sysctl_mem[0]))
205 *sk->sk_prot->memory_pressure = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206}
207
208EXPORT_SYMBOL(__sk_stream_mem_reclaim);
209
210int sk_stream_mem_schedule(struct sock *sk, int size, int kind)
211{
212 int amt = sk_stream_pages(size);
Pavel Emelyanov9859a792007-11-19 23:20:59 -0800213 struct proto *prot = sk->sk_prot;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214
215 sk->sk_forward_alloc += amt * SK_STREAM_MEM_QUANTUM;
Pavel Emelyanov9859a792007-11-19 23:20:59 -0800216 atomic_add(amt, prot->memory_allocated);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217
218 /* Under limit. */
Pavel Emelyanov9859a792007-11-19 23:20:59 -0800219 if (atomic_read(prot->memory_allocated) < prot->sysctl_mem[0]) {
220 if (*prot->memory_pressure)
221 *prot->memory_pressure = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222 return 1;
223 }
224
225 /* Over hard limit. */
Pavel Emelyanov9859a792007-11-19 23:20:59 -0800226 if (atomic_read(prot->memory_allocated) > prot->sysctl_mem[2]) {
227 prot->enter_memory_pressure();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228 goto suppress_allocation;
229 }
230
231 /* Under pressure. */
Pavel Emelyanov9859a792007-11-19 23:20:59 -0800232 if (atomic_read(prot->memory_allocated) > prot->sysctl_mem[1])
233 prot->enter_memory_pressure();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234
235 if (kind) {
Pavel Emelyanov9859a792007-11-19 23:20:59 -0800236 if (atomic_read(&sk->sk_rmem_alloc) < prot->sysctl_rmem[0])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700237 return 1;
Pavel Emelyanov9859a792007-11-19 23:20:59 -0800238 } else if (sk->sk_wmem_queued < prot->sysctl_wmem[0])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239 return 1;
240
Pavel Emelyanov9859a792007-11-19 23:20:59 -0800241 if (!*prot->memory_pressure ||
242 prot->sysctl_mem[2] > atomic_read(prot->sockets_allocated) *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700243 sk_stream_pages(sk->sk_wmem_queued +
244 atomic_read(&sk->sk_rmem_alloc) +
245 sk->sk_forward_alloc))
246 return 1;
247
248suppress_allocation:
249
250 if (!kind) {
251 sk_stream_moderate_sndbuf(sk);
252
253 /* Fail only if socket is _under_ its sndbuf.
254 * In this case we cannot block, so that we have to fail.
255 */
256 if (sk->sk_wmem_queued + size >= sk->sk_sndbuf)
257 return 1;
258 }
259
260 /* Alas. Undo changes. */
261 sk->sk_forward_alloc -= amt * SK_STREAM_MEM_QUANTUM;
Pavel Emelyanov9859a792007-11-19 23:20:59 -0800262 atomic_sub(amt, prot->memory_allocated);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263 return 0;
264}
265
266EXPORT_SYMBOL(sk_stream_mem_schedule);
267
268void sk_stream_kill_queues(struct sock *sk)
269{
270 /* First the read buffer. */
271 __skb_queue_purge(&sk->sk_receive_queue);
272
273 /* Next, the error queue. */
274 __skb_queue_purge(&sk->sk_error_queue);
275
276 /* Next, the write queue. */
277 BUG_TRAP(skb_queue_empty(&sk->sk_write_queue));
278
279 /* Account for returned memory. */
280 sk_stream_mem_reclaim(sk);
281
282 BUG_TRAP(!sk->sk_wmem_queued);
283 BUG_TRAP(!sk->sk_forward_alloc);
284
285 /* It is _impossible_ for the backlog to contain anything
286 * when we get here. All user references to this socket
287 * have gone away, only the net layer knows can touch it.
288 */
289}
290
291EXPORT_SYMBOL(sk_stream_kill_queues);