blob: fd4f8243cc35fed0442fb4b4c85b7049ee88c64f [file] [log] [blame]
Thomas Gleixner47505b82019-05-23 11:14:41 +02001// SPDX-License-Identifier: GPL-2.0-or-later
Vlad Yasevich60c778b2008-01-11 09:57:09 -05002/* SCTP kernel implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 * (C) Copyright IBM Corp. 2003, 2004
4 *
Vlad Yasevich60c778b2008-01-11 09:57:09 -05005 * This file is part of the SCTP kernel implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07006 *
Michael Opdenacker59c51592007-05-09 08:57:56 +02007 * This file contains the code relating the chunk abstraction.
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 * Please send any bug reports or fixes you make to the
10 * email address(es):
Daniel Borkmann91705c62013-07-23 14:51:47 +020011 * lksctp developers <linux-sctp@vger.kernel.org>
Linus Torvalds1da177e2005-04-16 15:20:36 -070012 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070013 * Written or modified by:
14 * Jon Grimm <jgrimm@us.ibm.com>
15 * Sridhar Samudrala <sri@us.ibm.com>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016 */
17
Joe Perches145ce502010-08-24 13:21:08 +000018#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/types.h>
21#include <linux/kernel.h>
22#include <linux/net.h>
23#include <linux/inet.h>
24#include <linux/skbuff.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090025#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070026#include <net/sock.h>
27#include <net/sctp/sctp.h>
28#include <net/sctp/sm.h>
29
30/* This file is mostly in anticipation of future work, but initially
31 * populate with fragment tracking for an outbound message.
32 */
33
34/* Initialize datamsg from memory. */
35static void sctp_datamsg_init(struct sctp_datamsg *msg)
36{
Reshetova, Elenac0acdfb2017-07-04 15:53:25 +030037 refcount_set(&msg->refcnt, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -070038 msg->send_failed = 0;
39 msg->send_error = 0;
Vlad Yasevich0e3aef82010-04-30 22:41:10 -040040 msg->can_delay = 1;
Xin Longe5f61292017-11-25 21:18:35 +080041 msg->abandoned = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070042 msg->expires_at = 0;
43 INIT_LIST_HEAD(&msg->chunks);
44}
45
46/* Allocate and initialize datamsg. */
Daniel Borkmanndda91922013-06-17 11:40:05 +020047static struct sctp_datamsg *sctp_datamsg_new(gfp_t gfp)
Linus Torvalds1da177e2005-04-16 15:20:36 -070048{
49 struct sctp_datamsg *msg;
50 msg = kmalloc(sizeof(struct sctp_datamsg), gfp);
Li Zefane8c38752008-04-10 01:57:24 -070051 if (msg) {
Linus Torvalds1da177e2005-04-16 15:20:36 -070052 sctp_datamsg_init(msg);
Li Zefane8c38752008-04-10 01:57:24 -070053 SCTP_DBG_OBJCNT_INC(datamsg);
54 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070055 return msg;
56}
57
Xin Longb61c6542016-09-14 02:04:20 +080058void sctp_datamsg_free(struct sctp_datamsg *msg)
59{
60 struct sctp_chunk *chunk;
61
62 /* This doesn't have to be a _safe vairant because
63 * sctp_chunk_free() only drops the refs.
64 */
65 list_for_each_entry(chunk, &msg->chunks, frag_list)
66 sctp_chunk_free(chunk);
67
68 sctp_datamsg_put(msg);
69}
70
Linus Torvalds1da177e2005-04-16 15:20:36 -070071/* Final destructruction of datamsg memory. */
72static void sctp_datamsg_destroy(struct sctp_datamsg *msg)
73{
Xin Longa1e3a052018-11-18 16:08:52 +080074 struct sctp_association *asoc = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -070075 struct list_head *pos, *temp;
76 struct sctp_chunk *chunk;
Linus Torvalds1da177e2005-04-16 15:20:36 -070077 struct sctp_ulpevent *ev;
Xin Longb6e6b5f2019-10-08 19:27:36 +080078 int error, sent;
Linus Torvalds1da177e2005-04-16 15:20:36 -070079
80 /* Release all references. */
81 list_for_each_safe(pos, temp, &msg->chunks) {
82 list_del_init(pos);
83 chunk = list_entry(pos, struct sctp_chunk, frag_list);
Linus Torvalds1da177e2005-04-16 15:20:36 -070084
Xin Longb6e6b5f2019-10-08 19:27:36 +080085 if (!msg->send_failed) {
86 sctp_chunk_put(chunk);
87 continue;
Linus Torvalds1da177e2005-04-16 15:20:36 -070088 }
89
Xin Longb6e6b5f2019-10-08 19:27:36 +080090 asoc = chunk->asoc;
91 error = msg->send_error ?: asoc->outqueue.error;
92 sent = chunk->has_tsn ? SCTP_DATA_SENT : SCTP_DATA_UNSENT;
Linus Torvalds1da177e2005-04-16 15:20:36 -070093
Xin Longb6e6b5f2019-10-08 19:27:36 +080094 if (sctp_ulpevent_type_enabled(asoc->subscribe,
95 SCTP_SEND_FAILED)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -070096 ev = sctp_ulpevent_make_send_failed(asoc, chunk, sent,
97 error, GFP_ATOMIC);
98 if (ev)
Xin Long9162e0e2017-12-08 21:04:05 +080099 asoc->stream.si->enqueue_event(&asoc->ulpq, ev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100 }
101
Xin Longb6e6b5f2019-10-08 19:27:36 +0800102 if (sctp_ulpevent_type_enabled(asoc->subscribe,
103 SCTP_SEND_FAILED_EVENT)) {
104 ev = sctp_ulpevent_make_send_failed_event(asoc, chunk,
105 sent, error,
106 GFP_ATOMIC);
107 if (ev)
108 asoc->stream.si->enqueue_event(&asoc->ulpq, ev);
109 }
110
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111 sctp_chunk_put(chunk);
112 }
113
114 SCTP_DBG_OBJCNT_DEC(datamsg);
115 kfree(msg);
116}
117
118/* Hold a reference. */
119static void sctp_datamsg_hold(struct sctp_datamsg *msg)
120{
Reshetova, Elenac0acdfb2017-07-04 15:53:25 +0300121 refcount_inc(&msg->refcnt);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122}
123
124/* Release a reference. */
125void sctp_datamsg_put(struct sctp_datamsg *msg)
126{
Reshetova, Elenac0acdfb2017-07-04 15:53:25 +0300127 if (refcount_dec_and_test(&msg->refcnt))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128 sctp_datamsg_destroy(msg);
129}
130
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131/* Assign a chunk to this datamsg. */
132static void sctp_datamsg_assign(struct sctp_datamsg *msg, struct sctp_chunk *chunk)
133{
134 sctp_datamsg_hold(msg);
135 chunk->msg = msg;
136}
137
138
139/* A data chunk can have a maximum payload of (2^16 - 20). Break
140 * down any such message into smaller chunks. Opportunistically, fragment
141 * the chunks down to the current MTU constraints. We may get refragmented
142 * later if the PMTU changes, but it is _much better_ to fragment immediately
143 * with a reasonable guess than always doing our fragmentation on the
144 * soft-interrupt.
145 */
146struct sctp_datamsg *sctp_datamsg_from_user(struct sctp_association *asoc,
147 struct sctp_sndrcvinfo *sinfo,
Al Viroe0eb0932014-11-15 01:11:23 -0500148 struct iov_iter *from)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700149{
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200150 size_t len, first_len, max_data, remaining;
151 size_t msg_len = iov_iter_count(from);
Xin Long1b1e0bc2018-03-14 19:05:30 +0800152 struct sctp_shared_key *shkey = NULL;
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200153 struct list_head *pos, *temp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154 struct sctp_chunk *chunk;
155 struct sctp_datamsg *msg;
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200156 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157
158 msg = sctp_datamsg_new(GFP_KERNEL);
159 if (!msg)
Tommi Rantala6e51fe72012-11-22 03:23:16 +0000160 return ERR_PTR(-ENOMEM);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161
162 /* Note: Calculate this outside of the loop, so that all fragments
163 * have the same expiration.
164 */
Xin Long8ae808e2016-10-08 11:40:16 +0800165 if (asoc->peer.prsctp_capable && sinfo->sinfo_timetolive &&
166 (SCTP_PR_TTL_ENABLED(sinfo->sinfo_flags) ||
167 !SCTP_PR_POLICY(sinfo->sinfo_flags)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168 msg->expires_at = jiffies +
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200169 msecs_to_jiffies(sinfo->sinfo_timetolive);
Xin Long06054832016-09-29 02:37:27 +0800170
Vlad Yasevich3e62abf2009-09-04 18:20:56 -0400171 /* This is the biggest possible DATA chunk that can fit into
172 * the packet
173 */
Marcelo Ricardo Leitner2f5e3c92018-04-26 16:58:55 -0300174 max_data = asoc->frag_point;
Jakub Audykowiczafd0a802018-12-04 20:27:41 +0100175 if (unlikely(!max_data)) {
176 max_data = sctp_min_frag_point(sctp_sk(asoc->base.sk),
177 sctp_datachk_len(&asoc->stream));
Matthias Maennichac510502019-02-28 11:36:52 +0000178 pr_warn_ratelimited("%s: asoc:%p frag_point is zero, forcing max_data to default minimum (%zu)",
Jakub Audykowiczafd0a802018-12-04 20:27:41 +0100179 __func__, asoc, max_data);
180 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181
Randy Dunlap99325642020-08-22 16:15:58 -0700182 /* If the peer requested that we authenticate DATA chunks
wangweidong2bccbad2013-10-26 16:06:30 +0800183 * we need to account for bundling of the AUTH chunks along with
Vlad Yasevich4cd57c82007-09-16 19:32:45 -0700184 * DATA.
185 */
186 if (sctp_auth_send_cid(SCTP_CID_DATA, asoc)) {
187 struct sctp_hmac *hmac_desc = sctp_auth_asoc_get_hmac(asoc);
188
189 if (hmac_desc)
Xin Longbb96dec2017-08-03 15:42:22 +0800190 max_data -= SCTP_PAD4(sizeof(struct sctp_auth_chunk) +
Marcelo Ricardo Leitnere2f036a2016-09-21 08:45:55 -0300191 hmac_desc->hmac_len);
Xin Long1b1e0bc2018-03-14 19:05:30 +0800192
Xin Long3ff547c2018-03-14 19:05:31 +0800193 if (sinfo->sinfo_tsn &&
194 sinfo->sinfo_ssn != asoc->active_key_id) {
195 shkey = sctp_auth_get_shkey(asoc, sinfo->sinfo_ssn);
196 if (!shkey) {
197 err = -EINVAL;
198 goto errout;
199 }
200 } else {
201 shkey = asoc->shkey;
202 }
Vlad Yasevich4cd57c82007-09-16 19:32:45 -0700203 }
204
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200205 /* Set first_len and then account for possible bundles on first frag */
206 first_len = max_data;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207
Vlad Yasevich5d7ff262009-08-07 13:23:28 -0400208 /* Check to see if we have a pending SACK and try to let it be bundled
209 * with this message. Do this if we don't have any data queued already.
210 * To check that, look at out_qlen and retransmit list.
211 * NOTE: we will not reduce to account for SACK, if the message would
212 * not have been fragmented.
213 */
214 if (timer_pending(&asoc->timers[SCTP_EVENT_TIMEOUT_SACK]) &&
215 asoc->outqueue.out_qlen == 0 &&
216 list_empty(&asoc->outqueue.retransmit) &&
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200217 msg_len > max_data)
Xin Longd4d6c612017-07-23 09:34:33 +0800218 first_len -= SCTP_PAD4(sizeof(struct sctp_sack_chunk));
Vlad Yasevich5d7ff262009-08-07 13:23:28 -0400219
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 /* Encourage Cookie-ECHO bundling. */
Vlad Yasevich5d7ff262009-08-07 13:23:28 -0400221 if (asoc->state < SCTP_STATE_COOKIE_ECHOED)
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200222 first_len -= SCTP_ARBITRARY_COOKIE_ECHO_LEN;
Vlad Yasevich3e62abf2009-09-04 18:20:56 -0400223
224 /* Account for a different sized first fragment */
225 if (msg_len >= first_len) {
Vlad Yasevich0e3aef82010-04-30 22:41:10 -0400226 msg->can_delay = 0;
Marcelo Ricardo Leitnerfedb1bd32018-06-20 12:47:52 -0300227 if (msg_len > first_len)
Xin Long4e7696d2019-12-09 13:45:18 +0800228 SCTP_INC_STATS(asoc->base.net,
Marcelo Ricardo Leitnerfedb1bd32018-06-20 12:47:52 -0300229 SCTP_MIB_FRAGUSRMSGS);
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200230 } else {
231 /* Which may be the only one... */
232 first_len = msg_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233 }
234
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200235 /* Create chunks for all DATA chunks. */
236 for (remaining = msg_len; remaining; remaining -= len) {
237 u8 frag = SCTP_DATA_MIDDLE_FRAG;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200239 if (remaining == msg_len) {
240 /* First frag, which may also be the last */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241 frag |= SCTP_DATA_FIRST_FRAG;
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200242 len = first_len;
243 } else {
244 /* Middle frags */
245 len = max_data;
246 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200248 if (len >= remaining) {
249 /* Last frag, which may also be the first */
250 len = remaining;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251 frag |= SCTP_DATA_LAST_FRAG;
252
Wei Yongjunb93d6472009-11-23 15:53:56 -0500253 /* The application requests to set the I-bit of the
254 * last DATA chunk of a user message when providing
255 * the user message to the SCTP implementation.
256 */
257 if ((sinfo->sinfo_flags & SCTP_EOF) ||
258 (sinfo->sinfo_flags & SCTP_SACK_IMMEDIATELY))
259 frag |= SCTP_DATA_SACK_IMM;
260 }
261
Xin Long0c3f6f62017-12-08 21:04:01 +0800262 chunk = asoc->stream.si->make_datafrag(asoc, sinfo, len, frag,
263 GFP_KERNEL);
Tommi Rantala6e51fe72012-11-22 03:23:16 +0000264 if (!chunk) {
265 err = -ENOMEM;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266 goto errout;
Tommi Rantala6e51fe72012-11-22 03:23:16 +0000267 }
268
Al Viroe0eb0932014-11-15 01:11:23 -0500269 err = sctp_user_addto_chunk(chunk, len, from);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700270 if (err < 0)
Tommi Rantalabe364c82012-11-27 04:01:46 +0000271 goto errout_chunk_free;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272
Xin Long1b1e0bc2018-03-14 19:05:30 +0800273 chunk->shkey = shkey;
274
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 /* Put the chunk->skb back into the form expected by send. */
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200276 __skb_pull(chunk->skb, (__u8 *)chunk->chunk_hdr -
277 chunk->skb->data);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278
279 sctp_datamsg_assign(msg, chunk);
280 list_add_tail(&chunk->frag_list, &msg->chunks);
281 }
282
283 return msg;
284
Tommi Rantalabe364c82012-11-27 04:01:46 +0000285errout_chunk_free:
286 sctp_chunk_free(chunk);
287
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288errout:
289 list_for_each_safe(pos, temp, &msg->chunks) {
290 list_del_init(pos);
291 chunk = list_entry(pos, struct sctp_chunk, frag_list);
292 sctp_chunk_free(chunk);
293 }
Florian Westphal80445cf2008-03-23 22:47:08 -0700294 sctp_datamsg_put(msg);
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200295
Tommi Rantala6e51fe72012-11-22 03:23:16 +0000296 return ERR_PTR(err);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297}
298
299/* Check whether this message has expired. */
300int sctp_chunk_abandoned(struct sctp_chunk *chunk)
301{
Xin Long8ae808e2016-10-08 11:40:16 +0800302 if (!chunk->asoc->peer.prsctp_capable)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303 return 0;
304
Xin Longe5f61292017-11-25 21:18:35 +0800305 if (chunk->msg->abandoned)
306 return 1;
307
Xin Long779edd72017-11-25 21:18:36 +0800308 if (!chunk->has_tsn &&
309 !(chunk->chunk_hdr->flags & SCTP_DATA_FIRST_FRAG))
310 return 0;
311
Xin Longa6c2f792016-07-09 19:47:43 +0800312 if (SCTP_PR_TTL_ENABLED(chunk->sinfo.sinfo_flags) &&
Xin Long06054832016-09-29 02:37:27 +0800313 time_after(jiffies, chunk->msg->expires_at)) {
Xin Longd229d482017-04-01 17:07:46 +0800314 struct sctp_stream_out *streamout =
Konstantin Khorenko05364ca2018-08-10 20:11:42 +0300315 SCTP_SO(&chunk->asoc->stream,
316 chunk->sinfo.sinfo_stream);
Xin Longd229d482017-04-01 17:07:46 +0800317
318 if (chunk->sent_count) {
Xin Longa6c2f792016-07-09 19:47:43 +0800319 chunk->asoc->abandoned_sent[SCTP_PR_INDEX(TTL)]++;
Marcelo Ricardo Leitnerf952be72017-10-03 19:20:11 -0300320 streamout->ext->abandoned_sent[SCTP_PR_INDEX(TTL)]++;
Xin Longd229d482017-04-01 17:07:46 +0800321 } else {
Xin Longa6c2f792016-07-09 19:47:43 +0800322 chunk->asoc->abandoned_unsent[SCTP_PR_INDEX(TTL)]++;
Marcelo Ricardo Leitnerf952be72017-10-03 19:20:11 -0300323 streamout->ext->abandoned_unsent[SCTP_PR_INDEX(TTL)]++;
Xin Longd229d482017-04-01 17:07:46 +0800324 }
Xin Longe5f61292017-11-25 21:18:35 +0800325 chunk->msg->abandoned = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700326 return 1;
Xin Long01aadb32016-07-09 19:47:44 +0800327 } else if (SCTP_PR_RTX_ENABLED(chunk->sinfo.sinfo_flags) &&
Xin Long06054832016-09-29 02:37:27 +0800328 chunk->sent_count > chunk->sinfo.sinfo_timetolive) {
Xin Longd229d482017-04-01 17:07:46 +0800329 struct sctp_stream_out *streamout =
Konstantin Khorenko05364ca2018-08-10 20:11:42 +0300330 SCTP_SO(&chunk->asoc->stream,
331 chunk->sinfo.sinfo_stream);
Xin Longd229d482017-04-01 17:07:46 +0800332
Xin Long01aadb32016-07-09 19:47:44 +0800333 chunk->asoc->abandoned_sent[SCTP_PR_INDEX(RTX)]++;
Marcelo Ricardo Leitnerf952be72017-10-03 19:20:11 -0300334 streamout->ext->abandoned_sent[SCTP_PR_INDEX(RTX)]++;
Xin Longe5f61292017-11-25 21:18:35 +0800335 chunk->msg->abandoned = 1;
Xin Long01aadb32016-07-09 19:47:44 +0800336 return 1;
Xin Long8ae808e2016-10-08 11:40:16 +0800337 } else if (!SCTP_PR_POLICY(chunk->sinfo.sinfo_flags) &&
338 chunk->msg->expires_at &&
339 time_after(jiffies, chunk->msg->expires_at)) {
Xin Longe5f61292017-11-25 21:18:35 +0800340 chunk->msg->abandoned = 1;
Xin Long8ae808e2016-10-08 11:40:16 +0800341 return 1;
Xin Longa6c2f792016-07-09 19:47:43 +0800342 }
Xin Long8dbdf1f2016-07-09 19:47:45 +0800343 /* PRIO policy is processed by sendmsg, not here */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344
345 return 0;
346}
347
348/* This chunk (and consequently entire message) has failed in its sending. */
349void sctp_chunk_fail(struct sctp_chunk *chunk, int error)
350{
351 chunk->msg->send_failed = 1;
352 chunk->msg->send_error = error;
353}