blob: 81466f6442e89fe2c0a9ff44d30645627812e54c [file] [log] [blame]
Vlad Yasevich60c778b2008-01-11 09:57:09 -05001/* SCTP kernel implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * (C) Copyright IBM Corp. 2003, 2004
3 *
Vlad Yasevich60c778b2008-01-11 09:57:09 -05004 * This file is part of the SCTP kernel implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07005 *
Michael Opdenacker59c51592007-05-09 08:57:56 +02006 * This file contains the code relating the chunk abstraction.
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 *
Vlad Yasevich60c778b2008-01-11 09:57:09 -05008 * This SCTP implementation is free software;
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 * you can redistribute it and/or modify it under the terms of
10 * the GNU General Public License as published by
11 * the Free Software Foundation; either version 2, or (at your option)
12 * any later version.
13 *
Vlad Yasevich60c778b2008-01-11 09:57:09 -050014 * This SCTP implementation is distributed in the hope that it
Linus Torvalds1da177e2005-04-16 15:20:36 -070015 * will be useful, but WITHOUT ANY WARRANTY; without even the implied
16 * ************************
17 * warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
18 * See the GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
Jeff Kirsher4b2f13a2013-12-06 06:28:48 -080021 * along with GNU CC; see the file COPYING. If not, see
22 * <http://www.gnu.org/licenses/>.
Linus Torvalds1da177e2005-04-16 15:20:36 -070023 *
24 * Please send any bug reports or fixes you make to the
25 * email address(es):
Daniel Borkmann91705c62013-07-23 14:51:47 +020026 * lksctp developers <linux-sctp@vger.kernel.org>
Linus Torvalds1da177e2005-04-16 15:20:36 -070027 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070028 * Written or modified by:
29 * Jon Grimm <jgrimm@us.ibm.com>
30 * Sridhar Samudrala <sri@us.ibm.com>
Linus Torvalds1da177e2005-04-16 15:20:36 -070031 */
32
Joe Perches145ce502010-08-24 13:21:08 +000033#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
34
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <linux/types.h>
36#include <linux/kernel.h>
37#include <linux/net.h>
38#include <linux/inet.h>
39#include <linux/skbuff.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090040#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070041#include <net/sock.h>
42#include <net/sctp/sctp.h>
43#include <net/sctp/sm.h>
44
45/* This file is mostly in anticipation of future work, but initially
46 * populate with fragment tracking for an outbound message.
47 */
48
49/* Initialize datamsg from memory. */
50static void sctp_datamsg_init(struct sctp_datamsg *msg)
51{
52 atomic_set(&msg->refcnt, 1);
53 msg->send_failed = 0;
54 msg->send_error = 0;
Vlad Yasevich0e3aef82010-04-30 22:41:10 -040055 msg->can_delay = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -070056 msg->expires_at = 0;
57 INIT_LIST_HEAD(&msg->chunks);
58}
59
60/* Allocate and initialize datamsg. */
Daniel Borkmanndda91922013-06-17 11:40:05 +020061static struct sctp_datamsg *sctp_datamsg_new(gfp_t gfp)
Linus Torvalds1da177e2005-04-16 15:20:36 -070062{
63 struct sctp_datamsg *msg;
64 msg = kmalloc(sizeof(struct sctp_datamsg), gfp);
Li Zefane8c38752008-04-10 01:57:24 -070065 if (msg) {
Linus Torvalds1da177e2005-04-16 15:20:36 -070066 sctp_datamsg_init(msg);
Li Zefane8c38752008-04-10 01:57:24 -070067 SCTP_DBG_OBJCNT_INC(datamsg);
68 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070069 return msg;
70}
71
Xin Longb61c6542016-09-14 02:04:20 +080072void sctp_datamsg_free(struct sctp_datamsg *msg)
73{
74 struct sctp_chunk *chunk;
75
76 /* This doesn't have to be a _safe vairant because
77 * sctp_chunk_free() only drops the refs.
78 */
79 list_for_each_entry(chunk, &msg->chunks, frag_list)
80 sctp_chunk_free(chunk);
81
82 sctp_datamsg_put(msg);
83}
84
Linus Torvalds1da177e2005-04-16 15:20:36 -070085/* Final destructruction of datamsg memory. */
86static void sctp_datamsg_destroy(struct sctp_datamsg *msg)
87{
88 struct list_head *pos, *temp;
89 struct sctp_chunk *chunk;
90 struct sctp_sock *sp;
91 struct sctp_ulpevent *ev;
92 struct sctp_association *asoc = NULL;
93 int error = 0, notify;
94
95 /* If we failed, we may need to notify. */
96 notify = msg->send_failed ? -1 : 0;
97
98 /* Release all references. */
99 list_for_each_safe(pos, temp, &msg->chunks) {
100 list_del_init(pos);
101 chunk = list_entry(pos, struct sctp_chunk, frag_list);
102 /* Check whether we _really_ need to notify. */
103 if (notify < 0) {
104 asoc = chunk->asoc;
105 if (msg->send_error)
106 error = msg->send_error;
107 else
108 error = asoc->outqueue.error;
109
110 sp = sctp_sk(asoc->base.sk);
111 notify = sctp_ulpevent_type_enabled(SCTP_SEND_FAILED,
112 &sp->subscribe);
113 }
114
115 /* Generate a SEND FAILED event only if enabled. */
116 if (notify > 0) {
117 int sent;
118 if (chunk->has_tsn)
119 sent = SCTP_DATA_SENT;
120 else
121 sent = SCTP_DATA_UNSENT;
122
123 ev = sctp_ulpevent_make_send_failed(asoc, chunk, sent,
124 error, GFP_ATOMIC);
125 if (ev)
126 sctp_ulpq_tail_event(&asoc->ulpq, ev);
127 }
128
129 sctp_chunk_put(chunk);
130 }
131
132 SCTP_DBG_OBJCNT_DEC(datamsg);
133 kfree(msg);
134}
135
136/* Hold a reference. */
137static void sctp_datamsg_hold(struct sctp_datamsg *msg)
138{
139 atomic_inc(&msg->refcnt);
140}
141
142/* Release a reference. */
143void sctp_datamsg_put(struct sctp_datamsg *msg)
144{
145 if (atomic_dec_and_test(&msg->refcnt))
146 sctp_datamsg_destroy(msg);
147}
148
Linus Torvalds1da177e2005-04-16 15:20:36 -0700149/* Assign a chunk to this datamsg. */
150static void sctp_datamsg_assign(struct sctp_datamsg *msg, struct sctp_chunk *chunk)
151{
152 sctp_datamsg_hold(msg);
153 chunk->msg = msg;
154}
155
156
157/* A data chunk can have a maximum payload of (2^16 - 20). Break
158 * down any such message into smaller chunks. Opportunistically, fragment
159 * the chunks down to the current MTU constraints. We may get refragmented
160 * later if the PMTU changes, but it is _much better_ to fragment immediately
161 * with a reasonable guess than always doing our fragmentation on the
162 * soft-interrupt.
163 */
164struct sctp_datamsg *sctp_datamsg_from_user(struct sctp_association *asoc,
165 struct sctp_sndrcvinfo *sinfo,
Al Viroe0eb0932014-11-15 01:11:23 -0500166 struct iov_iter *from)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167{
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200168 size_t len, first_len, max_data, remaining;
169 size_t msg_len = iov_iter_count(from);
170 struct list_head *pos, *temp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171 struct sctp_chunk *chunk;
172 struct sctp_datamsg *msg;
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200173 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174
175 msg = sctp_datamsg_new(GFP_KERNEL);
176 if (!msg)
Tommi Rantala6e51fe72012-11-22 03:23:16 +0000177 return ERR_PTR(-ENOMEM);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178
179 /* Note: Calculate this outside of the loop, so that all fragments
180 * have the same expiration.
181 */
Xin Long8ae808e2016-10-08 11:40:16 +0800182 if (asoc->peer.prsctp_capable && sinfo->sinfo_timetolive &&
183 (SCTP_PR_TTL_ENABLED(sinfo->sinfo_flags) ||
184 !SCTP_PR_POLICY(sinfo->sinfo_flags)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700185 msg->expires_at = jiffies +
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200186 msecs_to_jiffies(sinfo->sinfo_timetolive);
Xin Long06054832016-09-29 02:37:27 +0800187
Vlad Yasevich3e62abf2009-09-04 18:20:56 -0400188 /* This is the biggest possible DATA chunk that can fit into
189 * the packet
190 */
Marcelo Ricardo Leitner4a225ce2016-09-21 08:45:56 -0300191 max_data = asoc->pathmtu -
192 sctp_sk(asoc->base.sk)->pf->af->net_header_len -
193 sizeof(struct sctphdr) - sizeof(struct sctp_data_chunk);
194 max_data = SCTP_TRUNC4(max_data);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195
Vlad Yasevich4cd57c82007-09-16 19:32:45 -0700196 /* If the the peer requested that we authenticate DATA chunks
wangweidong2bccbad2013-10-26 16:06:30 +0800197 * we need to account for bundling of the AUTH chunks along with
Vlad Yasevich4cd57c82007-09-16 19:32:45 -0700198 * DATA.
199 */
200 if (sctp_auth_send_cid(SCTP_CID_DATA, asoc)) {
201 struct sctp_hmac *hmac_desc = sctp_auth_asoc_get_hmac(asoc);
202
203 if (hmac_desc)
Marcelo Ricardo Leitnere2f036a2016-09-21 08:45:55 -0300204 max_data -= SCTP_PAD4(sizeof(sctp_auth_chunk_t) +
205 hmac_desc->hmac_len);
Vlad Yasevich4cd57c82007-09-16 19:32:45 -0700206 }
207
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200208 /* Check what's our max considering the above */
209 max_data = min_t(size_t, max_data, asoc->frag_point);
Vlad Yasevich3e62abf2009-09-04 18:20:56 -0400210
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200211 /* Set first_len and then account for possible bundles on first frag */
212 first_len = max_data;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213
Vlad Yasevich5d7ff262009-08-07 13:23:28 -0400214 /* Check to see if we have a pending SACK and try to let it be bundled
215 * with this message. Do this if we don't have any data queued already.
216 * To check that, look at out_qlen and retransmit list.
217 * NOTE: we will not reduce to account for SACK, if the message would
218 * not have been fragmented.
219 */
220 if (timer_pending(&asoc->timers[SCTP_EVENT_TIMEOUT_SACK]) &&
221 asoc->outqueue.out_qlen == 0 &&
222 list_empty(&asoc->outqueue.retransmit) &&
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200223 msg_len > max_data)
224 first_len -= SCTP_PAD4(sizeof(sctp_sack_chunk_t));
Vlad Yasevich5d7ff262009-08-07 13:23:28 -0400225
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226 /* Encourage Cookie-ECHO bundling. */
Vlad Yasevich5d7ff262009-08-07 13:23:28 -0400227 if (asoc->state < SCTP_STATE_COOKIE_ECHOED)
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200228 first_len -= SCTP_ARBITRARY_COOKIE_ECHO_LEN;
Vlad Yasevich3e62abf2009-09-04 18:20:56 -0400229
230 /* Account for a different sized first fragment */
231 if (msg_len >= first_len) {
Vlad Yasevich0e3aef82010-04-30 22:41:10 -0400232 msg->can_delay = 0;
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200233 SCTP_INC_STATS(sock_net(asoc->base.sk), SCTP_MIB_FRAGUSRMSGS);
234 } else {
235 /* Which may be the only one... */
236 first_len = msg_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700237 }
238
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200239 /* Create chunks for all DATA chunks. */
240 for (remaining = msg_len; remaining; remaining -= len) {
241 u8 frag = SCTP_DATA_MIDDLE_FRAG;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200243 if (remaining == msg_len) {
244 /* First frag, which may also be the last */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245 frag |= SCTP_DATA_FIRST_FRAG;
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200246 len = first_len;
247 } else {
248 /* Middle frags */
249 len = max_data;
250 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200252 if (len >= remaining) {
253 /* Last frag, which may also be the first */
254 len = remaining;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 frag |= SCTP_DATA_LAST_FRAG;
256
Wei Yongjunb93d6472009-11-23 15:53:56 -0500257 /* The application requests to set the I-bit of the
258 * last DATA chunk of a user message when providing
259 * the user message to the SCTP implementation.
260 */
261 if ((sinfo->sinfo_flags & SCTP_EOF) ||
262 (sinfo->sinfo_flags & SCTP_SACK_IMMEDIATELY))
263 frag |= SCTP_DATA_SACK_IMM;
264 }
265
Marcelo Ricardo Leitnercea87682016-03-10 18:33:07 -0300266 chunk = sctp_make_datafrag_empty(asoc, sinfo, len, frag,
267 0, GFP_KERNEL);
Tommi Rantala6e51fe72012-11-22 03:23:16 +0000268 if (!chunk) {
269 err = -ENOMEM;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700270 goto errout;
Tommi Rantala6e51fe72012-11-22 03:23:16 +0000271 }
272
Al Viroe0eb0932014-11-15 01:11:23 -0500273 err = sctp_user_addto_chunk(chunk, len, from);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274 if (err < 0)
Tommi Rantalabe364c82012-11-27 04:01:46 +0000275 goto errout_chunk_free;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277 /* Put the chunk->skb back into the form expected by send. */
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200278 __skb_pull(chunk->skb, (__u8 *)chunk->chunk_hdr -
279 chunk->skb->data);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280
281 sctp_datamsg_assign(msg, chunk);
282 list_add_tail(&chunk->frag_list, &msg->chunks);
283 }
284
285 return msg;
286
Tommi Rantalabe364c82012-11-27 04:01:46 +0000287errout_chunk_free:
288 sctp_chunk_free(chunk);
289
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290errout:
291 list_for_each_safe(pos, temp, &msg->chunks) {
292 list_del_init(pos);
293 chunk = list_entry(pos, struct sctp_chunk, frag_list);
294 sctp_chunk_free(chunk);
295 }
Florian Westphal80445cf2008-03-23 22:47:08 -0700296 sctp_datamsg_put(msg);
Marcelo Ricardo Leitnerbfd2e4b2016-12-29 15:53:28 -0200297
Tommi Rantala6e51fe72012-11-22 03:23:16 +0000298 return ERR_PTR(err);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299}
300
301/* Check whether this message has expired. */
302int sctp_chunk_abandoned(struct sctp_chunk *chunk)
303{
Xin Long8ae808e2016-10-08 11:40:16 +0800304 if (!chunk->asoc->peer.prsctp_capable)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700305 return 0;
306
Xin Longa6c2f792016-07-09 19:47:43 +0800307 if (SCTP_PR_TTL_ENABLED(chunk->sinfo.sinfo_flags) &&
Xin Long06054832016-09-29 02:37:27 +0800308 time_after(jiffies, chunk->msg->expires_at)) {
Xin Longd229d482017-04-01 17:07:46 +0800309 struct sctp_stream_out *streamout =
Xin Longcee360a2017-05-31 16:36:31 +0800310 &chunk->asoc->stream.out[chunk->sinfo.sinfo_stream];
Xin Longd229d482017-04-01 17:07:46 +0800311
312 if (chunk->sent_count) {
Xin Longa6c2f792016-07-09 19:47:43 +0800313 chunk->asoc->abandoned_sent[SCTP_PR_INDEX(TTL)]++;
Xin Longd229d482017-04-01 17:07:46 +0800314 streamout->abandoned_sent[SCTP_PR_INDEX(TTL)]++;
315 } else {
Xin Longa6c2f792016-07-09 19:47:43 +0800316 chunk->asoc->abandoned_unsent[SCTP_PR_INDEX(TTL)]++;
Xin Longd229d482017-04-01 17:07:46 +0800317 streamout->abandoned_unsent[SCTP_PR_INDEX(TTL)]++;
318 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700319 return 1;
Xin Long01aadb32016-07-09 19:47:44 +0800320 } else if (SCTP_PR_RTX_ENABLED(chunk->sinfo.sinfo_flags) &&
Xin Long06054832016-09-29 02:37:27 +0800321 chunk->sent_count > chunk->sinfo.sinfo_timetolive) {
Xin Longd229d482017-04-01 17:07:46 +0800322 struct sctp_stream_out *streamout =
Xin Longcee360a2017-05-31 16:36:31 +0800323 &chunk->asoc->stream.out[chunk->sinfo.sinfo_stream];
Xin Longd229d482017-04-01 17:07:46 +0800324
Xin Long01aadb32016-07-09 19:47:44 +0800325 chunk->asoc->abandoned_sent[SCTP_PR_INDEX(RTX)]++;
Xin Longd229d482017-04-01 17:07:46 +0800326 streamout->abandoned_sent[SCTP_PR_INDEX(RTX)]++;
Xin Long01aadb32016-07-09 19:47:44 +0800327 return 1;
Xin Long8ae808e2016-10-08 11:40:16 +0800328 } else if (!SCTP_PR_POLICY(chunk->sinfo.sinfo_flags) &&
329 chunk->msg->expires_at &&
330 time_after(jiffies, chunk->msg->expires_at)) {
331 return 1;
Xin Longa6c2f792016-07-09 19:47:43 +0800332 }
Xin Long8dbdf1f2016-07-09 19:47:45 +0800333 /* PRIO policy is processed by sendmsg, not here */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334
335 return 0;
336}
337
338/* This chunk (and consequently entire message) has failed in its sending. */
339void sctp_chunk_fail(struct sctp_chunk *chunk, int error)
340{
341 chunk->msg->send_failed = 1;
342 chunk->msg->send_error = error;
343}