blob: 8a99a29302846fdc2b21d225daffa7e44adb067c [file] [log] [blame]
Mat Martineauf870fa02020-01-21 16:56:15 -08001/* SPDX-License-Identifier: GPL-2.0 */
2/* Multipath TCP
3 *
4 * Copyright (c) 2017 - 2019, Intel Corporation.
5 */
6
7#ifndef __MPTCP_PROTOCOL_H
8#define __MPTCP_PROTOCOL_H
9
Peter Krystad79c09492020-01-21 16:56:20 -080010#include <linux/random.h>
11#include <net/tcp.h>
12#include <net/inet_connection_sock.h>
13
Christoph Paaschcc7972e2020-01-21 16:56:31 -080014#define MPTCP_SUPPORTED_VERSION 1
Peter Krystadeda7acd2020-01-21 16:56:16 -080015
16/* MPTCP option bits */
17#define OPTION_MPTCP_MPC_SYN BIT(0)
18#define OPTION_MPTCP_MPC_SYNACK BIT(1)
19#define OPTION_MPTCP_MPC_ACK BIT(2)
20
21/* MPTCP option subtypes */
22#define MPTCPOPT_MP_CAPABLE 0
23#define MPTCPOPT_MP_JOIN 1
24#define MPTCPOPT_DSS 2
25#define MPTCPOPT_ADD_ADDR 3
26#define MPTCPOPT_RM_ADDR 4
27#define MPTCPOPT_MP_PRIO 5
28#define MPTCPOPT_MP_FAIL 6
29#define MPTCPOPT_MP_FASTCLOSE 7
30
31/* MPTCP suboption lengths */
Christoph Paaschcc7972e2020-01-21 16:56:31 -080032#define TCPOLEN_MPTCP_MPC_SYN 4
Peter Krystadeda7acd2020-01-21 16:56:16 -080033#define TCPOLEN_MPTCP_MPC_SYNACK 12
34#define TCPOLEN_MPTCP_MPC_ACK 20
Christoph Paaschcc7972e2020-01-21 16:56:31 -080035#define TCPOLEN_MPTCP_MPC_ACK_DATA 22
Mat Martineau6d0060f2020-01-21 16:56:23 -080036#define TCPOLEN_MPTCP_DSS_BASE 4
Mat Martineau648ef4b2020-01-21 16:56:24 -080037#define TCPOLEN_MPTCP_DSS_ACK32 4
Mat Martineau6d0060f2020-01-21 16:56:23 -080038#define TCPOLEN_MPTCP_DSS_ACK64 8
Mat Martineau648ef4b2020-01-21 16:56:24 -080039#define TCPOLEN_MPTCP_DSS_MAP32 10
Mat Martineau6d0060f2020-01-21 16:56:23 -080040#define TCPOLEN_MPTCP_DSS_MAP64 14
41#define TCPOLEN_MPTCP_DSS_CHECKSUM 2
Peter Krystadeda7acd2020-01-21 16:56:16 -080042
43/* MPTCP MP_CAPABLE flags */
44#define MPTCP_VERSION_MASK (0x0F)
45#define MPTCP_CAP_CHECKSUM_REQD BIT(7)
46#define MPTCP_CAP_EXTENSIBILITY BIT(6)
Paolo Abeni65492c52020-01-21 16:56:30 -080047#define MPTCP_CAP_HMAC_SHA256 BIT(0)
Peter Krystadeda7acd2020-01-21 16:56:16 -080048#define MPTCP_CAP_FLAG_MASK (0x3F)
49
Mat Martineau6d0060f2020-01-21 16:56:23 -080050/* MPTCP DSS flags */
51#define MPTCP_DSS_DATA_FIN BIT(4)
52#define MPTCP_DSS_DSN64 BIT(3)
53#define MPTCP_DSS_HAS_MAP BIT(2)
54#define MPTCP_DSS_ACK64 BIT(1)
55#define MPTCP_DSS_HAS_ACK BIT(0)
Mat Martineau648ef4b2020-01-21 16:56:24 -080056#define MPTCP_DSS_FLAG_MASK (0x1F)
57
58/* MPTCP socket flags */
59#define MPTCP_DATA_READY BIT(0)
Florian Westphal1891c4a2020-01-21 16:56:25 -080060#define MPTCP_SEND_SPACE BIT(1)
Mat Martineau6d0060f2020-01-21 16:56:23 -080061
Mat Martineauf870fa02020-01-21 16:56:15 -080062/* MPTCP connection sock */
63struct mptcp_sock {
64 /* inet_connection_sock must be the first member */
65 struct inet_connection_sock sk;
Peter Krystadcec37a62020-01-21 16:56:18 -080066 u64 local_key;
67 u64 remote_key;
Mat Martineau6d0060f2020-01-21 16:56:23 -080068 u64 write_seq;
69 u64 ack_seq;
Peter Krystad79c09492020-01-21 16:56:20 -080070 u32 token;
Mat Martineau648ef4b2020-01-21 16:56:24 -080071 unsigned long flags;
Christoph Paaschd22f4982020-01-21 16:56:32 -080072 bool can_ack;
Peter Krystadcec37a62020-01-21 16:56:18 -080073 struct list_head conn_list;
Mat Martineau6d0060f2020-01-21 16:56:23 -080074 struct skb_ext *cached_ext; /* for the next sendmsg */
Mat Martineauf870fa02020-01-21 16:56:15 -080075 struct socket *subflow; /* outgoing connect/listener/!mp_capable */
Paolo Abeni8ab183d2020-01-21 16:56:33 -080076 struct sock *first;
Mat Martineauf870fa02020-01-21 16:56:15 -080077};
78
Peter Krystadcec37a62020-01-21 16:56:18 -080079#define mptcp_for_each_subflow(__msk, __subflow) \
80 list_for_each_entry(__subflow, &((__msk)->conn_list), node)
81
Mat Martineauf870fa02020-01-21 16:56:15 -080082static inline struct mptcp_sock *mptcp_sk(const struct sock *sk)
83{
84 return (struct mptcp_sock *)sk;
85}
86
Peter Krystadcec37a62020-01-21 16:56:18 -080087struct mptcp_subflow_request_sock {
88 struct tcp_request_sock sk;
Christoph Paaschd22f4982020-01-21 16:56:32 -080089 u16 mp_capable : 1,
Peter Krystadcec37a62020-01-21 16:56:18 -080090 mp_join : 1,
Christoph Paaschd22f4982020-01-21 16:56:32 -080091 backup : 1,
92 remote_key_valid : 1;
Peter Krystadcec37a62020-01-21 16:56:18 -080093 u64 local_key;
94 u64 remote_key;
Peter Krystad79c09492020-01-21 16:56:20 -080095 u64 idsn;
96 u32 token;
Mat Martineau648ef4b2020-01-21 16:56:24 -080097 u32 ssn_offset;
Peter Krystadcec37a62020-01-21 16:56:18 -080098};
99
100static inline struct mptcp_subflow_request_sock *
101mptcp_subflow_rsk(const struct request_sock *rsk)
102{
103 return (struct mptcp_subflow_request_sock *)rsk;
104}
105
Peter Krystad2303f992020-01-21 16:56:17 -0800106/* MPTCP subflow context */
107struct mptcp_subflow_context {
Peter Krystadcec37a62020-01-21 16:56:18 -0800108 struct list_head node;/* conn_list of subflows */
109 u64 local_key;
110 u64 remote_key;
Peter Krystad79c09492020-01-21 16:56:20 -0800111 u64 idsn;
Mat Martineau648ef4b2020-01-21 16:56:24 -0800112 u64 map_seq;
Christoph Paaschcc7972e2020-01-21 16:56:31 -0800113 u32 snd_isn;
Peter Krystad79c09492020-01-21 16:56:20 -0800114 u32 token;
Mat Martineau6d0060f2020-01-21 16:56:23 -0800115 u32 rel_write_seq;
Mat Martineau648ef4b2020-01-21 16:56:24 -0800116 u32 map_subflow_seq;
117 u32 ssn_offset;
118 u32 map_data_len;
Peter Krystadcec37a62020-01-21 16:56:18 -0800119 u32 request_mptcp : 1, /* send MP_CAPABLE */
120 mp_capable : 1, /* remote is MPTCP capable */
121 fourth_ack : 1, /* send initial DSS */
Mat Martineau648ef4b2020-01-21 16:56:24 -0800122 conn_finished : 1,
123 map_valid : 1,
Christoph Paaschd22f4982020-01-21 16:56:32 -0800124 mpc_map : 1,
Mat Martineau648ef4b2020-01-21 16:56:24 -0800125 data_avail : 1,
Christoph Paaschd22f4982020-01-21 16:56:32 -0800126 rx_eof : 1,
127 can_ack : 1; /* only after processing the remote a key */
Mat Martineau648ef4b2020-01-21 16:56:24 -0800128
Peter Krystad2303f992020-01-21 16:56:17 -0800129 struct sock *tcp_sock; /* tcp sk backpointer */
130 struct sock *conn; /* parent mptcp_sock */
Peter Krystadcec37a62020-01-21 16:56:18 -0800131 const struct inet_connection_sock_af_ops *icsk_af_ops;
Mat Martineau648ef4b2020-01-21 16:56:24 -0800132 void (*tcp_data_ready)(struct sock *sk);
133 void (*tcp_state_change)(struct sock *sk);
134 void (*tcp_write_space)(struct sock *sk);
135
Peter Krystad2303f992020-01-21 16:56:17 -0800136 struct rcu_head rcu;
137};
138
139static inline struct mptcp_subflow_context *
140mptcp_subflow_ctx(const struct sock *sk)
141{
142 struct inet_connection_sock *icsk = inet_csk(sk);
143
144 /* Use RCU on icsk_ulp_data only for sock diag code */
145 return (__force struct mptcp_subflow_context *)icsk->icsk_ulp_data;
146}
147
148static inline struct sock *
149mptcp_subflow_tcp_sock(const struct mptcp_subflow_context *subflow)
150{
151 return subflow->tcp_sock;
152}
153
Mat Martineau648ef4b2020-01-21 16:56:24 -0800154static inline u64
155mptcp_subflow_get_map_offset(const struct mptcp_subflow_context *subflow)
156{
157 return tcp_sk(mptcp_subflow_tcp_sock(subflow))->copied_seq -
158 subflow->ssn_offset -
159 subflow->map_subflow_seq;
160}
161
162static inline u64
163mptcp_subflow_get_mapped_dsn(const struct mptcp_subflow_context *subflow)
164{
165 return subflow->map_seq + mptcp_subflow_get_map_offset(subflow);
166}
167
168int mptcp_is_enabled(struct net *net);
169bool mptcp_subflow_data_available(struct sock *sk);
Peter Krystad2303f992020-01-21 16:56:17 -0800170void mptcp_subflow_init(void);
171int mptcp_subflow_create_socket(struct sock *sk, struct socket **new_sock);
172
Mat Martineau648ef4b2020-01-21 16:56:24 -0800173static inline void mptcp_subflow_tcp_fallback(struct sock *sk,
174 struct mptcp_subflow_context *ctx)
175{
176 sk->sk_data_ready = ctx->tcp_data_ready;
177 sk->sk_state_change = ctx->tcp_state_change;
178 sk->sk_write_space = ctx->tcp_write_space;
179
180 inet_csk(sk)->icsk_af_ops = ctx->icsk_af_ops;
181}
182
Peter Krystadcec37a62020-01-21 16:56:18 -0800183extern const struct inet_connection_sock_af_ops ipv4_specific;
184#if IS_ENABLED(CONFIG_MPTCP_IPV6)
185extern const struct inet_connection_sock_af_ops ipv6_specific;
186#endif
187
Mat Martineau648ef4b2020-01-21 16:56:24 -0800188void mptcp_proto_init(void);
Matthieu Baerts784325e2020-01-21 16:56:28 -0800189#if IS_ENABLED(CONFIG_MPTCP_IPV6)
190int mptcp_proto_v6_init(void);
191#endif
Mat Martineau648ef4b2020-01-21 16:56:24 -0800192
193struct mptcp_read_arg {
194 struct msghdr *msg;
195};
196
197int mptcp_read_actor(read_descriptor_t *desc, struct sk_buff *skb,
198 unsigned int offset, size_t len);
199
Peter Krystadcec37a62020-01-21 16:56:18 -0800200void mptcp_get_options(const struct sk_buff *skb,
201 struct tcp_options_received *opt_rx);
202
203void mptcp_finish_connect(struct sock *sk);
204
Peter Krystad79c09492020-01-21 16:56:20 -0800205int mptcp_token_new_request(struct request_sock *req);
206void mptcp_token_destroy_request(u32 token);
207int mptcp_token_new_connect(struct sock *sk);
208int mptcp_token_new_accept(u32 token);
209void mptcp_token_update_accept(struct sock *sk, struct sock *conn);
210void mptcp_token_destroy(u32 token);
211
212void mptcp_crypto_key_sha(u64 key, u32 *token, u64 *idsn);
213static inline void mptcp_crypto_key_gen_sha(u64 *key, u32 *token, u64 *idsn)
214{
215 /* we might consider a faster version that computes the key as a
216 * hash of some information available in the MPTCP socket. Use
217 * random data at the moment, as it's probably the safest option
218 * in case multiple sockets are opened in different namespaces at
219 * the same time.
220 */
221 get_random_bytes(key, sizeof(u64));
222 mptcp_crypto_key_sha(*key, token, idsn);
223}
224
225void mptcp_crypto_hmac_sha(u64 key1, u64 key2, u32 nonce1, u32 nonce2,
Paolo Abeni65492c52020-01-21 16:56:30 -0800226 void *hash_out);
Peter Krystad79c09492020-01-21 16:56:20 -0800227
Mat Martineau6d0060f2020-01-21 16:56:23 -0800228static inline struct mptcp_ext *mptcp_get_ext(struct sk_buff *skb)
229{
230 return (struct mptcp_ext *)skb_ext_find(skb, SKB_EXT_MPTCP);
231}
232
Mat Martineau648ef4b2020-01-21 16:56:24 -0800233static inline bool before64(__u64 seq1, __u64 seq2)
234{
235 return (__s64)(seq1 - seq2) < 0;
236}
237
238#define after64(seq2, seq1) before64(seq1, seq2)
239
Mat Martineauf870fa02020-01-21 16:56:15 -0800240#endif /* __MPTCP_PROTOCOL_H */