blob: 10eaa7c7381b0443823d856049207aa0dc85795d [file] [log] [blame]
Mat Martineauf870fa02020-01-21 16:56:15 -08001/* SPDX-License-Identifier: GPL-2.0 */
2/* Multipath TCP
3 *
4 * Copyright (c) 2017 - 2019, Intel Corporation.
5 */
6
7#ifndef __MPTCP_PROTOCOL_H
8#define __MPTCP_PROTOCOL_H
9
Peter Krystad79c09492020-01-21 16:56:20 -080010#include <linux/random.h>
11#include <net/tcp.h>
12#include <net/inet_connection_sock.h>
13
Christoph Paaschcc7972e2020-01-21 16:56:31 -080014#define MPTCP_SUPPORTED_VERSION 1
Peter Krystadeda7acd2020-01-21 16:56:16 -080015
16/* MPTCP option bits */
17#define OPTION_MPTCP_MPC_SYN BIT(0)
18#define OPTION_MPTCP_MPC_SYNACK BIT(1)
19#define OPTION_MPTCP_MPC_ACK BIT(2)
20
21/* MPTCP option subtypes */
22#define MPTCPOPT_MP_CAPABLE 0
23#define MPTCPOPT_MP_JOIN 1
24#define MPTCPOPT_DSS 2
25#define MPTCPOPT_ADD_ADDR 3
26#define MPTCPOPT_RM_ADDR 4
27#define MPTCPOPT_MP_PRIO 5
28#define MPTCPOPT_MP_FAIL 6
29#define MPTCPOPT_MP_FASTCLOSE 7
30
31/* MPTCP suboption lengths */
Christoph Paaschcc7972e2020-01-21 16:56:31 -080032#define TCPOLEN_MPTCP_MPC_SYN 4
Peter Krystadeda7acd2020-01-21 16:56:16 -080033#define TCPOLEN_MPTCP_MPC_SYNACK 12
34#define TCPOLEN_MPTCP_MPC_ACK 20
Christoph Paaschcc7972e2020-01-21 16:56:31 -080035#define TCPOLEN_MPTCP_MPC_ACK_DATA 22
Mat Martineau6d0060f2020-01-21 16:56:23 -080036#define TCPOLEN_MPTCP_DSS_BASE 4
Mat Martineau648ef4b2020-01-21 16:56:24 -080037#define TCPOLEN_MPTCP_DSS_ACK32 4
Mat Martineau6d0060f2020-01-21 16:56:23 -080038#define TCPOLEN_MPTCP_DSS_ACK64 8
Mat Martineau648ef4b2020-01-21 16:56:24 -080039#define TCPOLEN_MPTCP_DSS_MAP32 10
Mat Martineau6d0060f2020-01-21 16:56:23 -080040#define TCPOLEN_MPTCP_DSS_MAP64 14
41#define TCPOLEN_MPTCP_DSS_CHECKSUM 2
Peter Krystadeda7acd2020-01-21 16:56:16 -080042
43/* MPTCP MP_CAPABLE flags */
44#define MPTCP_VERSION_MASK (0x0F)
45#define MPTCP_CAP_CHECKSUM_REQD BIT(7)
46#define MPTCP_CAP_EXTENSIBILITY BIT(6)
Paolo Abeni65492c52020-01-21 16:56:30 -080047#define MPTCP_CAP_HMAC_SHA256 BIT(0)
Peter Krystadeda7acd2020-01-21 16:56:16 -080048#define MPTCP_CAP_FLAG_MASK (0x3F)
49
Mat Martineau6d0060f2020-01-21 16:56:23 -080050/* MPTCP DSS flags */
51#define MPTCP_DSS_DATA_FIN BIT(4)
52#define MPTCP_DSS_DSN64 BIT(3)
53#define MPTCP_DSS_HAS_MAP BIT(2)
54#define MPTCP_DSS_ACK64 BIT(1)
55#define MPTCP_DSS_HAS_ACK BIT(0)
Mat Martineau648ef4b2020-01-21 16:56:24 -080056#define MPTCP_DSS_FLAG_MASK (0x1F)
57
58/* MPTCP socket flags */
59#define MPTCP_DATA_READY BIT(0)
Florian Westphal1891c4a2020-01-21 16:56:25 -080060#define MPTCP_SEND_SPACE BIT(1)
Mat Martineau6d0060f2020-01-21 16:56:23 -080061
Mat Martineauf870fa02020-01-21 16:56:15 -080062/* MPTCP connection sock */
63struct mptcp_sock {
64 /* inet_connection_sock must be the first member */
65 struct inet_connection_sock sk;
Peter Krystadcec37a62020-01-21 16:56:18 -080066 u64 local_key;
67 u64 remote_key;
Mat Martineau6d0060f2020-01-21 16:56:23 -080068 u64 write_seq;
69 u64 ack_seq;
Peter Krystad79c09492020-01-21 16:56:20 -080070 u32 token;
Mat Martineau648ef4b2020-01-21 16:56:24 -080071 unsigned long flags;
Christoph Paaschd22f4982020-01-21 16:56:32 -080072 bool can_ack;
Peter Krystadcec37a62020-01-21 16:56:18 -080073 struct list_head conn_list;
Mat Martineau6d0060f2020-01-21 16:56:23 -080074 struct skb_ext *cached_ext; /* for the next sendmsg */
Mat Martineauf870fa02020-01-21 16:56:15 -080075 struct socket *subflow; /* outgoing connect/listener/!mp_capable */
76};
77
Peter Krystadcec37a62020-01-21 16:56:18 -080078#define mptcp_for_each_subflow(__msk, __subflow) \
79 list_for_each_entry(__subflow, &((__msk)->conn_list), node)
80
Mat Martineauf870fa02020-01-21 16:56:15 -080081static inline struct mptcp_sock *mptcp_sk(const struct sock *sk)
82{
83 return (struct mptcp_sock *)sk;
84}
85
Peter Krystadcec37a62020-01-21 16:56:18 -080086struct mptcp_subflow_request_sock {
87 struct tcp_request_sock sk;
Christoph Paaschd22f4982020-01-21 16:56:32 -080088 u16 mp_capable : 1,
Peter Krystadcec37a62020-01-21 16:56:18 -080089 mp_join : 1,
Christoph Paaschd22f4982020-01-21 16:56:32 -080090 backup : 1,
91 remote_key_valid : 1;
Peter Krystadcec37a62020-01-21 16:56:18 -080092 u64 local_key;
93 u64 remote_key;
Peter Krystad79c09492020-01-21 16:56:20 -080094 u64 idsn;
95 u32 token;
Mat Martineau648ef4b2020-01-21 16:56:24 -080096 u32 ssn_offset;
Peter Krystadcec37a62020-01-21 16:56:18 -080097};
98
99static inline struct mptcp_subflow_request_sock *
100mptcp_subflow_rsk(const struct request_sock *rsk)
101{
102 return (struct mptcp_subflow_request_sock *)rsk;
103}
104
Peter Krystad2303f992020-01-21 16:56:17 -0800105/* MPTCP subflow context */
106struct mptcp_subflow_context {
Peter Krystadcec37a62020-01-21 16:56:18 -0800107 struct list_head node;/* conn_list of subflows */
108 u64 local_key;
109 u64 remote_key;
Peter Krystad79c09492020-01-21 16:56:20 -0800110 u64 idsn;
Mat Martineau648ef4b2020-01-21 16:56:24 -0800111 u64 map_seq;
Christoph Paaschcc7972e2020-01-21 16:56:31 -0800112 u32 snd_isn;
Peter Krystad79c09492020-01-21 16:56:20 -0800113 u32 token;
Mat Martineau6d0060f2020-01-21 16:56:23 -0800114 u32 rel_write_seq;
Mat Martineau648ef4b2020-01-21 16:56:24 -0800115 u32 map_subflow_seq;
116 u32 ssn_offset;
117 u32 map_data_len;
Peter Krystadcec37a62020-01-21 16:56:18 -0800118 u32 request_mptcp : 1, /* send MP_CAPABLE */
119 mp_capable : 1, /* remote is MPTCP capable */
120 fourth_ack : 1, /* send initial DSS */
Mat Martineau648ef4b2020-01-21 16:56:24 -0800121 conn_finished : 1,
122 map_valid : 1,
Christoph Paaschd22f4982020-01-21 16:56:32 -0800123 mpc_map : 1,
Mat Martineau648ef4b2020-01-21 16:56:24 -0800124 data_avail : 1,
Christoph Paaschd22f4982020-01-21 16:56:32 -0800125 rx_eof : 1,
126 can_ack : 1; /* only after processing the remote a key */
Mat Martineau648ef4b2020-01-21 16:56:24 -0800127
Peter Krystad2303f992020-01-21 16:56:17 -0800128 struct sock *tcp_sock; /* tcp sk backpointer */
129 struct sock *conn; /* parent mptcp_sock */
Peter Krystadcec37a62020-01-21 16:56:18 -0800130 const struct inet_connection_sock_af_ops *icsk_af_ops;
Mat Martineau648ef4b2020-01-21 16:56:24 -0800131 void (*tcp_data_ready)(struct sock *sk);
132 void (*tcp_state_change)(struct sock *sk);
133 void (*tcp_write_space)(struct sock *sk);
134
Peter Krystad2303f992020-01-21 16:56:17 -0800135 struct rcu_head rcu;
136};
137
138static inline struct mptcp_subflow_context *
139mptcp_subflow_ctx(const struct sock *sk)
140{
141 struct inet_connection_sock *icsk = inet_csk(sk);
142
143 /* Use RCU on icsk_ulp_data only for sock diag code */
144 return (__force struct mptcp_subflow_context *)icsk->icsk_ulp_data;
145}
146
147static inline struct sock *
148mptcp_subflow_tcp_sock(const struct mptcp_subflow_context *subflow)
149{
150 return subflow->tcp_sock;
151}
152
Mat Martineau648ef4b2020-01-21 16:56:24 -0800153static inline u64
154mptcp_subflow_get_map_offset(const struct mptcp_subflow_context *subflow)
155{
156 return tcp_sk(mptcp_subflow_tcp_sock(subflow))->copied_seq -
157 subflow->ssn_offset -
158 subflow->map_subflow_seq;
159}
160
161static inline u64
162mptcp_subflow_get_mapped_dsn(const struct mptcp_subflow_context *subflow)
163{
164 return subflow->map_seq + mptcp_subflow_get_map_offset(subflow);
165}
166
167int mptcp_is_enabled(struct net *net);
168bool mptcp_subflow_data_available(struct sock *sk);
Peter Krystad2303f992020-01-21 16:56:17 -0800169void mptcp_subflow_init(void);
170int mptcp_subflow_create_socket(struct sock *sk, struct socket **new_sock);
171
Mat Martineau648ef4b2020-01-21 16:56:24 -0800172static inline void mptcp_subflow_tcp_fallback(struct sock *sk,
173 struct mptcp_subflow_context *ctx)
174{
175 sk->sk_data_ready = ctx->tcp_data_ready;
176 sk->sk_state_change = ctx->tcp_state_change;
177 sk->sk_write_space = ctx->tcp_write_space;
178
179 inet_csk(sk)->icsk_af_ops = ctx->icsk_af_ops;
180}
181
Peter Krystadcec37a62020-01-21 16:56:18 -0800182extern const struct inet_connection_sock_af_ops ipv4_specific;
183#if IS_ENABLED(CONFIG_MPTCP_IPV6)
184extern const struct inet_connection_sock_af_ops ipv6_specific;
185#endif
186
Mat Martineau648ef4b2020-01-21 16:56:24 -0800187void mptcp_proto_init(void);
Matthieu Baerts784325e2020-01-21 16:56:28 -0800188#if IS_ENABLED(CONFIG_MPTCP_IPV6)
189int mptcp_proto_v6_init(void);
190#endif
Mat Martineau648ef4b2020-01-21 16:56:24 -0800191
192struct mptcp_read_arg {
193 struct msghdr *msg;
194};
195
196int mptcp_read_actor(read_descriptor_t *desc, struct sk_buff *skb,
197 unsigned int offset, size_t len);
198
Peter Krystadcec37a62020-01-21 16:56:18 -0800199void mptcp_get_options(const struct sk_buff *skb,
200 struct tcp_options_received *opt_rx);
201
202void mptcp_finish_connect(struct sock *sk);
203
Peter Krystad79c09492020-01-21 16:56:20 -0800204int mptcp_token_new_request(struct request_sock *req);
205void mptcp_token_destroy_request(u32 token);
206int mptcp_token_new_connect(struct sock *sk);
207int mptcp_token_new_accept(u32 token);
208void mptcp_token_update_accept(struct sock *sk, struct sock *conn);
209void mptcp_token_destroy(u32 token);
210
211void mptcp_crypto_key_sha(u64 key, u32 *token, u64 *idsn);
212static inline void mptcp_crypto_key_gen_sha(u64 *key, u32 *token, u64 *idsn)
213{
214 /* we might consider a faster version that computes the key as a
215 * hash of some information available in the MPTCP socket. Use
216 * random data at the moment, as it's probably the safest option
217 * in case multiple sockets are opened in different namespaces at
218 * the same time.
219 */
220 get_random_bytes(key, sizeof(u64));
221 mptcp_crypto_key_sha(*key, token, idsn);
222}
223
224void mptcp_crypto_hmac_sha(u64 key1, u64 key2, u32 nonce1, u32 nonce2,
Paolo Abeni65492c52020-01-21 16:56:30 -0800225 void *hash_out);
Peter Krystad79c09492020-01-21 16:56:20 -0800226
Mat Martineau6d0060f2020-01-21 16:56:23 -0800227static inline struct mptcp_ext *mptcp_get_ext(struct sk_buff *skb)
228{
229 return (struct mptcp_ext *)skb_ext_find(skb, SKB_EXT_MPTCP);
230}
231
Mat Martineau648ef4b2020-01-21 16:56:24 -0800232static inline bool before64(__u64 seq1, __u64 seq2)
233{
234 return (__s64)(seq1 - seq2) < 0;
235}
236
237#define after64(seq2, seq1) before64(seq1, seq2)
238
Mat Martineauf870fa02020-01-21 16:56:15 -0800239#endif /* __MPTCP_PROTOCOL_H */