blob: 0e95572e56b41eb24ffd8e016cbf771fd174f725 [file] [log] [blame]
Per Lidenb97bf3f2006-01-02 19:04:38 +01001/*
2 * net/tipc/net.c: TIPC network routing code
YOSHIFUJI Hideakic4307282007-02-09 23:25:21 +09003 *
Jon Paul Maloy5a379072014-06-25 20:41:36 -05004 * Copyright (c) 1995-2006, 2014, Ericsson AB
Allan Stephens9df3b7e2011-02-24 13:20:20 -05005 * Copyright (c) 2005, 2010-2011, Wind River Systems
Per Lidenb97bf3f2006-01-02 19:04:38 +01006 * All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions are met:
10 *
Per Liden9ea1fd32006-01-11 13:30:43 +010011 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. Neither the names of the copyright holders nor the names of its
17 * contributors may be used to endorse or promote products derived from
18 * this software without specific prior written permission.
19 *
20 * Alternatively, this software may be distributed under the terms of the
21 * GNU General Public License ("GPL") version 2 as published by the Free
22 * Software Foundation.
Per Lidenb97bf3f2006-01-02 19:04:38 +010023 *
24 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
25 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
26 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
27 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
28 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
29 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
30 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
31 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
32 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
33 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
34 * POSSIBILITY OF SUCH DAMAGE.
35 */
36
37#include "core.h"
Per Lidenb97bf3f2006-01-02 19:04:38 +010038#include "net.h"
Per Lidenb97bf3f2006-01-02 19:04:38 +010039#include "name_distr.h"
40#include "subscr.h"
Jon Paul Maloy9816f062014-05-14 05:39:15 -040041#include "socket.h"
Allan Stephens672d99e2011-02-25 18:42:52 -050042#include "node.h"
Jon Paul Maloya6bf70f2015-05-14 10:46:13 -040043#include "bcast.h"
Xin Longbe07f052021-05-18 10:09:08 +080044#include "link.h"
Richard Alpe49cc66e2016-03-04 17:04:42 +010045#include "netlink.h"
Hoang Le46cb01e2019-11-12 07:40:04 +070046#include "monitor.h"
Richard Alpefd3cf2a2014-11-20 10:29:18 +010047
YOSHIFUJI Hideakic4307282007-02-09 23:25:21 +090048/*
Per Lidenb97bf3f2006-01-02 19:04:38 +010049 * The TIPC locking policy is designed to ensure a very fine locking
50 * granularity, permitting complete parallel access to individual
Ying Xue7216cd92014-04-21 10:55:48 +080051 * port and node/link instances. The code consists of four major
Per Lidenb97bf3f2006-01-02 19:04:38 +010052 * locking domains, each protected with their own disjunct set of locks.
53 *
Ying Xue7216cd92014-04-21 10:55:48 +080054 * 1: The bearer level.
55 * RTNL lock is used to serialize the process of configuring bearer
56 * on update side, and RCU lock is applied on read side to make
57 * bearer instance valid on both paths of message transmission and
58 * reception.
Per Lidenb97bf3f2006-01-02 19:04:38 +010059 *
Ying Xue7216cd92014-04-21 10:55:48 +080060 * 2: The node and link level.
61 * All node instances are saved into two tipc_node_list and node_htable
62 * lists. The two lists are protected by node_list_lock on write side,
63 * and they are guarded with RCU lock on read side. Especially node
64 * instance is destroyed only when TIPC module is removed, and we can
65 * confirm that there has no any user who is accessing the node at the
66 * moment. Therefore, Except for iterating the two lists within RCU
67 * protection, it's no needed to hold RCU that we access node instance
68 * in other places.
Per Lidenb97bf3f2006-01-02 19:04:38 +010069 *
Ying Xue7216cd92014-04-21 10:55:48 +080070 * In addition, all members in node structure including link instances
71 * are protected by node spin lock.
YOSHIFUJI Hideakic4307282007-02-09 23:25:21 +090072 *
Ying Xue7216cd92014-04-21 10:55:48 +080073 * 3: The transport level of the protocol.
74 * This consists of the structures port, (and its user level
75 * representations, such as user_port and tipc_sock), reference and
76 * tipc_user (port.c, reg.c, socket.c).
Per Lidenb97bf3f2006-01-02 19:04:38 +010077 *
Ying Xue7216cd92014-04-21 10:55:48 +080078 * This layer has four different locks:
Per Lidenb97bf3f2006-01-02 19:04:38 +010079 * - The tipc_port spin_lock. This is protecting each port instance
YOSHIFUJI Hideakic4307282007-02-09 23:25:21 +090080 * from parallel data access and removal. Since we can not place
81 * this lock in the port itself, it has been placed in the
Per Lidenb97bf3f2006-01-02 19:04:38 +010082 * corresponding reference table entry, which has the same life
YOSHIFUJI Hideakic4307282007-02-09 23:25:21 +090083 * cycle as the module. This entry is difficult to access from
84 * outside the TIPC core, however, so a pointer to the lock has
85 * been added in the port instance, -to be used for unlocking
Per Lidenb97bf3f2006-01-02 19:04:38 +010086 * only.
YOSHIFUJI Hideakic4307282007-02-09 23:25:21 +090087 * - A read/write lock to protect the reference table itself (teg.c).
88 * (Nobody is using read-only access to this, so it can just as
Per Lidenb97bf3f2006-01-02 19:04:38 +010089 * well be changed to a spin_lock)
90 * - A spin lock to protect the registry of kernel/driver users (reg.c)
YOSHIFUJI Hideakic4307282007-02-09 23:25:21 +090091 * - A global spin_lock (tipc_port_lock), which only task is to ensure
Per Lidenb97bf3f2006-01-02 19:04:38 +010092 * consistency where more than one port is involved in an operation,
Zheng Yongjuna79ace42021-04-07 09:59:45 +080093 * i.e., when a port is part of a linked list of ports.
Per Lidenb97bf3f2006-01-02 19:04:38 +010094 * There are two such lists; 'port_list', which is used for management,
95 * and 'wait_list', which is used to queue ports during congestion.
YOSHIFUJI Hideakic4307282007-02-09 23:25:21 +090096 *
Ying Xue7216cd92014-04-21 10:55:48 +080097 * 4: The name table (name_table.c, name_distr.c, subscription.c)
YOSHIFUJI Hideakic4307282007-02-09 23:25:21 +090098 * - There is one big read/write-lock (tipc_nametbl_lock) protecting the
99 * overall name table structure. Nothing must be added/removed to
Per Lidenb97bf3f2006-01-02 19:04:38 +0100100 * this structure without holding write access to it.
101 * - There is one local spin_lock per sub_sequence, which can be seen
Per Liden4323add2006-01-18 00:38:21 +0100102 * as a sub-domain to the tipc_nametbl_lock domain. It is used only
Per Lidenb97bf3f2006-01-02 19:04:38 +0100103 * for translation operations, and is needed because a translation
104 * steps the root of the 'publication' linked list between each lookup.
Per Liden4323add2006-01-18 00:38:21 +0100105 * This is always used within the scope of a tipc_nametbl_lock(read).
Per Lidenb97bf3f2006-01-02 19:04:38 +0100106 * - A local spin_lock protecting the queue of subscriber events.
107*/
Per Lidenb97bf3f2006-01-02 19:04:38 +0100108
Jon Maloyadba75b2018-11-16 16:55:04 -0500109static void tipc_net_finalize(struct net *net, u32 addr);
110
Jon Maloyd50ccc22018-03-22 20:42:50 +0100111int tipc_net_init(struct net *net, u8 *node_id, u32 addr)
Per Lidenb97bf3f2006-01-02 19:04:38 +0100112{
Jon Maloyd50ccc22018-03-22 20:42:50 +0100113 if (tipc_own_id(net)) {
114 pr_info("Cannot configure node identity twice\n");
115 return -1;
116 }
117 pr_info("Started in network mode\n");
Per Lidenb97bf3f2006-01-02 19:04:38 +0100118
Jon Maloy25b0b9c2018-03-22 20:42:51 +0100119 if (node_id)
Jon Maloyd50ccc22018-03-22 20:42:50 +0100120 tipc_set_node_id(net, node_id);
Jon Maloyd50ccc22018-03-22 20:42:50 +0100121 if (addr)
122 tipc_net_finalize(net, addr);
123 return 0;
124}
Herbert Xu40f9f432017-02-11 19:26:46 +0800125
Jon Maloyadba75b2018-11-16 16:55:04 -0500126static void tipc_net_finalize(struct net *net, u32 addr)
Jon Maloyd50ccc22018-03-22 20:42:50 +0100127{
Jon Maloy9faa89d2018-07-06 20:10:06 +0200128 struct tipc_net *tn = tipc_net(net);
Jon Maloy50a34992021-03-16 22:06:11 -0400129 struct tipc_socket_addr sk = {0, addr};
130 struct tipc_uaddr ua;
131
132 tipc_uaddr(&ua, TIPC_SERVICE_RANGE, TIPC_CLUSTER_SCOPE,
133 TIPC_NODE_STATE, addr, addr);
Jon Maloy9faa89d2018-07-06 20:10:06 +0200134
Jon Maloyadba75b2018-11-16 16:55:04 -0500135 if (cmpxchg(&tn->node_addr, 0, addr))
136 return;
137 tipc_set_node_addr(net, addr);
138 tipc_named_reinit(net);
139 tipc_sk_reinit(net);
Hoang Le46cb01e2019-11-12 07:40:04 +0700140 tipc_mon_reinit_self(net);
Jon Maloy50a34992021-03-16 22:06:11 -0400141 tipc_nametbl_publish(net, &ua, &sk, addr);
Jon Maloyadba75b2018-11-16 16:55:04 -0500142}
143
Hoang Huu Led966ddc2020-09-07 13:17:25 +0700144void tipc_net_finalize_work(struct work_struct *work)
Jon Maloyadba75b2018-11-16 16:55:04 -0500145{
Xin Longbe07f052021-05-18 10:09:08 +0800146 struct tipc_net *tn = container_of(work, struct tipc_net, work);
Jon Maloyadba75b2018-11-16 16:55:04 -0500147
Xin Longbe07f052021-05-18 10:09:08 +0800148 tipc_net_finalize(tipc_link_net(tn->bcl), tn->trial_addr);
Per Lidenb97bf3f2006-01-02 19:04:38 +0100149}
150
Ying Xuef2f98002015-01-09 15:27:05 +0800151void tipc_net_stop(struct net *net)
Per Lidenb97bf3f2006-01-02 19:04:38 +0100152{
Xin Long9926cb52019-03-24 00:48:22 +0800153 if (!tipc_own_id(net))
Per Lidenb97bf3f2006-01-02 19:04:38 +0100154 return;
Ying Xue46651c52014-03-27 12:54:36 +0800155
Ying Xuef97e4552014-04-21 10:55:44 +0800156 rtnl_lock();
Ying Xuef2f98002015-01-09 15:27:05 +0800157 tipc_bearer_stop(net);
Ying Xuef2f98002015-01-09 15:27:05 +0800158 tipc_node_stop(net);
Ying Xuef97e4552014-04-21 10:55:44 +0800159 rtnl_unlock();
Ying Xue46651c52014-03-27 12:54:36 +0800160
Erik Hugne2cf8aa12012-06-29 00:16:37 -0400161 pr_info("Left network mode\n");
Per Lidenb97bf3f2006-01-02 19:04:38 +0100162}
Richard Alpefd3cf2a2014-11-20 10:29:18 +0100163
Ying Xuec93d3ba2015-01-09 15:27:04 +0800164static int __tipc_nl_add_net(struct net *net, struct tipc_nl_msg *msg)
Richard Alpefd3cf2a2014-11-20 10:29:18 +0100165{
Ying Xuec93d3ba2015-01-09 15:27:04 +0800166 struct tipc_net *tn = net_generic(net, tipc_net_id);
Jon Maloyd50ccc22018-03-22 20:42:50 +0100167 u64 *w0 = (u64 *)&tn->node_id[0];
168 u64 *w1 = (u64 *)&tn->node_id[8];
Richard Alpefd3cf2a2014-11-20 10:29:18 +0100169 struct nlattr *attrs;
Jon Maloyd50ccc22018-03-22 20:42:50 +0100170 void *hdr;
Richard Alpefd3cf2a2014-11-20 10:29:18 +0100171
Richard Alpebfb3e5d2015-02-09 09:50:03 +0100172 hdr = genlmsg_put(msg->skb, msg->portid, msg->seq, &tipc_genl_family,
Richard Alpefd3cf2a2014-11-20 10:29:18 +0100173 NLM_F_MULTI, TIPC_NL_NET_GET);
174 if (!hdr)
175 return -EMSGSIZE;
176
Michal Kubecekae0be8d2019-04-26 11:13:06 +0200177 attrs = nla_nest_start_noflag(msg->skb, TIPC_NLA_NET);
Richard Alpefd3cf2a2014-11-20 10:29:18 +0100178 if (!attrs)
179 goto msg_full;
180
Ying Xuec93d3ba2015-01-09 15:27:04 +0800181 if (nla_put_u32(msg->skb, TIPC_NLA_NET_ID, tn->net_id))
Richard Alpefd3cf2a2014-11-20 10:29:18 +0100182 goto attr_msg_full;
Jon Maloyd50ccc22018-03-22 20:42:50 +0100183 if (nla_put_u64_64bit(msg->skb, TIPC_NLA_NET_NODEID, *w0, 0))
184 goto attr_msg_full;
185 if (nla_put_u64_64bit(msg->skb, TIPC_NLA_NET_NODEID_W1, *w1, 0))
186 goto attr_msg_full;
Richard Alpefd3cf2a2014-11-20 10:29:18 +0100187 nla_nest_end(msg->skb, attrs);
188 genlmsg_end(msg->skb, hdr);
189
190 return 0;
191
192attr_msg_full:
193 nla_nest_cancel(msg->skb, attrs);
194msg_full:
195 genlmsg_cancel(msg->skb, hdr);
196
197 return -EMSGSIZE;
198}
199
200int tipc_nl_net_dump(struct sk_buff *skb, struct netlink_callback *cb)
201{
Ying Xuec93d3ba2015-01-09 15:27:04 +0800202 struct net *net = sock_net(skb->sk);
Richard Alpefd3cf2a2014-11-20 10:29:18 +0100203 int err;
204 int done = cb->args[0];
205 struct tipc_nl_msg msg;
206
207 if (done)
208 return 0;
209
210 msg.skb = skb;
211 msg.portid = NETLINK_CB(cb->skb).portid;
212 msg.seq = cb->nlh->nlmsg_seq;
213
Ying Xuec93d3ba2015-01-09 15:27:04 +0800214 err = __tipc_nl_add_net(net, &msg);
Richard Alpefd3cf2a2014-11-20 10:29:18 +0100215 if (err)
216 goto out;
217
218 done = 1;
219out:
220 cb->args[0] = done;
221
222 return skb->len;
223}
Richard Alpe27c21412014-11-20 10:29:19 +0100224
Ying Xue5631f652018-02-14 13:38:03 +0800225int __tipc_nl_net_set(struct sk_buff *skb, struct genl_info *info)
Richard Alpe27c21412014-11-20 10:29:19 +0100226{
Richard Alpe27c21412014-11-20 10:29:19 +0100227 struct nlattr *attrs[TIPC_NLA_NET_MAX + 1];
Jon Maloy23fd3ea2018-03-22 20:42:49 +0100228 struct net *net = sock_net(skb->sk);
229 struct tipc_net *tn = tipc_net(net);
Ying Xuec93d3ba2015-01-09 15:27:04 +0800230 int err;
Richard Alpe27c21412014-11-20 10:29:19 +0100231
232 if (!info->attrs[TIPC_NLA_NET])
233 return -EINVAL;
234
Johannes Berg8cb08172019-04-26 14:07:28 +0200235 err = nla_parse_nested_deprecated(attrs, TIPC_NLA_NET_MAX,
236 info->attrs[TIPC_NLA_NET],
237 tipc_nl_net_policy, info->extack);
Jon Maloyd50ccc22018-03-22 20:42:50 +0100238
Richard Alpe27c21412014-11-20 10:29:19 +0100239 if (err)
240 return err;
241
Jon Maloy23fd3ea2018-03-22 20:42:49 +0100242 /* Can't change net id once TIPC has joined a network */
243 if (tipc_own_addr(net))
244 return -EPERM;
245
Richard Alpe27c21412014-11-20 10:29:19 +0100246 if (attrs[TIPC_NLA_NET_ID]) {
247 u32 val;
248
Richard Alpe27c21412014-11-20 10:29:19 +0100249 val = nla_get_u32(attrs[TIPC_NLA_NET_ID]);
250 if (val < 1 || val > 9999)
251 return -EINVAL;
252
Ying Xuec93d3ba2015-01-09 15:27:04 +0800253 tn->net_id = val;
Richard Alpe27c21412014-11-20 10:29:19 +0100254 }
255
256 if (attrs[TIPC_NLA_NET_ADDR]) {
257 u32 addr;
258
Richard Alpe27c21412014-11-20 10:29:19 +0100259 addr = nla_get_u32(attrs[TIPC_NLA_NET_ADDR]);
Jon Maloy20263642018-03-22 20:42:47 +0100260 if (!addr)
Richard Alpe27c21412014-11-20 10:29:19 +0100261 return -EINVAL;
Jon Maloyb89afb12018-03-22 20:42:48 +0100262 tn->legacy_addr_format = true;
Jon Maloyd50ccc22018-03-22 20:42:50 +0100263 tipc_net_init(net, NULL, addr);
Richard Alpe27c21412014-11-20 10:29:19 +0100264 }
265
Jon Maloyd50ccc22018-03-22 20:42:50 +0100266 if (attrs[TIPC_NLA_NET_NODEID]) {
267 u8 node_id[NODE_ID_LEN];
268 u64 *w0 = (u64 *)&node_id[0];
269 u64 *w1 = (u64 *)&node_id[8];
270
Eric Dumazetc6404122018-04-16 08:29:43 -0700271 if (!attrs[TIPC_NLA_NET_NODEID_W1])
272 return -EINVAL;
Jon Maloyd50ccc22018-03-22 20:42:50 +0100273 *w0 = nla_get_u64(attrs[TIPC_NLA_NET_NODEID]);
274 *w1 = nla_get_u64(attrs[TIPC_NLA_NET_NODEID_W1]);
275 tipc_net_init(net, node_id, 0);
276 }
Richard Alpe27c21412014-11-20 10:29:19 +0100277 return 0;
278}
Ying Xue5631f652018-02-14 13:38:03 +0800279
280int tipc_nl_net_set(struct sk_buff *skb, struct genl_info *info)
281{
282 int err;
283
284 rtnl_lock();
285 err = __tipc_nl_net_set(skb, info);
286 rtnl_unlock();
287
288 return err;
289}
John Rutherforde1b5e592019-12-19 16:03:57 +1100290
291static int __tipc_nl_addr_legacy_get(struct net *net, struct tipc_nl_msg *msg)
292{
293 struct tipc_net *tn = tipc_net(net);
294 struct nlattr *attrs;
295 void *hdr;
296
297 hdr = genlmsg_put(msg->skb, msg->portid, msg->seq, &tipc_genl_family,
298 0, TIPC_NL_ADDR_LEGACY_GET);
299 if (!hdr)
300 return -EMSGSIZE;
301
302 attrs = nla_nest_start(msg->skb, TIPC_NLA_NET);
303 if (!attrs)
304 goto msg_full;
305
306 if (tn->legacy_addr_format)
307 if (nla_put_flag(msg->skb, TIPC_NLA_NET_ADDR_LEGACY))
308 goto attr_msg_full;
309
310 nla_nest_end(msg->skb, attrs);
311 genlmsg_end(msg->skb, hdr);
312
313 return 0;
314
315attr_msg_full:
316 nla_nest_cancel(msg->skb, attrs);
317msg_full:
318 genlmsg_cancel(msg->skb, hdr);
319
320 return -EMSGSIZE;
321}
322
323int tipc_nl_net_addr_legacy_get(struct sk_buff *skb, struct genl_info *info)
324{
325 struct net *net = sock_net(skb->sk);
326 struct tipc_nl_msg msg;
327 struct sk_buff *rep;
328 int err;
329
330 rep = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
331 if (!rep)
332 return -ENOMEM;
333
334 msg.skb = rep;
335 msg.portid = info->snd_portid;
336 msg.seq = info->snd_seq;
337
338 err = __tipc_nl_addr_legacy_get(net, &msg);
339 if (err) {
340 nlmsg_free(msg.skb);
341 return err;
342 }
343
344 return genlmsg_reply(msg.skb, info);
345}