blob: e9449376b58e4293b7735362912e1ea1191a8815 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * NET3 IP device support routines.
3 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Derived from the IP parts of dev.c 1.0.19
Jesper Juhl02c30a82005-05-05 16:16:16 -070010 * Authors: Ross Biro
Linus Torvalds1da177e2005-04-16 15:20:36 -070011 * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
12 * Mark Evans, <evansmp@uhura.aston.ac.uk>
13 *
14 * Additional Authors:
15 * Alan Cox, <gw4pts@gw4pts.ampr.org>
16 * Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
17 *
18 * Changes:
19 * Alexey Kuznetsov: pa_* fields are replaced with ifaddr
20 * lists.
21 * Cyrus Durgin: updated for kmod
22 * Matthias Andree: in devinet_ioctl, compare label and
23 * address (4.4BSD alias style support),
24 * fall back to comparing just the label
25 * if no match found.
26 */
27
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
29#include <asm/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <linux/bitops.h>
Randy Dunlap4fc268d2006-01-11 12:17:47 -080031#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <linux/module.h>
33#include <linux/types.h>
34#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <linux/string.h>
36#include <linux/mm.h>
37#include <linux/socket.h>
38#include <linux/sockios.h>
39#include <linux/in.h>
40#include <linux/errno.h>
41#include <linux/interrupt.h>
Thomas Graf18237302006-08-04 23:04:54 -070042#include <linux/if_addr.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#include <linux/if_ether.h>
44#include <linux/inet.h>
45#include <linux/netdevice.h>
46#include <linux/etherdevice.h>
47#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070048#include <linux/init.h>
49#include <linux/notifier.h>
50#include <linux/inetdevice.h>
51#include <linux/igmp.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090052#include <linux/slab.h>
David S. Millerfd23c3b2011-02-18 12:42:28 -080053#include <linux/hash.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070054#ifdef CONFIG_SYSCTL
55#include <linux/sysctl.h>
56#endif
57#include <linux/kmod.h>
Nicolas Dichteledc9e742012-10-25 22:28:52 +000058#include <linux/netconf.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070059
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020060#include <net/arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070061#include <net/ip.h>
62#include <net/route.h>
63#include <net/ip_fib.h>
Thomas Graf63f34442007-03-22 11:55:17 -070064#include <net/rtnetlink.h>
Pavel Emelyanov752d14d2007-12-16 13:31:47 -080065#include <net/net_namespace.h>
Jiri Pirko5c766d62013-01-24 09:41:41 +000066#include <net/addrconf.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
David S. Miller406b6f92011-03-22 21:56:23 -070068#include "fib_lookup.h"
69
Adrian Bunk0027ba82008-01-31 17:17:31 -080070static struct ipv4_devconf ipv4_devconf = {
Herbert Xu42f811b2007-06-04 23:34:44 -070071 .data = {
Eric W. Biederman02291682010-02-14 03:25:51 +000072 [IPV4_DEVCONF_ACCEPT_REDIRECTS - 1] = 1,
73 [IPV4_DEVCONF_SEND_REDIRECTS - 1] = 1,
74 [IPV4_DEVCONF_SECURE_REDIRECTS - 1] = 1,
75 [IPV4_DEVCONF_SHARED_MEDIA - 1] = 1,
William Manley26900482013-08-06 19:03:15 +010076 [IPV4_DEVCONF_IGMPV2_UNSOLICITED_REPORT_INTERVAL - 1] = 10000 /*ms*/,
77 [IPV4_DEVCONF_IGMPV3_UNSOLICITED_REPORT_INTERVAL - 1] = 1000 /*ms*/,
Herbert Xu42f811b2007-06-04 23:34:44 -070078 },
Linus Torvalds1da177e2005-04-16 15:20:36 -070079};
80
81static struct ipv4_devconf ipv4_devconf_dflt = {
Herbert Xu42f811b2007-06-04 23:34:44 -070082 .data = {
Eric W. Biederman02291682010-02-14 03:25:51 +000083 [IPV4_DEVCONF_ACCEPT_REDIRECTS - 1] = 1,
84 [IPV4_DEVCONF_SEND_REDIRECTS - 1] = 1,
85 [IPV4_DEVCONF_SECURE_REDIRECTS - 1] = 1,
86 [IPV4_DEVCONF_SHARED_MEDIA - 1] = 1,
87 [IPV4_DEVCONF_ACCEPT_SOURCE_ROUTE - 1] = 1,
William Manley26900482013-08-06 19:03:15 +010088 [IPV4_DEVCONF_IGMPV2_UNSOLICITED_REPORT_INTERVAL - 1] = 10000 /*ms*/,
89 [IPV4_DEVCONF_IGMPV3_UNSOLICITED_REPORT_INTERVAL - 1] = 1000 /*ms*/,
Herbert Xu42f811b2007-06-04 23:34:44 -070090 },
Linus Torvalds1da177e2005-04-16 15:20:36 -070091};
92
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -080093#define IPV4_DEVCONF_DFLT(net, attr) \
94 IPV4_DEVCONF((*net->ipv4.devconf_dflt), attr)
Herbert Xu42f811b2007-06-04 23:34:44 -070095
Patrick McHardyef7c79e2007-06-05 12:38:30 -070096static const struct nla_policy ifa_ipv4_policy[IFA_MAX+1] = {
Thomas Graf5c753972006-08-04 23:03:53 -070097 [IFA_LOCAL] = { .type = NLA_U32 },
98 [IFA_ADDRESS] = { .type = NLA_U32 },
99 [IFA_BROADCAST] = { .type = NLA_U32 },
Thomas Graf5176f912006-08-26 20:13:18 -0700100 [IFA_LABEL] = { .type = NLA_STRING, .len = IFNAMSIZ - 1 },
Jiri Pirko5c766d62013-01-24 09:41:41 +0000101 [IFA_CACHEINFO] = { .len = sizeof(struct ifa_cacheinfo) },
Jiri Pirkoad6c8132013-12-08 12:16:10 +0100102 [IFA_FLAGS] = { .type = NLA_U32 },
Thomas Graf5c753972006-08-04 23:03:53 -0700103};
104
Eric Dumazet40384992012-08-03 21:06:50 +0000105#define IN4_ADDR_HSIZE_SHIFT 8
106#define IN4_ADDR_HSIZE (1U << IN4_ADDR_HSIZE_SHIFT)
107
David S. Millerfd23c3b2011-02-18 12:42:28 -0800108static struct hlist_head inet_addr_lst[IN4_ADDR_HSIZE];
David S. Millerfd23c3b2011-02-18 12:42:28 -0800109
Eric Dumazet40384992012-08-03 21:06:50 +0000110static u32 inet_addr_hash(struct net *net, __be32 addr)
David S. Millerfd23c3b2011-02-18 12:42:28 -0800111{
Eric Dumazet40384992012-08-03 21:06:50 +0000112 u32 val = (__force u32) addr ^ net_hash_mix(net);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800113
Eric Dumazet40384992012-08-03 21:06:50 +0000114 return hash_32(val, IN4_ADDR_HSIZE_SHIFT);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800115}
116
117static void inet_hash_insert(struct net *net, struct in_ifaddr *ifa)
118{
Eric Dumazet40384992012-08-03 21:06:50 +0000119 u32 hash = inet_addr_hash(net, ifa->ifa_local);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800120
WANG Cong32a4be42014-05-06 11:15:56 -0700121 ASSERT_RTNL();
David S. Millerfd23c3b2011-02-18 12:42:28 -0800122 hlist_add_head_rcu(&ifa->hash, &inet_addr_lst[hash]);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800123}
124
125static void inet_hash_remove(struct in_ifaddr *ifa)
126{
WANG Cong32a4be42014-05-06 11:15:56 -0700127 ASSERT_RTNL();
David S. Millerfd23c3b2011-02-18 12:42:28 -0800128 hlist_del_init_rcu(&ifa->hash);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800129}
130
David S. Miller9435eb12011-02-18 12:43:09 -0800131/**
132 * __ip_dev_find - find the first device with a given source address.
133 * @net: the net namespace
134 * @addr: the source address
135 * @devref: if true, take a reference on the found device
136 *
137 * If a caller uses devref=false, it should be protected by RCU, or RTNL
138 */
139struct net_device *__ip_dev_find(struct net *net, __be32 addr, bool devref)
140{
Eric Dumazet40384992012-08-03 21:06:50 +0000141 u32 hash = inet_addr_hash(net, addr);
David S. Miller9435eb12011-02-18 12:43:09 -0800142 struct net_device *result = NULL;
143 struct in_ifaddr *ifa;
David S. Miller9435eb12011-02-18 12:43:09 -0800144
145 rcu_read_lock();
Sasha Levinb67bfe02013-02-27 17:06:00 -0800146 hlist_for_each_entry_rcu(ifa, &inet_addr_lst[hash], hash) {
David S. Millere0660082011-03-03 11:24:19 -0800147 if (ifa->ifa_local == addr) {
Eric Dumazet40384992012-08-03 21:06:50 +0000148 struct net_device *dev = ifa->ifa_dev->dev;
149
150 if (!net_eq(dev_net(dev), net))
151 continue;
David S. Miller9435eb12011-02-18 12:43:09 -0800152 result = dev;
153 break;
154 }
155 }
David S. Miller406b6f92011-03-22 21:56:23 -0700156 if (!result) {
157 struct flowi4 fl4 = { .daddr = addr };
158 struct fib_result res = { 0 };
159 struct fib_table *local;
160
161 /* Fallback to FIB local table so that communication
162 * over loopback subnets work.
163 */
164 local = fib_get_table(net, RT_TABLE_LOCAL);
165 if (local &&
166 !fib_table_lookup(local, &fl4, &res, FIB_LOOKUP_NOREF) &&
167 res.type == RTN_LOCAL)
168 result = FIB_RES_DEV(res);
169 }
David S. Miller9435eb12011-02-18 12:43:09 -0800170 if (result && devref)
171 dev_hold(result);
172 rcu_read_unlock();
173 return result;
174}
175EXPORT_SYMBOL(__ip_dev_find);
176
Thomas Grafd6062cb2006-08-15 00:33:59 -0700177static void rtmsg_ifa(int event, struct in_ifaddr *, struct nlmsghdr *, u32);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178
Alan Sterne041c682006-03-27 01:16:30 -0800179static BLOCKING_NOTIFIER_HEAD(inetaddr_chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
181 int destroy);
182#ifdef CONFIG_SYSCTL
Pavel Emelyanov66f27a52007-12-02 00:55:54 +1100183static void devinet_sysctl_register(struct in_device *idev);
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800184static void devinet_sysctl_unregister(struct in_device *idev);
185#else
Eric Dumazet40384992012-08-03 21:06:50 +0000186static void devinet_sysctl_register(struct in_device *idev)
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800187{
188}
Eric Dumazet40384992012-08-03 21:06:50 +0000189static void devinet_sysctl_unregister(struct in_device *idev)
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800190{
191}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192#endif
193
194/* Locks all the inet devices. */
195
196static struct in_ifaddr *inet_alloc_ifa(void)
197{
Alexey Dobriyan93adcc82008-10-28 13:25:09 -0700198 return kzalloc(sizeof(struct in_ifaddr), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199}
200
201static void inet_rcu_free_ifa(struct rcu_head *head)
202{
203 struct in_ifaddr *ifa = container_of(head, struct in_ifaddr, rcu_head);
204 if (ifa->ifa_dev)
205 in_dev_put(ifa->ifa_dev);
206 kfree(ifa);
207}
208
Eric Dumazet40384992012-08-03 21:06:50 +0000209static void inet_free_ifa(struct in_ifaddr *ifa)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210{
211 call_rcu(&ifa->rcu_head, inet_rcu_free_ifa);
212}
213
214void in_dev_finish_destroy(struct in_device *idev)
215{
216 struct net_device *dev = idev->dev;
217
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700218 WARN_ON(idev->ifa_list);
219 WARN_ON(idev->mc_list);
Eric Dumazete9897072013-06-07 08:48:57 -0700220 kfree(rcu_dereference_protected(idev->mc_hash, 1));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221#ifdef NET_REFCNT_DEBUG
Joe Perches91df42b2012-05-15 14:11:54 +0000222 pr_debug("%s: %p=%s\n", __func__, idev, dev ? dev->name : "NIL");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223#endif
224 dev_put(dev);
225 if (!idev->dead)
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800226 pr_err("Freeing alive in_device %p\n", idev);
227 else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228 kfree(idev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229}
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800230EXPORT_SYMBOL(in_dev_finish_destroy);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231
Herbert Xu71e27da2007-06-04 23:36:06 -0700232static struct in_device *inetdev_init(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233{
234 struct in_device *in_dev;
235
236 ASSERT_RTNL();
237
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700238 in_dev = kzalloc(sizeof(*in_dev), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239 if (!in_dev)
240 goto out;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900241 memcpy(&in_dev->cnf, dev_net(dev)->ipv4.devconf_dflt,
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -0800242 sizeof(in_dev->cnf));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700243 in_dev->cnf.sysctl = NULL;
244 in_dev->dev = dev;
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800245 in_dev->arp_parms = neigh_parms_alloc(dev, &arp_tbl);
246 if (!in_dev->arp_parms)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247 goto out_kfree;
Ben Hutchings0187bdf2008-06-19 16:15:47 -0700248 if (IPV4_DEVCONF(in_dev->cnf, FORWARDING))
249 dev_disable_lro(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250 /* Reference in_dev->dev */
251 dev_hold(dev);
David L Stevens30c4cf52007-01-04 12:31:14 -0800252 /* Account for reference dev->ip_ptr (below) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253 in_dev_hold(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254
Pavel Emelyanov66f27a52007-12-02 00:55:54 +1100255 devinet_sysctl_register(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256 ip_mc_init_dev(in_dev);
257 if (dev->flags & IFF_UP)
258 ip_mc_up(in_dev);
Jarek Poplawski483479e2007-01-09 14:38:31 -0800259
David L Stevens30c4cf52007-01-04 12:31:14 -0800260 /* we can receive as soon as ip_ptr is set -- do this last */
Eric Dumazetcf778b02012-01-12 04:41:32 +0000261 rcu_assign_pointer(dev->ip_ptr, in_dev);
Jarek Poplawski483479e2007-01-09 14:38:31 -0800262out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263 return in_dev;
264out_kfree:
265 kfree(in_dev);
266 in_dev = NULL;
267 goto out;
268}
269
270static void in_dev_rcu_put(struct rcu_head *head)
271{
272 struct in_device *idev = container_of(head, struct in_device, rcu_head);
273 in_dev_put(idev);
274}
275
276static void inetdev_destroy(struct in_device *in_dev)
277{
278 struct in_ifaddr *ifa;
279 struct net_device *dev;
280
281 ASSERT_RTNL();
282
283 dev = in_dev->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284
285 in_dev->dead = 1;
286
287 ip_mc_destroy_dev(in_dev);
288
289 while ((ifa = in_dev->ifa_list) != NULL) {
290 inet_del_ifa(in_dev, &in_dev->ifa_list, 0);
291 inet_free_ifa(ifa);
292 }
293
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +0000294 RCU_INIT_POINTER(dev->ip_ptr, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800296 devinet_sysctl_unregister(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 neigh_parms_release(&arp_tbl, in_dev->arp_parms);
298 arp_ifdown(dev);
299
300 call_rcu(&in_dev->rcu_head, in_dev_rcu_put);
301}
302
Al Viroff428d72006-09-26 22:13:35 -0700303int inet_addr_onlink(struct in_device *in_dev, __be32 a, __be32 b)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700304{
305 rcu_read_lock();
306 for_primary_ifa(in_dev) {
307 if (inet_ifa_match(a, ifa)) {
308 if (!b || inet_ifa_match(b, ifa)) {
309 rcu_read_unlock();
310 return 1;
311 }
312 }
313 } endfor_ifa(in_dev);
314 rcu_read_unlock();
315 return 0;
316}
317
Thomas Grafd6062cb2006-08-15 00:33:59 -0700318static void __inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
Eric W. Biederman15e47302012-09-07 20:12:54 +0000319 int destroy, struct nlmsghdr *nlh, u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320{
Harald Welte8f937c62005-05-29 20:23:46 -0700321 struct in_ifaddr *promote = NULL;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800322 struct in_ifaddr *ifa, *ifa1 = *ifap;
323 struct in_ifaddr *last_prim = in_dev->ifa_list;
324 struct in_ifaddr *prev_prom = NULL;
325 int do_promote = IN_DEV_PROMOTE_SECONDARIES(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700326
327 ASSERT_RTNL();
328
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900329 /* 1. Deleting primary ifaddr forces deletion all secondaries
Harald Welte8f937c62005-05-29 20:23:46 -0700330 * unless alias promotion is set
331 **/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332
333 if (!(ifa1->ifa_flags & IFA_F_SECONDARY)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334 struct in_ifaddr **ifap1 = &ifa1->ifa_next;
335
336 while ((ifa = *ifap1) != NULL) {
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900337 if (!(ifa->ifa_flags & IFA_F_SECONDARY) &&
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800338 ifa1->ifa_scope <= ifa->ifa_scope)
339 last_prim = ifa;
340
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 if (!(ifa->ifa_flags & IFA_F_SECONDARY) ||
342 ifa1->ifa_mask != ifa->ifa_mask ||
343 !inet_ifa_match(ifa1->ifa_address, ifa)) {
344 ifap1 = &ifa->ifa_next;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800345 prev_prom = ifa;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346 continue;
347 }
348
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800349 if (!do_promote) {
David S. Millerfd23c3b2011-02-18 12:42:28 -0800350 inet_hash_remove(ifa);
Harald Welte8f937c62005-05-29 20:23:46 -0700351 *ifap1 = ifa->ifa_next;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352
Eric W. Biederman15e47302012-09-07 20:12:54 +0000353 rtmsg_ifa(RTM_DELADDR, ifa, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800354 blocking_notifier_call_chain(&inetaddr_chain,
355 NETDEV_DOWN, ifa);
Harald Welte8f937c62005-05-29 20:23:46 -0700356 inet_free_ifa(ifa);
357 } else {
358 promote = ifa;
359 break;
360 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361 }
362 }
363
Julian Anastasov2d230e22011-03-19 12:13:52 +0000364 /* On promotion all secondaries from subnet are changing
365 * the primary IP, we must remove all their routes silently
366 * and later to add them back with new prefsrc. Do this
367 * while all addresses are on the device list.
368 */
369 for (ifa = promote; ifa; ifa = ifa->ifa_next) {
370 if (ifa1->ifa_mask == ifa->ifa_mask &&
371 inet_ifa_match(ifa1->ifa_address, ifa))
372 fib_del_ifaddr(ifa, ifa1);
373 }
374
Linus Torvalds1da177e2005-04-16 15:20:36 -0700375 /* 2. Unlink it */
376
377 *ifap = ifa1->ifa_next;
David S. Millerfd23c3b2011-02-18 12:42:28 -0800378 inet_hash_remove(ifa1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379
380 /* 3. Announce address deletion */
381
382 /* Send message first, then call notifier.
383 At first sight, FIB update triggered by notifier
384 will refer to already deleted ifaddr, that could confuse
385 netlink listeners. It is not true: look, gated sees
386 that route deleted and if it still thinks that ifaddr
387 is valid, it will try to restore deleted routes... Grr.
388 So that, this order is correct.
389 */
Eric W. Biederman15e47302012-09-07 20:12:54 +0000390 rtmsg_ifa(RTM_DELADDR, ifa1, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800391 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_DOWN, ifa1);
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800392
393 if (promote) {
Julian Anastasov04024b92011-03-19 12:13:54 +0000394 struct in_ifaddr *next_sec = promote->ifa_next;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800395
396 if (prev_prom) {
397 prev_prom->ifa_next = promote->ifa_next;
398 promote->ifa_next = last_prim->ifa_next;
399 last_prim->ifa_next = promote;
400 }
401
402 promote->ifa_flags &= ~IFA_F_SECONDARY;
Eric W. Biederman15e47302012-09-07 20:12:54 +0000403 rtmsg_ifa(RTM_NEWADDR, promote, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800404 blocking_notifier_call_chain(&inetaddr_chain,
405 NETDEV_UP, promote);
Julian Anastasov04024b92011-03-19 12:13:54 +0000406 for (ifa = next_sec; ifa; ifa = ifa->ifa_next) {
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800407 if (ifa1->ifa_mask != ifa->ifa_mask ||
408 !inet_ifa_match(ifa1->ifa_address, ifa))
409 continue;
410 fib_add_ifaddr(ifa);
411 }
412
413 }
Herbert Xu63630972007-06-07 18:35:38 -0700414 if (destroy)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415 inet_free_ifa(ifa1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700416}
417
Thomas Grafd6062cb2006-08-15 00:33:59 -0700418static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
419 int destroy)
420{
421 __inet_del_ifa(in_dev, ifap, destroy, NULL, 0);
422}
423
Jiri Pirko5c766d62013-01-24 09:41:41 +0000424static void check_lifetime(struct work_struct *work);
425
426static DECLARE_DELAYED_WORK(check_lifetime_work, check_lifetime);
427
Thomas Grafd6062cb2006-08-15 00:33:59 -0700428static int __inet_insert_ifa(struct in_ifaddr *ifa, struct nlmsghdr *nlh,
Eric W. Biederman15e47302012-09-07 20:12:54 +0000429 u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700430{
431 struct in_device *in_dev = ifa->ifa_dev;
432 struct in_ifaddr *ifa1, **ifap, **last_primary;
433
434 ASSERT_RTNL();
435
436 if (!ifa->ifa_local) {
437 inet_free_ifa(ifa);
438 return 0;
439 }
440
441 ifa->ifa_flags &= ~IFA_F_SECONDARY;
442 last_primary = &in_dev->ifa_list;
443
444 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
445 ifap = &ifa1->ifa_next) {
446 if (!(ifa1->ifa_flags & IFA_F_SECONDARY) &&
447 ifa->ifa_scope <= ifa1->ifa_scope)
448 last_primary = &ifa1->ifa_next;
449 if (ifa1->ifa_mask == ifa->ifa_mask &&
450 inet_ifa_match(ifa1->ifa_address, ifa)) {
451 if (ifa1->ifa_local == ifa->ifa_local) {
452 inet_free_ifa(ifa);
453 return -EEXIST;
454 }
455 if (ifa1->ifa_scope != ifa->ifa_scope) {
456 inet_free_ifa(ifa);
457 return -EINVAL;
458 }
459 ifa->ifa_flags |= IFA_F_SECONDARY;
460 }
461 }
462
463 if (!(ifa->ifa_flags & IFA_F_SECONDARY)) {
Aruna-Hewapathirane63862b52014-01-11 07:15:59 -0500464 prandom_seed((__force u32) ifa->ifa_local);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700465 ifap = last_primary;
466 }
467
468 ifa->ifa_next = *ifap;
469 *ifap = ifa;
470
David S. Millerfd23c3b2011-02-18 12:42:28 -0800471 inet_hash_insert(dev_net(in_dev->dev), ifa);
472
Jiri Pirko5c766d62013-01-24 09:41:41 +0000473 cancel_delayed_work(&check_lifetime_work);
viresh kumar906e0732014-01-22 12:23:32 +0530474 queue_delayed_work(system_power_efficient_wq, &check_lifetime_work, 0);
Jiri Pirko5c766d62013-01-24 09:41:41 +0000475
Linus Torvalds1da177e2005-04-16 15:20:36 -0700476 /* Send message first, then call notifier.
477 Notifier will trigger FIB update, so that
478 listeners of netlink will know about new ifaddr */
Eric W. Biederman15e47302012-09-07 20:12:54 +0000479 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800480 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481
482 return 0;
483}
484
Thomas Grafd6062cb2006-08-15 00:33:59 -0700485static int inet_insert_ifa(struct in_ifaddr *ifa)
486{
487 return __inet_insert_ifa(ifa, NULL, 0);
488}
489
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490static int inet_set_ifa(struct net_device *dev, struct in_ifaddr *ifa)
491{
Herbert Xue5ed6392005-10-03 14:35:55 -0700492 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700493
494 ASSERT_RTNL();
495
496 if (!in_dev) {
Herbert Xu71e27da2007-06-04 23:36:06 -0700497 inet_free_ifa(ifa);
498 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499 }
Herbert Xu71e27da2007-06-04 23:36:06 -0700500 ipv4_devconf_setall(in_dev);
Jiri Pirko1d4c8c22013-12-07 19:26:56 +0100501 neigh_parms_data_state_setall(in_dev->arp_parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700502 if (ifa->ifa_dev != in_dev) {
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700503 WARN_ON(ifa->ifa_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700504 in_dev_hold(in_dev);
505 ifa->ifa_dev = in_dev;
506 }
Joe Perchesf97c1e02007-12-16 13:45:43 -0800507 if (ipv4_is_loopback(ifa->ifa_local))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508 ifa->ifa_scope = RT_SCOPE_HOST;
509 return inet_insert_ifa(ifa);
510}
511
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000512/* Caller must hold RCU or RTNL :
513 * We dont take a reference on found in_device
514 */
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800515struct in_device *inetdev_by_index(struct net *net, int ifindex)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700516{
517 struct net_device *dev;
518 struct in_device *in_dev = NULL;
Eric Dumazetc148fc22009-11-01 19:23:04 +0000519
520 rcu_read_lock();
521 dev = dev_get_by_index_rcu(net, ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700522 if (dev)
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000523 in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Eric Dumazetc148fc22009-11-01 19:23:04 +0000524 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700525 return in_dev;
526}
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800527EXPORT_SYMBOL(inetdev_by_index);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700528
529/* Called only from RTNL semaphored context. No locks. */
530
Al Viro60cad5d2006-09-26 22:17:09 -0700531struct in_ifaddr *inet_ifa_byprefix(struct in_device *in_dev, __be32 prefix,
532 __be32 mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700533{
534 ASSERT_RTNL();
535
536 for_primary_ifa(in_dev) {
537 if (ifa->ifa_mask == mask && inet_ifa_match(prefix, ifa))
538 return ifa;
539 } endfor_ifa(in_dev);
540 return NULL;
541}
542
Thomas Graf661d2962013-03-21 07:45:29 +0000543static int inet_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700544{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900545 struct net *net = sock_net(skb->sk);
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700546 struct nlattr *tb[IFA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700547 struct in_device *in_dev;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700548 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700549 struct in_ifaddr *ifa, **ifap;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700550 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700551
552 ASSERT_RTNL();
553
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700554 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
555 if (err < 0)
556 goto errout;
557
558 ifm = nlmsg_data(nlh);
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800559 in_dev = inetdev_by_index(net, ifm->ifa_index);
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700560 if (in_dev == NULL) {
561 err = -ENODEV;
562 goto errout;
563 }
564
Linus Torvalds1da177e2005-04-16 15:20:36 -0700565 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
566 ifap = &ifa->ifa_next) {
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700567 if (tb[IFA_LOCAL] &&
Al Viroa7a628c2006-09-26 22:16:43 -0700568 ifa->ifa_local != nla_get_be32(tb[IFA_LOCAL]))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700569 continue;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700570
571 if (tb[IFA_LABEL] && nla_strcmp(tb[IFA_LABEL], ifa->ifa_label))
572 continue;
573
574 if (tb[IFA_ADDRESS] &&
575 (ifm->ifa_prefixlen != ifa->ifa_prefixlen ||
Al Viroa7a628c2006-09-26 22:16:43 -0700576 !inet_ifa_match(nla_get_be32(tb[IFA_ADDRESS]), ifa)))
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700577 continue;
578
Eric W. Biederman15e47302012-09-07 20:12:54 +0000579 __inet_del_ifa(in_dev, ifap, 1, nlh, NETLINK_CB(skb).portid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580 return 0;
581 }
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700582
583 err = -EADDRNOTAVAIL;
584errout:
585 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586}
587
Jiri Pirko5c766d62013-01-24 09:41:41 +0000588#define INFINITY_LIFE_TIME 0xFFFFFFFF
589
590static void check_lifetime(struct work_struct *work)
591{
592 unsigned long now, next, next_sec, next_sched;
593 struct in_ifaddr *ifa;
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000594 struct hlist_node *n;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000595 int i;
596
597 now = jiffies;
598 next = round_jiffies_up(now + ADDR_CHECK_FREQUENCY);
599
Jiri Pirko5c766d62013-01-24 09:41:41 +0000600 for (i = 0; i < IN4_ADDR_HSIZE; i++) {
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000601 bool change_needed = false;
602
603 rcu_read_lock();
Sasha Levinb67bfe02013-02-27 17:06:00 -0800604 hlist_for_each_entry_rcu(ifa, &inet_addr_lst[i], hash) {
Jiri Pirko5c766d62013-01-24 09:41:41 +0000605 unsigned long age;
606
607 if (ifa->ifa_flags & IFA_F_PERMANENT)
608 continue;
609
610 /* We try to batch several events at once. */
611 age = (now - ifa->ifa_tstamp +
612 ADDRCONF_TIMER_FUZZ_MINUS) / HZ;
613
614 if (ifa->ifa_valid_lft != INFINITY_LIFE_TIME &&
615 age >= ifa->ifa_valid_lft) {
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000616 change_needed = true;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000617 } else if (ifa->ifa_preferred_lft ==
618 INFINITY_LIFE_TIME) {
619 continue;
620 } else if (age >= ifa->ifa_preferred_lft) {
621 if (time_before(ifa->ifa_tstamp +
622 ifa->ifa_valid_lft * HZ, next))
623 next = ifa->ifa_tstamp +
624 ifa->ifa_valid_lft * HZ;
625
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000626 if (!(ifa->ifa_flags & IFA_F_DEPRECATED))
627 change_needed = true;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000628 } else if (time_before(ifa->ifa_tstamp +
629 ifa->ifa_preferred_lft * HZ,
630 next)) {
631 next = ifa->ifa_tstamp +
632 ifa->ifa_preferred_lft * HZ;
633 }
634 }
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000635 rcu_read_unlock();
636 if (!change_needed)
637 continue;
638 rtnl_lock();
639 hlist_for_each_entry_safe(ifa, n, &inet_addr_lst[i], hash) {
640 unsigned long age;
641
642 if (ifa->ifa_flags & IFA_F_PERMANENT)
643 continue;
644
645 /* We try to batch several events at once. */
646 age = (now - ifa->ifa_tstamp +
647 ADDRCONF_TIMER_FUZZ_MINUS) / HZ;
648
649 if (ifa->ifa_valid_lft != INFINITY_LIFE_TIME &&
650 age >= ifa->ifa_valid_lft) {
651 struct in_ifaddr **ifap;
652
653 for (ifap = &ifa->ifa_dev->ifa_list;
654 *ifap != NULL; ifap = &(*ifap)->ifa_next) {
655 if (*ifap == ifa) {
656 inet_del_ifa(ifa->ifa_dev,
657 ifap, 1);
658 break;
659 }
660 }
661 } else if (ifa->ifa_preferred_lft !=
662 INFINITY_LIFE_TIME &&
663 age >= ifa->ifa_preferred_lft &&
664 !(ifa->ifa_flags & IFA_F_DEPRECATED)) {
665 ifa->ifa_flags |= IFA_F_DEPRECATED;
666 rtmsg_ifa(RTM_NEWADDR, ifa, NULL, 0);
667 }
668 }
669 rtnl_unlock();
Jiri Pirko5c766d62013-01-24 09:41:41 +0000670 }
Jiri Pirko5c766d62013-01-24 09:41:41 +0000671
672 next_sec = round_jiffies_up(next);
673 next_sched = next;
674
675 /* If rounded timeout is accurate enough, accept it. */
676 if (time_before(next_sec, next + ADDRCONF_TIMER_FUZZ))
677 next_sched = next_sec;
678
679 now = jiffies;
680 /* And minimum interval is ADDRCONF_TIMER_FUZZ_MAX. */
681 if (time_before(next_sched, now + ADDRCONF_TIMER_FUZZ_MAX))
682 next_sched = now + ADDRCONF_TIMER_FUZZ_MAX;
683
viresh kumar906e0732014-01-22 12:23:32 +0530684 queue_delayed_work(system_power_efficient_wq, &check_lifetime_work,
685 next_sched - now);
Jiri Pirko5c766d62013-01-24 09:41:41 +0000686}
687
688static void set_ifa_lifetime(struct in_ifaddr *ifa, __u32 valid_lft,
689 __u32 prefered_lft)
690{
691 unsigned long timeout;
692
693 ifa->ifa_flags &= ~(IFA_F_PERMANENT | IFA_F_DEPRECATED);
694
695 timeout = addrconf_timeout_fixup(valid_lft, HZ);
696 if (addrconf_finite_timeout(timeout))
697 ifa->ifa_valid_lft = timeout;
698 else
699 ifa->ifa_flags |= IFA_F_PERMANENT;
700
701 timeout = addrconf_timeout_fixup(prefered_lft, HZ);
702 if (addrconf_finite_timeout(timeout)) {
703 if (timeout == 0)
704 ifa->ifa_flags |= IFA_F_DEPRECATED;
705 ifa->ifa_preferred_lft = timeout;
706 }
707 ifa->ifa_tstamp = jiffies;
708 if (!ifa->ifa_cstamp)
709 ifa->ifa_cstamp = ifa->ifa_tstamp;
710}
711
712static struct in_ifaddr *rtm_to_ifaddr(struct net *net, struct nlmsghdr *nlh,
713 __u32 *pvalid_lft, __u32 *pprefered_lft)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700714{
Thomas Graf5c753972006-08-04 23:03:53 -0700715 struct nlattr *tb[IFA_MAX+1];
716 struct in_ifaddr *ifa;
717 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 struct net_device *dev;
719 struct in_device *in_dev;
Denis V. Lunev7b218572008-01-31 18:47:00 -0800720 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700721
Thomas Graf5c753972006-08-04 23:03:53 -0700722 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
723 if (err < 0)
724 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700725
Thomas Graf5c753972006-08-04 23:03:53 -0700726 ifm = nlmsg_data(nlh);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800727 err = -EINVAL;
728 if (ifm->ifa_prefixlen > 32 || tb[IFA_LOCAL] == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700729 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700730
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -0800731 dev = __dev_get_by_index(net, ifm->ifa_index);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800732 err = -ENODEV;
733 if (dev == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700734 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735
Thomas Graf5c753972006-08-04 23:03:53 -0700736 in_dev = __in_dev_get_rtnl(dev);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800737 err = -ENOBUFS;
738 if (in_dev == NULL)
Herbert Xu71e27da2007-06-04 23:36:06 -0700739 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700740
Thomas Graf5c753972006-08-04 23:03:53 -0700741 ifa = inet_alloc_ifa();
Denis V. Lunev7b218572008-01-31 18:47:00 -0800742 if (ifa == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700743 /*
744 * A potential indev allocation can be left alive, it stays
745 * assigned to its device and is destroy with it.
746 */
Thomas Graf5c753972006-08-04 23:03:53 -0700747 goto errout;
Thomas Graf5c753972006-08-04 23:03:53 -0700748
Pavel Emelyanova4e65d32007-12-07 23:55:43 -0800749 ipv4_devconf_setall(in_dev);
Jiri Pirko1d4c8c22013-12-07 19:26:56 +0100750 neigh_parms_data_state_setall(in_dev->arp_parms);
Thomas Graf5c753972006-08-04 23:03:53 -0700751 in_dev_hold(in_dev);
752
753 if (tb[IFA_ADDRESS] == NULL)
754 tb[IFA_ADDRESS] = tb[IFA_LOCAL];
755
David S. Millerfd23c3b2011-02-18 12:42:28 -0800756 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700757 ifa->ifa_prefixlen = ifm->ifa_prefixlen;
758 ifa->ifa_mask = inet_make_mask(ifm->ifa_prefixlen);
Jiri Pirkoad6c8132013-12-08 12:16:10 +0100759 ifa->ifa_flags = tb[IFA_FLAGS] ? nla_get_u32(tb[IFA_FLAGS]) :
760 ifm->ifa_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700761 ifa->ifa_scope = ifm->ifa_scope;
Thomas Graf5c753972006-08-04 23:03:53 -0700762 ifa->ifa_dev = in_dev;
763
Al Viroa7a628c2006-09-26 22:16:43 -0700764 ifa->ifa_local = nla_get_be32(tb[IFA_LOCAL]);
765 ifa->ifa_address = nla_get_be32(tb[IFA_ADDRESS]);
Thomas Graf5c753972006-08-04 23:03:53 -0700766
767 if (tb[IFA_BROADCAST])
Al Viroa7a628c2006-09-26 22:16:43 -0700768 ifa->ifa_broadcast = nla_get_be32(tb[IFA_BROADCAST]);
Thomas Graf5c753972006-08-04 23:03:53 -0700769
Thomas Graf5c753972006-08-04 23:03:53 -0700770 if (tb[IFA_LABEL])
771 nla_strlcpy(ifa->ifa_label, tb[IFA_LABEL], IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772 else
773 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
774
Jiri Pirko5c766d62013-01-24 09:41:41 +0000775 if (tb[IFA_CACHEINFO]) {
776 struct ifa_cacheinfo *ci;
777
778 ci = nla_data(tb[IFA_CACHEINFO]);
779 if (!ci->ifa_valid || ci->ifa_prefered > ci->ifa_valid) {
780 err = -EINVAL;
Daniel Borkmann446266b2013-08-02 11:32:43 +0200781 goto errout_free;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000782 }
783 *pvalid_lft = ci->ifa_valid;
784 *pprefered_lft = ci->ifa_prefered;
785 }
786
Thomas Graf5c753972006-08-04 23:03:53 -0700787 return ifa;
788
Daniel Borkmann446266b2013-08-02 11:32:43 +0200789errout_free:
790 inet_free_ifa(ifa);
Thomas Graf5c753972006-08-04 23:03:53 -0700791errout:
792 return ERR_PTR(err);
793}
794
Jiri Pirko5c766d62013-01-24 09:41:41 +0000795static struct in_ifaddr *find_matching_ifa(struct in_ifaddr *ifa)
796{
797 struct in_device *in_dev = ifa->ifa_dev;
798 struct in_ifaddr *ifa1, **ifap;
799
800 if (!ifa->ifa_local)
801 return NULL;
802
803 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
804 ifap = &ifa1->ifa_next) {
805 if (ifa1->ifa_mask == ifa->ifa_mask &&
806 inet_ifa_match(ifa1->ifa_address, ifa) &&
807 ifa1->ifa_local == ifa->ifa_local)
808 return ifa1;
809 }
810 return NULL;
811}
812
Thomas Graf661d2962013-03-21 07:45:29 +0000813static int inet_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh)
Thomas Graf5c753972006-08-04 23:03:53 -0700814{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900815 struct net *net = sock_net(skb->sk);
Thomas Graf5c753972006-08-04 23:03:53 -0700816 struct in_ifaddr *ifa;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000817 struct in_ifaddr *ifa_existing;
818 __u32 valid_lft = INFINITY_LIFE_TIME;
819 __u32 prefered_lft = INFINITY_LIFE_TIME;
Thomas Graf5c753972006-08-04 23:03:53 -0700820
821 ASSERT_RTNL();
822
Jiri Pirko5c766d62013-01-24 09:41:41 +0000823 ifa = rtm_to_ifaddr(net, nlh, &valid_lft, &prefered_lft);
Thomas Graf5c753972006-08-04 23:03:53 -0700824 if (IS_ERR(ifa))
825 return PTR_ERR(ifa);
826
Jiri Pirko5c766d62013-01-24 09:41:41 +0000827 ifa_existing = find_matching_ifa(ifa);
828 if (!ifa_existing) {
829 /* It would be best to check for !NLM_F_CREATE here but
stephen hemminger614d0562014-05-16 20:46:58 -0700830 * userspace already relies on not having to provide this.
Jiri Pirko5c766d62013-01-24 09:41:41 +0000831 */
832 set_ifa_lifetime(ifa, valid_lft, prefered_lft);
833 return __inet_insert_ifa(ifa, nlh, NETLINK_CB(skb).portid);
834 } else {
835 inet_free_ifa(ifa);
836
837 if (nlh->nlmsg_flags & NLM_F_EXCL ||
838 !(nlh->nlmsg_flags & NLM_F_REPLACE))
839 return -EEXIST;
Jiri Pirko34e2ed32013-04-04 08:33:00 +0000840 ifa = ifa_existing;
841 set_ifa_lifetime(ifa, valid_lft, prefered_lft);
Jiri Pirko05a324b2013-04-04 23:39:38 +0000842 cancel_delayed_work(&check_lifetime_work);
viresh kumar906e0732014-01-22 12:23:32 +0530843 queue_delayed_work(system_power_efficient_wq,
844 &check_lifetime_work, 0);
Jiri Pirko34e2ed32013-04-04 08:33:00 +0000845 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, NETLINK_CB(skb).portid);
846 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
Jiri Pirko5c766d62013-01-24 09:41:41 +0000847 }
848 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700849}
850
851/*
852 * Determine a default network mask, based on the IP address.
853 */
854
Eric Dumazet40384992012-08-03 21:06:50 +0000855static int inet_abc_len(__be32 addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700856{
857 int rc = -1; /* Something else, probably a multicast. */
858
Joe Perchesf97c1e02007-12-16 13:45:43 -0800859 if (ipv4_is_zeronet(addr))
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900860 rc = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700861 else {
Al Viro714e85b2006-11-14 20:51:49 -0800862 __u32 haddr = ntohl(addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700863
Al Viro714e85b2006-11-14 20:51:49 -0800864 if (IN_CLASSA(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700865 rc = 8;
Al Viro714e85b2006-11-14 20:51:49 -0800866 else if (IN_CLASSB(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700867 rc = 16;
Al Viro714e85b2006-11-14 20:51:49 -0800868 else if (IN_CLASSC(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700869 rc = 24;
870 }
871
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900872 return rc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700873}
874
875
Denis V. Luneve5b13cb2008-02-28 20:51:43 -0800876int devinet_ioctl(struct net *net, unsigned int cmd, void __user *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700877{
878 struct ifreq ifr;
879 struct sockaddr_in sin_orig;
880 struct sockaddr_in *sin = (struct sockaddr_in *)&ifr.ifr_addr;
881 struct in_device *in_dev;
882 struct in_ifaddr **ifap = NULL;
883 struct in_ifaddr *ifa = NULL;
884 struct net_device *dev;
885 char *colon;
886 int ret = -EFAULT;
887 int tryaddrmatch = 0;
888
889 /*
890 * Fetch the caller's info block into kernel space
891 */
892
893 if (copy_from_user(&ifr, arg, sizeof(struct ifreq)))
894 goto out;
895 ifr.ifr_name[IFNAMSIZ - 1] = 0;
896
897 /* save original address for comparison */
898 memcpy(&sin_orig, sin, sizeof(*sin));
899
900 colon = strchr(ifr.ifr_name, ':');
901 if (colon)
902 *colon = 0;
903
Denis V. Luneve5b13cb2008-02-28 20:51:43 -0800904 dev_load(net, ifr.ifr_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700905
Stephen Hemminger132adf52007-03-08 20:44:43 -0800906 switch (cmd) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700907 case SIOCGIFADDR: /* Get interface address */
908 case SIOCGIFBRDADDR: /* Get the broadcast address */
909 case SIOCGIFDSTADDR: /* Get the destination address */
910 case SIOCGIFNETMASK: /* Get the netmask for the interface */
911 /* Note that these ioctls will not sleep,
912 so that we do not impose a lock.
913 One day we will be forced to put shlock here (I mean SMP)
914 */
915 tryaddrmatch = (sin_orig.sin_family == AF_INET);
916 memset(sin, 0, sizeof(*sin));
917 sin->sin_family = AF_INET;
918 break;
919
920 case SIOCSIFFLAGS:
Zhao Hongjiangbf5b30b2012-09-20 22:37:25 +0000921 ret = -EPERM;
Eric W. Biederman52e804c2012-11-16 03:03:05 +0000922 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700923 goto out;
924 break;
925 case SIOCSIFADDR: /* Set interface address (and family) */
926 case SIOCSIFBRDADDR: /* Set the broadcast address */
927 case SIOCSIFDSTADDR: /* Set the destination address */
928 case SIOCSIFNETMASK: /* Set the netmask for the interface */
Zhao Hongjiangbf5b30b2012-09-20 22:37:25 +0000929 ret = -EPERM;
Eric W. Biederman52e804c2012-11-16 03:03:05 +0000930 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700931 goto out;
932 ret = -EINVAL;
933 if (sin->sin_family != AF_INET)
934 goto out;
935 break;
936 default:
937 ret = -EINVAL;
938 goto out;
939 }
940
941 rtnl_lock();
942
943 ret = -ENODEV;
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800944 dev = __dev_get_by_name(net, ifr.ifr_name);
945 if (!dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700946 goto done;
947
948 if (colon)
949 *colon = ':';
950
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800951 in_dev = __in_dev_get_rtnl(dev);
952 if (in_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700953 if (tryaddrmatch) {
954 /* Matthias Andree */
955 /* compare label and address (4.4BSD style) */
956 /* note: we only do this for a limited set of ioctls
957 and only if the original address family was AF_INET.
958 This is checked above. */
959 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
960 ifap = &ifa->ifa_next) {
961 if (!strcmp(ifr.ifr_name, ifa->ifa_label) &&
962 sin_orig.sin_addr.s_addr ==
David S. Miller6c91afe2011-03-09 13:27:16 -0800963 ifa->ifa_local) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700964 break; /* found */
965 }
966 }
967 }
968 /* we didn't get a match, maybe the application is
969 4.3BSD-style and passed in junk so we fall back to
970 comparing just the label */
971 if (!ifa) {
972 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
973 ifap = &ifa->ifa_next)
974 if (!strcmp(ifr.ifr_name, ifa->ifa_label))
975 break;
976 }
977 }
978
979 ret = -EADDRNOTAVAIL;
980 if (!ifa && cmd != SIOCSIFADDR && cmd != SIOCSIFFLAGS)
981 goto done;
982
Stephen Hemminger132adf52007-03-08 20:44:43 -0800983 switch (cmd) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700984 case SIOCGIFADDR: /* Get interface address */
985 sin->sin_addr.s_addr = ifa->ifa_local;
986 goto rarok;
987
988 case SIOCGIFBRDADDR: /* Get the broadcast address */
989 sin->sin_addr.s_addr = ifa->ifa_broadcast;
990 goto rarok;
991
992 case SIOCGIFDSTADDR: /* Get the destination address */
993 sin->sin_addr.s_addr = ifa->ifa_address;
994 goto rarok;
995
996 case SIOCGIFNETMASK: /* Get the netmask for the interface */
997 sin->sin_addr.s_addr = ifa->ifa_mask;
998 goto rarok;
999
1000 case SIOCSIFFLAGS:
1001 if (colon) {
1002 ret = -EADDRNOTAVAIL;
1003 if (!ifa)
1004 break;
1005 ret = 0;
1006 if (!(ifr.ifr_flags & IFF_UP))
1007 inet_del_ifa(in_dev, ifap, 1);
1008 break;
1009 }
1010 ret = dev_change_flags(dev, ifr.ifr_flags);
1011 break;
1012
1013 case SIOCSIFADDR: /* Set interface address (and family) */
1014 ret = -EINVAL;
1015 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
1016 break;
1017
1018 if (!ifa) {
1019 ret = -ENOBUFS;
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001020 ifa = inet_alloc_ifa();
1021 if (!ifa)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001022 break;
Xi Wangc7e2e1d2013-01-05 11:19:24 +00001023 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001024 if (colon)
1025 memcpy(ifa->ifa_label, ifr.ifr_name, IFNAMSIZ);
1026 else
1027 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1028 } else {
1029 ret = 0;
1030 if (ifa->ifa_local == sin->sin_addr.s_addr)
1031 break;
1032 inet_del_ifa(in_dev, ifap, 0);
1033 ifa->ifa_broadcast = 0;
Bjorn Mork148f9722008-02-26 18:17:53 -08001034 ifa->ifa_scope = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001035 }
1036
1037 ifa->ifa_address = ifa->ifa_local = sin->sin_addr.s_addr;
1038
1039 if (!(dev->flags & IFF_POINTOPOINT)) {
1040 ifa->ifa_prefixlen = inet_abc_len(ifa->ifa_address);
1041 ifa->ifa_mask = inet_make_mask(ifa->ifa_prefixlen);
1042 if ((dev->flags & IFF_BROADCAST) &&
1043 ifa->ifa_prefixlen < 31)
1044 ifa->ifa_broadcast = ifa->ifa_address |
1045 ~ifa->ifa_mask;
1046 } else {
1047 ifa->ifa_prefixlen = 32;
1048 ifa->ifa_mask = inet_make_mask(32);
1049 }
Jiri Pirko5c766d62013-01-24 09:41:41 +00001050 set_ifa_lifetime(ifa, INFINITY_LIFE_TIME, INFINITY_LIFE_TIME);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001051 ret = inet_set_ifa(dev, ifa);
1052 break;
1053
1054 case SIOCSIFBRDADDR: /* Set the broadcast address */
1055 ret = 0;
1056 if (ifa->ifa_broadcast != sin->sin_addr.s_addr) {
1057 inet_del_ifa(in_dev, ifap, 0);
1058 ifa->ifa_broadcast = sin->sin_addr.s_addr;
1059 inet_insert_ifa(ifa);
1060 }
1061 break;
1062
1063 case SIOCSIFDSTADDR: /* Set the destination address */
1064 ret = 0;
1065 if (ifa->ifa_address == sin->sin_addr.s_addr)
1066 break;
1067 ret = -EINVAL;
1068 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
1069 break;
1070 ret = 0;
1071 inet_del_ifa(in_dev, ifap, 0);
1072 ifa->ifa_address = sin->sin_addr.s_addr;
1073 inet_insert_ifa(ifa);
1074 break;
1075
1076 case SIOCSIFNETMASK: /* Set the netmask for the interface */
1077
1078 /*
1079 * The mask we set must be legal.
1080 */
1081 ret = -EINVAL;
1082 if (bad_mask(sin->sin_addr.s_addr, 0))
1083 break;
1084 ret = 0;
1085 if (ifa->ifa_mask != sin->sin_addr.s_addr) {
Al Viroa144ea42006-09-28 18:00:55 -07001086 __be32 old_mask = ifa->ifa_mask;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001087 inet_del_ifa(in_dev, ifap, 0);
1088 ifa->ifa_mask = sin->sin_addr.s_addr;
1089 ifa->ifa_prefixlen = inet_mask_len(ifa->ifa_mask);
1090
1091 /* See if current broadcast address matches
1092 * with current netmask, then recalculate
1093 * the broadcast address. Otherwise it's a
1094 * funny address, so don't touch it since
1095 * the user seems to know what (s)he's doing...
1096 */
1097 if ((dev->flags & IFF_BROADCAST) &&
1098 (ifa->ifa_prefixlen < 31) &&
1099 (ifa->ifa_broadcast ==
David Engeldcab5e12005-10-21 22:09:16 -05001100 (ifa->ifa_local|~old_mask))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001101 ifa->ifa_broadcast = (ifa->ifa_local |
1102 ~sin->sin_addr.s_addr);
1103 }
1104 inet_insert_ifa(ifa);
1105 }
1106 break;
1107 }
1108done:
1109 rtnl_unlock();
1110out:
1111 return ret;
1112rarok:
1113 rtnl_unlock();
1114 ret = copy_to_user(arg, &ifr, sizeof(struct ifreq)) ? -EFAULT : 0;
1115 goto out;
1116}
1117
1118static int inet_gifconf(struct net_device *dev, char __user *buf, int len)
1119{
Herbert Xue5ed6392005-10-03 14:35:55 -07001120 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001121 struct in_ifaddr *ifa;
1122 struct ifreq ifr;
1123 int done = 0;
1124
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001125 if (!in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001126 goto out;
1127
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001128 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001129 if (!buf) {
1130 done += sizeof(ifr);
1131 continue;
1132 }
1133 if (len < (int) sizeof(ifr))
1134 break;
1135 memset(&ifr, 0, sizeof(struct ifreq));
Dan Carpenter4299c8a2013-07-29 22:15:19 +03001136 strcpy(ifr.ifr_name, ifa->ifa_label);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001137
1138 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_family = AF_INET;
1139 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_addr.s_addr =
1140 ifa->ifa_local;
1141
1142 if (copy_to_user(buf, &ifr, sizeof(struct ifreq))) {
1143 done = -EFAULT;
1144 break;
1145 }
1146 buf += sizeof(struct ifreq);
1147 len -= sizeof(struct ifreq);
1148 done += sizeof(struct ifreq);
1149 }
1150out:
1151 return done;
1152}
1153
Al Viroa61ced52006-09-26 21:27:54 -07001154__be32 inet_select_addr(const struct net_device *dev, __be32 dst, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001155{
Al Viroa61ced52006-09-26 21:27:54 -07001156 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001157 struct in_device *in_dev;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001158 struct net *net = dev_net(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001159
1160 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -07001161 in_dev = __in_dev_get_rcu(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001162 if (!in_dev)
1163 goto no_in_dev;
1164
1165 for_primary_ifa(in_dev) {
1166 if (ifa->ifa_scope > scope)
1167 continue;
1168 if (!dst || inet_ifa_match(dst, ifa)) {
1169 addr = ifa->ifa_local;
1170 break;
1171 }
1172 if (!addr)
1173 addr = ifa->ifa_local;
1174 } endfor_ifa(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001175
1176 if (addr)
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001177 goto out_unlock;
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001178no_in_dev:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001179
1180 /* Not loopback addresses on loopback should be preferred
1181 in this case. It is importnat that lo is the first interface
1182 in dev_base list.
1183 */
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001184 for_each_netdev_rcu(net, dev) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001185 in_dev = __in_dev_get_rcu(dev);
1186 if (!in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001187 continue;
1188
1189 for_primary_ifa(in_dev) {
1190 if (ifa->ifa_scope != RT_SCOPE_LINK &&
1191 ifa->ifa_scope <= scope) {
1192 addr = ifa->ifa_local;
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001193 goto out_unlock;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001194 }
1195 } endfor_ifa(in_dev);
1196 }
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001197out_unlock:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001198 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001199 return addr;
1200}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001201EXPORT_SYMBOL(inet_select_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001202
Al Viro60cad5d2006-09-26 22:17:09 -07001203static __be32 confirm_addr_indev(struct in_device *in_dev, __be32 dst,
1204 __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001205{
1206 int same = 0;
Al Viroa144ea42006-09-28 18:00:55 -07001207 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001208
1209 for_ifa(in_dev) {
1210 if (!addr &&
1211 (local == ifa->ifa_local || !local) &&
1212 ifa->ifa_scope <= scope) {
1213 addr = ifa->ifa_local;
1214 if (same)
1215 break;
1216 }
1217 if (!same) {
1218 same = (!local || inet_ifa_match(local, ifa)) &&
1219 (!dst || inet_ifa_match(dst, ifa));
1220 if (same && addr) {
1221 if (local || !dst)
1222 break;
1223 /* Is the selected addr into dst subnet? */
1224 if (inet_ifa_match(addr, ifa))
1225 break;
1226 /* No, then can we use new local src? */
1227 if (ifa->ifa_scope <= scope) {
1228 addr = ifa->ifa_local;
1229 break;
1230 }
1231 /* search for large dst subnet for addr */
1232 same = 0;
1233 }
1234 }
1235 } endfor_ifa(in_dev);
1236
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001237 return same ? addr : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001238}
1239
1240/*
1241 * Confirm that local IP address exists using wildcards:
Nicolas Dichtelb601fa12013-12-10 15:02:40 +01001242 * - net: netns to check, cannot be NULL
1243 * - in_dev: only on this interface, NULL=any interface
Linus Torvalds1da177e2005-04-16 15:20:36 -07001244 * - dst: only in the same subnet as dst, 0=any dst
1245 * - local: address, 0=autoselect the local address
1246 * - scope: maximum allowed scope value for the local address
1247 */
Nicolas Dichtelb601fa12013-12-10 15:02:40 +01001248__be32 inet_confirm_addr(struct net *net, struct in_device *in_dev,
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001249 __be32 dst, __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001250{
Al Viro60cad5d2006-09-26 22:17:09 -07001251 __be32 addr = 0;
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001252 struct net_device *dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001253
Nicolas Dichtelb601fa12013-12-10 15:02:40 +01001254 if (in_dev != NULL)
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001255 return confirm_addr_indev(in_dev, dst, local, scope);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001256
Linus Torvalds1da177e2005-04-16 15:20:36 -07001257 rcu_read_lock();
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001258 for_each_netdev_rcu(net, dev) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001259 in_dev = __in_dev_get_rcu(dev);
1260 if (in_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001261 addr = confirm_addr_indev(in_dev, dst, local, scope);
1262 if (addr)
1263 break;
1264 }
1265 }
1266 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001267
1268 return addr;
1269}
Andy Gospodarekeaddcd72012-03-22 16:14:29 +00001270EXPORT_SYMBOL(inet_confirm_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001271
1272/*
1273 * Device notifier
1274 */
1275
1276int register_inetaddr_notifier(struct notifier_block *nb)
1277{
Alan Sterne041c682006-03-27 01:16:30 -08001278 return blocking_notifier_chain_register(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001279}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001280EXPORT_SYMBOL(register_inetaddr_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001281
1282int unregister_inetaddr_notifier(struct notifier_block *nb)
1283{
Alan Sterne041c682006-03-27 01:16:30 -08001284 return blocking_notifier_chain_unregister(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001285}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001286EXPORT_SYMBOL(unregister_inetaddr_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001288/* Rename ifa_labels for a device name change. Make some effort to preserve
1289 * existing alias numbering and to create unique labels if possible.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001290*/
1291static void inetdev_changename(struct net_device *dev, struct in_device *in_dev)
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001292{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001293 struct in_ifaddr *ifa;
1294 int named = 0;
1295
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001296 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
1297 char old[IFNAMSIZ], *dot;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001298
1299 memcpy(old, ifa->ifa_label, IFNAMSIZ);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001300 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001301 if (named++ == 0)
Thomas Graf573bf472008-06-10 15:40:04 -07001302 goto skip;
Mark McLoughlin44344b22008-01-04 00:56:25 -08001303 dot = strchr(old, ':');
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001304 if (dot == NULL) {
1305 sprintf(old, ":%d", named);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001306 dot = old;
1307 }
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001308 if (strlen(dot) + strlen(dev->name) < IFNAMSIZ)
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001309 strcat(ifa->ifa_label, dot);
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001310 else
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001311 strcpy(ifa->ifa_label + (IFNAMSIZ - strlen(dot) - 1), dot);
Thomas Graf573bf472008-06-10 15:40:04 -07001312skip:
1313 rtmsg_ifa(RTM_NEWADDR, ifa, NULL, 0);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001314 }
1315}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001316
Eric Dumazet40384992012-08-03 21:06:50 +00001317static bool inetdev_valid_mtu(unsigned int mtu)
Breno Leitao067708432008-09-02 17:28:58 -07001318{
1319 return mtu >= 68;
1320}
1321
Ian Campbelld11327ad2011-02-11 07:44:16 +00001322static void inetdev_send_gratuitous_arp(struct net_device *dev,
1323 struct in_device *in_dev)
1324
1325{
Zoltan Kissb76d0782011-07-24 13:09:30 +00001326 struct in_ifaddr *ifa;
Ian Campbelld11327ad2011-02-11 07:44:16 +00001327
Zoltan Kissb76d0782011-07-24 13:09:30 +00001328 for (ifa = in_dev->ifa_list; ifa;
1329 ifa = ifa->ifa_next) {
1330 arp_send(ARPOP_REQUEST, ETH_P_ARP,
1331 ifa->ifa_local, dev,
1332 ifa->ifa_local, NULL,
1333 dev->dev_addr, NULL);
1334 }
Ian Campbelld11327ad2011-02-11 07:44:16 +00001335}
1336
Linus Torvalds1da177e2005-04-16 15:20:36 -07001337/* Called only under RTNL semaphore */
1338
1339static int inetdev_event(struct notifier_block *this, unsigned long event,
1340 void *ptr)
1341{
Jiri Pirko351638e2013-05-28 01:30:21 +00001342 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
Eric Dumazet748e2d92012-08-22 21:50:59 +00001343 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001344
1345 ASSERT_RTNL();
1346
1347 if (!in_dev) {
Herbert Xu8030f542007-02-22 01:53:47 +09001348 if (event == NETDEV_REGISTER) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001349 in_dev = inetdev_init(dev);
Herbert Xub217d612007-07-30 17:04:52 -07001350 if (!in_dev)
1351 return notifier_from_errno(-ENOMEM);
Eric W. Biederman0cc217e2007-09-26 22:10:06 -07001352 if (dev->flags & IFF_LOOPBACK) {
Herbert Xu42f811b2007-06-04 23:34:44 -07001353 IN_DEV_CONF_SET(in_dev, NOXFRM, 1);
1354 IN_DEV_CONF_SET(in_dev, NOPOLICY, 1);
Herbert Xu8030f542007-02-22 01:53:47 +09001355 }
Breno Leitao067708432008-09-02 17:28:58 -07001356 } else if (event == NETDEV_CHANGEMTU) {
1357 /* Re-enabling IP */
1358 if (inetdev_valid_mtu(dev->mtu))
1359 in_dev = inetdev_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001360 }
1361 goto out;
1362 }
1363
1364 switch (event) {
1365 case NETDEV_REGISTER:
Joe Perches91df42b2012-05-15 14:11:54 +00001366 pr_debug("%s: bug\n", __func__);
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +00001367 RCU_INIT_POINTER(dev->ip_ptr, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001368 break;
1369 case NETDEV_UP:
Breno Leitao067708432008-09-02 17:28:58 -07001370 if (!inetdev_valid_mtu(dev->mtu))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001371 break;
Eric W. Biederman0cc217e2007-09-26 22:10:06 -07001372 if (dev->flags & IFF_LOOPBACK) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001373 struct in_ifaddr *ifa = inet_alloc_ifa();
1374
1375 if (ifa) {
David S. Millerfd23c3b2011-02-18 12:42:28 -08001376 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001377 ifa->ifa_local =
1378 ifa->ifa_address = htonl(INADDR_LOOPBACK);
1379 ifa->ifa_prefixlen = 8;
1380 ifa->ifa_mask = inet_make_mask(8);
1381 in_dev_hold(in_dev);
1382 ifa->ifa_dev = in_dev;
1383 ifa->ifa_scope = RT_SCOPE_HOST;
1384 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
Jiri Pirko5c766d62013-01-24 09:41:41 +00001385 set_ifa_lifetime(ifa, INFINITY_LIFE_TIME,
1386 INFINITY_LIFE_TIME);
Jiri Pirkodfd15822014-01-07 15:55:45 +01001387 ipv4_devconf_setall(in_dev);
1388 neigh_parms_data_state_setall(in_dev->arp_parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001389 inet_insert_ifa(ifa);
1390 }
1391 }
1392 ip_mc_up(in_dev);
Stephen Hemmingereefef1c2009-02-01 01:04:33 -08001393 /* fall through */
1394 case NETDEV_CHANGEADDR:
Ian Campbelld11327ad2011-02-11 07:44:16 +00001395 if (!IN_DEV_ARP_NOTIFY(in_dev))
1396 break;
1397 /* fall through */
1398 case NETDEV_NOTIFY_PEERS:
Stephen Hemmingera21090c2009-10-07 03:18:17 -07001399 /* Send gratuitous ARP to notify of link change */
Ian Campbelld11327ad2011-02-11 07:44:16 +00001400 inetdev_send_gratuitous_arp(dev, in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001401 break;
1402 case NETDEV_DOWN:
1403 ip_mc_down(in_dev);
1404 break;
Jiri Pirko93d9b7d2010-03-10 10:28:56 +00001405 case NETDEV_PRE_TYPE_CHANGE:
Moni Shoua75c78502009-09-15 02:37:40 -07001406 ip_mc_unmap(in_dev);
1407 break;
Jiri Pirko93d9b7d2010-03-10 10:28:56 +00001408 case NETDEV_POST_TYPE_CHANGE:
Moni Shoua75c78502009-09-15 02:37:40 -07001409 ip_mc_remap(in_dev);
1410 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001411 case NETDEV_CHANGEMTU:
Breno Leitao067708432008-09-02 17:28:58 -07001412 if (inetdev_valid_mtu(dev->mtu))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001413 break;
Breno Leitao067708432008-09-02 17:28:58 -07001414 /* disable IP when MTU is not enough */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001415 case NETDEV_UNREGISTER:
1416 inetdev_destroy(in_dev);
1417 break;
1418 case NETDEV_CHANGENAME:
1419 /* Do not notify about label change, this event is
1420 * not interesting to applications using netlink.
1421 */
1422 inetdev_changename(dev, in_dev);
1423
Pavel Emelyanov51602b22007-12-11 02:17:40 -08001424 devinet_sysctl_unregister(in_dev);
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11001425 devinet_sysctl_register(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001426 break;
1427 }
1428out:
1429 return NOTIFY_DONE;
1430}
1431
1432static struct notifier_block ip_netdev_notifier = {
Jianjun Kong539afed2008-11-03 02:48:48 -08001433 .notifier_call = inetdev_event,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001434};
1435
Eric Dumazet40384992012-08-03 21:06:50 +00001436static size_t inet_nlmsg_size(void)
Thomas Graf339bf982006-11-10 14:10:15 -08001437{
1438 return NLMSG_ALIGN(sizeof(struct ifaddrmsg))
1439 + nla_total_size(4) /* IFA_ADDRESS */
1440 + nla_total_size(4) /* IFA_LOCAL */
1441 + nla_total_size(4) /* IFA_BROADCAST */
Jiri Pirkoad6c8132013-12-08 12:16:10 +01001442 + nla_total_size(IFNAMSIZ) /* IFA_LABEL */
Geert Uytterhoeven63b5f152014-02-05 08:38:25 +01001443 + nla_total_size(4) /* IFA_FLAGS */
1444 + nla_total_size(sizeof(struct ifa_cacheinfo)); /* IFA_CACHEINFO */
Thomas Graf339bf982006-11-10 14:10:15 -08001445}
1446
Jiri Pirko5c766d62013-01-24 09:41:41 +00001447static inline u32 cstamp_delta(unsigned long cstamp)
1448{
1449 return (cstamp - INITIAL_JIFFIES) * 100UL / HZ;
1450}
1451
1452static int put_cacheinfo(struct sk_buff *skb, unsigned long cstamp,
1453 unsigned long tstamp, u32 preferred, u32 valid)
1454{
1455 struct ifa_cacheinfo ci;
1456
1457 ci.cstamp = cstamp_delta(cstamp);
1458 ci.tstamp = cstamp_delta(tstamp);
1459 ci.ifa_prefered = preferred;
1460 ci.ifa_valid = valid;
1461
1462 return nla_put(skb, IFA_CACHEINFO, sizeof(ci), &ci);
1463}
1464
Linus Torvalds1da177e2005-04-16 15:20:36 -07001465static int inet_fill_ifaddr(struct sk_buff *skb, struct in_ifaddr *ifa,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001466 u32 portid, u32 seq, int event, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001467{
1468 struct ifaddrmsg *ifm;
1469 struct nlmsghdr *nlh;
Jiri Pirko5c766d62013-01-24 09:41:41 +00001470 u32 preferred, valid;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001471
Eric W. Biederman15e47302012-09-07 20:12:54 +00001472 nlh = nlmsg_put(skb, portid, seq, event, sizeof(*ifm), flags);
Thomas Graf47f68512006-08-04 23:04:36 -07001473 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001474 return -EMSGSIZE;
Thomas Graf47f68512006-08-04 23:04:36 -07001475
1476 ifm = nlmsg_data(nlh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001477 ifm->ifa_family = AF_INET;
1478 ifm->ifa_prefixlen = ifa->ifa_prefixlen;
Jiri Pirko5c766d62013-01-24 09:41:41 +00001479 ifm->ifa_flags = ifa->ifa_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001480 ifm->ifa_scope = ifa->ifa_scope;
1481 ifm->ifa_index = ifa->ifa_dev->dev->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001482
Jiri Pirko5c766d62013-01-24 09:41:41 +00001483 if (!(ifm->ifa_flags & IFA_F_PERMANENT)) {
1484 preferred = ifa->ifa_preferred_lft;
1485 valid = ifa->ifa_valid_lft;
1486 if (preferred != INFINITY_LIFE_TIME) {
1487 long tval = (jiffies - ifa->ifa_tstamp) / HZ;
1488
1489 if (preferred > tval)
1490 preferred -= tval;
1491 else
1492 preferred = 0;
1493 if (valid != INFINITY_LIFE_TIME) {
1494 if (valid > tval)
1495 valid -= tval;
1496 else
1497 valid = 0;
1498 }
1499 }
1500 } else {
1501 preferred = INFINITY_LIFE_TIME;
1502 valid = INFINITY_LIFE_TIME;
1503 }
David S. Millerf3756b72012-04-01 20:39:02 -04001504 if ((ifa->ifa_address &&
1505 nla_put_be32(skb, IFA_ADDRESS, ifa->ifa_address)) ||
1506 (ifa->ifa_local &&
1507 nla_put_be32(skb, IFA_LOCAL, ifa->ifa_local)) ||
1508 (ifa->ifa_broadcast &&
1509 nla_put_be32(skb, IFA_BROADCAST, ifa->ifa_broadcast)) ||
1510 (ifa->ifa_label[0] &&
Jiri Pirko5c766d62013-01-24 09:41:41 +00001511 nla_put_string(skb, IFA_LABEL, ifa->ifa_label)) ||
Jiri Pirkoad6c8132013-12-08 12:16:10 +01001512 nla_put_u32(skb, IFA_FLAGS, ifa->ifa_flags) ||
Jiri Pirko5c766d62013-01-24 09:41:41 +00001513 put_cacheinfo(skb, ifa->ifa_cstamp, ifa->ifa_tstamp,
1514 preferred, valid))
David S. Millerf3756b72012-04-01 20:39:02 -04001515 goto nla_put_failure;
Thomas Graf47f68512006-08-04 23:04:36 -07001516
1517 return nlmsg_end(skb, nlh);
1518
1519nla_put_failure:
Patrick McHardy26932562007-01-31 23:16:40 -08001520 nlmsg_cancel(skb, nlh);
1521 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001522}
1523
1524static int inet_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb)
1525{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001526 struct net *net = sock_net(skb->sk);
Eric Dumazeteec4df92009-11-12 07:44:25 +00001527 int h, s_h;
1528 int idx, s_idx;
1529 int ip_idx, s_ip_idx;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001530 struct net_device *dev;
1531 struct in_device *in_dev;
1532 struct in_ifaddr *ifa;
Eric Dumazeteec4df92009-11-12 07:44:25 +00001533 struct hlist_head *head;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001534
Eric Dumazeteec4df92009-11-12 07:44:25 +00001535 s_h = cb->args[0];
1536 s_idx = idx = cb->args[1];
1537 s_ip_idx = ip_idx = cb->args[2];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001538
Eric Dumazeteec4df92009-11-12 07:44:25 +00001539 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
1540 idx = 0;
1541 head = &net->dev_index_head[h];
1542 rcu_read_lock();
Nicolas Dichtel04652772013-03-22 06:28:42 +00001543 cb->seq = atomic_read(&net->ipv4.dev_addr_genid) ^
1544 net->dev_base_seq;
Sasha Levinb67bfe02013-02-27 17:06:00 -08001545 hlist_for_each_entry_rcu(dev, head, index_hlist) {
Eric Dumazeteec4df92009-11-12 07:44:25 +00001546 if (idx < s_idx)
1547 goto cont;
Patrick McHardy4b97efd2010-03-26 20:27:49 -07001548 if (h > s_h || idx > s_idx)
Eric Dumazeteec4df92009-11-12 07:44:25 +00001549 s_ip_idx = 0;
1550 in_dev = __in_dev_get_rcu(dev);
1551 if (!in_dev)
1552 goto cont;
1553
1554 for (ifa = in_dev->ifa_list, ip_idx = 0; ifa;
1555 ifa = ifa->ifa_next, ip_idx++) {
1556 if (ip_idx < s_ip_idx)
1557 continue;
1558 if (inet_fill_ifaddr(skb, ifa,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001559 NETLINK_CB(cb->skb).portid,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001560 cb->nlh->nlmsg_seq,
Eric Dumazeteec4df92009-11-12 07:44:25 +00001561 RTM_NEWADDR, NLM_F_MULTI) <= 0) {
1562 rcu_read_unlock();
1563 goto done;
1564 }
Nicolas Dichtel04652772013-03-22 06:28:42 +00001565 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
Eric Dumazeteec4df92009-11-12 07:44:25 +00001566 }
Pavel Emelianov7562f872007-05-03 15:13:45 -07001567cont:
Eric Dumazeteec4df92009-11-12 07:44:25 +00001568 idx++;
1569 }
1570 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001571 }
1572
1573done:
Eric Dumazeteec4df92009-11-12 07:44:25 +00001574 cb->args[0] = h;
1575 cb->args[1] = idx;
1576 cb->args[2] = ip_idx;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001577
1578 return skb->len;
1579}
1580
Jianjun Kong539afed2008-11-03 02:48:48 -08001581static void rtmsg_ifa(int event, struct in_ifaddr *ifa, struct nlmsghdr *nlh,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001582 u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001583{
Thomas Graf47f68512006-08-04 23:04:36 -07001584 struct sk_buff *skb;
Thomas Grafd6062cb2006-08-15 00:33:59 -07001585 u32 seq = nlh ? nlh->nlmsg_seq : 0;
1586 int err = -ENOBUFS;
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -08001587 struct net *net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001588
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001589 net = dev_net(ifa->ifa_dev->dev);
Thomas Graf339bf982006-11-10 14:10:15 -08001590 skb = nlmsg_new(inet_nlmsg_size(), GFP_KERNEL);
Thomas Graf47f68512006-08-04 23:04:36 -07001591 if (skb == NULL)
Thomas Grafd6062cb2006-08-15 00:33:59 -07001592 goto errout;
1593
Eric W. Biederman15e47302012-09-07 20:12:54 +00001594 err = inet_fill_ifaddr(skb, ifa, portid, seq, event, 0);
Patrick McHardy26932562007-01-31 23:16:40 -08001595 if (err < 0) {
1596 /* -EMSGSIZE implies BUG in inet_nlmsg_size() */
1597 WARN_ON(err == -EMSGSIZE);
1598 kfree_skb(skb);
1599 goto errout;
1600 }
Eric W. Biederman15e47302012-09-07 20:12:54 +00001601 rtnl_notify(skb, net, portid, RTNLGRP_IPV4_IFADDR, nlh, GFP_KERNEL);
Pablo Neira Ayuso1ce85fe2009-02-24 23:18:28 -08001602 return;
Thomas Grafd6062cb2006-08-15 00:33:59 -07001603errout:
1604 if (err < 0)
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -08001605 rtnl_set_sk_err(net, RTNLGRP_IPV4_IFADDR, err);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001606}
1607
Thomas Graf9f0f7272010-11-16 04:32:48 +00001608static size_t inet_get_link_af_size(const struct net_device *dev)
1609{
Eric Dumazet1fc19af2011-05-09 20:55:03 -07001610 struct in_device *in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Thomas Graf9f0f7272010-11-16 04:32:48 +00001611
1612 if (!in_dev)
1613 return 0;
1614
1615 return nla_total_size(IPV4_DEVCONF_MAX * 4); /* IFLA_INET_CONF */
1616}
1617
1618static int inet_fill_link_af(struct sk_buff *skb, const struct net_device *dev)
1619{
Eric Dumazet1fc19af2011-05-09 20:55:03 -07001620 struct in_device *in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Thomas Graf9f0f7272010-11-16 04:32:48 +00001621 struct nlattr *nla;
1622 int i;
1623
1624 if (!in_dev)
1625 return -ENODATA;
1626
1627 nla = nla_reserve(skb, IFLA_INET_CONF, IPV4_DEVCONF_MAX * 4);
1628 if (nla == NULL)
1629 return -EMSGSIZE;
1630
1631 for (i = 0; i < IPV4_DEVCONF_MAX; i++)
1632 ((u32 *) nla_data(nla))[i] = in_dev->cnf.data[i];
1633
1634 return 0;
1635}
1636
1637static const struct nla_policy inet_af_policy[IFLA_INET_MAX+1] = {
1638 [IFLA_INET_CONF] = { .type = NLA_NESTED },
1639};
1640
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001641static int inet_validate_link_af(const struct net_device *dev,
1642 const struct nlattr *nla)
Thomas Graf9f0f7272010-11-16 04:32:48 +00001643{
Thomas Graf9f0f7272010-11-16 04:32:48 +00001644 struct nlattr *a, *tb[IFLA_INET_MAX+1];
1645 int err, rem;
1646
Eric Dumazetf7fce742010-12-01 06:03:06 +00001647 if (dev && !__in_dev_get_rtnl(dev))
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001648 return -EAFNOSUPPORT;
Thomas Graf9f0f7272010-11-16 04:32:48 +00001649
1650 err = nla_parse_nested(tb, IFLA_INET_MAX, nla, inet_af_policy);
1651 if (err < 0)
1652 return err;
1653
1654 if (tb[IFLA_INET_CONF]) {
1655 nla_for_each_nested(a, tb[IFLA_INET_CONF], rem) {
1656 int cfgid = nla_type(a);
1657
1658 if (nla_len(a) < 4)
1659 return -EINVAL;
1660
1661 if (cfgid <= 0 || cfgid > IPV4_DEVCONF_MAX)
1662 return -EINVAL;
1663 }
1664 }
1665
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001666 return 0;
1667}
1668
1669static int inet_set_link_af(struct net_device *dev, const struct nlattr *nla)
1670{
Eric Dumazetf7fce742010-12-01 06:03:06 +00001671 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001672 struct nlattr *a, *tb[IFLA_INET_MAX+1];
1673 int rem;
1674
1675 if (!in_dev)
1676 return -EAFNOSUPPORT;
1677
1678 if (nla_parse_nested(tb, IFLA_INET_MAX, nla, NULL) < 0)
1679 BUG();
1680
Thomas Graf9f0f7272010-11-16 04:32:48 +00001681 if (tb[IFLA_INET_CONF]) {
1682 nla_for_each_nested(a, tb[IFLA_INET_CONF], rem)
1683 ipv4_devconf_set(in_dev, nla_type(a), nla_get_u32(a));
1684 }
1685
1686 return 0;
1687}
1688
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001689static int inet_netconf_msgsize_devconf(int type)
1690{
1691 int size = NLMSG_ALIGN(sizeof(struct netconfmsg))
1692 + nla_total_size(4); /* NETCONFA_IFINDEX */
1693
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001694 /* type -1 is used for ALL */
1695 if (type == -1 || type == NETCONFA_FORWARDING)
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001696 size += nla_total_size(4);
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001697 if (type == -1 || type == NETCONFA_RP_FILTER)
1698 size += nla_total_size(4);
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001699 if (type == -1 || type == NETCONFA_MC_FORWARDING)
1700 size += nla_total_size(4);
stephen hemminger09aea5d2013-12-17 22:35:52 -08001701 if (type == -1 || type == NETCONFA_PROXY_NEIGH)
stephen hemmingerf085ff12013-12-12 13:06:50 -08001702 size += nla_total_size(4);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001703
1704 return size;
1705}
1706
1707static int inet_netconf_fill_devconf(struct sk_buff *skb, int ifindex,
1708 struct ipv4_devconf *devconf, u32 portid,
1709 u32 seq, int event, unsigned int flags,
1710 int type)
1711{
1712 struct nlmsghdr *nlh;
1713 struct netconfmsg *ncm;
1714
1715 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct netconfmsg),
1716 flags);
1717 if (nlh == NULL)
1718 return -EMSGSIZE;
1719
1720 ncm = nlmsg_data(nlh);
1721 ncm->ncm_family = AF_INET;
1722
1723 if (nla_put_s32(skb, NETCONFA_IFINDEX, ifindex) < 0)
1724 goto nla_put_failure;
1725
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001726 /* type -1 is used for ALL */
1727 if ((type == -1 || type == NETCONFA_FORWARDING) &&
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001728 nla_put_s32(skb, NETCONFA_FORWARDING,
1729 IPV4_DEVCONF(*devconf, FORWARDING)) < 0)
1730 goto nla_put_failure;
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001731 if ((type == -1 || type == NETCONFA_RP_FILTER) &&
1732 nla_put_s32(skb, NETCONFA_RP_FILTER,
1733 IPV4_DEVCONF(*devconf, RP_FILTER)) < 0)
1734 goto nla_put_failure;
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001735 if ((type == -1 || type == NETCONFA_MC_FORWARDING) &&
1736 nla_put_s32(skb, NETCONFA_MC_FORWARDING,
1737 IPV4_DEVCONF(*devconf, MC_FORWARDING)) < 0)
1738 goto nla_put_failure;
stephen hemminger09aea5d2013-12-17 22:35:52 -08001739 if ((type == -1 || type == NETCONFA_PROXY_NEIGH) &&
1740 nla_put_s32(skb, NETCONFA_PROXY_NEIGH,
stephen hemmingerf085ff12013-12-12 13:06:50 -08001741 IPV4_DEVCONF(*devconf, PROXY_ARP)) < 0)
1742 goto nla_put_failure;
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001743
1744 return nlmsg_end(skb, nlh);
1745
1746nla_put_failure:
1747 nlmsg_cancel(skb, nlh);
1748 return -EMSGSIZE;
1749}
1750
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001751void inet_netconf_notify_devconf(struct net *net, int type, int ifindex,
1752 struct ipv4_devconf *devconf)
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001753{
1754 struct sk_buff *skb;
1755 int err = -ENOBUFS;
1756
1757 skb = nlmsg_new(inet_netconf_msgsize_devconf(type), GFP_ATOMIC);
1758 if (skb == NULL)
1759 goto errout;
1760
1761 err = inet_netconf_fill_devconf(skb, ifindex, devconf, 0, 0,
1762 RTM_NEWNETCONF, 0, type);
1763 if (err < 0) {
1764 /* -EMSGSIZE implies BUG in inet_netconf_msgsize_devconf() */
1765 WARN_ON(err == -EMSGSIZE);
1766 kfree_skb(skb);
1767 goto errout;
1768 }
1769 rtnl_notify(skb, net, 0, RTNLGRP_IPV4_NETCONF, NULL, GFP_ATOMIC);
1770 return;
1771errout:
1772 if (err < 0)
1773 rtnl_set_sk_err(net, RTNLGRP_IPV4_NETCONF, err);
1774}
1775
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001776static const struct nla_policy devconf_ipv4_policy[NETCONFA_MAX+1] = {
1777 [NETCONFA_IFINDEX] = { .len = sizeof(int) },
1778 [NETCONFA_FORWARDING] = { .len = sizeof(int) },
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001779 [NETCONFA_RP_FILTER] = { .len = sizeof(int) },
stephen hemminger09aea5d2013-12-17 22:35:52 -08001780 [NETCONFA_PROXY_NEIGH] = { .len = sizeof(int) },
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001781};
1782
1783static int inet_netconf_get_devconf(struct sk_buff *in_skb,
Thomas Graf661d2962013-03-21 07:45:29 +00001784 struct nlmsghdr *nlh)
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001785{
1786 struct net *net = sock_net(in_skb->sk);
1787 struct nlattr *tb[NETCONFA_MAX+1];
1788 struct netconfmsg *ncm;
1789 struct sk_buff *skb;
1790 struct ipv4_devconf *devconf;
1791 struct in_device *in_dev;
1792 struct net_device *dev;
1793 int ifindex;
1794 int err;
1795
1796 err = nlmsg_parse(nlh, sizeof(*ncm), tb, NETCONFA_MAX,
1797 devconf_ipv4_policy);
1798 if (err < 0)
1799 goto errout;
1800
1801 err = EINVAL;
1802 if (!tb[NETCONFA_IFINDEX])
1803 goto errout;
1804
1805 ifindex = nla_get_s32(tb[NETCONFA_IFINDEX]);
1806 switch (ifindex) {
1807 case NETCONFA_IFINDEX_ALL:
1808 devconf = net->ipv4.devconf_all;
1809 break;
1810 case NETCONFA_IFINDEX_DEFAULT:
1811 devconf = net->ipv4.devconf_dflt;
1812 break;
1813 default:
1814 dev = __dev_get_by_index(net, ifindex);
1815 if (dev == NULL)
1816 goto errout;
1817 in_dev = __in_dev_get_rtnl(dev);
1818 if (in_dev == NULL)
1819 goto errout;
1820 devconf = &in_dev->cnf;
1821 break;
1822 }
1823
1824 err = -ENOBUFS;
1825 skb = nlmsg_new(inet_netconf_msgsize_devconf(-1), GFP_ATOMIC);
1826 if (skb == NULL)
1827 goto errout;
1828
1829 err = inet_netconf_fill_devconf(skb, ifindex, devconf,
1830 NETLINK_CB(in_skb).portid,
1831 nlh->nlmsg_seq, RTM_NEWNETCONF, 0,
1832 -1);
1833 if (err < 0) {
1834 /* -EMSGSIZE implies BUG in inet_netconf_msgsize_devconf() */
1835 WARN_ON(err == -EMSGSIZE);
1836 kfree_skb(skb);
1837 goto errout;
1838 }
1839 err = rtnl_unicast(skb, net, NETLINK_CB(in_skb).portid);
1840errout:
1841 return err;
1842}
1843
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001844static int inet_netconf_dump_devconf(struct sk_buff *skb,
1845 struct netlink_callback *cb)
1846{
1847 struct net *net = sock_net(skb->sk);
1848 int h, s_h;
1849 int idx, s_idx;
1850 struct net_device *dev;
1851 struct in_device *in_dev;
1852 struct hlist_head *head;
1853
1854 s_h = cb->args[0];
1855 s_idx = idx = cb->args[1];
1856
1857 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
1858 idx = 0;
1859 head = &net->dev_index_head[h];
1860 rcu_read_lock();
Nicolas Dichtel04652772013-03-22 06:28:42 +00001861 cb->seq = atomic_read(&net->ipv4.dev_addr_genid) ^
1862 net->dev_base_seq;
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001863 hlist_for_each_entry_rcu(dev, head, index_hlist) {
1864 if (idx < s_idx)
1865 goto cont;
1866 in_dev = __in_dev_get_rcu(dev);
1867 if (!in_dev)
1868 goto cont;
1869
1870 if (inet_netconf_fill_devconf(skb, dev->ifindex,
1871 &in_dev->cnf,
1872 NETLINK_CB(cb->skb).portid,
1873 cb->nlh->nlmsg_seq,
1874 RTM_NEWNETCONF,
1875 NLM_F_MULTI,
1876 -1) <= 0) {
1877 rcu_read_unlock();
1878 goto done;
1879 }
Nicolas Dichtel04652772013-03-22 06:28:42 +00001880 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001881cont:
1882 idx++;
1883 }
1884 rcu_read_unlock();
1885 }
1886 if (h == NETDEV_HASHENTRIES) {
1887 if (inet_netconf_fill_devconf(skb, NETCONFA_IFINDEX_ALL,
1888 net->ipv4.devconf_all,
1889 NETLINK_CB(cb->skb).portid,
1890 cb->nlh->nlmsg_seq,
1891 RTM_NEWNETCONF, NLM_F_MULTI,
1892 -1) <= 0)
1893 goto done;
1894 else
1895 h++;
1896 }
1897 if (h == NETDEV_HASHENTRIES + 1) {
1898 if (inet_netconf_fill_devconf(skb, NETCONFA_IFINDEX_DEFAULT,
1899 net->ipv4.devconf_dflt,
1900 NETLINK_CB(cb->skb).portid,
1901 cb->nlh->nlmsg_seq,
1902 RTM_NEWNETCONF, NLM_F_MULTI,
1903 -1) <= 0)
1904 goto done;
1905 else
1906 h++;
1907 }
1908done:
1909 cb->args[0] = h;
1910 cb->args[1] = idx;
1911
1912 return skb->len;
1913}
1914
Linus Torvalds1da177e2005-04-16 15:20:36 -07001915#ifdef CONFIG_SYSCTL
1916
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001917static void devinet_copy_dflt_conf(struct net *net, int i)
Herbert Xu31be3082007-06-04 23:35:37 -07001918{
1919 struct net_device *dev;
1920
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001921 rcu_read_lock();
1922 for_each_netdev_rcu(net, dev) {
Herbert Xu31be3082007-06-04 23:35:37 -07001923 struct in_device *in_dev;
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001924
Herbert Xu31be3082007-06-04 23:35:37 -07001925 in_dev = __in_dev_get_rcu(dev);
1926 if (in_dev && !test_bit(i, in_dev->cnf.state))
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001927 in_dev->cnf.data[i] = net->ipv4.devconf_dflt->data[i];
Herbert Xu31be3082007-06-04 23:35:37 -07001928 }
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001929 rcu_read_unlock();
Herbert Xu31be3082007-06-04 23:35:37 -07001930}
1931
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001932/* called with RTNL locked */
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001933static void inet_forward_change(struct net *net)
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001934{
1935 struct net_device *dev;
Pavel Emelyanov586f1212007-12-16 13:32:48 -08001936 int on = IPV4_DEVCONF_ALL(net, FORWARDING);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001937
Pavel Emelyanov586f1212007-12-16 13:32:48 -08001938 IPV4_DEVCONF_ALL(net, ACCEPT_REDIRECTS) = !on;
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001939 IPV4_DEVCONF_DFLT(net, FORWARDING) = on;
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001940 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1941 NETCONFA_IFINDEX_ALL,
1942 net->ipv4.devconf_all);
1943 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1944 NETCONFA_IFINDEX_DEFAULT,
1945 net->ipv4.devconf_dflt);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001946
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001947 for_each_netdev(net, dev) {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001948 struct in_device *in_dev;
Ben Hutchings0187bdf2008-06-19 16:15:47 -07001949 if (on)
1950 dev_disable_lro(dev);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001951 rcu_read_lock();
1952 in_dev = __in_dev_get_rcu(dev);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001953 if (in_dev) {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001954 IN_DEV_CONF_SET(in_dev, FORWARDING, on);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001955 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1956 dev->ifindex, &in_dev->cnf);
1957 }
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001958 rcu_read_unlock();
1959 }
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001960}
1961
stephen hemmingerf085ff12013-12-12 13:06:50 -08001962static int devinet_conf_ifindex(struct net *net, struct ipv4_devconf *cnf)
1963{
1964 if (cnf == net->ipv4.devconf_dflt)
1965 return NETCONFA_IFINDEX_DEFAULT;
1966 else if (cnf == net->ipv4.devconf_all)
1967 return NETCONFA_IFINDEX_ALL;
1968 else {
1969 struct in_device *idev
1970 = container_of(cnf, struct in_device, cnf);
1971 return idev->dev->ifindex;
1972 }
1973}
1974
Joe Perchesfe2c6332013-06-11 23:04:25 -07001975static int devinet_conf_proc(struct ctl_table *ctl, int write,
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001976 void __user *buffer,
Herbert Xu31be3082007-06-04 23:35:37 -07001977 size_t *lenp, loff_t *ppos)
1978{
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001979 int old_value = *(int *)ctl->data;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001980 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001981 int new_value = *(int *)ctl->data;
Herbert Xu31be3082007-06-04 23:35:37 -07001982
1983 if (write) {
1984 struct ipv4_devconf *cnf = ctl->extra1;
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001985 struct net *net = ctl->extra2;
Herbert Xu31be3082007-06-04 23:35:37 -07001986 int i = (int *)ctl->data - cnf->data;
stephen hemmingerf085ff12013-12-12 13:06:50 -08001987 int ifindex;
Herbert Xu31be3082007-06-04 23:35:37 -07001988
1989 set_bit(i, cnf->state);
1990
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001991 if (cnf == net->ipv4.devconf_dflt)
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001992 devinet_copy_dflt_conf(net, i);
Thomas Grafd0daebc32012-06-12 00:44:01 +00001993 if (i == IPV4_DEVCONF_ACCEPT_LOCAL - 1 ||
1994 i == IPV4_DEVCONF_ROUTE_LOCALNET - 1)
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001995 if ((new_value == 0) && (old_value != 0))
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00001996 rt_cache_flush(net);
stephen hemmingerf085ff12013-12-12 13:06:50 -08001997
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001998 if (i == IPV4_DEVCONF_RP_FILTER - 1 &&
1999 new_value != old_value) {
stephen hemmingerf085ff12013-12-12 13:06:50 -08002000 ifindex = devinet_conf_ifindex(net, cnf);
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00002001 inet_netconf_notify_devconf(net, NETCONFA_RP_FILTER,
2002 ifindex, cnf);
2003 }
stephen hemmingerf085ff12013-12-12 13:06:50 -08002004 if (i == IPV4_DEVCONF_PROXY_ARP - 1 &&
2005 new_value != old_value) {
2006 ifindex = devinet_conf_ifindex(net, cnf);
stephen hemminger09aea5d2013-12-17 22:35:52 -08002007 inet_netconf_notify_devconf(net, NETCONFA_PROXY_NEIGH,
stephen hemmingerf085ff12013-12-12 13:06:50 -08002008 ifindex, cnf);
2009 }
Herbert Xu31be3082007-06-04 23:35:37 -07002010 }
2011
2012 return ret;
2013}
2014
Joe Perchesfe2c6332013-06-11 23:04:25 -07002015static int devinet_sysctl_forward(struct ctl_table *ctl, int write,
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07002016 void __user *buffer,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002017 size_t *lenp, loff_t *ppos)
2018{
2019 int *valp = ctl->data;
2020 int val = *valp;
Eric W. Biederman88af1822010-02-19 13:22:59 +00002021 loff_t pos = *ppos;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07002022 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002023
2024 if (write && *valp != val) {
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002025 struct net *net = ctl->extra2;
2026
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002027 if (valp != &IPV4_DEVCONF_DFLT(net, FORWARDING)) {
Eric W. Biederman88af1822010-02-19 13:22:59 +00002028 if (!rtnl_trylock()) {
2029 /* Restore the original values before restarting */
2030 *valp = val;
2031 *ppos = pos;
Eric W. Biederman9b8adb52009-05-13 16:59:21 +00002032 return restart_syscall();
Eric W. Biederman88af1822010-02-19 13:22:59 +00002033 }
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002034 if (valp == &IPV4_DEVCONF_ALL(net, FORWARDING)) {
2035 inet_forward_change(net);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002036 } else {
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002037 struct ipv4_devconf *cnf = ctl->extra1;
2038 struct in_device *idev =
2039 container_of(cnf, struct in_device, cnf);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002040 if (*valp)
2041 dev_disable_lro(idev->dev);
2042 inet_netconf_notify_devconf(net,
2043 NETCONFA_FORWARDING,
2044 idev->dev->ifindex,
2045 cnf);
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002046 }
2047 rtnl_unlock();
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00002048 rt_cache_flush(net);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002049 } else
2050 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
2051 NETCONFA_IFINDEX_DEFAULT,
2052 net->ipv4.devconf_dflt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002053 }
2054
2055 return ret;
2056}
2057
Joe Perchesfe2c6332013-06-11 23:04:25 -07002058static int ipv4_doint_and_flush(struct ctl_table *ctl, int write,
David S. Miller323e1262010-12-12 21:55:08 -08002059 void __user *buffer,
2060 size_t *lenp, loff_t *ppos)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002061{
2062 int *valp = ctl->data;
2063 int val = *valp;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07002064 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Denis V. Lunev76e6ebf2008-07-05 19:00:44 -07002065 struct net *net = ctl->extra2;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002066
2067 if (write && *valp != val)
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00002068 rt_cache_flush(net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002069
2070 return ret;
2071}
2072
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002073#define DEVINET_SYSCTL_ENTRY(attr, name, mval, proc) \
Herbert Xu42f811b2007-06-04 23:34:44 -07002074 { \
Herbert Xu42f811b2007-06-04 23:34:44 -07002075 .procname = name, \
2076 .data = ipv4_devconf.data + \
Eric W. Biederman02291682010-02-14 03:25:51 +00002077 IPV4_DEVCONF_ ## attr - 1, \
Herbert Xu42f811b2007-06-04 23:34:44 -07002078 .maxlen = sizeof(int), \
2079 .mode = mval, \
2080 .proc_handler = proc, \
Herbert Xu31be3082007-06-04 23:35:37 -07002081 .extra1 = &ipv4_devconf, \
Herbert Xu42f811b2007-06-04 23:34:44 -07002082 }
2083
2084#define DEVINET_SYSCTL_RW_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002085 DEVINET_SYSCTL_ENTRY(attr, name, 0644, devinet_conf_proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002086
2087#define DEVINET_SYSCTL_RO_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002088 DEVINET_SYSCTL_ENTRY(attr, name, 0444, devinet_conf_proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002089
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002090#define DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, proc) \
2091 DEVINET_SYSCTL_ENTRY(attr, name, 0644, proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002092
2093#define DEVINET_SYSCTL_FLUSHING_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002094 DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, ipv4_doint_and_flush)
Herbert Xu42f811b2007-06-04 23:34:44 -07002095
Linus Torvalds1da177e2005-04-16 15:20:36 -07002096static struct devinet_sysctl_table {
2097 struct ctl_table_header *sysctl_header;
Eric W. Biederman02291682010-02-14 03:25:51 +00002098 struct ctl_table devinet_vars[__IPV4_DEVCONF_MAX];
Linus Torvalds1da177e2005-04-16 15:20:36 -07002099} devinet_sysctl = {
2100 .devinet_vars = {
Herbert Xu42f811b2007-06-04 23:34:44 -07002101 DEVINET_SYSCTL_COMPLEX_ENTRY(FORWARDING, "forwarding",
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002102 devinet_sysctl_forward),
Herbert Xu42f811b2007-06-04 23:34:44 -07002103 DEVINET_SYSCTL_RO_ENTRY(MC_FORWARDING, "mc_forwarding"),
2104
2105 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_REDIRECTS, "accept_redirects"),
2106 DEVINET_SYSCTL_RW_ENTRY(SECURE_REDIRECTS, "secure_redirects"),
2107 DEVINET_SYSCTL_RW_ENTRY(SHARED_MEDIA, "shared_media"),
2108 DEVINET_SYSCTL_RW_ENTRY(RP_FILTER, "rp_filter"),
2109 DEVINET_SYSCTL_RW_ENTRY(SEND_REDIRECTS, "send_redirects"),
2110 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_SOURCE_ROUTE,
2111 "accept_source_route"),
Patrick McHardy8153a102009-12-03 01:25:58 +00002112 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_LOCAL, "accept_local"),
Jamal Hadi Salim28f6aee2009-12-25 17:30:22 -08002113 DEVINET_SYSCTL_RW_ENTRY(SRC_VMARK, "src_valid_mark"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002114 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP, "proxy_arp"),
2115 DEVINET_SYSCTL_RW_ENTRY(MEDIUM_ID, "medium_id"),
2116 DEVINET_SYSCTL_RW_ENTRY(BOOTP_RELAY, "bootp_relay"),
2117 DEVINET_SYSCTL_RW_ENTRY(LOG_MARTIANS, "log_martians"),
2118 DEVINET_SYSCTL_RW_ENTRY(TAG, "tag"),
2119 DEVINET_SYSCTL_RW_ENTRY(ARPFILTER, "arp_filter"),
2120 DEVINET_SYSCTL_RW_ENTRY(ARP_ANNOUNCE, "arp_announce"),
2121 DEVINET_SYSCTL_RW_ENTRY(ARP_IGNORE, "arp_ignore"),
2122 DEVINET_SYSCTL_RW_ENTRY(ARP_ACCEPT, "arp_accept"),
Stephen Hemmingereefef1c2009-02-01 01:04:33 -08002123 DEVINET_SYSCTL_RW_ENTRY(ARP_NOTIFY, "arp_notify"),
Jesper Dangaard Brouer65324142010-01-05 05:50:47 +00002124 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP_PVLAN, "proxy_arp_pvlan"),
William Manley5c6fe012013-08-06 19:03:14 +01002125 DEVINET_SYSCTL_RW_ENTRY(FORCE_IGMP_VERSION,
2126 "force_igmp_version"),
William Manley26900482013-08-06 19:03:15 +01002127 DEVINET_SYSCTL_RW_ENTRY(IGMPV2_UNSOLICITED_REPORT_INTERVAL,
2128 "igmpv2_unsolicited_report_interval"),
2129 DEVINET_SYSCTL_RW_ENTRY(IGMPV3_UNSOLICITED_REPORT_INTERVAL,
2130 "igmpv3_unsolicited_report_interval"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002131
2132 DEVINET_SYSCTL_FLUSHING_ENTRY(NOXFRM, "disable_xfrm"),
2133 DEVINET_SYSCTL_FLUSHING_ENTRY(NOPOLICY, "disable_policy"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002134 DEVINET_SYSCTL_FLUSHING_ENTRY(PROMOTE_SECONDARIES,
2135 "promote_secondaries"),
Thomas Grafd0daebc32012-06-12 00:44:01 +00002136 DEVINET_SYSCTL_FLUSHING_ENTRY(ROUTE_LOCALNET,
2137 "route_localnet"),
Linus Torvalds1da177e2005-04-16 15:20:36 -07002138 },
Linus Torvalds1da177e2005-04-16 15:20:36 -07002139};
2140
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002141static int __devinet_sysctl_register(struct net *net, char *dev_name,
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002142 struct ipv4_devconf *p)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002143{
2144 int i;
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002145 struct devinet_sysctl_table *t;
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002146 char path[sizeof("net/ipv4/conf/") + IFNAMSIZ];
Pavel Emelyanovbfada692007-12-02 00:57:08 +11002147
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002148 t = kmemdup(&devinet_sysctl, sizeof(*t), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002149 if (!t)
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002150 goto out;
2151
Linus Torvalds1da177e2005-04-16 15:20:36 -07002152 for (i = 0; i < ARRAY_SIZE(t->devinet_vars) - 1; i++) {
2153 t->devinet_vars[i].data += (char *)p - (char *)&ipv4_devconf;
Herbert Xu31be3082007-06-04 23:35:37 -07002154 t->devinet_vars[i].extra1 = p;
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002155 t->devinet_vars[i].extra2 = net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002156 }
2157
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002158 snprintf(path, sizeof(path), "net/ipv4/conf/%s", dev_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002159
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002160 t->sysctl_header = register_net_sysctl(net, path, t->devinet_vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002161 if (!t->sysctl_header)
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002162 goto free;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002163
2164 p->sysctl = t;
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002165 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002166
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002167free:
Linus Torvalds1da177e2005-04-16 15:20:36 -07002168 kfree(t);
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002169out:
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002170 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002171}
2172
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002173static void __devinet_sysctl_unregister(struct ipv4_devconf *cnf)
2174{
2175 struct devinet_sysctl_table *t = cnf->sysctl;
2176
2177 if (t == NULL)
2178 return;
2179
2180 cnf->sysctl = NULL;
Lucian Adrian Grijincuff538812011-05-01 01:44:01 +00002181 unregister_net_sysctl_table(t->sysctl_header);
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002182 kfree(t);
2183}
2184
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11002185static void devinet_sysctl_register(struct in_device *idev)
2186{
Jiri Pirko73af6142013-12-07 19:26:55 +01002187 neigh_sysctl_register(idev->dev, idev->arp_parms, NULL);
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09002188 __devinet_sysctl_register(dev_net(idev->dev), idev->dev->name,
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002189 &idev->cnf);
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11002190}
2191
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002192static void devinet_sysctl_unregister(struct in_device *idev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002193{
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002194 __devinet_sysctl_unregister(&idev->cnf);
2195 neigh_sysctl_unregister(idev->arp_parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002196}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002197
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002198static struct ctl_table ctl_forward_entry[] = {
2199 {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002200 .procname = "ip_forward",
2201 .data = &ipv4_devconf.data[
Eric W. Biederman02291682010-02-14 03:25:51 +00002202 IPV4_DEVCONF_FORWARDING - 1],
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002203 .maxlen = sizeof(int),
2204 .mode = 0644,
2205 .proc_handler = devinet_sysctl_forward,
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002206 .extra1 = &ipv4_devconf,
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002207 .extra2 = &init_net,
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002208 },
2209 { },
2210};
Eric Dumazet2a75de02008-01-05 23:08:49 -08002211#endif
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002212
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002213static __net_init int devinet_init_net(struct net *net)
2214{
2215 int err;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002216 struct ipv4_devconf *all, *dflt;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002217#ifdef CONFIG_SYSCTL
2218 struct ctl_table *tbl = ctl_forward_entry;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002219 struct ctl_table_header *forw_hdr;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002220#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002221
2222 err = -ENOMEM;
2223 all = &ipv4_devconf;
2224 dflt = &ipv4_devconf_dflt;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002225
Octavian Purdila09ad9bc2009-11-25 15:14:13 -08002226 if (!net_eq(net, &init_net)) {
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002227 all = kmemdup(all, sizeof(ipv4_devconf), GFP_KERNEL);
2228 if (all == NULL)
2229 goto err_alloc_all;
2230
2231 dflt = kmemdup(dflt, sizeof(ipv4_devconf_dflt), GFP_KERNEL);
2232 if (dflt == NULL)
2233 goto err_alloc_dflt;
2234
Eric Dumazet2a75de02008-01-05 23:08:49 -08002235#ifdef CONFIG_SYSCTL
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002236 tbl = kmemdup(tbl, sizeof(ctl_forward_entry), GFP_KERNEL);
2237 if (tbl == NULL)
2238 goto err_alloc_ctl;
2239
Eric W. Biederman02291682010-02-14 03:25:51 +00002240 tbl[0].data = &all->data[IPV4_DEVCONF_FORWARDING - 1];
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002241 tbl[0].extra1 = all;
2242 tbl[0].extra2 = net;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002243#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002244 }
2245
2246#ifdef CONFIG_SYSCTL
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002247 err = __devinet_sysctl_register(net, "all", all);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002248 if (err < 0)
2249 goto err_reg_all;
2250
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002251 err = __devinet_sysctl_register(net, "default", dflt);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002252 if (err < 0)
2253 goto err_reg_dflt;
2254
2255 err = -ENOMEM;
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002256 forw_hdr = register_net_sysctl(net, "net/ipv4", tbl);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002257 if (forw_hdr == NULL)
2258 goto err_reg_ctl;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002259 net->ipv4.forw_hdr = forw_hdr;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002260#endif
2261
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002262 net->ipv4.devconf_all = all;
2263 net->ipv4.devconf_dflt = dflt;
2264 return 0;
2265
2266#ifdef CONFIG_SYSCTL
2267err_reg_ctl:
2268 __devinet_sysctl_unregister(dflt);
2269err_reg_dflt:
2270 __devinet_sysctl_unregister(all);
2271err_reg_all:
2272 if (tbl != ctl_forward_entry)
2273 kfree(tbl);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002274err_alloc_ctl:
Eric Dumazet2a75de02008-01-05 23:08:49 -08002275#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002276 if (dflt != &ipv4_devconf_dflt)
2277 kfree(dflt);
2278err_alloc_dflt:
2279 if (all != &ipv4_devconf)
2280 kfree(all);
2281err_alloc_all:
2282 return err;
2283}
2284
2285static __net_exit void devinet_exit_net(struct net *net)
2286{
Eric Dumazet2a75de02008-01-05 23:08:49 -08002287#ifdef CONFIG_SYSCTL
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002288 struct ctl_table *tbl;
2289
2290 tbl = net->ipv4.forw_hdr->ctl_table_arg;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002291 unregister_net_sysctl_table(net->ipv4.forw_hdr);
2292 __devinet_sysctl_unregister(net->ipv4.devconf_dflt);
2293 __devinet_sysctl_unregister(net->ipv4.devconf_all);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002294 kfree(tbl);
Eric Dumazet2a75de02008-01-05 23:08:49 -08002295#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002296 kfree(net->ipv4.devconf_dflt);
2297 kfree(net->ipv4.devconf_all);
2298}
2299
2300static __net_initdata struct pernet_operations devinet_ops = {
2301 .init = devinet_init_net,
2302 .exit = devinet_exit_net,
2303};
2304
Thomas Graf9f0f7272010-11-16 04:32:48 +00002305static struct rtnl_af_ops inet_af_ops = {
2306 .family = AF_INET,
2307 .fill_link_af = inet_fill_link_af,
2308 .get_link_af_size = inet_get_link_af_size,
Thomas Grafcf7afbf2010-11-22 01:31:54 +00002309 .validate_link_af = inet_validate_link_af,
2310 .set_link_af = inet_set_link_af,
Thomas Graf9f0f7272010-11-16 04:32:48 +00002311};
2312
Linus Torvalds1da177e2005-04-16 15:20:36 -07002313void __init devinet_init(void)
2314{
David S. Millerfd23c3b2011-02-18 12:42:28 -08002315 int i;
2316
2317 for (i = 0; i < IN4_ADDR_HSIZE; i++)
2318 INIT_HLIST_HEAD(&inet_addr_lst[i]);
2319
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002320 register_pernet_subsys(&devinet_ops);
2321
Linus Torvalds1da177e2005-04-16 15:20:36 -07002322 register_gifconf(PF_INET, inet_gifconf);
2323 register_netdevice_notifier(&ip_netdev_notifier);
Thomas Graf63f34442007-03-22 11:55:17 -07002324
viresh kumar906e0732014-01-22 12:23:32 +05302325 queue_delayed_work(system_power_efficient_wq, &check_lifetime_work, 0);
Jiri Pirko5c766d62013-01-24 09:41:41 +00002326
Thomas Graf9f0f7272010-11-16 04:32:48 +00002327 rtnl_af_register(&inet_af_ops);
2328
Greg Rosec7ac8672011-06-10 01:27:09 +00002329 rtnl_register(PF_INET, RTM_NEWADDR, inet_rtm_newaddr, NULL, NULL);
2330 rtnl_register(PF_INET, RTM_DELADDR, inet_rtm_deladdr, NULL, NULL);
2331 rtnl_register(PF_INET, RTM_GETADDR, NULL, inet_dump_ifaddr, NULL);
Nicolas Dichtel9e551112012-10-25 22:28:53 +00002332 rtnl_register(PF_INET, RTM_GETNETCONF, inet_netconf_get_devconf,
Nicolas Dichtel7a674202013-03-05 23:42:06 +00002333 inet_netconf_dump_devconf, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002334}
2335