blob: 43065be363010b3f9bd2c6bb0f65454931a32949 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * NET3 IP device support routines.
3 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Derived from the IP parts of dev.c 1.0.19
Jesper Juhl02c30a82005-05-05 16:16:16 -070010 * Authors: Ross Biro
Linus Torvalds1da177e2005-04-16 15:20:36 -070011 * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
12 * Mark Evans, <evansmp@uhura.aston.ac.uk>
13 *
14 * Additional Authors:
15 * Alan Cox, <gw4pts@gw4pts.ampr.org>
16 * Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
17 *
18 * Changes:
19 * Alexey Kuznetsov: pa_* fields are replaced with ifaddr
20 * lists.
21 * Cyrus Durgin: updated for kmod
22 * Matthias Andree: in devinet_ioctl, compare label and
23 * address (4.4BSD alias style support),
24 * fall back to comparing just the label
25 * if no match found.
26 */
27
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
29#include <asm/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <linux/bitops.h>
Randy Dunlap4fc268d2006-01-11 12:17:47 -080031#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <linux/module.h>
33#include <linux/types.h>
34#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <linux/string.h>
36#include <linux/mm.h>
37#include <linux/socket.h>
38#include <linux/sockios.h>
39#include <linux/in.h>
40#include <linux/errno.h>
41#include <linux/interrupt.h>
Thomas Graf18237302006-08-04 23:04:54 -070042#include <linux/if_addr.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#include <linux/if_ether.h>
44#include <linux/inet.h>
45#include <linux/netdevice.h>
46#include <linux/etherdevice.h>
47#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070048#include <linux/init.h>
49#include <linux/notifier.h>
50#include <linux/inetdevice.h>
51#include <linux/igmp.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090052#include <linux/slab.h>
David S. Millerfd23c3b2011-02-18 12:42:28 -080053#include <linux/hash.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070054#ifdef CONFIG_SYSCTL
55#include <linux/sysctl.h>
56#endif
57#include <linux/kmod.h>
Nicolas Dichteledc9e742012-10-25 22:28:52 +000058#include <linux/netconf.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070059
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020060#include <net/arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070061#include <net/ip.h>
62#include <net/route.h>
63#include <net/ip_fib.h>
Thomas Graf63f34442007-03-22 11:55:17 -070064#include <net/rtnetlink.h>
Pavel Emelyanov752d14d2007-12-16 13:31:47 -080065#include <net/net_namespace.h>
Jiri Pirko5c766d62013-01-24 09:41:41 +000066#include <net/addrconf.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
David S. Miller406b6f92011-03-22 21:56:23 -070068#include "fib_lookup.h"
69
Adrian Bunk0027ba82008-01-31 17:17:31 -080070static struct ipv4_devconf ipv4_devconf = {
Herbert Xu42f811b2007-06-04 23:34:44 -070071 .data = {
Eric W. Biederman02291682010-02-14 03:25:51 +000072 [IPV4_DEVCONF_ACCEPT_REDIRECTS - 1] = 1,
73 [IPV4_DEVCONF_SEND_REDIRECTS - 1] = 1,
74 [IPV4_DEVCONF_SECURE_REDIRECTS - 1] = 1,
75 [IPV4_DEVCONF_SHARED_MEDIA - 1] = 1,
William Manley26900482013-08-06 19:03:15 +010076 [IPV4_DEVCONF_IGMPV2_UNSOLICITED_REPORT_INTERVAL - 1] = 10000 /*ms*/,
77 [IPV4_DEVCONF_IGMPV3_UNSOLICITED_REPORT_INTERVAL - 1] = 1000 /*ms*/,
Herbert Xu42f811b2007-06-04 23:34:44 -070078 },
Linus Torvalds1da177e2005-04-16 15:20:36 -070079};
80
81static struct ipv4_devconf ipv4_devconf_dflt = {
Herbert Xu42f811b2007-06-04 23:34:44 -070082 .data = {
Eric W. Biederman02291682010-02-14 03:25:51 +000083 [IPV4_DEVCONF_ACCEPT_REDIRECTS - 1] = 1,
84 [IPV4_DEVCONF_SEND_REDIRECTS - 1] = 1,
85 [IPV4_DEVCONF_SECURE_REDIRECTS - 1] = 1,
86 [IPV4_DEVCONF_SHARED_MEDIA - 1] = 1,
87 [IPV4_DEVCONF_ACCEPT_SOURCE_ROUTE - 1] = 1,
William Manley26900482013-08-06 19:03:15 +010088 [IPV4_DEVCONF_IGMPV2_UNSOLICITED_REPORT_INTERVAL - 1] = 10000 /*ms*/,
89 [IPV4_DEVCONF_IGMPV3_UNSOLICITED_REPORT_INTERVAL - 1] = 1000 /*ms*/,
Herbert Xu42f811b2007-06-04 23:34:44 -070090 },
Linus Torvalds1da177e2005-04-16 15:20:36 -070091};
92
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -080093#define IPV4_DEVCONF_DFLT(net, attr) \
94 IPV4_DEVCONF((*net->ipv4.devconf_dflt), attr)
Herbert Xu42f811b2007-06-04 23:34:44 -070095
Patrick McHardyef7c79e2007-06-05 12:38:30 -070096static const struct nla_policy ifa_ipv4_policy[IFA_MAX+1] = {
Thomas Graf5c753972006-08-04 23:03:53 -070097 [IFA_LOCAL] = { .type = NLA_U32 },
98 [IFA_ADDRESS] = { .type = NLA_U32 },
99 [IFA_BROADCAST] = { .type = NLA_U32 },
Thomas Graf5176f912006-08-26 20:13:18 -0700100 [IFA_LABEL] = { .type = NLA_STRING, .len = IFNAMSIZ - 1 },
Jiri Pirko5c766d62013-01-24 09:41:41 +0000101 [IFA_CACHEINFO] = { .len = sizeof(struct ifa_cacheinfo) },
Thomas Graf5c753972006-08-04 23:03:53 -0700102};
103
Eric Dumazet40384992012-08-03 21:06:50 +0000104#define IN4_ADDR_HSIZE_SHIFT 8
105#define IN4_ADDR_HSIZE (1U << IN4_ADDR_HSIZE_SHIFT)
106
David S. Millerfd23c3b2011-02-18 12:42:28 -0800107static struct hlist_head inet_addr_lst[IN4_ADDR_HSIZE];
108static DEFINE_SPINLOCK(inet_addr_hash_lock);
109
Eric Dumazet40384992012-08-03 21:06:50 +0000110static u32 inet_addr_hash(struct net *net, __be32 addr)
David S. Millerfd23c3b2011-02-18 12:42:28 -0800111{
Eric Dumazet40384992012-08-03 21:06:50 +0000112 u32 val = (__force u32) addr ^ net_hash_mix(net);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800113
Eric Dumazet40384992012-08-03 21:06:50 +0000114 return hash_32(val, IN4_ADDR_HSIZE_SHIFT);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800115}
116
117static void inet_hash_insert(struct net *net, struct in_ifaddr *ifa)
118{
Eric Dumazet40384992012-08-03 21:06:50 +0000119 u32 hash = inet_addr_hash(net, ifa->ifa_local);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800120
121 spin_lock(&inet_addr_hash_lock);
122 hlist_add_head_rcu(&ifa->hash, &inet_addr_lst[hash]);
123 spin_unlock(&inet_addr_hash_lock);
124}
125
126static void inet_hash_remove(struct in_ifaddr *ifa)
127{
128 spin_lock(&inet_addr_hash_lock);
129 hlist_del_init_rcu(&ifa->hash);
130 spin_unlock(&inet_addr_hash_lock);
131}
132
David S. Miller9435eb12011-02-18 12:43:09 -0800133/**
134 * __ip_dev_find - find the first device with a given source address.
135 * @net: the net namespace
136 * @addr: the source address
137 * @devref: if true, take a reference on the found device
138 *
139 * If a caller uses devref=false, it should be protected by RCU, or RTNL
140 */
141struct net_device *__ip_dev_find(struct net *net, __be32 addr, bool devref)
142{
Eric Dumazet40384992012-08-03 21:06:50 +0000143 u32 hash = inet_addr_hash(net, addr);
David S. Miller9435eb12011-02-18 12:43:09 -0800144 struct net_device *result = NULL;
145 struct in_ifaddr *ifa;
David S. Miller9435eb12011-02-18 12:43:09 -0800146
147 rcu_read_lock();
Sasha Levinb67bfe02013-02-27 17:06:00 -0800148 hlist_for_each_entry_rcu(ifa, &inet_addr_lst[hash], hash) {
David S. Millere0660082011-03-03 11:24:19 -0800149 if (ifa->ifa_local == addr) {
Eric Dumazet40384992012-08-03 21:06:50 +0000150 struct net_device *dev = ifa->ifa_dev->dev;
151
152 if (!net_eq(dev_net(dev), net))
153 continue;
David S. Miller9435eb12011-02-18 12:43:09 -0800154 result = dev;
155 break;
156 }
157 }
David S. Miller406b6f92011-03-22 21:56:23 -0700158 if (!result) {
159 struct flowi4 fl4 = { .daddr = addr };
160 struct fib_result res = { 0 };
161 struct fib_table *local;
162
163 /* Fallback to FIB local table so that communication
164 * over loopback subnets work.
165 */
166 local = fib_get_table(net, RT_TABLE_LOCAL);
167 if (local &&
168 !fib_table_lookup(local, &fl4, &res, FIB_LOOKUP_NOREF) &&
169 res.type == RTN_LOCAL)
170 result = FIB_RES_DEV(res);
171 }
David S. Miller9435eb12011-02-18 12:43:09 -0800172 if (result && devref)
173 dev_hold(result);
174 rcu_read_unlock();
175 return result;
176}
177EXPORT_SYMBOL(__ip_dev_find);
178
Thomas Grafd6062cb2006-08-15 00:33:59 -0700179static void rtmsg_ifa(int event, struct in_ifaddr *, struct nlmsghdr *, u32);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180
Alan Sterne041c682006-03-27 01:16:30 -0800181static BLOCKING_NOTIFIER_HEAD(inetaddr_chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700182static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
183 int destroy);
184#ifdef CONFIG_SYSCTL
Pavel Emelyanov66f27a52007-12-02 00:55:54 +1100185static void devinet_sysctl_register(struct in_device *idev);
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800186static void devinet_sysctl_unregister(struct in_device *idev);
187#else
Eric Dumazet40384992012-08-03 21:06:50 +0000188static void devinet_sysctl_register(struct in_device *idev)
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800189{
190}
Eric Dumazet40384992012-08-03 21:06:50 +0000191static void devinet_sysctl_unregister(struct in_device *idev)
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800192{
193}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194#endif
195
196/* Locks all the inet devices. */
197
198static struct in_ifaddr *inet_alloc_ifa(void)
199{
Alexey Dobriyan93adcc82008-10-28 13:25:09 -0700200 return kzalloc(sizeof(struct in_ifaddr), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700201}
202
203static void inet_rcu_free_ifa(struct rcu_head *head)
204{
205 struct in_ifaddr *ifa = container_of(head, struct in_ifaddr, rcu_head);
206 if (ifa->ifa_dev)
207 in_dev_put(ifa->ifa_dev);
208 kfree(ifa);
209}
210
Eric Dumazet40384992012-08-03 21:06:50 +0000211static void inet_free_ifa(struct in_ifaddr *ifa)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700212{
213 call_rcu(&ifa->rcu_head, inet_rcu_free_ifa);
214}
215
216void in_dev_finish_destroy(struct in_device *idev)
217{
218 struct net_device *dev = idev->dev;
219
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700220 WARN_ON(idev->ifa_list);
221 WARN_ON(idev->mc_list);
Eric Dumazete9897072013-06-07 08:48:57 -0700222 kfree(rcu_dereference_protected(idev->mc_hash, 1));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223#ifdef NET_REFCNT_DEBUG
Joe Perches91df42b2012-05-15 14:11:54 +0000224 pr_debug("%s: %p=%s\n", __func__, idev, dev ? dev->name : "NIL");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700225#endif
226 dev_put(dev);
227 if (!idev->dead)
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800228 pr_err("Freeing alive in_device %p\n", idev);
229 else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230 kfree(idev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231}
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800232EXPORT_SYMBOL(in_dev_finish_destroy);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233
Herbert Xu71e27da2007-06-04 23:36:06 -0700234static struct in_device *inetdev_init(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700235{
236 struct in_device *in_dev;
237
238 ASSERT_RTNL();
239
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700240 in_dev = kzalloc(sizeof(*in_dev), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241 if (!in_dev)
242 goto out;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900243 memcpy(&in_dev->cnf, dev_net(dev)->ipv4.devconf_dflt,
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -0800244 sizeof(in_dev->cnf));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245 in_dev->cnf.sysctl = NULL;
246 in_dev->dev = dev;
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800247 in_dev->arp_parms = neigh_parms_alloc(dev, &arp_tbl);
248 if (!in_dev->arp_parms)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249 goto out_kfree;
Ben Hutchings0187bdf2008-06-19 16:15:47 -0700250 if (IPV4_DEVCONF(in_dev->cnf, FORWARDING))
251 dev_disable_lro(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252 /* Reference in_dev->dev */
253 dev_hold(dev);
David L Stevens30c4cf52007-01-04 12:31:14 -0800254 /* Account for reference dev->ip_ptr (below) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 in_dev_hold(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256
Pavel Emelyanov66f27a52007-12-02 00:55:54 +1100257 devinet_sysctl_register(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258 ip_mc_init_dev(in_dev);
259 if (dev->flags & IFF_UP)
260 ip_mc_up(in_dev);
Jarek Poplawski483479e2007-01-09 14:38:31 -0800261
David L Stevens30c4cf52007-01-04 12:31:14 -0800262 /* we can receive as soon as ip_ptr is set -- do this last */
Eric Dumazetcf778b02012-01-12 04:41:32 +0000263 rcu_assign_pointer(dev->ip_ptr, in_dev);
Jarek Poplawski483479e2007-01-09 14:38:31 -0800264out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265 return in_dev;
266out_kfree:
267 kfree(in_dev);
268 in_dev = NULL;
269 goto out;
270}
271
272static void in_dev_rcu_put(struct rcu_head *head)
273{
274 struct in_device *idev = container_of(head, struct in_device, rcu_head);
275 in_dev_put(idev);
276}
277
278static void inetdev_destroy(struct in_device *in_dev)
279{
280 struct in_ifaddr *ifa;
281 struct net_device *dev;
282
283 ASSERT_RTNL();
284
285 dev = in_dev->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286
287 in_dev->dead = 1;
288
289 ip_mc_destroy_dev(in_dev);
290
291 while ((ifa = in_dev->ifa_list) != NULL) {
292 inet_del_ifa(in_dev, &in_dev->ifa_list, 0);
293 inet_free_ifa(ifa);
294 }
295
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +0000296 RCU_INIT_POINTER(dev->ip_ptr, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800298 devinet_sysctl_unregister(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299 neigh_parms_release(&arp_tbl, in_dev->arp_parms);
300 arp_ifdown(dev);
301
302 call_rcu(&in_dev->rcu_head, in_dev_rcu_put);
303}
304
Al Viroff428d72006-09-26 22:13:35 -0700305int inet_addr_onlink(struct in_device *in_dev, __be32 a, __be32 b)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306{
307 rcu_read_lock();
308 for_primary_ifa(in_dev) {
309 if (inet_ifa_match(a, ifa)) {
310 if (!b || inet_ifa_match(b, ifa)) {
311 rcu_read_unlock();
312 return 1;
313 }
314 }
315 } endfor_ifa(in_dev);
316 rcu_read_unlock();
317 return 0;
318}
319
Thomas Grafd6062cb2006-08-15 00:33:59 -0700320static void __inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
Eric W. Biederman15e47302012-09-07 20:12:54 +0000321 int destroy, struct nlmsghdr *nlh, u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322{
Harald Welte8f937c62005-05-29 20:23:46 -0700323 struct in_ifaddr *promote = NULL;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800324 struct in_ifaddr *ifa, *ifa1 = *ifap;
325 struct in_ifaddr *last_prim = in_dev->ifa_list;
326 struct in_ifaddr *prev_prom = NULL;
327 int do_promote = IN_DEV_PROMOTE_SECONDARIES(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328
329 ASSERT_RTNL();
330
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900331 /* 1. Deleting primary ifaddr forces deletion all secondaries
Harald Welte8f937c62005-05-29 20:23:46 -0700332 * unless alias promotion is set
333 **/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334
335 if (!(ifa1->ifa_flags & IFA_F_SECONDARY)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336 struct in_ifaddr **ifap1 = &ifa1->ifa_next;
337
338 while ((ifa = *ifap1) != NULL) {
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900339 if (!(ifa->ifa_flags & IFA_F_SECONDARY) &&
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800340 ifa1->ifa_scope <= ifa->ifa_scope)
341 last_prim = ifa;
342
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343 if (!(ifa->ifa_flags & IFA_F_SECONDARY) ||
344 ifa1->ifa_mask != ifa->ifa_mask ||
345 !inet_ifa_match(ifa1->ifa_address, ifa)) {
346 ifap1 = &ifa->ifa_next;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800347 prev_prom = ifa;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348 continue;
349 }
350
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800351 if (!do_promote) {
David S. Millerfd23c3b2011-02-18 12:42:28 -0800352 inet_hash_remove(ifa);
Harald Welte8f937c62005-05-29 20:23:46 -0700353 *ifap1 = ifa->ifa_next;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354
Eric W. Biederman15e47302012-09-07 20:12:54 +0000355 rtmsg_ifa(RTM_DELADDR, ifa, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800356 blocking_notifier_call_chain(&inetaddr_chain,
357 NETDEV_DOWN, ifa);
Harald Welte8f937c62005-05-29 20:23:46 -0700358 inet_free_ifa(ifa);
359 } else {
360 promote = ifa;
361 break;
362 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363 }
364 }
365
Julian Anastasov2d230e22011-03-19 12:13:52 +0000366 /* On promotion all secondaries from subnet are changing
367 * the primary IP, we must remove all their routes silently
368 * and later to add them back with new prefsrc. Do this
369 * while all addresses are on the device list.
370 */
371 for (ifa = promote; ifa; ifa = ifa->ifa_next) {
372 if (ifa1->ifa_mask == ifa->ifa_mask &&
373 inet_ifa_match(ifa1->ifa_address, ifa))
374 fib_del_ifaddr(ifa, ifa1);
375 }
376
Linus Torvalds1da177e2005-04-16 15:20:36 -0700377 /* 2. Unlink it */
378
379 *ifap = ifa1->ifa_next;
David S. Millerfd23c3b2011-02-18 12:42:28 -0800380 inet_hash_remove(ifa1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381
382 /* 3. Announce address deletion */
383
384 /* Send message first, then call notifier.
385 At first sight, FIB update triggered by notifier
386 will refer to already deleted ifaddr, that could confuse
387 netlink listeners. It is not true: look, gated sees
388 that route deleted and if it still thinks that ifaddr
389 is valid, it will try to restore deleted routes... Grr.
390 So that, this order is correct.
391 */
Eric W. Biederman15e47302012-09-07 20:12:54 +0000392 rtmsg_ifa(RTM_DELADDR, ifa1, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800393 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_DOWN, ifa1);
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800394
395 if (promote) {
Julian Anastasov04024b92011-03-19 12:13:54 +0000396 struct in_ifaddr *next_sec = promote->ifa_next;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800397
398 if (prev_prom) {
399 prev_prom->ifa_next = promote->ifa_next;
400 promote->ifa_next = last_prim->ifa_next;
401 last_prim->ifa_next = promote;
402 }
403
404 promote->ifa_flags &= ~IFA_F_SECONDARY;
Eric W. Biederman15e47302012-09-07 20:12:54 +0000405 rtmsg_ifa(RTM_NEWADDR, promote, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800406 blocking_notifier_call_chain(&inetaddr_chain,
407 NETDEV_UP, promote);
Julian Anastasov04024b92011-03-19 12:13:54 +0000408 for (ifa = next_sec; ifa; ifa = ifa->ifa_next) {
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800409 if (ifa1->ifa_mask != ifa->ifa_mask ||
410 !inet_ifa_match(ifa1->ifa_address, ifa))
411 continue;
412 fib_add_ifaddr(ifa);
413 }
414
415 }
Herbert Xu63630972007-06-07 18:35:38 -0700416 if (destroy)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 inet_free_ifa(ifa1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700418}
419
Thomas Grafd6062cb2006-08-15 00:33:59 -0700420static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
421 int destroy)
422{
423 __inet_del_ifa(in_dev, ifap, destroy, NULL, 0);
424}
425
Jiri Pirko5c766d62013-01-24 09:41:41 +0000426static void check_lifetime(struct work_struct *work);
427
428static DECLARE_DELAYED_WORK(check_lifetime_work, check_lifetime);
429
Thomas Grafd6062cb2006-08-15 00:33:59 -0700430static int __inet_insert_ifa(struct in_ifaddr *ifa, struct nlmsghdr *nlh,
Eric W. Biederman15e47302012-09-07 20:12:54 +0000431 u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432{
433 struct in_device *in_dev = ifa->ifa_dev;
434 struct in_ifaddr *ifa1, **ifap, **last_primary;
435
436 ASSERT_RTNL();
437
438 if (!ifa->ifa_local) {
439 inet_free_ifa(ifa);
440 return 0;
441 }
442
443 ifa->ifa_flags &= ~IFA_F_SECONDARY;
444 last_primary = &in_dev->ifa_list;
445
446 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
447 ifap = &ifa1->ifa_next) {
448 if (!(ifa1->ifa_flags & IFA_F_SECONDARY) &&
449 ifa->ifa_scope <= ifa1->ifa_scope)
450 last_primary = &ifa1->ifa_next;
451 if (ifa1->ifa_mask == ifa->ifa_mask &&
452 inet_ifa_match(ifa1->ifa_address, ifa)) {
453 if (ifa1->ifa_local == ifa->ifa_local) {
454 inet_free_ifa(ifa);
455 return -EEXIST;
456 }
457 if (ifa1->ifa_scope != ifa->ifa_scope) {
458 inet_free_ifa(ifa);
459 return -EINVAL;
460 }
461 ifa->ifa_flags |= IFA_F_SECONDARY;
462 }
463 }
464
465 if (!(ifa->ifa_flags & IFA_F_SECONDARY)) {
466 net_srandom(ifa->ifa_local);
467 ifap = last_primary;
468 }
469
470 ifa->ifa_next = *ifap;
471 *ifap = ifa;
472
David S. Millerfd23c3b2011-02-18 12:42:28 -0800473 inet_hash_insert(dev_net(in_dev->dev), ifa);
474
Jiri Pirko5c766d62013-01-24 09:41:41 +0000475 cancel_delayed_work(&check_lifetime_work);
476 schedule_delayed_work(&check_lifetime_work, 0);
477
Linus Torvalds1da177e2005-04-16 15:20:36 -0700478 /* Send message first, then call notifier.
479 Notifier will trigger FIB update, so that
480 listeners of netlink will know about new ifaddr */
Eric W. Biederman15e47302012-09-07 20:12:54 +0000481 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800482 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700483
484 return 0;
485}
486
Thomas Grafd6062cb2006-08-15 00:33:59 -0700487static int inet_insert_ifa(struct in_ifaddr *ifa)
488{
489 return __inet_insert_ifa(ifa, NULL, 0);
490}
491
Linus Torvalds1da177e2005-04-16 15:20:36 -0700492static int inet_set_ifa(struct net_device *dev, struct in_ifaddr *ifa)
493{
Herbert Xue5ed6392005-10-03 14:35:55 -0700494 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700495
496 ASSERT_RTNL();
497
498 if (!in_dev) {
Herbert Xu71e27da2007-06-04 23:36:06 -0700499 inet_free_ifa(ifa);
500 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700501 }
Herbert Xu71e27da2007-06-04 23:36:06 -0700502 ipv4_devconf_setall(in_dev);
Jiri Pirko1d4c8c22013-12-07 19:26:56 +0100503 neigh_parms_data_state_setall(in_dev->arp_parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700504 if (ifa->ifa_dev != in_dev) {
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700505 WARN_ON(ifa->ifa_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700506 in_dev_hold(in_dev);
507 ifa->ifa_dev = in_dev;
508 }
Joe Perchesf97c1e02007-12-16 13:45:43 -0800509 if (ipv4_is_loopback(ifa->ifa_local))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510 ifa->ifa_scope = RT_SCOPE_HOST;
511 return inet_insert_ifa(ifa);
512}
513
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000514/* Caller must hold RCU or RTNL :
515 * We dont take a reference on found in_device
516 */
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800517struct in_device *inetdev_by_index(struct net *net, int ifindex)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700518{
519 struct net_device *dev;
520 struct in_device *in_dev = NULL;
Eric Dumazetc148fc22009-11-01 19:23:04 +0000521
522 rcu_read_lock();
523 dev = dev_get_by_index_rcu(net, ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524 if (dev)
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000525 in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Eric Dumazetc148fc22009-11-01 19:23:04 +0000526 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700527 return in_dev;
528}
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800529EXPORT_SYMBOL(inetdev_by_index);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700530
531/* Called only from RTNL semaphored context. No locks. */
532
Al Viro60cad5d2006-09-26 22:17:09 -0700533struct in_ifaddr *inet_ifa_byprefix(struct in_device *in_dev, __be32 prefix,
534 __be32 mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700535{
536 ASSERT_RTNL();
537
538 for_primary_ifa(in_dev) {
539 if (ifa->ifa_mask == mask && inet_ifa_match(prefix, ifa))
540 return ifa;
541 } endfor_ifa(in_dev);
542 return NULL;
543}
544
Thomas Graf661d2962013-03-21 07:45:29 +0000545static int inet_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700546{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900547 struct net *net = sock_net(skb->sk);
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700548 struct nlattr *tb[IFA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700549 struct in_device *in_dev;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700550 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700551 struct in_ifaddr *ifa, **ifap;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700552 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700553
554 ASSERT_RTNL();
555
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700556 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
557 if (err < 0)
558 goto errout;
559
560 ifm = nlmsg_data(nlh);
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800561 in_dev = inetdev_by_index(net, ifm->ifa_index);
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700562 if (in_dev == NULL) {
563 err = -ENODEV;
564 goto errout;
565 }
566
Linus Torvalds1da177e2005-04-16 15:20:36 -0700567 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
568 ifap = &ifa->ifa_next) {
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700569 if (tb[IFA_LOCAL] &&
Al Viroa7a628c2006-09-26 22:16:43 -0700570 ifa->ifa_local != nla_get_be32(tb[IFA_LOCAL]))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700571 continue;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700572
573 if (tb[IFA_LABEL] && nla_strcmp(tb[IFA_LABEL], ifa->ifa_label))
574 continue;
575
576 if (tb[IFA_ADDRESS] &&
577 (ifm->ifa_prefixlen != ifa->ifa_prefixlen ||
Al Viroa7a628c2006-09-26 22:16:43 -0700578 !inet_ifa_match(nla_get_be32(tb[IFA_ADDRESS]), ifa)))
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700579 continue;
580
Eric W. Biederman15e47302012-09-07 20:12:54 +0000581 __inet_del_ifa(in_dev, ifap, 1, nlh, NETLINK_CB(skb).portid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700582 return 0;
583 }
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700584
585 err = -EADDRNOTAVAIL;
586errout:
587 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588}
589
Jiri Pirko5c766d62013-01-24 09:41:41 +0000590#define INFINITY_LIFE_TIME 0xFFFFFFFF
591
592static void check_lifetime(struct work_struct *work)
593{
594 unsigned long now, next, next_sec, next_sched;
595 struct in_ifaddr *ifa;
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000596 struct hlist_node *n;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000597 int i;
598
599 now = jiffies;
600 next = round_jiffies_up(now + ADDR_CHECK_FREQUENCY);
601
Jiri Pirko5c766d62013-01-24 09:41:41 +0000602 for (i = 0; i < IN4_ADDR_HSIZE; i++) {
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000603 bool change_needed = false;
604
605 rcu_read_lock();
Sasha Levinb67bfe02013-02-27 17:06:00 -0800606 hlist_for_each_entry_rcu(ifa, &inet_addr_lst[i], hash) {
Jiri Pirko5c766d62013-01-24 09:41:41 +0000607 unsigned long age;
608
609 if (ifa->ifa_flags & IFA_F_PERMANENT)
610 continue;
611
612 /* We try to batch several events at once. */
613 age = (now - ifa->ifa_tstamp +
614 ADDRCONF_TIMER_FUZZ_MINUS) / HZ;
615
616 if (ifa->ifa_valid_lft != INFINITY_LIFE_TIME &&
617 age >= ifa->ifa_valid_lft) {
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000618 change_needed = true;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000619 } else if (ifa->ifa_preferred_lft ==
620 INFINITY_LIFE_TIME) {
621 continue;
622 } else if (age >= ifa->ifa_preferred_lft) {
623 if (time_before(ifa->ifa_tstamp +
624 ifa->ifa_valid_lft * HZ, next))
625 next = ifa->ifa_tstamp +
626 ifa->ifa_valid_lft * HZ;
627
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000628 if (!(ifa->ifa_flags & IFA_F_DEPRECATED))
629 change_needed = true;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000630 } else if (time_before(ifa->ifa_tstamp +
631 ifa->ifa_preferred_lft * HZ,
632 next)) {
633 next = ifa->ifa_tstamp +
634 ifa->ifa_preferred_lft * HZ;
635 }
636 }
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000637 rcu_read_unlock();
638 if (!change_needed)
639 continue;
640 rtnl_lock();
641 hlist_for_each_entry_safe(ifa, n, &inet_addr_lst[i], hash) {
642 unsigned long age;
643
644 if (ifa->ifa_flags & IFA_F_PERMANENT)
645 continue;
646
647 /* We try to batch several events at once. */
648 age = (now - ifa->ifa_tstamp +
649 ADDRCONF_TIMER_FUZZ_MINUS) / HZ;
650
651 if (ifa->ifa_valid_lft != INFINITY_LIFE_TIME &&
652 age >= ifa->ifa_valid_lft) {
653 struct in_ifaddr **ifap;
654
655 for (ifap = &ifa->ifa_dev->ifa_list;
656 *ifap != NULL; ifap = &(*ifap)->ifa_next) {
657 if (*ifap == ifa) {
658 inet_del_ifa(ifa->ifa_dev,
659 ifap, 1);
660 break;
661 }
662 }
663 } else if (ifa->ifa_preferred_lft !=
664 INFINITY_LIFE_TIME &&
665 age >= ifa->ifa_preferred_lft &&
666 !(ifa->ifa_flags & IFA_F_DEPRECATED)) {
667 ifa->ifa_flags |= IFA_F_DEPRECATED;
668 rtmsg_ifa(RTM_NEWADDR, ifa, NULL, 0);
669 }
670 }
671 rtnl_unlock();
Jiri Pirko5c766d62013-01-24 09:41:41 +0000672 }
Jiri Pirko5c766d62013-01-24 09:41:41 +0000673
674 next_sec = round_jiffies_up(next);
675 next_sched = next;
676
677 /* If rounded timeout is accurate enough, accept it. */
678 if (time_before(next_sec, next + ADDRCONF_TIMER_FUZZ))
679 next_sched = next_sec;
680
681 now = jiffies;
682 /* And minimum interval is ADDRCONF_TIMER_FUZZ_MAX. */
683 if (time_before(next_sched, now + ADDRCONF_TIMER_FUZZ_MAX))
684 next_sched = now + ADDRCONF_TIMER_FUZZ_MAX;
685
686 schedule_delayed_work(&check_lifetime_work, next_sched - now);
687}
688
689static void set_ifa_lifetime(struct in_ifaddr *ifa, __u32 valid_lft,
690 __u32 prefered_lft)
691{
692 unsigned long timeout;
693
694 ifa->ifa_flags &= ~(IFA_F_PERMANENT | IFA_F_DEPRECATED);
695
696 timeout = addrconf_timeout_fixup(valid_lft, HZ);
697 if (addrconf_finite_timeout(timeout))
698 ifa->ifa_valid_lft = timeout;
699 else
700 ifa->ifa_flags |= IFA_F_PERMANENT;
701
702 timeout = addrconf_timeout_fixup(prefered_lft, HZ);
703 if (addrconf_finite_timeout(timeout)) {
704 if (timeout == 0)
705 ifa->ifa_flags |= IFA_F_DEPRECATED;
706 ifa->ifa_preferred_lft = timeout;
707 }
708 ifa->ifa_tstamp = jiffies;
709 if (!ifa->ifa_cstamp)
710 ifa->ifa_cstamp = ifa->ifa_tstamp;
711}
712
713static struct in_ifaddr *rtm_to_ifaddr(struct net *net, struct nlmsghdr *nlh,
714 __u32 *pvalid_lft, __u32 *pprefered_lft)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700715{
Thomas Graf5c753972006-08-04 23:03:53 -0700716 struct nlattr *tb[IFA_MAX+1];
717 struct in_ifaddr *ifa;
718 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700719 struct net_device *dev;
720 struct in_device *in_dev;
Denis V. Lunev7b218572008-01-31 18:47:00 -0800721 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700722
Thomas Graf5c753972006-08-04 23:03:53 -0700723 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
724 if (err < 0)
725 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726
Thomas Graf5c753972006-08-04 23:03:53 -0700727 ifm = nlmsg_data(nlh);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800728 err = -EINVAL;
729 if (ifm->ifa_prefixlen > 32 || tb[IFA_LOCAL] == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700730 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700731
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -0800732 dev = __dev_get_by_index(net, ifm->ifa_index);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800733 err = -ENODEV;
734 if (dev == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700735 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700736
Thomas Graf5c753972006-08-04 23:03:53 -0700737 in_dev = __in_dev_get_rtnl(dev);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800738 err = -ENOBUFS;
739 if (in_dev == NULL)
Herbert Xu71e27da2007-06-04 23:36:06 -0700740 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741
Thomas Graf5c753972006-08-04 23:03:53 -0700742 ifa = inet_alloc_ifa();
Denis V. Lunev7b218572008-01-31 18:47:00 -0800743 if (ifa == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700744 /*
745 * A potential indev allocation can be left alive, it stays
746 * assigned to its device and is destroy with it.
747 */
Thomas Graf5c753972006-08-04 23:03:53 -0700748 goto errout;
Thomas Graf5c753972006-08-04 23:03:53 -0700749
Pavel Emelyanova4e65d32007-12-07 23:55:43 -0800750 ipv4_devconf_setall(in_dev);
Jiri Pirko1d4c8c22013-12-07 19:26:56 +0100751 neigh_parms_data_state_setall(in_dev->arp_parms);
Thomas Graf5c753972006-08-04 23:03:53 -0700752 in_dev_hold(in_dev);
753
754 if (tb[IFA_ADDRESS] == NULL)
755 tb[IFA_ADDRESS] = tb[IFA_LOCAL];
756
David S. Millerfd23c3b2011-02-18 12:42:28 -0800757 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758 ifa->ifa_prefixlen = ifm->ifa_prefixlen;
759 ifa->ifa_mask = inet_make_mask(ifm->ifa_prefixlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700760 ifa->ifa_flags = ifm->ifa_flags;
761 ifa->ifa_scope = ifm->ifa_scope;
Thomas Graf5c753972006-08-04 23:03:53 -0700762 ifa->ifa_dev = in_dev;
763
Al Viroa7a628c2006-09-26 22:16:43 -0700764 ifa->ifa_local = nla_get_be32(tb[IFA_LOCAL]);
765 ifa->ifa_address = nla_get_be32(tb[IFA_ADDRESS]);
Thomas Graf5c753972006-08-04 23:03:53 -0700766
767 if (tb[IFA_BROADCAST])
Al Viroa7a628c2006-09-26 22:16:43 -0700768 ifa->ifa_broadcast = nla_get_be32(tb[IFA_BROADCAST]);
Thomas Graf5c753972006-08-04 23:03:53 -0700769
Thomas Graf5c753972006-08-04 23:03:53 -0700770 if (tb[IFA_LABEL])
771 nla_strlcpy(ifa->ifa_label, tb[IFA_LABEL], IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772 else
773 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
774
Jiri Pirko5c766d62013-01-24 09:41:41 +0000775 if (tb[IFA_CACHEINFO]) {
776 struct ifa_cacheinfo *ci;
777
778 ci = nla_data(tb[IFA_CACHEINFO]);
779 if (!ci->ifa_valid || ci->ifa_prefered > ci->ifa_valid) {
780 err = -EINVAL;
Daniel Borkmann446266b2013-08-02 11:32:43 +0200781 goto errout_free;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000782 }
783 *pvalid_lft = ci->ifa_valid;
784 *pprefered_lft = ci->ifa_prefered;
785 }
786
Thomas Graf5c753972006-08-04 23:03:53 -0700787 return ifa;
788
Daniel Borkmann446266b2013-08-02 11:32:43 +0200789errout_free:
790 inet_free_ifa(ifa);
Thomas Graf5c753972006-08-04 23:03:53 -0700791errout:
792 return ERR_PTR(err);
793}
794
Jiri Pirko5c766d62013-01-24 09:41:41 +0000795static struct in_ifaddr *find_matching_ifa(struct in_ifaddr *ifa)
796{
797 struct in_device *in_dev = ifa->ifa_dev;
798 struct in_ifaddr *ifa1, **ifap;
799
800 if (!ifa->ifa_local)
801 return NULL;
802
803 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
804 ifap = &ifa1->ifa_next) {
805 if (ifa1->ifa_mask == ifa->ifa_mask &&
806 inet_ifa_match(ifa1->ifa_address, ifa) &&
807 ifa1->ifa_local == ifa->ifa_local)
808 return ifa1;
809 }
810 return NULL;
811}
812
Thomas Graf661d2962013-03-21 07:45:29 +0000813static int inet_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh)
Thomas Graf5c753972006-08-04 23:03:53 -0700814{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900815 struct net *net = sock_net(skb->sk);
Thomas Graf5c753972006-08-04 23:03:53 -0700816 struct in_ifaddr *ifa;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000817 struct in_ifaddr *ifa_existing;
818 __u32 valid_lft = INFINITY_LIFE_TIME;
819 __u32 prefered_lft = INFINITY_LIFE_TIME;
Thomas Graf5c753972006-08-04 23:03:53 -0700820
821 ASSERT_RTNL();
822
Jiri Pirko5c766d62013-01-24 09:41:41 +0000823 ifa = rtm_to_ifaddr(net, nlh, &valid_lft, &prefered_lft);
Thomas Graf5c753972006-08-04 23:03:53 -0700824 if (IS_ERR(ifa))
825 return PTR_ERR(ifa);
826
Jiri Pirko5c766d62013-01-24 09:41:41 +0000827 ifa_existing = find_matching_ifa(ifa);
828 if (!ifa_existing) {
829 /* It would be best to check for !NLM_F_CREATE here but
830 * userspace alreay relies on not having to provide this.
831 */
832 set_ifa_lifetime(ifa, valid_lft, prefered_lft);
833 return __inet_insert_ifa(ifa, nlh, NETLINK_CB(skb).portid);
834 } else {
835 inet_free_ifa(ifa);
836
837 if (nlh->nlmsg_flags & NLM_F_EXCL ||
838 !(nlh->nlmsg_flags & NLM_F_REPLACE))
839 return -EEXIST;
Jiri Pirko34e2ed32013-04-04 08:33:00 +0000840 ifa = ifa_existing;
841 set_ifa_lifetime(ifa, valid_lft, prefered_lft);
Jiri Pirko05a324b2013-04-04 23:39:38 +0000842 cancel_delayed_work(&check_lifetime_work);
843 schedule_delayed_work(&check_lifetime_work, 0);
Jiri Pirko34e2ed32013-04-04 08:33:00 +0000844 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, NETLINK_CB(skb).portid);
845 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
Jiri Pirko5c766d62013-01-24 09:41:41 +0000846 }
847 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700848}
849
850/*
851 * Determine a default network mask, based on the IP address.
852 */
853
Eric Dumazet40384992012-08-03 21:06:50 +0000854static int inet_abc_len(__be32 addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700855{
856 int rc = -1; /* Something else, probably a multicast. */
857
Joe Perchesf97c1e02007-12-16 13:45:43 -0800858 if (ipv4_is_zeronet(addr))
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900859 rc = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700860 else {
Al Viro714e85b2006-11-14 20:51:49 -0800861 __u32 haddr = ntohl(addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700862
Al Viro714e85b2006-11-14 20:51:49 -0800863 if (IN_CLASSA(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700864 rc = 8;
Al Viro714e85b2006-11-14 20:51:49 -0800865 else if (IN_CLASSB(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700866 rc = 16;
Al Viro714e85b2006-11-14 20:51:49 -0800867 else if (IN_CLASSC(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700868 rc = 24;
869 }
870
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900871 return rc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700872}
873
874
Denis V. Luneve5b13cb2008-02-28 20:51:43 -0800875int devinet_ioctl(struct net *net, unsigned int cmd, void __user *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700876{
877 struct ifreq ifr;
878 struct sockaddr_in sin_orig;
879 struct sockaddr_in *sin = (struct sockaddr_in *)&ifr.ifr_addr;
880 struct in_device *in_dev;
881 struct in_ifaddr **ifap = NULL;
882 struct in_ifaddr *ifa = NULL;
883 struct net_device *dev;
884 char *colon;
885 int ret = -EFAULT;
886 int tryaddrmatch = 0;
887
888 /*
889 * Fetch the caller's info block into kernel space
890 */
891
892 if (copy_from_user(&ifr, arg, sizeof(struct ifreq)))
893 goto out;
894 ifr.ifr_name[IFNAMSIZ - 1] = 0;
895
896 /* save original address for comparison */
897 memcpy(&sin_orig, sin, sizeof(*sin));
898
899 colon = strchr(ifr.ifr_name, ':');
900 if (colon)
901 *colon = 0;
902
Denis V. Luneve5b13cb2008-02-28 20:51:43 -0800903 dev_load(net, ifr.ifr_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700904
Stephen Hemminger132adf52007-03-08 20:44:43 -0800905 switch (cmd) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700906 case SIOCGIFADDR: /* Get interface address */
907 case SIOCGIFBRDADDR: /* Get the broadcast address */
908 case SIOCGIFDSTADDR: /* Get the destination address */
909 case SIOCGIFNETMASK: /* Get the netmask for the interface */
910 /* Note that these ioctls will not sleep,
911 so that we do not impose a lock.
912 One day we will be forced to put shlock here (I mean SMP)
913 */
914 tryaddrmatch = (sin_orig.sin_family == AF_INET);
915 memset(sin, 0, sizeof(*sin));
916 sin->sin_family = AF_INET;
917 break;
918
919 case SIOCSIFFLAGS:
Zhao Hongjiangbf5b30b2012-09-20 22:37:25 +0000920 ret = -EPERM;
Eric W. Biederman52e804c2012-11-16 03:03:05 +0000921 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700922 goto out;
923 break;
924 case SIOCSIFADDR: /* Set interface address (and family) */
925 case SIOCSIFBRDADDR: /* Set the broadcast address */
926 case SIOCSIFDSTADDR: /* Set the destination address */
927 case SIOCSIFNETMASK: /* Set the netmask for the interface */
Zhao Hongjiangbf5b30b2012-09-20 22:37:25 +0000928 ret = -EPERM;
Eric W. Biederman52e804c2012-11-16 03:03:05 +0000929 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700930 goto out;
931 ret = -EINVAL;
932 if (sin->sin_family != AF_INET)
933 goto out;
934 break;
935 default:
936 ret = -EINVAL;
937 goto out;
938 }
939
940 rtnl_lock();
941
942 ret = -ENODEV;
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800943 dev = __dev_get_by_name(net, ifr.ifr_name);
944 if (!dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700945 goto done;
946
947 if (colon)
948 *colon = ':';
949
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800950 in_dev = __in_dev_get_rtnl(dev);
951 if (in_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700952 if (tryaddrmatch) {
953 /* Matthias Andree */
954 /* compare label and address (4.4BSD style) */
955 /* note: we only do this for a limited set of ioctls
956 and only if the original address family was AF_INET.
957 This is checked above. */
958 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
959 ifap = &ifa->ifa_next) {
960 if (!strcmp(ifr.ifr_name, ifa->ifa_label) &&
961 sin_orig.sin_addr.s_addr ==
David S. Miller6c91afe2011-03-09 13:27:16 -0800962 ifa->ifa_local) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700963 break; /* found */
964 }
965 }
966 }
967 /* we didn't get a match, maybe the application is
968 4.3BSD-style and passed in junk so we fall back to
969 comparing just the label */
970 if (!ifa) {
971 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
972 ifap = &ifa->ifa_next)
973 if (!strcmp(ifr.ifr_name, ifa->ifa_label))
974 break;
975 }
976 }
977
978 ret = -EADDRNOTAVAIL;
979 if (!ifa && cmd != SIOCSIFADDR && cmd != SIOCSIFFLAGS)
980 goto done;
981
Stephen Hemminger132adf52007-03-08 20:44:43 -0800982 switch (cmd) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700983 case SIOCGIFADDR: /* Get interface address */
984 sin->sin_addr.s_addr = ifa->ifa_local;
985 goto rarok;
986
987 case SIOCGIFBRDADDR: /* Get the broadcast address */
988 sin->sin_addr.s_addr = ifa->ifa_broadcast;
989 goto rarok;
990
991 case SIOCGIFDSTADDR: /* Get the destination address */
992 sin->sin_addr.s_addr = ifa->ifa_address;
993 goto rarok;
994
995 case SIOCGIFNETMASK: /* Get the netmask for the interface */
996 sin->sin_addr.s_addr = ifa->ifa_mask;
997 goto rarok;
998
999 case SIOCSIFFLAGS:
1000 if (colon) {
1001 ret = -EADDRNOTAVAIL;
1002 if (!ifa)
1003 break;
1004 ret = 0;
1005 if (!(ifr.ifr_flags & IFF_UP))
1006 inet_del_ifa(in_dev, ifap, 1);
1007 break;
1008 }
1009 ret = dev_change_flags(dev, ifr.ifr_flags);
1010 break;
1011
1012 case SIOCSIFADDR: /* Set interface address (and family) */
1013 ret = -EINVAL;
1014 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
1015 break;
1016
1017 if (!ifa) {
1018 ret = -ENOBUFS;
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001019 ifa = inet_alloc_ifa();
1020 if (!ifa)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001021 break;
Xi Wangc7e2e1d2013-01-05 11:19:24 +00001022 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001023 if (colon)
1024 memcpy(ifa->ifa_label, ifr.ifr_name, IFNAMSIZ);
1025 else
1026 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1027 } else {
1028 ret = 0;
1029 if (ifa->ifa_local == sin->sin_addr.s_addr)
1030 break;
1031 inet_del_ifa(in_dev, ifap, 0);
1032 ifa->ifa_broadcast = 0;
Bjorn Mork148f9722008-02-26 18:17:53 -08001033 ifa->ifa_scope = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001034 }
1035
1036 ifa->ifa_address = ifa->ifa_local = sin->sin_addr.s_addr;
1037
1038 if (!(dev->flags & IFF_POINTOPOINT)) {
1039 ifa->ifa_prefixlen = inet_abc_len(ifa->ifa_address);
1040 ifa->ifa_mask = inet_make_mask(ifa->ifa_prefixlen);
1041 if ((dev->flags & IFF_BROADCAST) &&
1042 ifa->ifa_prefixlen < 31)
1043 ifa->ifa_broadcast = ifa->ifa_address |
1044 ~ifa->ifa_mask;
1045 } else {
1046 ifa->ifa_prefixlen = 32;
1047 ifa->ifa_mask = inet_make_mask(32);
1048 }
Jiri Pirko5c766d62013-01-24 09:41:41 +00001049 set_ifa_lifetime(ifa, INFINITY_LIFE_TIME, INFINITY_LIFE_TIME);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001050 ret = inet_set_ifa(dev, ifa);
1051 break;
1052
1053 case SIOCSIFBRDADDR: /* Set the broadcast address */
1054 ret = 0;
1055 if (ifa->ifa_broadcast != sin->sin_addr.s_addr) {
1056 inet_del_ifa(in_dev, ifap, 0);
1057 ifa->ifa_broadcast = sin->sin_addr.s_addr;
1058 inet_insert_ifa(ifa);
1059 }
1060 break;
1061
1062 case SIOCSIFDSTADDR: /* Set the destination address */
1063 ret = 0;
1064 if (ifa->ifa_address == sin->sin_addr.s_addr)
1065 break;
1066 ret = -EINVAL;
1067 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
1068 break;
1069 ret = 0;
1070 inet_del_ifa(in_dev, ifap, 0);
1071 ifa->ifa_address = sin->sin_addr.s_addr;
1072 inet_insert_ifa(ifa);
1073 break;
1074
1075 case SIOCSIFNETMASK: /* Set the netmask for the interface */
1076
1077 /*
1078 * The mask we set must be legal.
1079 */
1080 ret = -EINVAL;
1081 if (bad_mask(sin->sin_addr.s_addr, 0))
1082 break;
1083 ret = 0;
1084 if (ifa->ifa_mask != sin->sin_addr.s_addr) {
Al Viroa144ea42006-09-28 18:00:55 -07001085 __be32 old_mask = ifa->ifa_mask;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001086 inet_del_ifa(in_dev, ifap, 0);
1087 ifa->ifa_mask = sin->sin_addr.s_addr;
1088 ifa->ifa_prefixlen = inet_mask_len(ifa->ifa_mask);
1089
1090 /* See if current broadcast address matches
1091 * with current netmask, then recalculate
1092 * the broadcast address. Otherwise it's a
1093 * funny address, so don't touch it since
1094 * the user seems to know what (s)he's doing...
1095 */
1096 if ((dev->flags & IFF_BROADCAST) &&
1097 (ifa->ifa_prefixlen < 31) &&
1098 (ifa->ifa_broadcast ==
David Engeldcab5e12005-10-21 22:09:16 -05001099 (ifa->ifa_local|~old_mask))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001100 ifa->ifa_broadcast = (ifa->ifa_local |
1101 ~sin->sin_addr.s_addr);
1102 }
1103 inet_insert_ifa(ifa);
1104 }
1105 break;
1106 }
1107done:
1108 rtnl_unlock();
1109out:
1110 return ret;
1111rarok:
1112 rtnl_unlock();
1113 ret = copy_to_user(arg, &ifr, sizeof(struct ifreq)) ? -EFAULT : 0;
1114 goto out;
1115}
1116
1117static int inet_gifconf(struct net_device *dev, char __user *buf, int len)
1118{
Herbert Xue5ed6392005-10-03 14:35:55 -07001119 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001120 struct in_ifaddr *ifa;
1121 struct ifreq ifr;
1122 int done = 0;
1123
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001124 if (!in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001125 goto out;
1126
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001127 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001128 if (!buf) {
1129 done += sizeof(ifr);
1130 continue;
1131 }
1132 if (len < (int) sizeof(ifr))
1133 break;
1134 memset(&ifr, 0, sizeof(struct ifreq));
Dan Carpenter4299c8a2013-07-29 22:15:19 +03001135 strcpy(ifr.ifr_name, ifa->ifa_label);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001136
1137 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_family = AF_INET;
1138 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_addr.s_addr =
1139 ifa->ifa_local;
1140
1141 if (copy_to_user(buf, &ifr, sizeof(struct ifreq))) {
1142 done = -EFAULT;
1143 break;
1144 }
1145 buf += sizeof(struct ifreq);
1146 len -= sizeof(struct ifreq);
1147 done += sizeof(struct ifreq);
1148 }
1149out:
1150 return done;
1151}
1152
Al Viroa61ced52006-09-26 21:27:54 -07001153__be32 inet_select_addr(const struct net_device *dev, __be32 dst, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001154{
Al Viroa61ced52006-09-26 21:27:54 -07001155 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001156 struct in_device *in_dev;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001157 struct net *net = dev_net(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158
1159 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -07001160 in_dev = __in_dev_get_rcu(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001161 if (!in_dev)
1162 goto no_in_dev;
1163
1164 for_primary_ifa(in_dev) {
1165 if (ifa->ifa_scope > scope)
1166 continue;
1167 if (!dst || inet_ifa_match(dst, ifa)) {
1168 addr = ifa->ifa_local;
1169 break;
1170 }
1171 if (!addr)
1172 addr = ifa->ifa_local;
1173 } endfor_ifa(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001174
1175 if (addr)
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001176 goto out_unlock;
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001177no_in_dev:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001178
1179 /* Not loopback addresses on loopback should be preferred
1180 in this case. It is importnat that lo is the first interface
1181 in dev_base list.
1182 */
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001183 for_each_netdev_rcu(net, dev) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001184 in_dev = __in_dev_get_rcu(dev);
1185 if (!in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001186 continue;
1187
1188 for_primary_ifa(in_dev) {
1189 if (ifa->ifa_scope != RT_SCOPE_LINK &&
1190 ifa->ifa_scope <= scope) {
1191 addr = ifa->ifa_local;
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001192 goto out_unlock;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001193 }
1194 } endfor_ifa(in_dev);
1195 }
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001196out_unlock:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001197 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001198 return addr;
1199}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001200EXPORT_SYMBOL(inet_select_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001201
Al Viro60cad5d2006-09-26 22:17:09 -07001202static __be32 confirm_addr_indev(struct in_device *in_dev, __be32 dst,
1203 __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001204{
1205 int same = 0;
Al Viroa144ea42006-09-28 18:00:55 -07001206 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001207
1208 for_ifa(in_dev) {
1209 if (!addr &&
1210 (local == ifa->ifa_local || !local) &&
1211 ifa->ifa_scope <= scope) {
1212 addr = ifa->ifa_local;
1213 if (same)
1214 break;
1215 }
1216 if (!same) {
1217 same = (!local || inet_ifa_match(local, ifa)) &&
1218 (!dst || inet_ifa_match(dst, ifa));
1219 if (same && addr) {
1220 if (local || !dst)
1221 break;
1222 /* Is the selected addr into dst subnet? */
1223 if (inet_ifa_match(addr, ifa))
1224 break;
1225 /* No, then can we use new local src? */
1226 if (ifa->ifa_scope <= scope) {
1227 addr = ifa->ifa_local;
1228 break;
1229 }
1230 /* search for large dst subnet for addr */
1231 same = 0;
1232 }
1233 }
1234 } endfor_ifa(in_dev);
1235
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001236 return same ? addr : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001237}
1238
1239/*
1240 * Confirm that local IP address exists using wildcards:
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001241 * - in_dev: only on this interface, 0=any interface
Linus Torvalds1da177e2005-04-16 15:20:36 -07001242 * - dst: only in the same subnet as dst, 0=any dst
1243 * - local: address, 0=autoselect the local address
1244 * - scope: maximum allowed scope value for the local address
1245 */
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001246__be32 inet_confirm_addr(struct in_device *in_dev,
1247 __be32 dst, __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001248{
Al Viro60cad5d2006-09-26 22:17:09 -07001249 __be32 addr = 0;
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001250 struct net_device *dev;
Denis V. Lunev39a6d062008-01-14 23:06:19 -08001251 struct net *net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001252
Denis V. Lunev39a6d062008-01-14 23:06:19 -08001253 if (scope != RT_SCOPE_LINK)
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001254 return confirm_addr_indev(in_dev, dst, local, scope);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001255
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001256 net = dev_net(in_dev->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001257 rcu_read_lock();
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001258 for_each_netdev_rcu(net, dev) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001259 in_dev = __in_dev_get_rcu(dev);
1260 if (in_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001261 addr = confirm_addr_indev(in_dev, dst, local, scope);
1262 if (addr)
1263 break;
1264 }
1265 }
1266 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001267
1268 return addr;
1269}
Andy Gospodarekeaddcd72012-03-22 16:14:29 +00001270EXPORT_SYMBOL(inet_confirm_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001271
1272/*
1273 * Device notifier
1274 */
1275
1276int register_inetaddr_notifier(struct notifier_block *nb)
1277{
Alan Sterne041c682006-03-27 01:16:30 -08001278 return blocking_notifier_chain_register(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001279}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001280EXPORT_SYMBOL(register_inetaddr_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001281
1282int unregister_inetaddr_notifier(struct notifier_block *nb)
1283{
Alan Sterne041c682006-03-27 01:16:30 -08001284 return blocking_notifier_chain_unregister(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001285}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001286EXPORT_SYMBOL(unregister_inetaddr_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001288/* Rename ifa_labels for a device name change. Make some effort to preserve
1289 * existing alias numbering and to create unique labels if possible.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001290*/
1291static void inetdev_changename(struct net_device *dev, struct in_device *in_dev)
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001292{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001293 struct in_ifaddr *ifa;
1294 int named = 0;
1295
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001296 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
1297 char old[IFNAMSIZ], *dot;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001298
1299 memcpy(old, ifa->ifa_label, IFNAMSIZ);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001300 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001301 if (named++ == 0)
Thomas Graf573bf472008-06-10 15:40:04 -07001302 goto skip;
Mark McLoughlin44344b22008-01-04 00:56:25 -08001303 dot = strchr(old, ':');
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001304 if (dot == NULL) {
1305 sprintf(old, ":%d", named);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001306 dot = old;
1307 }
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001308 if (strlen(dot) + strlen(dev->name) < IFNAMSIZ)
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001309 strcat(ifa->ifa_label, dot);
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001310 else
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001311 strcpy(ifa->ifa_label + (IFNAMSIZ - strlen(dot) - 1), dot);
Thomas Graf573bf472008-06-10 15:40:04 -07001312skip:
1313 rtmsg_ifa(RTM_NEWADDR, ifa, NULL, 0);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001314 }
1315}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001316
Eric Dumazet40384992012-08-03 21:06:50 +00001317static bool inetdev_valid_mtu(unsigned int mtu)
Breno Leitao06770842008-09-02 17:28:58 -07001318{
1319 return mtu >= 68;
1320}
1321
Ian Campbelld11327ad2011-02-11 07:44:16 +00001322static void inetdev_send_gratuitous_arp(struct net_device *dev,
1323 struct in_device *in_dev)
1324
1325{
Zoltan Kissb76d0782011-07-24 13:09:30 +00001326 struct in_ifaddr *ifa;
Ian Campbelld11327ad2011-02-11 07:44:16 +00001327
Zoltan Kissb76d0782011-07-24 13:09:30 +00001328 for (ifa = in_dev->ifa_list; ifa;
1329 ifa = ifa->ifa_next) {
1330 arp_send(ARPOP_REQUEST, ETH_P_ARP,
1331 ifa->ifa_local, dev,
1332 ifa->ifa_local, NULL,
1333 dev->dev_addr, NULL);
1334 }
Ian Campbelld11327ad2011-02-11 07:44:16 +00001335}
1336
Linus Torvalds1da177e2005-04-16 15:20:36 -07001337/* Called only under RTNL semaphore */
1338
1339static int inetdev_event(struct notifier_block *this, unsigned long event,
1340 void *ptr)
1341{
Jiri Pirko351638e2013-05-28 01:30:21 +00001342 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
Eric Dumazet748e2d92012-08-22 21:50:59 +00001343 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001344
1345 ASSERT_RTNL();
1346
1347 if (!in_dev) {
Herbert Xu8030f542007-02-22 01:53:47 +09001348 if (event == NETDEV_REGISTER) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001349 in_dev = inetdev_init(dev);
Herbert Xub217d612007-07-30 17:04:52 -07001350 if (!in_dev)
1351 return notifier_from_errno(-ENOMEM);
Eric W. Biederman0cc217e2007-09-26 22:10:06 -07001352 if (dev->flags & IFF_LOOPBACK) {
Herbert Xu42f811b2007-06-04 23:34:44 -07001353 IN_DEV_CONF_SET(in_dev, NOXFRM, 1);
1354 IN_DEV_CONF_SET(in_dev, NOPOLICY, 1);
Herbert Xu8030f542007-02-22 01:53:47 +09001355 }
Breno Leitao06770842008-09-02 17:28:58 -07001356 } else if (event == NETDEV_CHANGEMTU) {
1357 /* Re-enabling IP */
1358 if (inetdev_valid_mtu(dev->mtu))
1359 in_dev = inetdev_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001360 }
1361 goto out;
1362 }
1363
1364 switch (event) {
1365 case NETDEV_REGISTER:
Joe Perches91df42b2012-05-15 14:11:54 +00001366 pr_debug("%s: bug\n", __func__);
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +00001367 RCU_INIT_POINTER(dev->ip_ptr, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001368 break;
1369 case NETDEV_UP:
Breno Leitao06770842008-09-02 17:28:58 -07001370 if (!inetdev_valid_mtu(dev->mtu))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001371 break;
Eric W. Biederman0cc217e2007-09-26 22:10:06 -07001372 if (dev->flags & IFF_LOOPBACK) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001373 struct in_ifaddr *ifa = inet_alloc_ifa();
1374
1375 if (ifa) {
David S. Millerfd23c3b2011-02-18 12:42:28 -08001376 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001377 ifa->ifa_local =
1378 ifa->ifa_address = htonl(INADDR_LOOPBACK);
1379 ifa->ifa_prefixlen = 8;
1380 ifa->ifa_mask = inet_make_mask(8);
1381 in_dev_hold(in_dev);
1382 ifa->ifa_dev = in_dev;
1383 ifa->ifa_scope = RT_SCOPE_HOST;
1384 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
Jiri Pirko5c766d62013-01-24 09:41:41 +00001385 set_ifa_lifetime(ifa, INFINITY_LIFE_TIME,
1386 INFINITY_LIFE_TIME);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001387 inet_insert_ifa(ifa);
1388 }
1389 }
1390 ip_mc_up(in_dev);
Stephen Hemmingereefef1c2009-02-01 01:04:33 -08001391 /* fall through */
1392 case NETDEV_CHANGEADDR:
Ian Campbelld11327ad2011-02-11 07:44:16 +00001393 if (!IN_DEV_ARP_NOTIFY(in_dev))
1394 break;
1395 /* fall through */
1396 case NETDEV_NOTIFY_PEERS:
Stephen Hemmingera21090c2009-10-07 03:18:17 -07001397 /* Send gratuitous ARP to notify of link change */
Ian Campbelld11327ad2011-02-11 07:44:16 +00001398 inetdev_send_gratuitous_arp(dev, in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001399 break;
1400 case NETDEV_DOWN:
1401 ip_mc_down(in_dev);
1402 break;
Jiri Pirko93d9b7d2010-03-10 10:28:56 +00001403 case NETDEV_PRE_TYPE_CHANGE:
Moni Shoua75c78502009-09-15 02:37:40 -07001404 ip_mc_unmap(in_dev);
1405 break;
Jiri Pirko93d9b7d2010-03-10 10:28:56 +00001406 case NETDEV_POST_TYPE_CHANGE:
Moni Shoua75c78502009-09-15 02:37:40 -07001407 ip_mc_remap(in_dev);
1408 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001409 case NETDEV_CHANGEMTU:
Breno Leitao06770842008-09-02 17:28:58 -07001410 if (inetdev_valid_mtu(dev->mtu))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001411 break;
Breno Leitao06770842008-09-02 17:28:58 -07001412 /* disable IP when MTU is not enough */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001413 case NETDEV_UNREGISTER:
1414 inetdev_destroy(in_dev);
1415 break;
1416 case NETDEV_CHANGENAME:
1417 /* Do not notify about label change, this event is
1418 * not interesting to applications using netlink.
1419 */
1420 inetdev_changename(dev, in_dev);
1421
Pavel Emelyanov51602b22007-12-11 02:17:40 -08001422 devinet_sysctl_unregister(in_dev);
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11001423 devinet_sysctl_register(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001424 break;
1425 }
1426out:
1427 return NOTIFY_DONE;
1428}
1429
1430static struct notifier_block ip_netdev_notifier = {
Jianjun Kong539afed2008-11-03 02:48:48 -08001431 .notifier_call = inetdev_event,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001432};
1433
Eric Dumazet40384992012-08-03 21:06:50 +00001434static size_t inet_nlmsg_size(void)
Thomas Graf339bf982006-11-10 14:10:15 -08001435{
1436 return NLMSG_ALIGN(sizeof(struct ifaddrmsg))
1437 + nla_total_size(4) /* IFA_ADDRESS */
1438 + nla_total_size(4) /* IFA_LOCAL */
1439 + nla_total_size(4) /* IFA_BROADCAST */
Thomas Graf339bf982006-11-10 14:10:15 -08001440 + nla_total_size(IFNAMSIZ); /* IFA_LABEL */
1441}
1442
Jiri Pirko5c766d62013-01-24 09:41:41 +00001443static inline u32 cstamp_delta(unsigned long cstamp)
1444{
1445 return (cstamp - INITIAL_JIFFIES) * 100UL / HZ;
1446}
1447
1448static int put_cacheinfo(struct sk_buff *skb, unsigned long cstamp,
1449 unsigned long tstamp, u32 preferred, u32 valid)
1450{
1451 struct ifa_cacheinfo ci;
1452
1453 ci.cstamp = cstamp_delta(cstamp);
1454 ci.tstamp = cstamp_delta(tstamp);
1455 ci.ifa_prefered = preferred;
1456 ci.ifa_valid = valid;
1457
1458 return nla_put(skb, IFA_CACHEINFO, sizeof(ci), &ci);
1459}
1460
Linus Torvalds1da177e2005-04-16 15:20:36 -07001461static int inet_fill_ifaddr(struct sk_buff *skb, struct in_ifaddr *ifa,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001462 u32 portid, u32 seq, int event, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001463{
1464 struct ifaddrmsg *ifm;
1465 struct nlmsghdr *nlh;
Jiri Pirko5c766d62013-01-24 09:41:41 +00001466 u32 preferred, valid;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001467
Eric W. Biederman15e47302012-09-07 20:12:54 +00001468 nlh = nlmsg_put(skb, portid, seq, event, sizeof(*ifm), flags);
Thomas Graf47f68512006-08-04 23:04:36 -07001469 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001470 return -EMSGSIZE;
Thomas Graf47f68512006-08-04 23:04:36 -07001471
1472 ifm = nlmsg_data(nlh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001473 ifm->ifa_family = AF_INET;
1474 ifm->ifa_prefixlen = ifa->ifa_prefixlen;
Jiri Pirko5c766d62013-01-24 09:41:41 +00001475 ifm->ifa_flags = ifa->ifa_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001476 ifm->ifa_scope = ifa->ifa_scope;
1477 ifm->ifa_index = ifa->ifa_dev->dev->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001478
Jiri Pirko5c766d62013-01-24 09:41:41 +00001479 if (!(ifm->ifa_flags & IFA_F_PERMANENT)) {
1480 preferred = ifa->ifa_preferred_lft;
1481 valid = ifa->ifa_valid_lft;
1482 if (preferred != INFINITY_LIFE_TIME) {
1483 long tval = (jiffies - ifa->ifa_tstamp) / HZ;
1484
1485 if (preferred > tval)
1486 preferred -= tval;
1487 else
1488 preferred = 0;
1489 if (valid != INFINITY_LIFE_TIME) {
1490 if (valid > tval)
1491 valid -= tval;
1492 else
1493 valid = 0;
1494 }
1495 }
1496 } else {
1497 preferred = INFINITY_LIFE_TIME;
1498 valid = INFINITY_LIFE_TIME;
1499 }
David S. Millerf3756b72012-04-01 20:39:02 -04001500 if ((ifa->ifa_address &&
1501 nla_put_be32(skb, IFA_ADDRESS, ifa->ifa_address)) ||
1502 (ifa->ifa_local &&
1503 nla_put_be32(skb, IFA_LOCAL, ifa->ifa_local)) ||
1504 (ifa->ifa_broadcast &&
1505 nla_put_be32(skb, IFA_BROADCAST, ifa->ifa_broadcast)) ||
1506 (ifa->ifa_label[0] &&
Jiri Pirko5c766d62013-01-24 09:41:41 +00001507 nla_put_string(skb, IFA_LABEL, ifa->ifa_label)) ||
1508 put_cacheinfo(skb, ifa->ifa_cstamp, ifa->ifa_tstamp,
1509 preferred, valid))
David S. Millerf3756b72012-04-01 20:39:02 -04001510 goto nla_put_failure;
Thomas Graf47f68512006-08-04 23:04:36 -07001511
1512 return nlmsg_end(skb, nlh);
1513
1514nla_put_failure:
Patrick McHardy26932562007-01-31 23:16:40 -08001515 nlmsg_cancel(skb, nlh);
1516 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001517}
1518
1519static int inet_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb)
1520{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001521 struct net *net = sock_net(skb->sk);
Eric Dumazeteec4df92009-11-12 07:44:25 +00001522 int h, s_h;
1523 int idx, s_idx;
1524 int ip_idx, s_ip_idx;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001525 struct net_device *dev;
1526 struct in_device *in_dev;
1527 struct in_ifaddr *ifa;
Eric Dumazeteec4df92009-11-12 07:44:25 +00001528 struct hlist_head *head;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001529
Eric Dumazeteec4df92009-11-12 07:44:25 +00001530 s_h = cb->args[0];
1531 s_idx = idx = cb->args[1];
1532 s_ip_idx = ip_idx = cb->args[2];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001533
Eric Dumazeteec4df92009-11-12 07:44:25 +00001534 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
1535 idx = 0;
1536 head = &net->dev_index_head[h];
1537 rcu_read_lock();
Nicolas Dichtel04652772013-03-22 06:28:42 +00001538 cb->seq = atomic_read(&net->ipv4.dev_addr_genid) ^
1539 net->dev_base_seq;
Sasha Levinb67bfe02013-02-27 17:06:00 -08001540 hlist_for_each_entry_rcu(dev, head, index_hlist) {
Eric Dumazeteec4df92009-11-12 07:44:25 +00001541 if (idx < s_idx)
1542 goto cont;
Patrick McHardy4b97efd2010-03-26 20:27:49 -07001543 if (h > s_h || idx > s_idx)
Eric Dumazeteec4df92009-11-12 07:44:25 +00001544 s_ip_idx = 0;
1545 in_dev = __in_dev_get_rcu(dev);
1546 if (!in_dev)
1547 goto cont;
1548
1549 for (ifa = in_dev->ifa_list, ip_idx = 0; ifa;
1550 ifa = ifa->ifa_next, ip_idx++) {
1551 if (ip_idx < s_ip_idx)
1552 continue;
1553 if (inet_fill_ifaddr(skb, ifa,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001554 NETLINK_CB(cb->skb).portid,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001555 cb->nlh->nlmsg_seq,
Eric Dumazeteec4df92009-11-12 07:44:25 +00001556 RTM_NEWADDR, NLM_F_MULTI) <= 0) {
1557 rcu_read_unlock();
1558 goto done;
1559 }
Nicolas Dichtel04652772013-03-22 06:28:42 +00001560 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
Eric Dumazeteec4df92009-11-12 07:44:25 +00001561 }
Pavel Emelianov7562f872007-05-03 15:13:45 -07001562cont:
Eric Dumazeteec4df92009-11-12 07:44:25 +00001563 idx++;
1564 }
1565 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001566 }
1567
1568done:
Eric Dumazeteec4df92009-11-12 07:44:25 +00001569 cb->args[0] = h;
1570 cb->args[1] = idx;
1571 cb->args[2] = ip_idx;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001572
1573 return skb->len;
1574}
1575
Jianjun Kong539afed2008-11-03 02:48:48 -08001576static void rtmsg_ifa(int event, struct in_ifaddr *ifa, struct nlmsghdr *nlh,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001577 u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001578{
Thomas Graf47f68512006-08-04 23:04:36 -07001579 struct sk_buff *skb;
Thomas Grafd6062cb2006-08-15 00:33:59 -07001580 u32 seq = nlh ? nlh->nlmsg_seq : 0;
1581 int err = -ENOBUFS;
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -08001582 struct net *net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001583
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001584 net = dev_net(ifa->ifa_dev->dev);
Thomas Graf339bf982006-11-10 14:10:15 -08001585 skb = nlmsg_new(inet_nlmsg_size(), GFP_KERNEL);
Thomas Graf47f68512006-08-04 23:04:36 -07001586 if (skb == NULL)
Thomas Grafd6062cb2006-08-15 00:33:59 -07001587 goto errout;
1588
Eric W. Biederman15e47302012-09-07 20:12:54 +00001589 err = inet_fill_ifaddr(skb, ifa, portid, seq, event, 0);
Patrick McHardy26932562007-01-31 23:16:40 -08001590 if (err < 0) {
1591 /* -EMSGSIZE implies BUG in inet_nlmsg_size() */
1592 WARN_ON(err == -EMSGSIZE);
1593 kfree_skb(skb);
1594 goto errout;
1595 }
Eric W. Biederman15e47302012-09-07 20:12:54 +00001596 rtnl_notify(skb, net, portid, RTNLGRP_IPV4_IFADDR, nlh, GFP_KERNEL);
Pablo Neira Ayuso1ce85fe2009-02-24 23:18:28 -08001597 return;
Thomas Grafd6062cb2006-08-15 00:33:59 -07001598errout:
1599 if (err < 0)
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -08001600 rtnl_set_sk_err(net, RTNLGRP_IPV4_IFADDR, err);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001601}
1602
Thomas Graf9f0f7272010-11-16 04:32:48 +00001603static size_t inet_get_link_af_size(const struct net_device *dev)
1604{
Eric Dumazet1fc19af2011-05-09 20:55:03 -07001605 struct in_device *in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Thomas Graf9f0f7272010-11-16 04:32:48 +00001606
1607 if (!in_dev)
1608 return 0;
1609
1610 return nla_total_size(IPV4_DEVCONF_MAX * 4); /* IFLA_INET_CONF */
1611}
1612
1613static int inet_fill_link_af(struct sk_buff *skb, const struct net_device *dev)
1614{
Eric Dumazet1fc19af2011-05-09 20:55:03 -07001615 struct in_device *in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Thomas Graf9f0f7272010-11-16 04:32:48 +00001616 struct nlattr *nla;
1617 int i;
1618
1619 if (!in_dev)
1620 return -ENODATA;
1621
1622 nla = nla_reserve(skb, IFLA_INET_CONF, IPV4_DEVCONF_MAX * 4);
1623 if (nla == NULL)
1624 return -EMSGSIZE;
1625
1626 for (i = 0; i < IPV4_DEVCONF_MAX; i++)
1627 ((u32 *) nla_data(nla))[i] = in_dev->cnf.data[i];
1628
1629 return 0;
1630}
1631
1632static const struct nla_policy inet_af_policy[IFLA_INET_MAX+1] = {
1633 [IFLA_INET_CONF] = { .type = NLA_NESTED },
1634};
1635
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001636static int inet_validate_link_af(const struct net_device *dev,
1637 const struct nlattr *nla)
Thomas Graf9f0f7272010-11-16 04:32:48 +00001638{
Thomas Graf9f0f7272010-11-16 04:32:48 +00001639 struct nlattr *a, *tb[IFLA_INET_MAX+1];
1640 int err, rem;
1641
Eric Dumazetf7fce742010-12-01 06:03:06 +00001642 if (dev && !__in_dev_get_rtnl(dev))
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001643 return -EAFNOSUPPORT;
Thomas Graf9f0f7272010-11-16 04:32:48 +00001644
1645 err = nla_parse_nested(tb, IFLA_INET_MAX, nla, inet_af_policy);
1646 if (err < 0)
1647 return err;
1648
1649 if (tb[IFLA_INET_CONF]) {
1650 nla_for_each_nested(a, tb[IFLA_INET_CONF], rem) {
1651 int cfgid = nla_type(a);
1652
1653 if (nla_len(a) < 4)
1654 return -EINVAL;
1655
1656 if (cfgid <= 0 || cfgid > IPV4_DEVCONF_MAX)
1657 return -EINVAL;
1658 }
1659 }
1660
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001661 return 0;
1662}
1663
1664static int inet_set_link_af(struct net_device *dev, const struct nlattr *nla)
1665{
Eric Dumazetf7fce742010-12-01 06:03:06 +00001666 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001667 struct nlattr *a, *tb[IFLA_INET_MAX+1];
1668 int rem;
1669
1670 if (!in_dev)
1671 return -EAFNOSUPPORT;
1672
1673 if (nla_parse_nested(tb, IFLA_INET_MAX, nla, NULL) < 0)
1674 BUG();
1675
Thomas Graf9f0f7272010-11-16 04:32:48 +00001676 if (tb[IFLA_INET_CONF]) {
1677 nla_for_each_nested(a, tb[IFLA_INET_CONF], rem)
1678 ipv4_devconf_set(in_dev, nla_type(a), nla_get_u32(a));
1679 }
1680
1681 return 0;
1682}
1683
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001684static int inet_netconf_msgsize_devconf(int type)
1685{
1686 int size = NLMSG_ALIGN(sizeof(struct netconfmsg))
1687 + nla_total_size(4); /* NETCONFA_IFINDEX */
1688
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001689 /* type -1 is used for ALL */
1690 if (type == -1 || type == NETCONFA_FORWARDING)
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001691 size += nla_total_size(4);
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001692 if (type == -1 || type == NETCONFA_RP_FILTER)
1693 size += nla_total_size(4);
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001694 if (type == -1 || type == NETCONFA_MC_FORWARDING)
1695 size += nla_total_size(4);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001696
1697 return size;
1698}
1699
1700static int inet_netconf_fill_devconf(struct sk_buff *skb, int ifindex,
1701 struct ipv4_devconf *devconf, u32 portid,
1702 u32 seq, int event, unsigned int flags,
1703 int type)
1704{
1705 struct nlmsghdr *nlh;
1706 struct netconfmsg *ncm;
1707
1708 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct netconfmsg),
1709 flags);
1710 if (nlh == NULL)
1711 return -EMSGSIZE;
1712
1713 ncm = nlmsg_data(nlh);
1714 ncm->ncm_family = AF_INET;
1715
1716 if (nla_put_s32(skb, NETCONFA_IFINDEX, ifindex) < 0)
1717 goto nla_put_failure;
1718
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001719 /* type -1 is used for ALL */
1720 if ((type == -1 || type == NETCONFA_FORWARDING) &&
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001721 nla_put_s32(skb, NETCONFA_FORWARDING,
1722 IPV4_DEVCONF(*devconf, FORWARDING)) < 0)
1723 goto nla_put_failure;
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001724 if ((type == -1 || type == NETCONFA_RP_FILTER) &&
1725 nla_put_s32(skb, NETCONFA_RP_FILTER,
1726 IPV4_DEVCONF(*devconf, RP_FILTER)) < 0)
1727 goto nla_put_failure;
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001728 if ((type == -1 || type == NETCONFA_MC_FORWARDING) &&
1729 nla_put_s32(skb, NETCONFA_MC_FORWARDING,
1730 IPV4_DEVCONF(*devconf, MC_FORWARDING)) < 0)
1731 goto nla_put_failure;
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001732
1733 return nlmsg_end(skb, nlh);
1734
1735nla_put_failure:
1736 nlmsg_cancel(skb, nlh);
1737 return -EMSGSIZE;
1738}
1739
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001740void inet_netconf_notify_devconf(struct net *net, int type, int ifindex,
1741 struct ipv4_devconf *devconf)
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001742{
1743 struct sk_buff *skb;
1744 int err = -ENOBUFS;
1745
1746 skb = nlmsg_new(inet_netconf_msgsize_devconf(type), GFP_ATOMIC);
1747 if (skb == NULL)
1748 goto errout;
1749
1750 err = inet_netconf_fill_devconf(skb, ifindex, devconf, 0, 0,
1751 RTM_NEWNETCONF, 0, type);
1752 if (err < 0) {
1753 /* -EMSGSIZE implies BUG in inet_netconf_msgsize_devconf() */
1754 WARN_ON(err == -EMSGSIZE);
1755 kfree_skb(skb);
1756 goto errout;
1757 }
1758 rtnl_notify(skb, net, 0, RTNLGRP_IPV4_NETCONF, NULL, GFP_ATOMIC);
1759 return;
1760errout:
1761 if (err < 0)
1762 rtnl_set_sk_err(net, RTNLGRP_IPV4_NETCONF, err);
1763}
1764
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001765static const struct nla_policy devconf_ipv4_policy[NETCONFA_MAX+1] = {
1766 [NETCONFA_IFINDEX] = { .len = sizeof(int) },
1767 [NETCONFA_FORWARDING] = { .len = sizeof(int) },
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001768 [NETCONFA_RP_FILTER] = { .len = sizeof(int) },
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001769};
1770
1771static int inet_netconf_get_devconf(struct sk_buff *in_skb,
Thomas Graf661d2962013-03-21 07:45:29 +00001772 struct nlmsghdr *nlh)
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001773{
1774 struct net *net = sock_net(in_skb->sk);
1775 struct nlattr *tb[NETCONFA_MAX+1];
1776 struct netconfmsg *ncm;
1777 struct sk_buff *skb;
1778 struct ipv4_devconf *devconf;
1779 struct in_device *in_dev;
1780 struct net_device *dev;
1781 int ifindex;
1782 int err;
1783
1784 err = nlmsg_parse(nlh, sizeof(*ncm), tb, NETCONFA_MAX,
1785 devconf_ipv4_policy);
1786 if (err < 0)
1787 goto errout;
1788
1789 err = EINVAL;
1790 if (!tb[NETCONFA_IFINDEX])
1791 goto errout;
1792
1793 ifindex = nla_get_s32(tb[NETCONFA_IFINDEX]);
1794 switch (ifindex) {
1795 case NETCONFA_IFINDEX_ALL:
1796 devconf = net->ipv4.devconf_all;
1797 break;
1798 case NETCONFA_IFINDEX_DEFAULT:
1799 devconf = net->ipv4.devconf_dflt;
1800 break;
1801 default:
1802 dev = __dev_get_by_index(net, ifindex);
1803 if (dev == NULL)
1804 goto errout;
1805 in_dev = __in_dev_get_rtnl(dev);
1806 if (in_dev == NULL)
1807 goto errout;
1808 devconf = &in_dev->cnf;
1809 break;
1810 }
1811
1812 err = -ENOBUFS;
1813 skb = nlmsg_new(inet_netconf_msgsize_devconf(-1), GFP_ATOMIC);
1814 if (skb == NULL)
1815 goto errout;
1816
1817 err = inet_netconf_fill_devconf(skb, ifindex, devconf,
1818 NETLINK_CB(in_skb).portid,
1819 nlh->nlmsg_seq, RTM_NEWNETCONF, 0,
1820 -1);
1821 if (err < 0) {
1822 /* -EMSGSIZE implies BUG in inet_netconf_msgsize_devconf() */
1823 WARN_ON(err == -EMSGSIZE);
1824 kfree_skb(skb);
1825 goto errout;
1826 }
1827 err = rtnl_unicast(skb, net, NETLINK_CB(in_skb).portid);
1828errout:
1829 return err;
1830}
1831
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001832static int inet_netconf_dump_devconf(struct sk_buff *skb,
1833 struct netlink_callback *cb)
1834{
1835 struct net *net = sock_net(skb->sk);
1836 int h, s_h;
1837 int idx, s_idx;
1838 struct net_device *dev;
1839 struct in_device *in_dev;
1840 struct hlist_head *head;
1841
1842 s_h = cb->args[0];
1843 s_idx = idx = cb->args[1];
1844
1845 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
1846 idx = 0;
1847 head = &net->dev_index_head[h];
1848 rcu_read_lock();
Nicolas Dichtel04652772013-03-22 06:28:42 +00001849 cb->seq = atomic_read(&net->ipv4.dev_addr_genid) ^
1850 net->dev_base_seq;
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001851 hlist_for_each_entry_rcu(dev, head, index_hlist) {
1852 if (idx < s_idx)
1853 goto cont;
1854 in_dev = __in_dev_get_rcu(dev);
1855 if (!in_dev)
1856 goto cont;
1857
1858 if (inet_netconf_fill_devconf(skb, dev->ifindex,
1859 &in_dev->cnf,
1860 NETLINK_CB(cb->skb).portid,
1861 cb->nlh->nlmsg_seq,
1862 RTM_NEWNETCONF,
1863 NLM_F_MULTI,
1864 -1) <= 0) {
1865 rcu_read_unlock();
1866 goto done;
1867 }
Nicolas Dichtel04652772013-03-22 06:28:42 +00001868 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001869cont:
1870 idx++;
1871 }
1872 rcu_read_unlock();
1873 }
1874 if (h == NETDEV_HASHENTRIES) {
1875 if (inet_netconf_fill_devconf(skb, NETCONFA_IFINDEX_ALL,
1876 net->ipv4.devconf_all,
1877 NETLINK_CB(cb->skb).portid,
1878 cb->nlh->nlmsg_seq,
1879 RTM_NEWNETCONF, NLM_F_MULTI,
1880 -1) <= 0)
1881 goto done;
1882 else
1883 h++;
1884 }
1885 if (h == NETDEV_HASHENTRIES + 1) {
1886 if (inet_netconf_fill_devconf(skb, NETCONFA_IFINDEX_DEFAULT,
1887 net->ipv4.devconf_dflt,
1888 NETLINK_CB(cb->skb).portid,
1889 cb->nlh->nlmsg_seq,
1890 RTM_NEWNETCONF, NLM_F_MULTI,
1891 -1) <= 0)
1892 goto done;
1893 else
1894 h++;
1895 }
1896done:
1897 cb->args[0] = h;
1898 cb->args[1] = idx;
1899
1900 return skb->len;
1901}
1902
Linus Torvalds1da177e2005-04-16 15:20:36 -07001903#ifdef CONFIG_SYSCTL
1904
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001905static void devinet_copy_dflt_conf(struct net *net, int i)
Herbert Xu31be3082007-06-04 23:35:37 -07001906{
1907 struct net_device *dev;
1908
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001909 rcu_read_lock();
1910 for_each_netdev_rcu(net, dev) {
Herbert Xu31be3082007-06-04 23:35:37 -07001911 struct in_device *in_dev;
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001912
Herbert Xu31be3082007-06-04 23:35:37 -07001913 in_dev = __in_dev_get_rcu(dev);
1914 if (in_dev && !test_bit(i, in_dev->cnf.state))
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001915 in_dev->cnf.data[i] = net->ipv4.devconf_dflt->data[i];
Herbert Xu31be3082007-06-04 23:35:37 -07001916 }
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001917 rcu_read_unlock();
Herbert Xu31be3082007-06-04 23:35:37 -07001918}
1919
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001920/* called with RTNL locked */
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001921static void inet_forward_change(struct net *net)
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001922{
1923 struct net_device *dev;
Pavel Emelyanov586f1212007-12-16 13:32:48 -08001924 int on = IPV4_DEVCONF_ALL(net, FORWARDING);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001925
Pavel Emelyanov586f1212007-12-16 13:32:48 -08001926 IPV4_DEVCONF_ALL(net, ACCEPT_REDIRECTS) = !on;
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001927 IPV4_DEVCONF_DFLT(net, FORWARDING) = on;
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001928 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1929 NETCONFA_IFINDEX_ALL,
1930 net->ipv4.devconf_all);
1931 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1932 NETCONFA_IFINDEX_DEFAULT,
1933 net->ipv4.devconf_dflt);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001934
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001935 for_each_netdev(net, dev) {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001936 struct in_device *in_dev;
Ben Hutchings0187bdf2008-06-19 16:15:47 -07001937 if (on)
1938 dev_disable_lro(dev);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001939 rcu_read_lock();
1940 in_dev = __in_dev_get_rcu(dev);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001941 if (in_dev) {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001942 IN_DEV_CONF_SET(in_dev, FORWARDING, on);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001943 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1944 dev->ifindex, &in_dev->cnf);
1945 }
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001946 rcu_read_unlock();
1947 }
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001948}
1949
Joe Perchesfe2c6332013-06-11 23:04:25 -07001950static int devinet_conf_proc(struct ctl_table *ctl, int write,
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001951 void __user *buffer,
Herbert Xu31be3082007-06-04 23:35:37 -07001952 size_t *lenp, loff_t *ppos)
1953{
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001954 int old_value = *(int *)ctl->data;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001955 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001956 int new_value = *(int *)ctl->data;
Herbert Xu31be3082007-06-04 23:35:37 -07001957
1958 if (write) {
1959 struct ipv4_devconf *cnf = ctl->extra1;
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001960 struct net *net = ctl->extra2;
Herbert Xu31be3082007-06-04 23:35:37 -07001961 int i = (int *)ctl->data - cnf->data;
1962
1963 set_bit(i, cnf->state);
1964
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001965 if (cnf == net->ipv4.devconf_dflt)
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001966 devinet_copy_dflt_conf(net, i);
Thomas Grafd0daebc32012-06-12 00:44:01 +00001967 if (i == IPV4_DEVCONF_ACCEPT_LOCAL - 1 ||
1968 i == IPV4_DEVCONF_ROUTE_LOCALNET - 1)
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001969 if ((new_value == 0) && (old_value != 0))
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00001970 rt_cache_flush(net);
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001971 if (i == IPV4_DEVCONF_RP_FILTER - 1 &&
1972 new_value != old_value) {
1973 int ifindex;
1974
1975 if (cnf == net->ipv4.devconf_dflt)
1976 ifindex = NETCONFA_IFINDEX_DEFAULT;
1977 else if (cnf == net->ipv4.devconf_all)
1978 ifindex = NETCONFA_IFINDEX_ALL;
1979 else {
1980 struct in_device *idev =
1981 container_of(cnf, struct in_device,
1982 cnf);
1983 ifindex = idev->dev->ifindex;
1984 }
1985 inet_netconf_notify_devconf(net, NETCONFA_RP_FILTER,
1986 ifindex, cnf);
1987 }
Herbert Xu31be3082007-06-04 23:35:37 -07001988 }
1989
1990 return ret;
1991}
1992
Joe Perchesfe2c6332013-06-11 23:04:25 -07001993static int devinet_sysctl_forward(struct ctl_table *ctl, int write,
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001994 void __user *buffer,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001995 size_t *lenp, loff_t *ppos)
1996{
1997 int *valp = ctl->data;
1998 int val = *valp;
Eric W. Biederman88af1822010-02-19 13:22:59 +00001999 loff_t pos = *ppos;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07002000 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002001
2002 if (write && *valp != val) {
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002003 struct net *net = ctl->extra2;
2004
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002005 if (valp != &IPV4_DEVCONF_DFLT(net, FORWARDING)) {
Eric W. Biederman88af1822010-02-19 13:22:59 +00002006 if (!rtnl_trylock()) {
2007 /* Restore the original values before restarting */
2008 *valp = val;
2009 *ppos = pos;
Eric W. Biederman9b8adb52009-05-13 16:59:21 +00002010 return restart_syscall();
Eric W. Biederman88af1822010-02-19 13:22:59 +00002011 }
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002012 if (valp == &IPV4_DEVCONF_ALL(net, FORWARDING)) {
2013 inet_forward_change(net);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002014 } else {
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002015 struct ipv4_devconf *cnf = ctl->extra1;
2016 struct in_device *idev =
2017 container_of(cnf, struct in_device, cnf);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002018 if (*valp)
2019 dev_disable_lro(idev->dev);
2020 inet_netconf_notify_devconf(net,
2021 NETCONFA_FORWARDING,
2022 idev->dev->ifindex,
2023 cnf);
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002024 }
2025 rtnl_unlock();
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00002026 rt_cache_flush(net);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002027 } else
2028 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
2029 NETCONFA_IFINDEX_DEFAULT,
2030 net->ipv4.devconf_dflt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002031 }
2032
2033 return ret;
2034}
2035
Joe Perchesfe2c6332013-06-11 23:04:25 -07002036static int ipv4_doint_and_flush(struct ctl_table *ctl, int write,
David S. Miller323e1262010-12-12 21:55:08 -08002037 void __user *buffer,
2038 size_t *lenp, loff_t *ppos)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002039{
2040 int *valp = ctl->data;
2041 int val = *valp;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07002042 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Denis V. Lunev76e6ebf2008-07-05 19:00:44 -07002043 struct net *net = ctl->extra2;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002044
2045 if (write && *valp != val)
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00002046 rt_cache_flush(net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002047
2048 return ret;
2049}
2050
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002051#define DEVINET_SYSCTL_ENTRY(attr, name, mval, proc) \
Herbert Xu42f811b2007-06-04 23:34:44 -07002052 { \
Herbert Xu42f811b2007-06-04 23:34:44 -07002053 .procname = name, \
2054 .data = ipv4_devconf.data + \
Eric W. Biederman02291682010-02-14 03:25:51 +00002055 IPV4_DEVCONF_ ## attr - 1, \
Herbert Xu42f811b2007-06-04 23:34:44 -07002056 .maxlen = sizeof(int), \
2057 .mode = mval, \
2058 .proc_handler = proc, \
Herbert Xu31be3082007-06-04 23:35:37 -07002059 .extra1 = &ipv4_devconf, \
Herbert Xu42f811b2007-06-04 23:34:44 -07002060 }
2061
2062#define DEVINET_SYSCTL_RW_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002063 DEVINET_SYSCTL_ENTRY(attr, name, 0644, devinet_conf_proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002064
2065#define DEVINET_SYSCTL_RO_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002066 DEVINET_SYSCTL_ENTRY(attr, name, 0444, devinet_conf_proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002067
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002068#define DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, proc) \
2069 DEVINET_SYSCTL_ENTRY(attr, name, 0644, proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002070
2071#define DEVINET_SYSCTL_FLUSHING_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002072 DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, ipv4_doint_and_flush)
Herbert Xu42f811b2007-06-04 23:34:44 -07002073
Linus Torvalds1da177e2005-04-16 15:20:36 -07002074static struct devinet_sysctl_table {
2075 struct ctl_table_header *sysctl_header;
Eric W. Biederman02291682010-02-14 03:25:51 +00002076 struct ctl_table devinet_vars[__IPV4_DEVCONF_MAX];
Linus Torvalds1da177e2005-04-16 15:20:36 -07002077} devinet_sysctl = {
2078 .devinet_vars = {
Herbert Xu42f811b2007-06-04 23:34:44 -07002079 DEVINET_SYSCTL_COMPLEX_ENTRY(FORWARDING, "forwarding",
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002080 devinet_sysctl_forward),
Herbert Xu42f811b2007-06-04 23:34:44 -07002081 DEVINET_SYSCTL_RO_ENTRY(MC_FORWARDING, "mc_forwarding"),
2082
2083 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_REDIRECTS, "accept_redirects"),
2084 DEVINET_SYSCTL_RW_ENTRY(SECURE_REDIRECTS, "secure_redirects"),
2085 DEVINET_SYSCTL_RW_ENTRY(SHARED_MEDIA, "shared_media"),
2086 DEVINET_SYSCTL_RW_ENTRY(RP_FILTER, "rp_filter"),
2087 DEVINET_SYSCTL_RW_ENTRY(SEND_REDIRECTS, "send_redirects"),
2088 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_SOURCE_ROUTE,
2089 "accept_source_route"),
Patrick McHardy8153a102009-12-03 01:25:58 +00002090 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_LOCAL, "accept_local"),
Jamal Hadi Salim28f6aee2009-12-25 17:30:22 -08002091 DEVINET_SYSCTL_RW_ENTRY(SRC_VMARK, "src_valid_mark"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002092 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP, "proxy_arp"),
2093 DEVINET_SYSCTL_RW_ENTRY(MEDIUM_ID, "medium_id"),
2094 DEVINET_SYSCTL_RW_ENTRY(BOOTP_RELAY, "bootp_relay"),
2095 DEVINET_SYSCTL_RW_ENTRY(LOG_MARTIANS, "log_martians"),
2096 DEVINET_SYSCTL_RW_ENTRY(TAG, "tag"),
2097 DEVINET_SYSCTL_RW_ENTRY(ARPFILTER, "arp_filter"),
2098 DEVINET_SYSCTL_RW_ENTRY(ARP_ANNOUNCE, "arp_announce"),
2099 DEVINET_SYSCTL_RW_ENTRY(ARP_IGNORE, "arp_ignore"),
2100 DEVINET_SYSCTL_RW_ENTRY(ARP_ACCEPT, "arp_accept"),
Stephen Hemmingereefef1c2009-02-01 01:04:33 -08002101 DEVINET_SYSCTL_RW_ENTRY(ARP_NOTIFY, "arp_notify"),
Jesper Dangaard Brouer65324142010-01-05 05:50:47 +00002102 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP_PVLAN, "proxy_arp_pvlan"),
William Manley5c6fe012013-08-06 19:03:14 +01002103 DEVINET_SYSCTL_RW_ENTRY(FORCE_IGMP_VERSION,
2104 "force_igmp_version"),
William Manley26900482013-08-06 19:03:15 +01002105 DEVINET_SYSCTL_RW_ENTRY(IGMPV2_UNSOLICITED_REPORT_INTERVAL,
2106 "igmpv2_unsolicited_report_interval"),
2107 DEVINET_SYSCTL_RW_ENTRY(IGMPV3_UNSOLICITED_REPORT_INTERVAL,
2108 "igmpv3_unsolicited_report_interval"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002109
2110 DEVINET_SYSCTL_FLUSHING_ENTRY(NOXFRM, "disable_xfrm"),
2111 DEVINET_SYSCTL_FLUSHING_ENTRY(NOPOLICY, "disable_policy"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002112 DEVINET_SYSCTL_FLUSHING_ENTRY(PROMOTE_SECONDARIES,
2113 "promote_secondaries"),
Thomas Grafd0daebc32012-06-12 00:44:01 +00002114 DEVINET_SYSCTL_FLUSHING_ENTRY(ROUTE_LOCALNET,
2115 "route_localnet"),
Linus Torvalds1da177e2005-04-16 15:20:36 -07002116 },
Linus Torvalds1da177e2005-04-16 15:20:36 -07002117};
2118
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002119static int __devinet_sysctl_register(struct net *net, char *dev_name,
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002120 struct ipv4_devconf *p)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002121{
2122 int i;
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002123 struct devinet_sysctl_table *t;
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002124 char path[sizeof("net/ipv4/conf/") + IFNAMSIZ];
Pavel Emelyanovbfada692007-12-02 00:57:08 +11002125
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002126 t = kmemdup(&devinet_sysctl, sizeof(*t), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002127 if (!t)
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002128 goto out;
2129
Linus Torvalds1da177e2005-04-16 15:20:36 -07002130 for (i = 0; i < ARRAY_SIZE(t->devinet_vars) - 1; i++) {
2131 t->devinet_vars[i].data += (char *)p - (char *)&ipv4_devconf;
Herbert Xu31be3082007-06-04 23:35:37 -07002132 t->devinet_vars[i].extra1 = p;
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002133 t->devinet_vars[i].extra2 = net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002134 }
2135
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002136 snprintf(path, sizeof(path), "net/ipv4/conf/%s", dev_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002137
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002138 t->sysctl_header = register_net_sysctl(net, path, t->devinet_vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002139 if (!t->sysctl_header)
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002140 goto free;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002141
2142 p->sysctl = t;
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002143 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002144
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002145free:
Linus Torvalds1da177e2005-04-16 15:20:36 -07002146 kfree(t);
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002147out:
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002148 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002149}
2150
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002151static void __devinet_sysctl_unregister(struct ipv4_devconf *cnf)
2152{
2153 struct devinet_sysctl_table *t = cnf->sysctl;
2154
2155 if (t == NULL)
2156 return;
2157
2158 cnf->sysctl = NULL;
Lucian Adrian Grijincuff538812011-05-01 01:44:01 +00002159 unregister_net_sysctl_table(t->sysctl_header);
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002160 kfree(t);
2161}
2162
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11002163static void devinet_sysctl_register(struct in_device *idev)
2164{
Jiri Pirko73af6142013-12-07 19:26:55 +01002165 neigh_sysctl_register(idev->dev, idev->arp_parms, NULL);
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09002166 __devinet_sysctl_register(dev_net(idev->dev), idev->dev->name,
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002167 &idev->cnf);
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11002168}
2169
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002170static void devinet_sysctl_unregister(struct in_device *idev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002171{
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002172 __devinet_sysctl_unregister(&idev->cnf);
2173 neigh_sysctl_unregister(idev->arp_parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002174}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002175
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002176static struct ctl_table ctl_forward_entry[] = {
2177 {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002178 .procname = "ip_forward",
2179 .data = &ipv4_devconf.data[
Eric W. Biederman02291682010-02-14 03:25:51 +00002180 IPV4_DEVCONF_FORWARDING - 1],
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002181 .maxlen = sizeof(int),
2182 .mode = 0644,
2183 .proc_handler = devinet_sysctl_forward,
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002184 .extra1 = &ipv4_devconf,
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002185 .extra2 = &init_net,
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002186 },
2187 { },
2188};
Eric Dumazet2a75de02008-01-05 23:08:49 -08002189#endif
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002190
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002191static __net_init int devinet_init_net(struct net *net)
2192{
2193 int err;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002194 struct ipv4_devconf *all, *dflt;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002195#ifdef CONFIG_SYSCTL
2196 struct ctl_table *tbl = ctl_forward_entry;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002197 struct ctl_table_header *forw_hdr;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002198#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002199
2200 err = -ENOMEM;
2201 all = &ipv4_devconf;
2202 dflt = &ipv4_devconf_dflt;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002203
Octavian Purdila09ad9bc2009-11-25 15:14:13 -08002204 if (!net_eq(net, &init_net)) {
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002205 all = kmemdup(all, sizeof(ipv4_devconf), GFP_KERNEL);
2206 if (all == NULL)
2207 goto err_alloc_all;
2208
2209 dflt = kmemdup(dflt, sizeof(ipv4_devconf_dflt), GFP_KERNEL);
2210 if (dflt == NULL)
2211 goto err_alloc_dflt;
2212
Eric Dumazet2a75de02008-01-05 23:08:49 -08002213#ifdef CONFIG_SYSCTL
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002214 tbl = kmemdup(tbl, sizeof(ctl_forward_entry), GFP_KERNEL);
2215 if (tbl == NULL)
2216 goto err_alloc_ctl;
2217
Eric W. Biederman02291682010-02-14 03:25:51 +00002218 tbl[0].data = &all->data[IPV4_DEVCONF_FORWARDING - 1];
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002219 tbl[0].extra1 = all;
2220 tbl[0].extra2 = net;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002221#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002222 }
2223
2224#ifdef CONFIG_SYSCTL
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002225 err = __devinet_sysctl_register(net, "all", all);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002226 if (err < 0)
2227 goto err_reg_all;
2228
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002229 err = __devinet_sysctl_register(net, "default", dflt);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002230 if (err < 0)
2231 goto err_reg_dflt;
2232
2233 err = -ENOMEM;
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002234 forw_hdr = register_net_sysctl(net, "net/ipv4", tbl);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002235 if (forw_hdr == NULL)
2236 goto err_reg_ctl;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002237 net->ipv4.forw_hdr = forw_hdr;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002238#endif
2239
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002240 net->ipv4.devconf_all = all;
2241 net->ipv4.devconf_dflt = dflt;
2242 return 0;
2243
2244#ifdef CONFIG_SYSCTL
2245err_reg_ctl:
2246 __devinet_sysctl_unregister(dflt);
2247err_reg_dflt:
2248 __devinet_sysctl_unregister(all);
2249err_reg_all:
2250 if (tbl != ctl_forward_entry)
2251 kfree(tbl);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002252err_alloc_ctl:
Eric Dumazet2a75de02008-01-05 23:08:49 -08002253#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002254 if (dflt != &ipv4_devconf_dflt)
2255 kfree(dflt);
2256err_alloc_dflt:
2257 if (all != &ipv4_devconf)
2258 kfree(all);
2259err_alloc_all:
2260 return err;
2261}
2262
2263static __net_exit void devinet_exit_net(struct net *net)
2264{
Eric Dumazet2a75de02008-01-05 23:08:49 -08002265#ifdef CONFIG_SYSCTL
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002266 struct ctl_table *tbl;
2267
2268 tbl = net->ipv4.forw_hdr->ctl_table_arg;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002269 unregister_net_sysctl_table(net->ipv4.forw_hdr);
2270 __devinet_sysctl_unregister(net->ipv4.devconf_dflt);
2271 __devinet_sysctl_unregister(net->ipv4.devconf_all);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002272 kfree(tbl);
Eric Dumazet2a75de02008-01-05 23:08:49 -08002273#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002274 kfree(net->ipv4.devconf_dflt);
2275 kfree(net->ipv4.devconf_all);
2276}
2277
2278static __net_initdata struct pernet_operations devinet_ops = {
2279 .init = devinet_init_net,
2280 .exit = devinet_exit_net,
2281};
2282
Thomas Graf9f0f7272010-11-16 04:32:48 +00002283static struct rtnl_af_ops inet_af_ops = {
2284 .family = AF_INET,
2285 .fill_link_af = inet_fill_link_af,
2286 .get_link_af_size = inet_get_link_af_size,
Thomas Grafcf7afbf2010-11-22 01:31:54 +00002287 .validate_link_af = inet_validate_link_af,
2288 .set_link_af = inet_set_link_af,
Thomas Graf9f0f7272010-11-16 04:32:48 +00002289};
2290
Linus Torvalds1da177e2005-04-16 15:20:36 -07002291void __init devinet_init(void)
2292{
David S. Millerfd23c3b2011-02-18 12:42:28 -08002293 int i;
2294
2295 for (i = 0; i < IN4_ADDR_HSIZE; i++)
2296 INIT_HLIST_HEAD(&inet_addr_lst[i]);
2297
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002298 register_pernet_subsys(&devinet_ops);
2299
Linus Torvalds1da177e2005-04-16 15:20:36 -07002300 register_gifconf(PF_INET, inet_gifconf);
2301 register_netdevice_notifier(&ip_netdev_notifier);
Thomas Graf63f34442007-03-22 11:55:17 -07002302
Jiri Pirko5c766d62013-01-24 09:41:41 +00002303 schedule_delayed_work(&check_lifetime_work, 0);
2304
Thomas Graf9f0f7272010-11-16 04:32:48 +00002305 rtnl_af_register(&inet_af_ops);
2306
Greg Rosec7ac8672011-06-10 01:27:09 +00002307 rtnl_register(PF_INET, RTM_NEWADDR, inet_rtm_newaddr, NULL, NULL);
2308 rtnl_register(PF_INET, RTM_DELADDR, inet_rtm_deladdr, NULL, NULL);
2309 rtnl_register(PF_INET, RTM_GETADDR, NULL, inet_dump_ifaddr, NULL);
Nicolas Dichtel9e551112012-10-25 22:28:53 +00002310 rtnl_register(PF_INET, RTM_GETNETCONF, inet_netconf_get_devconf,
Nicolas Dichtel7a674202013-03-05 23:42:06 +00002311 inet_netconf_dump_devconf, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002312}
2313