blob: 9a2f24078a542864ef42142d24574ffcd9cf9f05 [file] [log] [blame]
Daniel Borkmannc675e062019-02-08 13:55:31 +01001/* Copyright (c) 2014 Mahesh Bandewar <maheshb@google.com>
2 *
3 * This program is free software; you can redistribute it and/or
4 * modify it under the terms of the GNU General Public License as
5 * published by the Free Software Foundation; either version 2 of
6 * the License, or (at your option) any later version.
7 */
8
9#include "ipvlan.h"
10
11static unsigned int ipvlan_netid __read_mostly;
12
13struct ipvlan_netns {
14 unsigned int ipvl_nf_hook_refcnt;
15};
16
17static struct ipvl_addr *ipvlan_skb_to_addr(struct sk_buff *skb,
18 struct net_device *dev)
19{
20 struct ipvl_addr *addr = NULL;
21 struct ipvl_port *port;
22 int addr_type;
23 void *lyr3h;
24
25 if (!dev || !netif_is_ipvlan_port(dev))
26 goto out;
27
28 port = ipvlan_port_get_rcu(dev);
29 if (!port || port->mode != IPVLAN_MODE_L3S)
30 goto out;
31
32 lyr3h = ipvlan_get_L3_hdr(port, skb, &addr_type);
33 if (!lyr3h)
34 goto out;
35
36 addr = ipvlan_addr_lookup(port, lyr3h, addr_type, true);
37out:
38 return addr;
39}
40
41static struct sk_buff *ipvlan_l3_rcv(struct net_device *dev,
42 struct sk_buff *skb, u16 proto)
43{
44 struct ipvl_addr *addr;
45 struct net_device *sdev;
46
47 addr = ipvlan_skb_to_addr(skb, dev);
48 if (!addr)
49 goto out;
50
51 sdev = addr->master->dev;
52 switch (proto) {
53 case AF_INET:
54 {
55 struct iphdr *ip4h = ip_hdr(skb);
56 int err;
57
58 err = ip_route_input_noref(skb, ip4h->daddr, ip4h->saddr,
59 ip4h->tos, sdev);
60 if (unlikely(err))
61 goto out;
62 break;
63 }
64#if IS_ENABLED(CONFIG_IPV6)
65 case AF_INET6:
66 {
67 struct dst_entry *dst;
68 struct ipv6hdr *ip6h = ipv6_hdr(skb);
69 int flags = RT6_LOOKUP_F_HAS_SADDR;
70 struct flowi6 fl6 = {
71 .flowi6_iif = sdev->ifindex,
72 .daddr = ip6h->daddr,
73 .saddr = ip6h->saddr,
74 .flowlabel = ip6_flowinfo(ip6h),
75 .flowi6_mark = skb->mark,
76 .flowi6_proto = ip6h->nexthdr,
77 };
78
79 skb_dst_drop(skb);
80 dst = ip6_route_input_lookup(dev_net(sdev), sdev, &fl6,
81 skb, flags);
82 skb_dst_set(skb, dst);
83 break;
84 }
85#endif
86 default:
87 break;
88 }
89out:
90 return skb;
91}
92
93static const struct l3mdev_ops ipvl_l3mdev_ops = {
94 .l3mdev_l3_rcv = ipvlan_l3_rcv,
95};
96
97static unsigned int ipvlan_nf_input(void *priv, struct sk_buff *skb,
98 const struct nf_hook_state *state)
99{
100 struct ipvl_addr *addr;
101 unsigned int len;
102
103 addr = ipvlan_skb_to_addr(skb, skb->dev);
104 if (!addr)
105 goto out;
106
107 skb->dev = addr->master->dev;
108 len = skb->len + ETH_HLEN;
109 ipvlan_count_rx(addr->master, len, true, false);
110out:
111 return NF_ACCEPT;
112}
113
114static const struct nf_hook_ops ipvl_nfops[] = {
115 {
116 .hook = ipvlan_nf_input,
117 .pf = NFPROTO_IPV4,
118 .hooknum = NF_INET_LOCAL_IN,
119 .priority = INT_MAX,
120 },
121#if IS_ENABLED(CONFIG_IPV6)
122 {
123 .hook = ipvlan_nf_input,
124 .pf = NFPROTO_IPV6,
125 .hooknum = NF_INET_LOCAL_IN,
126 .priority = INT_MAX,
127 },
128#endif
129};
130
131static int ipvlan_register_nf_hook(struct net *net)
132{
133 struct ipvlan_netns *vnet = net_generic(net, ipvlan_netid);
134 int err = 0;
135
136 if (!vnet->ipvl_nf_hook_refcnt) {
137 err = nf_register_net_hooks(net, ipvl_nfops,
138 ARRAY_SIZE(ipvl_nfops));
139 if (!err)
140 vnet->ipvl_nf_hook_refcnt = 1;
141 } else {
142 vnet->ipvl_nf_hook_refcnt++;
143 }
144
145 return err;
146}
147
148static void ipvlan_unregister_nf_hook(struct net *net)
149{
150 struct ipvlan_netns *vnet = net_generic(net, ipvlan_netid);
151
152 if (WARN_ON(!vnet->ipvl_nf_hook_refcnt))
153 return;
154
155 vnet->ipvl_nf_hook_refcnt--;
156 if (!vnet->ipvl_nf_hook_refcnt)
157 nf_unregister_net_hooks(net, ipvl_nfops,
158 ARRAY_SIZE(ipvl_nfops));
159}
160
161void ipvlan_migrate_l3s_hook(struct net *oldnet, struct net *newnet)
162{
163 struct ipvlan_netns *old_vnet;
164
165 ASSERT_RTNL();
166
167 old_vnet = net_generic(oldnet, ipvlan_netid);
168 if (!old_vnet->ipvl_nf_hook_refcnt)
169 return;
170
171 ipvlan_register_nf_hook(newnet);
172 ipvlan_unregister_nf_hook(oldnet);
173}
174
175static void ipvlan_ns_exit(struct net *net)
176{
177 struct ipvlan_netns *vnet = net_generic(net, ipvlan_netid);
178
179 if (WARN_ON_ONCE(vnet->ipvl_nf_hook_refcnt)) {
180 vnet->ipvl_nf_hook_refcnt = 0;
181 nf_unregister_net_hooks(net, ipvl_nfops,
182 ARRAY_SIZE(ipvl_nfops));
183 }
184}
185
186static struct pernet_operations ipvlan_net_ops = {
187 .id = &ipvlan_netid,
188 .size = sizeof(struct ipvlan_netns),
189 .exit = ipvlan_ns_exit,
190};
191
192int ipvlan_l3s_init(void)
193{
194 return register_pernet_subsys(&ipvlan_net_ops);
195}
196
197void ipvlan_l3s_cleanup(void)
198{
199 unregister_pernet_subsys(&ipvlan_net_ops);
200}
201
202int ipvlan_l3s_register(struct ipvl_port *port)
203{
204 struct net_device *dev = port->dev;
205 int ret;
206
207 ASSERT_RTNL();
208
209 ret = ipvlan_register_nf_hook(read_pnet(&port->pnet));
210 if (!ret) {
211 dev->l3mdev_ops = &ipvl_l3mdev_ops;
212 dev->priv_flags |= IFF_L3MDEV_MASTER;
213 }
214
215 return ret;
216}
217
218void ipvlan_l3s_unregister(struct ipvl_port *port)
219{
220 struct net_device *dev = port->dev;
221
222 ASSERT_RTNL();
223
224 dev->priv_flags &= ~IFF_L3MDEV_MASTER;
225 ipvlan_unregister_nf_hook(read_pnet(&port->pnet));
226 dev->l3mdev_ops = NULL;
227}