blob: 14f1cbd3b96faf5876427a6189f5e28eac31556a [file] [log] [blame]
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001/* Copyright (c) 2014 Mahesh Bandewar <maheshb@google.com>
2 *
3 * This program is free software; you can redistribute it and/or
4 * modify it under the terms of the GNU General Public License as
5 * published by the Free Software Foundation; either version 2 of
6 * the License, or (at your option) any later version.
7 *
8 */
9
10#include "ipvlan.h"
11
Florian Westphal31338222017-04-20 18:08:15 +020012static unsigned int ipvlan_netid __read_mostly;
13
14struct ipvlan_netns {
15 unsigned int ipvl_nf_hook_refcnt;
16};
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070017
Florian Westphal591bb272017-07-26 11:40:52 +020018static const struct nf_hook_ops ipvl_nfops[] = {
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070019 {
20 .hook = ipvlan_nf_input,
21 .pf = NFPROTO_IPV4,
22 .hooknum = NF_INET_LOCAL_IN,
23 .priority = INT_MAX,
24 },
Matteo Croce94333fa2018-02-21 01:31:13 +010025#if IS_ENABLED(CONFIG_IPV6)
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070026 {
27 .hook = ipvlan_nf_input,
28 .pf = NFPROTO_IPV6,
29 .hooknum = NF_INET_LOCAL_IN,
30 .priority = INT_MAX,
31 },
Matteo Croce94333fa2018-02-21 01:31:13 +010032#endif
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070033};
34
Julia Lawallab530f62016-10-15 17:40:30 +020035static const struct l3mdev_ops ipvl_l3mdev_ops = {
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070036 .l3mdev_l3_rcv = ipvlan_l3_rcv,
37};
38
Mahesh Bandewarab5b7012016-02-20 19:31:41 -080039static void ipvlan_adjust_mtu(struct ipvl_dev *ipvlan, struct net_device *dev)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -080040{
Gao Feng8f679ed2016-11-30 08:48:44 +080041 ipvlan->dev->mtu = dev->mtu;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -080042}
43
Florian Westphal31338222017-04-20 18:08:15 +020044static int ipvlan_register_nf_hook(struct net *net)
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070045{
Florian Westphal31338222017-04-20 18:08:15 +020046 struct ipvlan_netns *vnet = net_generic(net, ipvlan_netid);
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070047 int err = 0;
48
Florian Westphal31338222017-04-20 18:08:15 +020049 if (!vnet->ipvl_nf_hook_refcnt) {
50 err = nf_register_net_hooks(net, ipvl_nfops,
51 ARRAY_SIZE(ipvl_nfops));
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070052 if (!err)
Florian Westphal31338222017-04-20 18:08:15 +020053 vnet->ipvl_nf_hook_refcnt = 1;
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070054 } else {
Florian Westphal31338222017-04-20 18:08:15 +020055 vnet->ipvl_nf_hook_refcnt++;
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070056 }
57
58 return err;
59}
60
Florian Westphal31338222017-04-20 18:08:15 +020061static void ipvlan_unregister_nf_hook(struct net *net)
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070062{
Florian Westphal31338222017-04-20 18:08:15 +020063 struct ipvlan_netns *vnet = net_generic(net, ipvlan_netid);
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070064
Florian Westphal31338222017-04-20 18:08:15 +020065 if (WARN_ON(!vnet->ipvl_nf_hook_refcnt))
66 return;
67
68 vnet->ipvl_nf_hook_refcnt--;
69 if (!vnet->ipvl_nf_hook_refcnt)
70 nf_unregister_net_hooks(net, ipvl_nfops,
71 ARRAY_SIZE(ipvl_nfops));
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070072}
73
Petr Machatacf7686a2018-12-06 17:05:40 +000074static int ipvlan_set_port_mode(struct ipvl_port *port, u16 nval,
75 struct netlink_ext_ack *extack)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -080076{
77 struct ipvl_dev *ipvlan;
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070078 struct net_device *mdev = port->dev;
Hangbin Liu5dc2d392018-07-01 16:21:21 +080079 unsigned int flags;
80 int err;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -080081
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070082 ASSERT_RTNL();
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -080083 if (port->mode != nval) {
Hangbin Liu5dc2d392018-07-01 16:21:21 +080084 list_for_each_entry(ipvlan, &port->ipvlans, pnode) {
85 flags = ipvlan->dev->flags;
86 if (nval == IPVLAN_MODE_L3 || nval == IPVLAN_MODE_L3S) {
87 err = dev_change_flags(ipvlan->dev,
88 flags | IFF_NOARP);
89 } else {
90 err = dev_change_flags(ipvlan->dev,
91 flags & ~IFF_NOARP);
92 }
93 if (unlikely(err))
94 goto fail;
95 }
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070096 if (nval == IPVLAN_MODE_L3S) {
97 /* New mode is L3S */
Florian Westphal31338222017-04-20 18:08:15 +020098 err = ipvlan_register_nf_hook(read_pnet(&port->pnet));
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -070099 if (!err) {
100 mdev->l3mdev_ops = &ipvl_l3mdev_ops;
101 mdev->priv_flags |= IFF_L3MDEV_MASTER;
102 } else
Hangbin Liu5dc2d392018-07-01 16:21:21 +0800103 goto fail;
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -0700104 } else if (port->mode == IPVLAN_MODE_L3S) {
105 /* Old mode was L3S */
106 mdev->priv_flags &= ~IFF_L3MDEV_MASTER;
Florian Westphal31338222017-04-20 18:08:15 +0200107 ipvlan_unregister_nf_hook(read_pnet(&port->pnet));
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -0700108 mdev->l3mdev_ops = NULL;
109 }
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800110 port->mode = nval;
111 }
Hangbin Liu5dc2d392018-07-01 16:21:21 +0800112 return 0;
113
114fail:
115 /* Undo the flags changes that have been done so far. */
116 list_for_each_entry_continue_reverse(ipvlan, &port->ipvlans, pnode) {
117 flags = ipvlan->dev->flags;
118 if (port->mode == IPVLAN_MODE_L3 ||
119 port->mode == IPVLAN_MODE_L3S)
120 dev_change_flags(ipvlan->dev, flags | IFF_NOARP);
121 else
122 dev_change_flags(ipvlan->dev, flags & ~IFF_NOARP);
123 }
124
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -0700125 return err;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800126}
127
128static int ipvlan_port_create(struct net_device *dev)
129{
130 struct ipvl_port *port;
131 int err, idx;
132
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800133 port = kzalloc(sizeof(struct ipvl_port), GFP_KERNEL);
134 if (!port)
135 return -ENOMEM;
136
Florian Westphal31338222017-04-20 18:08:15 +0200137 write_pnet(&port->pnet, dev_net(dev));
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800138 port->dev = dev;
139 port->mode = IPVLAN_MODE_L3;
140 INIT_LIST_HEAD(&port->ipvlans);
141 for (idx = 0; idx < IPVLAN_HASH_SIZE; idx++)
142 INIT_HLIST_HEAD(&port->hlhead[idx]);
143
Mahesh Bandewarba35f852015-05-04 17:06:03 -0700144 skb_queue_head_init(&port->backlog);
145 INIT_WORK(&port->wq, ipvlan_process_multicast);
Mahesh Bandewar009146d2017-01-03 12:47:16 -0800146 ida_init(&port->ida);
Mahesh Bandewarda36e132017-01-09 15:05:54 -0800147 port->dev_id_start = 1;
Mahesh Bandewarba35f852015-05-04 17:06:03 -0700148
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800149 err = netdev_rx_handler_register(dev, ipvlan_handle_frame, port);
150 if (err)
151 goto err;
152
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800153 return 0;
154
155err:
Gao Feng48140a22016-12-07 08:44:47 +0800156 kfree(port);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800157 return err;
158}
159
160static void ipvlan_port_destroy(struct net_device *dev)
161{
162 struct ipvl_port *port = ipvlan_port_get_rtnl(dev);
Eric Dumazetb1227d02016-12-21 18:00:24 -0800163 struct sk_buff *skb;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800164
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -0700165 if (port->mode == IPVLAN_MODE_L3S) {
166 dev->priv_flags &= ~IFF_L3MDEV_MASTER;
Florian Westphal31338222017-04-20 18:08:15 +0200167 ipvlan_unregister_nf_hook(dev_net(dev));
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -0700168 dev->l3mdev_ops = NULL;
169 }
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800170 netdev_rx_handler_unregister(dev);
Mahesh Bandewarba35f852015-05-04 17:06:03 -0700171 cancel_work_sync(&port->wq);
Eric Dumazetb1227d02016-12-21 18:00:24 -0800172 while ((skb = __skb_dequeue(&port->backlog)) != NULL) {
173 if (skb->dev)
174 dev_put(skb->dev);
175 kfree_skb(skb);
176 }
Mahesh Bandewar009146d2017-01-03 12:47:16 -0800177 ida_destroy(&port->ida);
Gao Feng48140a22016-12-07 08:44:47 +0800178 kfree(port);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800179}
180
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800181#define IPVLAN_FEATURES \
Tom Herberta1882222015-12-14 11:19:43 -0800182 (NETIF_F_SG | NETIF_F_HW_CSUM | NETIF_F_HIGHDMA | NETIF_F_FRAGLIST | \
David S. Miller182e0b62017-07-03 06:32:14 -0700183 NETIF_F_GSO | NETIF_F_TSO | NETIF_F_GSO_ROBUST | \
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800184 NETIF_F_TSO_ECN | NETIF_F_TSO6 | NETIF_F_GRO | NETIF_F_RXCSUM | \
185 NETIF_F_HW_VLAN_CTAG_FILTER | NETIF_F_HW_VLAN_STAG_FILTER)
186
187#define IPVLAN_STATE_MASK \
188 ((1<<__LINK_STATE_NOCARRIER) | (1<<__LINK_STATE_DORMANT))
189
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800190static int ipvlan_init(struct net_device *dev)
191{
192 struct ipvl_dev *ipvlan = netdev_priv(dev);
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800193 struct net_device *phy_dev = ipvlan->phy_dev;
194 struct ipvl_port *port;
195 int err;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800196
197 dev->state = (dev->state & ~IPVLAN_STATE_MASK) |
198 (phy_dev->state & IPVLAN_STATE_MASK);
199 dev->features = phy_dev->features & IPVLAN_FEATURES;
Paolo Abeni3518e402018-03-02 16:03:32 +0100200 dev->features |= NETIF_F_LLTX | NETIF_F_VLAN_CHALLENGED;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800201 dev->gso_max_size = phy_dev->gso_max_size;
Eric Dumazetf6773c52016-03-16 21:59:49 -0700202 dev->gso_max_segs = phy_dev->gso_max_segs;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800203 dev->hard_header_len = phy_dev->hard_header_len;
204
Eric Dumazet0d7dd792016-06-09 07:45:15 -0700205 netdev_lockdep_set_classes(dev);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800206
Florian Fainelli87173cd2017-08-01 12:11:13 -0700207 ipvlan->pcpu_stats = netdev_alloc_pcpu_stats(struct ipvl_pcpu_stats);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800208 if (!ipvlan->pcpu_stats)
209 return -ENOMEM;
210
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800211 if (!netif_is_ipvlan_port(phy_dev)) {
212 err = ipvlan_port_create(phy_dev);
213 if (err < 0) {
214 free_percpu(ipvlan->pcpu_stats);
215 return err;
216 }
217 }
218 port = ipvlan_port_get_rtnl(phy_dev);
Mahesh Bandewar494e8482016-04-27 14:59:27 -0700219 port->count += 1;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800220 return 0;
221}
222
223static void ipvlan_uninit(struct net_device *dev)
224{
225 struct ipvl_dev *ipvlan = netdev_priv(dev);
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800226 struct net_device *phy_dev = ipvlan->phy_dev;
227 struct ipvl_port *port;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800228
Markus Elfring04901ce2014-11-29 16:23:20 +0100229 free_percpu(ipvlan->pcpu_stats);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800230
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800231 port = ipvlan_port_get_rtnl(phy_dev);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800232 port->count -= 1;
233 if (!port->count)
234 ipvlan_port_destroy(port->dev);
235}
236
237static int ipvlan_open(struct net_device *dev)
238{
239 struct ipvl_dev *ipvlan = netdev_priv(dev);
240 struct net_device *phy_dev = ipvlan->phy_dev;
241 struct ipvl_addr *addr;
242
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -0700243 if (ipvlan->port->mode == IPVLAN_MODE_L3 ||
244 ipvlan->port->mode == IPVLAN_MODE_L3S)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800245 dev->flags |= IFF_NOARP;
246 else
247 dev->flags &= ~IFF_NOARP;
248
Paolo Abeni82308192018-02-28 10:59:27 +0100249 rcu_read_lock();
250 list_for_each_entry_rcu(addr, &ipvlan->addrs, anode)
Konstantin Khlebnikov515866f2015-07-14 16:35:50 +0300251 ipvlan_ht_addr_add(ipvlan, addr);
Paolo Abeni82308192018-02-28 10:59:27 +0100252 rcu_read_unlock();
Konstantin Khlebnikov515866f2015-07-14 16:35:50 +0300253
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800254 return dev_uc_add(phy_dev, phy_dev->dev_addr);
255}
256
257static int ipvlan_stop(struct net_device *dev)
258{
259 struct ipvl_dev *ipvlan = netdev_priv(dev);
260 struct net_device *phy_dev = ipvlan->phy_dev;
261 struct ipvl_addr *addr;
262
263 dev_uc_unsync(phy_dev, dev);
264 dev_mc_unsync(phy_dev, dev);
265
266 dev_uc_del(phy_dev, phy_dev->dev_addr);
267
Paolo Abeni82308192018-02-28 10:59:27 +0100268 rcu_read_lock();
269 list_for_each_entry_rcu(addr, &ipvlan->addrs, anode)
Konstantin Khlebnikov6640e672015-07-14 16:35:53 +0300270 ipvlan_ht_addr_del(addr);
Paolo Abeni82308192018-02-28 10:59:27 +0100271 rcu_read_unlock();
Konstantin Khlebnikov515866f2015-07-14 16:35:50 +0300272
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800273 return 0;
274}
275
Mahesh Bandewar92c7b0d2014-11-25 21:24:43 -0800276static netdev_tx_t ipvlan_start_xmit(struct sk_buff *skb,
277 struct net_device *dev)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800278{
279 const struct ipvl_dev *ipvlan = netdev_priv(dev);
280 int skblen = skb->len;
281 int ret;
282
283 ret = ipvlan_queue_xmit(skb, dev);
284 if (likely(ret == NET_XMIT_SUCCESS || ret == NET_XMIT_CN)) {
285 struct ipvl_pcpu_stats *pcptr;
286
287 pcptr = this_cpu_ptr(ipvlan->pcpu_stats);
288
289 u64_stats_update_begin(&pcptr->syncp);
290 pcptr->tx_pkts++;
291 pcptr->tx_bytes += skblen;
292 u64_stats_update_end(&pcptr->syncp);
293 } else {
294 this_cpu_inc(ipvlan->pcpu_stats->tx_drps);
295 }
296 return ret;
297}
298
299static netdev_features_t ipvlan_fix_features(struct net_device *dev,
300 netdev_features_t features)
301{
302 struct ipvl_dev *ipvlan = netdev_priv(dev);
303
304 return features & (ipvlan->sfeatures | ~IPVLAN_FEATURES);
305}
306
307static void ipvlan_change_rx_flags(struct net_device *dev, int change)
308{
309 struct ipvl_dev *ipvlan = netdev_priv(dev);
310 struct net_device *phy_dev = ipvlan->phy_dev;
311
312 if (change & IFF_ALLMULTI)
313 dev_set_allmulti(phy_dev, dev->flags & IFF_ALLMULTI? 1 : -1);
314}
315
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800316static void ipvlan_set_multicast_mac_filter(struct net_device *dev)
317{
318 struct ipvl_dev *ipvlan = netdev_priv(dev);
319
320 if (dev->flags & (IFF_PROMISC | IFF_ALLMULTI)) {
321 bitmap_fill(ipvlan->mac_filters, IPVLAN_MAC_FILTER_SIZE);
322 } else {
323 struct netdev_hw_addr *ha;
324 DECLARE_BITMAP(mc_filters, IPVLAN_MAC_FILTER_SIZE);
325
326 bitmap_zero(mc_filters, IPVLAN_MAC_FILTER_SIZE);
327 netdev_for_each_mc_addr(ha, dev)
328 __set_bit(ipvlan_mac_hash(ha->addr), mc_filters);
329
Mahesh Bandewarf631c442015-05-04 17:06:11 -0700330 /* Turn-on broadcast bit irrespective of address family,
331 * since broadcast is deferred to a work-queue, hence no
332 * impact on fast-path processing.
333 */
334 __set_bit(ipvlan_mac_hash(dev->broadcast), mc_filters);
335
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800336 bitmap_copy(ipvlan->mac_filters, mc_filters,
337 IPVLAN_MAC_FILTER_SIZE);
338 }
339 dev_uc_sync(ipvlan->phy_dev, dev);
340 dev_mc_sync(ipvlan->phy_dev, dev);
341}
342
stephen hemmingerbc1f4472017-01-06 19:12:52 -0800343static void ipvlan_get_stats64(struct net_device *dev,
344 struct rtnl_link_stats64 *s)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800345{
346 struct ipvl_dev *ipvlan = netdev_priv(dev);
347
348 if (ipvlan->pcpu_stats) {
349 struct ipvl_pcpu_stats *pcptr;
350 u64 rx_pkts, rx_bytes, rx_mcast, tx_pkts, tx_bytes;
351 u32 rx_errs = 0, tx_drps = 0;
352 u32 strt;
353 int idx;
354
355 for_each_possible_cpu(idx) {
356 pcptr = per_cpu_ptr(ipvlan->pcpu_stats, idx);
357 do {
358 strt= u64_stats_fetch_begin_irq(&pcptr->syncp);
359 rx_pkts = pcptr->rx_pkts;
360 rx_bytes = pcptr->rx_bytes;
361 rx_mcast = pcptr->rx_mcast;
362 tx_pkts = pcptr->tx_pkts;
363 tx_bytes = pcptr->tx_bytes;
364 } while (u64_stats_fetch_retry_irq(&pcptr->syncp,
365 strt));
366
367 s->rx_packets += rx_pkts;
368 s->rx_bytes += rx_bytes;
369 s->multicast += rx_mcast;
370 s->tx_packets += tx_pkts;
371 s->tx_bytes += tx_bytes;
372
373 /* u32 values are updated without syncp protection. */
374 rx_errs += pcptr->rx_errs;
375 tx_drps += pcptr->tx_drps;
376 }
377 s->rx_errors = rx_errs;
378 s->rx_dropped = rx_errs;
379 s->tx_dropped = tx_drps;
380 }
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800381}
382
383static int ipvlan_vlan_rx_add_vid(struct net_device *dev, __be16 proto, u16 vid)
384{
385 struct ipvl_dev *ipvlan = netdev_priv(dev);
386 struct net_device *phy_dev = ipvlan->phy_dev;
387
388 return vlan_vid_add(phy_dev, proto, vid);
389}
390
391static int ipvlan_vlan_rx_kill_vid(struct net_device *dev, __be16 proto,
392 u16 vid)
393{
394 struct ipvl_dev *ipvlan = netdev_priv(dev);
395 struct net_device *phy_dev = ipvlan->phy_dev;
396
397 vlan_vid_del(phy_dev, proto, vid);
398 return 0;
399}
400
Nicolas Dichtel7c411652015-04-02 17:07:06 +0200401static int ipvlan_get_iflink(const struct net_device *dev)
402{
403 struct ipvl_dev *ipvlan = netdev_priv(dev);
404
405 return ipvlan->phy_dev->ifindex;
406}
407
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800408static const struct net_device_ops ipvlan_netdev_ops = {
409 .ndo_init = ipvlan_init,
410 .ndo_uninit = ipvlan_uninit,
411 .ndo_open = ipvlan_open,
412 .ndo_stop = ipvlan_stop,
413 .ndo_start_xmit = ipvlan_start_xmit,
414 .ndo_fix_features = ipvlan_fix_features,
415 .ndo_change_rx_flags = ipvlan_change_rx_flags,
416 .ndo_set_rx_mode = ipvlan_set_multicast_mac_filter,
417 .ndo_get_stats64 = ipvlan_get_stats64,
418 .ndo_vlan_rx_add_vid = ipvlan_vlan_rx_add_vid,
419 .ndo_vlan_rx_kill_vid = ipvlan_vlan_rx_kill_vid,
Nicolas Dichtel7c411652015-04-02 17:07:06 +0200420 .ndo_get_iflink = ipvlan_get_iflink,
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800421};
422
423static int ipvlan_hard_header(struct sk_buff *skb, struct net_device *dev,
424 unsigned short type, const void *daddr,
425 const void *saddr, unsigned len)
426{
427 const struct ipvl_dev *ipvlan = netdev_priv(dev);
428 struct net_device *phy_dev = ipvlan->phy_dev;
429
430 /* TODO Probably use a different field than dev_addr so that the
431 * mac-address on the virtual device is portable and can be carried
432 * while the packets use the mac-addr on the physical device.
433 */
434 return dev_hard_header(skb, phy_dev, type, daddr,
Mahesh Bandewar32c10bb2017-10-11 17:16:26 -0700435 saddr ? : phy_dev->dev_addr, len);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800436}
437
438static const struct header_ops ipvlan_header_ops = {
439 .create = ipvlan_hard_header,
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800440 .parse = eth_header_parse,
441 .cache = eth_header_cache,
442 .cache_update = eth_header_cache_update,
443};
444
Paolo Abeni1ec54cb2018-03-06 10:56:31 +0100445static bool netif_is_ipvlan(const struct net_device *dev)
446{
447 /* both ipvlan and ipvtap devices use the same netdev_ops */
448 return dev->netdev_ops == &ipvlan_netdev_ops;
449}
450
David Decotigny314d10d2016-02-24 10:58:03 -0800451static int ipvlan_ethtool_get_link_ksettings(struct net_device *dev,
452 struct ethtool_link_ksettings *cmd)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800453{
454 const struct ipvl_dev *ipvlan = netdev_priv(dev);
455
David Decotigny314d10d2016-02-24 10:58:03 -0800456 return __ethtool_get_link_ksettings(ipvlan->phy_dev, cmd);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800457}
458
459static void ipvlan_ethtool_get_drvinfo(struct net_device *dev,
460 struct ethtool_drvinfo *drvinfo)
461{
462 strlcpy(drvinfo->driver, IPVLAN_DRV, sizeof(drvinfo->driver));
463 strlcpy(drvinfo->version, IPV_DRV_VER, sizeof(drvinfo->version));
464}
465
466static u32 ipvlan_ethtool_get_msglevel(struct net_device *dev)
467{
468 const struct ipvl_dev *ipvlan = netdev_priv(dev);
469
470 return ipvlan->msg_enable;
471}
472
473static void ipvlan_ethtool_set_msglevel(struct net_device *dev, u32 value)
474{
475 struct ipvl_dev *ipvlan = netdev_priv(dev);
476
477 ipvlan->msg_enable = value;
478}
479
480static const struct ethtool_ops ipvlan_ethtool_ops = {
481 .get_link = ethtool_op_get_link,
David Decotigny314d10d2016-02-24 10:58:03 -0800482 .get_link_ksettings = ipvlan_ethtool_get_link_ksettings,
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800483 .get_drvinfo = ipvlan_ethtool_get_drvinfo,
484 .get_msglevel = ipvlan_ethtool_get_msglevel,
485 .set_msglevel = ipvlan_ethtool_set_msglevel,
486};
487
488static int ipvlan_nl_changelink(struct net_device *dev,
Matthias Schifferad744b22017-06-25 23:56:00 +0200489 struct nlattr *tb[], struct nlattr *data[],
490 struct netlink_ext_ack *extack)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800491{
492 struct ipvl_dev *ipvlan = netdev_priv(dev);
493 struct ipvl_port *port = ipvlan_port_get_rtnl(ipvlan->phy_dev);
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -0700494 int err = 0;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800495
Mahesh Bandewara190d042017-10-26 15:09:21 -0700496 if (!data)
497 return 0;
498
499 if (data[IFLA_IPVLAN_MODE]) {
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800500 u16 nmode = nla_get_u16(data[IFLA_IPVLAN_MODE]);
501
Petr Machatacf7686a2018-12-06 17:05:40 +0000502 err = ipvlan_set_port_mode(port, nmode, extack);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800503 }
Mahesh Bandewara190d042017-10-26 15:09:21 -0700504
505 if (!err && data[IFLA_IPVLAN_FLAGS]) {
506 u16 flags = nla_get_u16(data[IFLA_IPVLAN_FLAGS]);
507
508 if (flags & IPVLAN_F_PRIVATE)
509 ipvlan_mark_private(port);
510 else
511 ipvlan_clear_private(port);
Mahesh Bandewarfe89aa62017-10-26 15:09:25 -0700512
513 if (flags & IPVLAN_F_VEPA)
514 ipvlan_mark_vepa(port);
515 else
516 ipvlan_clear_vepa(port);
Mahesh Bandewara190d042017-10-26 15:09:21 -0700517 }
518
Mahesh Bandewar4fbae7d2016-09-16 12:59:19 -0700519 return err;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800520}
521
522static size_t ipvlan_nl_getsize(const struct net_device *dev)
523{
524 return (0
525 + nla_total_size(2) /* IFLA_IPVLAN_MODE */
Mahesh Bandewara190d042017-10-26 15:09:21 -0700526 + nla_total_size(2) /* IFLA_IPVLAN_FLAGS */
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800527 );
528}
529
Matthias Schiffera8b8a8892017-06-25 23:56:01 +0200530static int ipvlan_nl_validate(struct nlattr *tb[], struct nlattr *data[],
531 struct netlink_ext_ack *extack)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800532{
Mahesh Bandewara190d042017-10-26 15:09:21 -0700533 if (!data)
534 return 0;
535
536 if (data[IFLA_IPVLAN_MODE]) {
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800537 u16 mode = nla_get_u16(data[IFLA_IPVLAN_MODE]);
538
539 if (mode < IPVLAN_MODE_L2 || mode >= IPVLAN_MODE_MAX)
540 return -EINVAL;
541 }
Mahesh Bandewara190d042017-10-26 15:09:21 -0700542 if (data[IFLA_IPVLAN_FLAGS]) {
543 u16 flags = nla_get_u16(data[IFLA_IPVLAN_FLAGS]);
544
Mahesh Bandewarfe89aa62017-10-26 15:09:25 -0700545 /* Only two bits are used at this moment. */
546 if (flags & ~(IPVLAN_F_PRIVATE | IPVLAN_F_VEPA))
547 return -EINVAL;
548 /* Also both flags can't be active at the same time. */
549 if ((flags & (IPVLAN_F_PRIVATE | IPVLAN_F_VEPA)) ==
550 (IPVLAN_F_PRIVATE | IPVLAN_F_VEPA))
Mahesh Bandewara190d042017-10-26 15:09:21 -0700551 return -EINVAL;
552 }
553
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800554 return 0;
555}
556
557static int ipvlan_nl_fillinfo(struct sk_buff *skb,
558 const struct net_device *dev)
559{
560 struct ipvl_dev *ipvlan = netdev_priv(dev);
561 struct ipvl_port *port = ipvlan_port_get_rtnl(ipvlan->phy_dev);
562 int ret = -EINVAL;
563
564 if (!port)
565 goto err;
566
567 ret = -EMSGSIZE;
568 if (nla_put_u16(skb, IFLA_IPVLAN_MODE, port->mode))
569 goto err;
Mahesh Bandewara190d042017-10-26 15:09:21 -0700570 if (nla_put_u16(skb, IFLA_IPVLAN_FLAGS, port->flags))
571 goto err;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800572
573 return 0;
574
575err:
576 return ret;
577}
578
Sainath Grandhi235a9d82017-02-10 16:03:52 -0800579int ipvlan_link_new(struct net *src_net, struct net_device *dev,
Matthias Schiffer7a3f4a12017-06-25 23:55:59 +0200580 struct nlattr *tb[], struct nlattr *data[],
581 struct netlink_ext_ack *extack)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800582{
583 struct ipvl_dev *ipvlan = netdev_priv(dev);
584 struct ipvl_port *port;
585 struct net_device *phy_dev;
586 int err;
Mahesh Bandeware93fbc52016-02-20 19:31:36 -0800587 u16 mode = IPVLAN_MODE_L3;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800588
589 if (!tb[IFLA_LINK])
590 return -EINVAL;
591
592 phy_dev = __dev_get_by_index(src_net, nla_get_u32(tb[IFLA_LINK]));
593 if (!phy_dev)
594 return -ENODEV;
595
Mahesh Bandewar5933fea2014-12-06 15:53:33 -0800596 if (netif_is_ipvlan(phy_dev)) {
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800597 struct ipvl_dev *tmp = netdev_priv(phy_dev);
598
599 phy_dev = tmp->phy_dev;
Mahesh Bandewar5933fea2014-12-06 15:53:33 -0800600 } else if (!netif_is_ipvlan_port(phy_dev)) {
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800601 /* Exit early if the underlying link is invalid or busy */
602 if (phy_dev->type != ARPHRD_ETHER ||
603 phy_dev->flags & IFF_LOOPBACK) {
604 netdev_err(phy_dev,
605 "Master is either lo or non-ether device\n");
606 return -EINVAL;
607 }
608
609 if (netdev_is_rx_handler_busy(phy_dev)) {
610 netdev_err(phy_dev, "Device is already in use.\n");
611 return -EBUSY;
612 }
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800613 }
614
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800615 ipvlan->phy_dev = phy_dev;
616 ipvlan->dev = dev;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800617 ipvlan->sfeatures = IPVLAN_FEATURES;
Xin Long30877962018-06-21 12:56:04 +0800618 if (!tb[IFLA_MTU])
619 ipvlan_adjust_mtu(ipvlan, phy_dev);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800620 INIT_LIST_HEAD(&ipvlan->addrs);
Paolo Abeni82308192018-02-28 10:59:27 +0100621 spin_lock_init(&ipvlan->addrs_lock);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800622
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800623 /* TODO Probably put random address here to be presented to the
624 * world but keep using the physical-dev address for the outgoing
625 * packets.
Mahesh Bandewara190d042017-10-26 15:09:21 -0700626 */
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800627 memcpy(dev->dev_addr, phy_dev->dev_addr, ETH_ALEN);
628
Paolo Abenif54262502018-03-09 10:39:24 +0100629 dev->priv_flags |= IFF_NO_RX_HANDLER;
630
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800631 err = register_netdevice(dev);
632 if (err < 0)
633 return err;
634
635 /* ipvlan_init() would have created the port, if required */
636 port = ipvlan_port_get_rtnl(phy_dev);
637 ipvlan->port = port;
Mahesh Bandewara190d042017-10-26 15:09:21 -0700638
Mahesh Bandewarda36e132017-01-09 15:05:54 -0800639 /* If the port-id base is at the MAX value, then wrap it around and
640 * begin from 0x1 again. This may be due to a busy system where lots
641 * of slaves are getting created and deleted.
642 */
643 if (port->dev_id_start == 0xFFFE)
644 port->dev_id_start = 0x1;
645
Mahesh Bandewar009146d2017-01-03 12:47:16 -0800646 /* Since L2 address is shared among all IPvlan slaves including
647 * master, use unique 16 bit dev-ids to diffentiate among them.
648 * Assign IDs between 0x1 and 0xFFFE (used by the master) to each
649 * slave link [see addrconf_ifid_eui48()].
650 */
Mahesh Bandewarda36e132017-01-09 15:05:54 -0800651 err = ida_simple_get(&port->ida, port->dev_id_start, 0xFFFE,
652 GFP_KERNEL);
Mahesh Bandewar009146d2017-01-03 12:47:16 -0800653 if (err < 0)
Mahesh Bandewar019ec002017-01-13 15:48:30 -0800654 err = ida_simple_get(&port->ida, 0x1, port->dev_id_start,
655 GFP_KERNEL);
656 if (err < 0)
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800657 goto unregister_netdev;
Mahesh Bandewar009146d2017-01-03 12:47:16 -0800658 dev->dev_id = err;
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800659
Mahesh Bandewarda36e132017-01-09 15:05:54 -0800660 /* Increment id-base to the next slot for the future assignment */
661 port->dev_id_start = err + 1;
Mahesh Bandewar009146d2017-01-03 12:47:16 -0800662
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800663 err = netdev_upper_dev_link(phy_dev, dev, extack);
664 if (err)
Mahesh Bandewar009146d2017-01-03 12:47:16 -0800665 goto remove_ida;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800666
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800667 /* Flags are per port and latest update overrides. User has
668 * to be consistent in setting it just like the mode attribute.
669 */
670 if (data && data[IFLA_IPVLAN_FLAGS])
671 port->flags = nla_get_u16(data[IFLA_IPVLAN_FLAGS]);
672
673 if (data && data[IFLA_IPVLAN_MODE])
674 mode = nla_get_u16(data[IFLA_IPVLAN_MODE]);
675
Petr Machatacf7686a2018-12-06 17:05:40 +0000676 err = ipvlan_set_port_mode(port, mode, extack);
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800677 if (err)
Gao Feng1a31cc82016-12-08 11:16:58 +0800678 goto unlink_netdev;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800679
680 list_add_tail_rcu(&ipvlan->pnode, &port->ipvlans);
681 netif_stacked_transfer_operstate(phy_dev, dev);
682 return 0;
Gao Feng147fd282016-11-24 23:39:59 +0800683
Gao Feng1a31cc82016-12-08 11:16:58 +0800684unlink_netdev:
685 netdev_upper_dev_unlink(phy_dev, dev);
Mahesh Bandewar009146d2017-01-03 12:47:16 -0800686remove_ida:
687 ida_simple_remove(&port->ida, dev->dev_id);
Girish Moodalbailfe18da62017-11-16 23:16:17 -0800688unregister_netdev:
689 unregister_netdevice(dev);
Gao Feng147fd282016-11-24 23:39:59 +0800690 return err;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800691}
Sainath Grandhi235a9d82017-02-10 16:03:52 -0800692EXPORT_SYMBOL_GPL(ipvlan_link_new);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800693
Sainath Grandhi235a9d82017-02-10 16:03:52 -0800694void ipvlan_link_delete(struct net_device *dev, struct list_head *head)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800695{
696 struct ipvl_dev *ipvlan = netdev_priv(dev);
697 struct ipvl_addr *addr, *next;
698
Paolo Abeni82308192018-02-28 10:59:27 +0100699 spin_lock_bh(&ipvlan->addrs_lock);
Konstantin Khlebnikov515866f2015-07-14 16:35:50 +0300700 list_for_each_entry_safe(addr, next, &ipvlan->addrs, anode) {
Konstantin Khlebnikov6640e672015-07-14 16:35:53 +0300701 ipvlan_ht_addr_del(addr);
Paolo Abeni82308192018-02-28 10:59:27 +0100702 list_del_rcu(&addr->anode);
Konstantin Khlebnikov6a725492015-07-14 16:35:51 +0300703 kfree_rcu(addr, rcu);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800704 }
Paolo Abeni82308192018-02-28 10:59:27 +0100705 spin_unlock_bh(&ipvlan->addrs_lock);
Konstantin Khlebnikov515866f2015-07-14 16:35:50 +0300706
Mahesh Bandewar009146d2017-01-03 12:47:16 -0800707 ida_simple_remove(&ipvlan->port->ida, dev->dev_id);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800708 list_del_rcu(&ipvlan->pnode);
709 unregister_netdevice_queue(dev, head);
710 netdev_upper_dev_unlink(ipvlan->phy_dev, dev);
711}
Sainath Grandhi235a9d82017-02-10 16:03:52 -0800712EXPORT_SYMBOL_GPL(ipvlan_link_delete);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800713
Sainath Grandhi235a9d82017-02-10 16:03:52 -0800714void ipvlan_link_setup(struct net_device *dev)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800715{
716 ether_setup(dev);
717
Xin Long548feb32018-06-18 16:15:57 +0800718 dev->max_mtu = ETH_MAX_MTU;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800719 dev->priv_flags &= ~(IFF_XMIT_DST_RELEASE | IFF_TX_SKB_SHARING);
Phil Sutterbf485bc2015-08-18 10:30:40 +0200720 dev->priv_flags |= IFF_UNICAST_FLT | IFF_NO_QUEUE;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800721 dev->netdev_ops = &ipvlan_netdev_ops;
David S. Millercf124db2017-05-08 12:52:56 -0400722 dev->needs_free_netdev = true;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800723 dev->header_ops = &ipvlan_header_ops;
724 dev->ethtool_ops = &ipvlan_ethtool_ops;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800725}
Sainath Grandhi235a9d82017-02-10 16:03:52 -0800726EXPORT_SYMBOL_GPL(ipvlan_link_setup);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800727
728static const struct nla_policy ipvlan_nl_policy[IFLA_IPVLAN_MAX + 1] =
729{
730 [IFLA_IPVLAN_MODE] = { .type = NLA_U16 },
Mahesh Bandewara190d042017-10-26 15:09:21 -0700731 [IFLA_IPVLAN_FLAGS] = { .type = NLA_U16 },
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800732};
733
734static struct rtnl_link_ops ipvlan_link_ops = {
735 .kind = "ipvlan",
736 .priv_size = sizeof(struct ipvl_dev),
737
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800738 .setup = ipvlan_link_setup,
739 .newlink = ipvlan_link_new,
740 .dellink = ipvlan_link_delete,
741};
742
Sainath Grandhi235a9d82017-02-10 16:03:52 -0800743int ipvlan_link_register(struct rtnl_link_ops *ops)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800744{
Sainath Grandhi235a9d82017-02-10 16:03:52 -0800745 ops->get_size = ipvlan_nl_getsize;
746 ops->policy = ipvlan_nl_policy;
747 ops->validate = ipvlan_nl_validate;
748 ops->fill_info = ipvlan_nl_fillinfo;
749 ops->changelink = ipvlan_nl_changelink;
750 ops->maxtype = IFLA_IPVLAN_MAX;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800751 return rtnl_link_register(ops);
752}
Sainath Grandhi235a9d82017-02-10 16:03:52 -0800753EXPORT_SYMBOL_GPL(ipvlan_link_register);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800754
755static int ipvlan_device_event(struct notifier_block *unused,
756 unsigned long event, void *ptr)
757{
758 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
759 struct ipvl_dev *ipvlan, *next;
760 struct ipvl_port *port;
761 LIST_HEAD(lst_kill);
762
Mahesh Bandewar5933fea2014-12-06 15:53:33 -0800763 if (!netif_is_ipvlan_port(dev))
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800764 return NOTIFY_DONE;
765
766 port = ipvlan_port_get_rtnl(dev);
767
768 switch (event) {
769 case NETDEV_CHANGE:
770 list_for_each_entry(ipvlan, &port->ipvlans, pnode)
771 netif_stacked_transfer_operstate(ipvlan->phy_dev,
772 ipvlan->dev);
773 break;
774
Florian Westphal31338222017-04-20 18:08:15 +0200775 case NETDEV_REGISTER: {
776 struct net *oldnet, *newnet = dev_net(dev);
777 struct ipvlan_netns *old_vnet;
778
779 oldnet = read_pnet(&port->pnet);
780 if (net_eq(newnet, oldnet))
781 break;
782
783 write_pnet(&port->pnet, newnet);
784
785 old_vnet = net_generic(oldnet, ipvlan_netid);
786 if (!old_vnet->ipvl_nf_hook_refcnt)
787 break;
788
789 ipvlan_register_nf_hook(newnet);
790 ipvlan_unregister_nf_hook(oldnet);
791 break;
792 }
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800793 case NETDEV_UNREGISTER:
794 if (dev->reg_state != NETREG_UNREGISTERING)
795 break;
796
Paolo Abeni82308192018-02-28 10:59:27 +0100797 list_for_each_entry_safe(ipvlan, next, &port->ipvlans, pnode)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800798 ipvlan->dev->rtnl_link_ops->dellink(ipvlan->dev,
799 &lst_kill);
800 unregister_netdevice_many(&lst_kill);
801 break;
802
803 case NETDEV_FEAT_CHANGE:
804 list_for_each_entry(ipvlan, &port->ipvlans, pnode) {
805 ipvlan->dev->features = dev->features & IPVLAN_FEATURES;
806 ipvlan->dev->gso_max_size = dev->gso_max_size;
Eric Dumazetf6773c52016-03-16 21:59:49 -0700807 ipvlan->dev->gso_max_segs = dev->gso_max_segs;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800808 netdev_features_change(ipvlan->dev);
809 }
810 break;
811
812 case NETDEV_CHANGEMTU:
813 list_for_each_entry(ipvlan, &port->ipvlans, pnode)
814 ipvlan_adjust_mtu(ipvlan, dev);
815 break;
816
Mahesh Bandewar32c10bb2017-10-11 17:16:26 -0700817 case NETDEV_CHANGEADDR:
Keefe Liuab452c32018-05-14 19:38:09 +0800818 list_for_each_entry(ipvlan, &port->ipvlans, pnode) {
Mahesh Bandewar32c10bb2017-10-11 17:16:26 -0700819 ether_addr_copy(ipvlan->dev->dev_addr, dev->dev_addr);
Keefe Liuab452c32018-05-14 19:38:09 +0800820 call_netdevice_notifiers(NETDEV_CHANGEADDR, ipvlan->dev);
821 }
Mahesh Bandewar32c10bb2017-10-11 17:16:26 -0700822 break;
823
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800824 case NETDEV_PRE_TYPE_CHANGE:
825 /* Forbid underlying device to change its type. */
826 return NOTIFY_BAD;
827 }
828 return NOTIFY_DONE;
829}
830
Paolo Abeni82308192018-02-28 10:59:27 +0100831/* the caller must held the addrs lock */
Gao Feng86673982016-12-28 16:46:51 +0800832static int ipvlan_add_addr(struct ipvl_dev *ipvlan, void *iaddr, bool is_v6)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800833{
834 struct ipvl_addr *addr;
835
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800836 addr = kzalloc(sizeof(struct ipvl_addr), GFP_ATOMIC);
837 if (!addr)
838 return -ENOMEM;
839
840 addr->master = ipvlan;
Matteo Croce94333fa2018-02-21 01:31:13 +0100841 if (!is_v6) {
Gao Feng86673982016-12-28 16:46:51 +0800842 memcpy(&addr->ip4addr, iaddr, sizeof(struct in_addr));
843 addr->atype = IPVL_IPV4;
Matteo Croce94333fa2018-02-21 01:31:13 +0100844#if IS_ENABLED(CONFIG_IPV6)
845 } else {
846 memcpy(&addr->ip6addr, iaddr, sizeof(struct in6_addr));
847 addr->atype = IPVL_IPV6;
848#endif
Gao Feng86673982016-12-28 16:46:51 +0800849 }
Paolo Abeni82308192018-02-28 10:59:27 +0100850
851 list_add_tail_rcu(&addr->anode, &ipvlan->addrs);
Konstantin Khlebnikov515866f2015-07-14 16:35:50 +0300852
Jiri Benc27705f72015-03-28 19:13:22 +0100853 /* If the interface is not up, the address will be added to the hash
854 * list by ipvlan_open.
855 */
856 if (netif_running(ipvlan->dev))
857 ipvlan_ht_addr_add(ipvlan, addr);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800858
859 return 0;
860}
861
Gao Feng86673982016-12-28 16:46:51 +0800862static void ipvlan_del_addr(struct ipvl_dev *ipvlan, void *iaddr, bool is_v6)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800863{
864 struct ipvl_addr *addr;
865
Paolo Abeni82308192018-02-28 10:59:27 +0100866 spin_lock_bh(&ipvlan->addrs_lock);
Gao Feng86673982016-12-28 16:46:51 +0800867 addr = ipvlan_find_addr(ipvlan, iaddr, is_v6);
Paolo Abeni82308192018-02-28 10:59:27 +0100868 if (!addr) {
869 spin_unlock_bh(&ipvlan->addrs_lock);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800870 return;
Paolo Abeni82308192018-02-28 10:59:27 +0100871 }
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800872
Konstantin Khlebnikov6640e672015-07-14 16:35:53 +0300873 ipvlan_ht_addr_del(addr);
Paolo Abeni82308192018-02-28 10:59:27 +0100874 list_del_rcu(&addr->anode);
875 spin_unlock_bh(&ipvlan->addrs_lock);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800876 kfree_rcu(addr, rcu);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800877}
878
Matteo Croce94333fa2018-02-21 01:31:13 +0100879static bool ipvlan_is_valid_dev(const struct net_device *dev)
880{
881 struct ipvl_dev *ipvlan = netdev_priv(dev);
882
883 if (!netif_is_ipvlan(dev))
884 return false;
885
886 if (!ipvlan || !ipvlan->port)
887 return false;
888
889 return true;
890}
891
892#if IS_ENABLED(CONFIG_IPV6)
Gao Feng86673982016-12-28 16:46:51 +0800893static int ipvlan_add_addr6(struct ipvl_dev *ipvlan, struct in6_addr *ip6_addr)
894{
Paolo Abeni82308192018-02-28 10:59:27 +0100895 int ret = -EINVAL;
896
897 spin_lock_bh(&ipvlan->addrs_lock);
898 if (ipvlan_addr_busy(ipvlan->port, ip6_addr, true))
Gao Feng86673982016-12-28 16:46:51 +0800899 netif_err(ipvlan, ifup, ipvlan->dev,
900 "Failed to add IPv6=%pI6c addr for %s intf\n",
901 ip6_addr, ipvlan->dev->name);
Paolo Abeni82308192018-02-28 10:59:27 +0100902 else
903 ret = ipvlan_add_addr(ipvlan, ip6_addr, true);
904 spin_unlock_bh(&ipvlan->addrs_lock);
905 return ret;
Gao Feng86673982016-12-28 16:46:51 +0800906}
907
908static void ipvlan_del_addr6(struct ipvl_dev *ipvlan, struct in6_addr *ip6_addr)
909{
910 return ipvlan_del_addr(ipvlan, ip6_addr, true);
911}
912
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800913static int ipvlan_addr6_event(struct notifier_block *unused,
914 unsigned long event, void *ptr)
915{
916 struct inet6_ifaddr *if6 = (struct inet6_ifaddr *)ptr;
917 struct net_device *dev = (struct net_device *)if6->idev->dev;
918 struct ipvl_dev *ipvlan = netdev_priv(dev);
919
Gao Feng5e51fe62017-12-01 16:33:03 +0800920 if (!ipvlan_is_valid_dev(dev))
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800921 return NOTIFY_DONE;
922
923 switch (event) {
924 case NETDEV_UP:
925 if (ipvlan_add_addr6(ipvlan, &if6->addr))
926 return NOTIFY_BAD;
927 break;
928
929 case NETDEV_DOWN:
930 ipvlan_del_addr6(ipvlan, &if6->addr);
931 break;
932 }
933
934 return NOTIFY_OK;
935}
936
Krister Johansen3ad7d242017-06-08 13:12:14 -0700937static int ipvlan_addr6_validator_event(struct notifier_block *unused,
938 unsigned long event, void *ptr)
939{
940 struct in6_validator_info *i6vi = (struct in6_validator_info *)ptr;
941 struct net_device *dev = (struct net_device *)i6vi->i6vi_dev->dev;
942 struct ipvl_dev *ipvlan = netdev_priv(dev);
943
Gao Feng5e51fe62017-12-01 16:33:03 +0800944 if (!ipvlan_is_valid_dev(dev))
Krister Johansen3ad7d242017-06-08 13:12:14 -0700945 return NOTIFY_DONE;
946
947 switch (event) {
948 case NETDEV_UP:
David Ahernde95e042017-10-18 09:56:54 -0700949 if (ipvlan_addr_busy(ipvlan->port, &i6vi->i6vi_addr, true)) {
950 NL_SET_ERR_MSG(i6vi->extack,
951 "Address already assigned to an ipvlan device");
Krister Johansen3ad7d242017-06-08 13:12:14 -0700952 return notifier_from_errno(-EADDRINUSE);
David Ahernde95e042017-10-18 09:56:54 -0700953 }
Krister Johansen3ad7d242017-06-08 13:12:14 -0700954 break;
955 }
956
957 return NOTIFY_OK;
958}
Matteo Croce94333fa2018-02-21 01:31:13 +0100959#endif
Krister Johansen3ad7d242017-06-08 13:12:14 -0700960
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800961static int ipvlan_add_addr4(struct ipvl_dev *ipvlan, struct in_addr *ip4_addr)
962{
Paolo Abeni82308192018-02-28 10:59:27 +0100963 int ret = -EINVAL;
964
965 spin_lock_bh(&ipvlan->addrs_lock);
966 if (ipvlan_addr_busy(ipvlan->port, ip4_addr, false))
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800967 netif_err(ipvlan, ifup, ipvlan->dev,
968 "Failed to add IPv4=%pI4 on %s intf.\n",
969 ip4_addr, ipvlan->dev->name);
Paolo Abeni82308192018-02-28 10:59:27 +0100970 else
971 ret = ipvlan_add_addr(ipvlan, ip4_addr, false);
972 spin_unlock_bh(&ipvlan->addrs_lock);
973 return ret;
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800974}
975
976static void ipvlan_del_addr4(struct ipvl_dev *ipvlan, struct in_addr *ip4_addr)
977{
Gao Feng86673982016-12-28 16:46:51 +0800978 return ipvlan_del_addr(ipvlan, ip4_addr, false);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800979}
980
981static int ipvlan_addr4_event(struct notifier_block *unused,
982 unsigned long event, void *ptr)
983{
984 struct in_ifaddr *if4 = (struct in_ifaddr *)ptr;
985 struct net_device *dev = (struct net_device *)if4->ifa_dev->dev;
986 struct ipvl_dev *ipvlan = netdev_priv(dev);
987 struct in_addr ip4_addr;
988
Gao Feng5e51fe62017-12-01 16:33:03 +0800989 if (!ipvlan_is_valid_dev(dev))
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -0800990 return NOTIFY_DONE;
991
992 switch (event) {
993 case NETDEV_UP:
994 ip4_addr.s_addr = if4->ifa_address;
995 if (ipvlan_add_addr4(ipvlan, &ip4_addr))
996 return NOTIFY_BAD;
997 break;
998
999 case NETDEV_DOWN:
1000 ip4_addr.s_addr = if4->ifa_address;
1001 ipvlan_del_addr4(ipvlan, &ip4_addr);
1002 break;
1003 }
1004
1005 return NOTIFY_OK;
1006}
1007
Krister Johansen3ad7d242017-06-08 13:12:14 -07001008static int ipvlan_addr4_validator_event(struct notifier_block *unused,
1009 unsigned long event, void *ptr)
1010{
1011 struct in_validator_info *ivi = (struct in_validator_info *)ptr;
1012 struct net_device *dev = (struct net_device *)ivi->ivi_dev->dev;
1013 struct ipvl_dev *ipvlan = netdev_priv(dev);
1014
Gao Feng5e51fe62017-12-01 16:33:03 +08001015 if (!ipvlan_is_valid_dev(dev))
Krister Johansen3ad7d242017-06-08 13:12:14 -07001016 return NOTIFY_DONE;
1017
1018 switch (event) {
1019 case NETDEV_UP:
David Ahernde95e042017-10-18 09:56:54 -07001020 if (ipvlan_addr_busy(ipvlan->port, &ivi->ivi_addr, false)) {
1021 NL_SET_ERR_MSG(ivi->extack,
1022 "Address already assigned to an ipvlan device");
Krister Johansen3ad7d242017-06-08 13:12:14 -07001023 return notifier_from_errno(-EADDRINUSE);
David Ahernde95e042017-10-18 09:56:54 -07001024 }
Krister Johansen3ad7d242017-06-08 13:12:14 -07001025 break;
1026 }
1027
1028 return NOTIFY_OK;
1029}
1030
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001031static struct notifier_block ipvlan_addr4_notifier_block __read_mostly = {
1032 .notifier_call = ipvlan_addr4_event,
1033};
1034
Krister Johansen3ad7d242017-06-08 13:12:14 -07001035static struct notifier_block ipvlan_addr4_vtor_notifier_block __read_mostly = {
1036 .notifier_call = ipvlan_addr4_validator_event,
1037};
1038
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001039static struct notifier_block ipvlan_notifier_block __read_mostly = {
1040 .notifier_call = ipvlan_device_event,
1041};
1042
Matteo Croce94333fa2018-02-21 01:31:13 +01001043#if IS_ENABLED(CONFIG_IPV6)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001044static struct notifier_block ipvlan_addr6_notifier_block __read_mostly = {
1045 .notifier_call = ipvlan_addr6_event,
1046};
1047
Krister Johansen3ad7d242017-06-08 13:12:14 -07001048static struct notifier_block ipvlan_addr6_vtor_notifier_block __read_mostly = {
1049 .notifier_call = ipvlan_addr6_validator_event,
1050};
Matteo Croce94333fa2018-02-21 01:31:13 +01001051#endif
Krister Johansen3ad7d242017-06-08 13:12:14 -07001052
Florian Westphal31338222017-04-20 18:08:15 +02001053static void ipvlan_ns_exit(struct net *net)
1054{
1055 struct ipvlan_netns *vnet = net_generic(net, ipvlan_netid);
1056
1057 if (WARN_ON_ONCE(vnet->ipvl_nf_hook_refcnt)) {
1058 vnet->ipvl_nf_hook_refcnt = 0;
1059 nf_unregister_net_hooks(net, ipvl_nfops,
1060 ARRAY_SIZE(ipvl_nfops));
1061 }
1062}
1063
1064static struct pernet_operations ipvlan_net_ops = {
1065 .id = &ipvlan_netid,
1066 .size = sizeof(struct ipvlan_netns),
1067 .exit = ipvlan_ns_exit,
1068};
1069
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001070static int __init ipvlan_init_module(void)
1071{
1072 int err;
1073
1074 ipvlan_init_secret();
1075 register_netdevice_notifier(&ipvlan_notifier_block);
Matteo Croce94333fa2018-02-21 01:31:13 +01001076#if IS_ENABLED(CONFIG_IPV6)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001077 register_inet6addr_notifier(&ipvlan_addr6_notifier_block);
Krister Johansen3ad7d242017-06-08 13:12:14 -07001078 register_inet6addr_validator_notifier(
1079 &ipvlan_addr6_vtor_notifier_block);
Matteo Croce94333fa2018-02-21 01:31:13 +01001080#endif
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001081 register_inetaddr_notifier(&ipvlan_addr4_notifier_block);
Krister Johansen3ad7d242017-06-08 13:12:14 -07001082 register_inetaddr_validator_notifier(&ipvlan_addr4_vtor_notifier_block);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001083
Florian Westphal31338222017-04-20 18:08:15 +02001084 err = register_pernet_subsys(&ipvlan_net_ops);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001085 if (err < 0)
1086 goto error;
1087
Florian Westphal31338222017-04-20 18:08:15 +02001088 err = ipvlan_link_register(&ipvlan_link_ops);
1089 if (err < 0) {
1090 unregister_pernet_subsys(&ipvlan_net_ops);
1091 goto error;
1092 }
1093
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001094 return 0;
1095error:
1096 unregister_inetaddr_notifier(&ipvlan_addr4_notifier_block);
Krister Johansen3ad7d242017-06-08 13:12:14 -07001097 unregister_inetaddr_validator_notifier(
1098 &ipvlan_addr4_vtor_notifier_block);
Matteo Croce94333fa2018-02-21 01:31:13 +01001099#if IS_ENABLED(CONFIG_IPV6)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001100 unregister_inet6addr_notifier(&ipvlan_addr6_notifier_block);
Krister Johansen3ad7d242017-06-08 13:12:14 -07001101 unregister_inet6addr_validator_notifier(
1102 &ipvlan_addr6_vtor_notifier_block);
Matteo Croce94333fa2018-02-21 01:31:13 +01001103#endif
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001104 unregister_netdevice_notifier(&ipvlan_notifier_block);
1105 return err;
1106}
1107
1108static void __exit ipvlan_cleanup_module(void)
1109{
1110 rtnl_link_unregister(&ipvlan_link_ops);
Florian Westphal31338222017-04-20 18:08:15 +02001111 unregister_pernet_subsys(&ipvlan_net_ops);
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001112 unregister_netdevice_notifier(&ipvlan_notifier_block);
1113 unregister_inetaddr_notifier(&ipvlan_addr4_notifier_block);
Krister Johansen3ad7d242017-06-08 13:12:14 -07001114 unregister_inetaddr_validator_notifier(
1115 &ipvlan_addr4_vtor_notifier_block);
Matteo Croce94333fa2018-02-21 01:31:13 +01001116#if IS_ENABLED(CONFIG_IPV6)
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001117 unregister_inet6addr_notifier(&ipvlan_addr6_notifier_block);
Krister Johansen3ad7d242017-06-08 13:12:14 -07001118 unregister_inet6addr_validator_notifier(
1119 &ipvlan_addr6_vtor_notifier_block);
Matteo Croce94333fa2018-02-21 01:31:13 +01001120#endif
Mahesh Bandewar2ad7bf32014-11-23 23:07:46 -08001121}
1122
1123module_init(ipvlan_init_module);
1124module_exit(ipvlan_cleanup_module);
1125
1126MODULE_LICENSE("GPL");
1127MODULE_AUTHOR("Mahesh Bandewar <maheshb@google.com>");
1128MODULE_DESCRIPTION("Driver for L3 (IPv6/IPv4) based VLANs");
1129MODULE_ALIAS_RTNL_LINK("ipvlan");