Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* |
| 2 | * Anycast support for IPv6 |
YOSHIFUJI Hideaki | 1ab1457 | 2007-02-09 23:24:49 +0900 | [diff] [blame] | 3 | * Linux INET6 implementation |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 4 | * |
| 5 | * Authors: |
| 6 | * David L Stevens (dlstevens@us.ibm.com) |
| 7 | * |
| 8 | * based heavily on net/ipv6/mcast.c |
| 9 | * |
| 10 | * This program is free software; you can redistribute it and/or |
| 11 | * modify it under the terms of the GNU General Public License |
| 12 | * as published by the Free Software Foundation; either version |
| 13 | * 2 of the License, or (at your option) any later version. |
| 14 | */ |
| 15 | |
Randy Dunlap | 4fc268d | 2006-01-11 12:17:47 -0800 | [diff] [blame] | 16 | #include <linux/capability.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 17 | #include <linux/module.h> |
| 18 | #include <linux/errno.h> |
| 19 | #include <linux/types.h> |
| 20 | #include <linux/random.h> |
| 21 | #include <linux/string.h> |
| 22 | #include <linux/socket.h> |
| 23 | #include <linux/sockios.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 24 | #include <linux/net.h> |
| 25 | #include <linux/in6.h> |
| 26 | #include <linux/netdevice.h> |
| 27 | #include <linux/if_arp.h> |
| 28 | #include <linux/route.h> |
| 29 | #include <linux/init.h> |
| 30 | #include <linux/proc_fs.h> |
| 31 | #include <linux/seq_file.h> |
Tejun Heo | 5a0e3ad | 2010-03-24 17:04:11 +0900 | [diff] [blame] | 32 | #include <linux/slab.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 33 | |
Eric W. Biederman | 457c4cb | 2007-09-12 12:01:34 +0200 | [diff] [blame] | 34 | #include <net/net_namespace.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 35 | #include <net/sock.h> |
| 36 | #include <net/snmp.h> |
| 37 | |
| 38 | #include <net/ipv6.h> |
| 39 | #include <net/protocol.h> |
| 40 | #include <net/if_inet6.h> |
| 41 | #include <net/ndisc.h> |
| 42 | #include <net/addrconf.h> |
| 43 | #include <net/ip6_route.h> |
| 44 | |
| 45 | #include <net/checksum.h> |
| 46 | |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 47 | #define IN6_ADDR_HSIZE_SHIFT 8 |
| 48 | #define IN6_ADDR_HSIZE BIT(IN6_ADDR_HSIZE_SHIFT) |
| 49 | /* anycast address hash table |
| 50 | */ |
| 51 | static struct hlist_head inet6_acaddr_lst[IN6_ADDR_HSIZE]; |
| 52 | static DEFINE_SPINLOCK(acaddr_hash_lock); |
| 53 | |
Eric Dumazet | b71d1d4 | 2011-04-22 04:53:02 +0000 | [diff] [blame] | 54 | static int ipv6_dev_ac_dec(struct net_device *dev, const struct in6_addr *addr); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 55 | |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 56 | static u32 inet6_acaddr_hash(struct net *net, const struct in6_addr *addr) |
| 57 | { |
| 58 | u32 val = ipv6_addr_hash(addr) ^ net_hash_mix(net); |
| 59 | |
| 60 | return hash_32(val, IN6_ADDR_HSIZE_SHIFT); |
| 61 | } |
| 62 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 63 | /* |
| 64 | * socket join an anycast group |
| 65 | */ |
| 66 | |
Eric Dumazet | b71d1d4 | 2011-04-22 04:53:02 +0000 | [diff] [blame] | 67 | int ipv6_sock_ac_join(struct sock *sk, int ifindex, const struct in6_addr *addr) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 68 | { |
| 69 | struct ipv6_pinfo *np = inet6_sk(sk); |
| 70 | struct net_device *dev = NULL; |
| 71 | struct inet6_dev *idev; |
| 72 | struct ipv6_ac_socklist *pac; |
Daniel Lezcano | 6ab57e7 | 2008-03-26 16:52:32 -0700 | [diff] [blame] | 73 | struct net *net = sock_net(sk); |
YOSHIFUJI Hideaki | 53b7997 | 2008-07-19 22:35:03 -0700 | [diff] [blame] | 74 | int ishost = !net->ipv6.devconf_all->forwarding; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 75 | int err = 0; |
| 76 | |
Marcelo Ricardo Leitner | c4a6853 | 2015-03-20 11:37:17 -0300 | [diff] [blame] | 77 | ASSERT_RTNL(); |
| 78 | |
Eric W. Biederman | af31f41 | 2012-11-16 03:03:06 +0000 | [diff] [blame] | 79 | if (!ns_capable(net->user_ns, CAP_NET_ADMIN)) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 80 | return -EPERM; |
| 81 | if (ipv6_addr_is_multicast(addr)) |
| 82 | return -EINVAL; |
David Ahern | 232378e | 2018-03-13 08:29:37 -0700 | [diff] [blame] | 83 | |
| 84 | if (ifindex) |
| 85 | dev = __dev_get_by_index(net, ifindex); |
| 86 | |
| 87 | if (ipv6_chk_addr_and_flags(net, addr, dev, true, 0, IFA_F_TENTATIVE)) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 88 | return -EINVAL; |
| 89 | |
| 90 | pac = sock_kmalloc(sk, sizeof(struct ipv6_ac_socklist), GFP_KERNEL); |
Ian Morris | 63159f2 | 2015-03-29 14:00:04 +0100 | [diff] [blame] | 91 | if (!pac) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 92 | return -ENOMEM; |
| 93 | pac->acl_next = NULL; |
Alexey Dobriyan | 4e3fd7a | 2011-11-21 03:39:03 +0000 | [diff] [blame] | 94 | pac->acl_addr = *addr; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 95 | |
| 96 | if (ifindex == 0) { |
| 97 | struct rt6_info *rt; |
| 98 | |
David Ahern | b75cc8f | 2018-03-02 08:32:17 -0800 | [diff] [blame] | 99 | rt = rt6_lookup(net, addr, NULL, 0, NULL, 0); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 100 | if (rt) { |
David S. Miller | d191854 | 2011-12-28 20:19:20 -0500 | [diff] [blame] | 101 | dev = rt->dst.dev; |
Amerigo Wang | 94e187c | 2012-10-29 00:13:19 +0000 | [diff] [blame] | 102 | ip6_rt_put(rt); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 103 | } else if (ishost) { |
| 104 | err = -EADDRNOTAVAIL; |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 105 | goto error; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 106 | } else { |
| 107 | /* router, no matching interface: just pick one */ |
WANG Cong | 6c55549 | 2014-09-11 15:35:09 -0700 | [diff] [blame] | 108 | dev = __dev_get_by_flags(net, IFF_UP, |
| 109 | IFF_UP | IFF_LOOPBACK); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 110 | } |
David Ahern | 232378e | 2018-03-13 08:29:37 -0700 | [diff] [blame] | 111 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 112 | |
Ian Morris | 63159f2 | 2015-03-29 14:00:04 +0100 | [diff] [blame] | 113 | if (!dev) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 114 | err = -ENODEV; |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 115 | goto error; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 116 | } |
| 117 | |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 118 | idev = __in6_dev_get(dev); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 119 | if (!idev) { |
| 120 | if (ifindex) |
| 121 | err = -ENODEV; |
| 122 | else |
| 123 | err = -EADDRNOTAVAIL; |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 124 | goto error; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 125 | } |
| 126 | /* reset ishost, now that we have a specific device */ |
| 127 | ishost = !idev->cnf.forwarding; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 128 | |
| 129 | pac->acl_ifindex = dev->ifindex; |
| 130 | |
| 131 | /* XXX |
| 132 | * For hosts, allow link-local or matching prefix anycasts. |
| 133 | * This obviates the need for propagating anycast routes while |
| 134 | * still allowing some non-router anycast participation. |
| 135 | */ |
YOSHIFUJI Hideaki | 52eeeb8 | 2008-03-15 22:54:23 -0400 | [diff] [blame] | 136 | if (!ipv6_chk_prefix(addr, dev)) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 137 | if (ishost) |
| 138 | err = -EADDRNOTAVAIL; |
| 139 | if (err) |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 140 | goto error; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 141 | } |
| 142 | |
WANG Cong | 013b4d9 | 2014-09-11 15:35:11 -0700 | [diff] [blame] | 143 | err = __ipv6_dev_ac_inc(idev, addr); |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 144 | if (!err) { |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 145 | pac->acl_next = np->ipv6_ac_list; |
| 146 | np->ipv6_ac_list = pac; |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 147 | pac = NULL; |
| 148 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 149 | |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 150 | error: |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 151 | if (pac) |
| 152 | sock_kfree_s(sk, pac, sizeof(*pac)); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 153 | return err; |
| 154 | } |
| 155 | |
| 156 | /* |
| 157 | * socket leave an anycast group |
| 158 | */ |
Eric Dumazet | b71d1d4 | 2011-04-22 04:53:02 +0000 | [diff] [blame] | 159 | int ipv6_sock_ac_drop(struct sock *sk, int ifindex, const struct in6_addr *addr) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 160 | { |
| 161 | struct ipv6_pinfo *np = inet6_sk(sk); |
| 162 | struct net_device *dev; |
| 163 | struct ipv6_ac_socklist *pac, *prev_pac; |
Daniel Lezcano | 6ab57e7 | 2008-03-26 16:52:32 -0700 | [diff] [blame] | 164 | struct net *net = sock_net(sk); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 165 | |
Marcelo Ricardo Leitner | c4a6853 | 2015-03-20 11:37:17 -0300 | [diff] [blame] | 166 | ASSERT_RTNL(); |
| 167 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 168 | prev_pac = NULL; |
| 169 | for (pac = np->ipv6_ac_list; pac; pac = pac->acl_next) { |
| 170 | if ((ifindex == 0 || pac->acl_ifindex == ifindex) && |
| 171 | ipv6_addr_equal(&pac->acl_addr, addr)) |
| 172 | break; |
| 173 | prev_pac = pac; |
| 174 | } |
Marcelo Ricardo Leitner | c4a6853 | 2015-03-20 11:37:17 -0300 | [diff] [blame] | 175 | if (!pac) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 176 | return -ENOENT; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 177 | if (prev_pac) |
| 178 | prev_pac->acl_next = pac->acl_next; |
| 179 | else |
| 180 | np->ipv6_ac_list = pac->acl_next; |
| 181 | |
WANG Cong | 6c55549 | 2014-09-11 15:35:09 -0700 | [diff] [blame] | 182 | dev = __dev_get_by_index(net, pac->acl_ifindex); |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 183 | if (dev) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 184 | ipv6_dev_ac_dec(dev, &pac->acl_addr); |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 185 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 186 | sock_kfree_s(sk, pac, sizeof(*pac)); |
| 187 | return 0; |
| 188 | } |
| 189 | |
| 190 | void ipv6_sock_ac_close(struct sock *sk) |
| 191 | { |
| 192 | struct ipv6_pinfo *np = inet6_sk(sk); |
| 193 | struct net_device *dev = NULL; |
| 194 | struct ipv6_ac_socklist *pac; |
Daniel Lezcano | 6ab57e7 | 2008-03-26 16:52:32 -0700 | [diff] [blame] | 195 | struct net *net = sock_net(sk); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 196 | int prev_index; |
| 197 | |
Eric Dumazet | 0e1efe9 | 2012-12-05 09:18:10 +0000 | [diff] [blame] | 198 | if (!np->ipv6_ac_list) |
| 199 | return; |
| 200 | |
WANG Cong | b03a9c0 | 2014-09-11 15:35:10 -0700 | [diff] [blame] | 201 | rtnl_lock(); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 202 | pac = np->ipv6_ac_list; |
| 203 | np->ipv6_ac_list = NULL; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 204 | |
| 205 | prev_index = 0; |
| 206 | while (pac) { |
| 207 | struct ipv6_ac_socklist *next = pac->acl_next; |
| 208 | |
| 209 | if (pac->acl_ifindex != prev_index) { |
WANG Cong | 6c55549 | 2014-09-11 15:35:09 -0700 | [diff] [blame] | 210 | dev = __dev_get_by_index(net, pac->acl_ifindex); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 211 | prev_index = pac->acl_ifindex; |
| 212 | } |
| 213 | if (dev) |
| 214 | ipv6_dev_ac_dec(dev, &pac->acl_addr); |
| 215 | sock_kfree_s(sk, pac, sizeof(*pac)); |
| 216 | pac = next; |
| 217 | } |
Sabrina Dubroca | a9ed4a2 | 2014-09-02 10:29:29 +0200 | [diff] [blame] | 218 | rtnl_unlock(); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 219 | } |
| 220 | |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 221 | static void ipv6_add_acaddr_hash(struct net *net, struct ifacaddr6 *aca) |
| 222 | { |
| 223 | unsigned int hash = inet6_acaddr_hash(net, &aca->aca_addr); |
| 224 | |
| 225 | spin_lock(&acaddr_hash_lock); |
| 226 | hlist_add_head_rcu(&aca->aca_addr_lst, &inet6_acaddr_lst[hash]); |
| 227 | spin_unlock(&acaddr_hash_lock); |
| 228 | } |
| 229 | |
| 230 | static void ipv6_del_acaddr_hash(struct ifacaddr6 *aca) |
| 231 | { |
| 232 | spin_lock(&acaddr_hash_lock); |
| 233 | hlist_del_init_rcu(&aca->aca_addr_lst); |
| 234 | spin_unlock(&acaddr_hash_lock); |
| 235 | } |
| 236 | |
WANG Cong | 83aa29e | 2014-09-11 15:35:12 -0700 | [diff] [blame] | 237 | static void aca_get(struct ifacaddr6 *aca) |
| 238 | { |
Reshetova, Elena | affa78b | 2017-07-04 09:34:58 +0300 | [diff] [blame] | 239 | refcount_inc(&aca->aca_refcnt); |
WANG Cong | 83aa29e | 2014-09-11 15:35:12 -0700 | [diff] [blame] | 240 | } |
| 241 | |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 242 | static void aca_free_rcu(struct rcu_head *h) |
| 243 | { |
| 244 | struct ifacaddr6 *aca = container_of(h, struct ifacaddr6, rcu); |
| 245 | |
| 246 | fib6_info_release(aca->aca_rt); |
| 247 | kfree(aca); |
| 248 | } |
| 249 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 250 | static void aca_put(struct ifacaddr6 *ac) |
| 251 | { |
Reshetova, Elena | affa78b | 2017-07-04 09:34:58 +0300 | [diff] [blame] | 252 | if (refcount_dec_and_test(&ac->aca_refcnt)) { |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 253 | call_rcu(&ac->rcu, aca_free_rcu); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 254 | } |
| 255 | } |
| 256 | |
David Ahern | 93c2fb2 | 2018-04-18 15:38:59 -0700 | [diff] [blame] | 257 | static struct ifacaddr6 *aca_alloc(struct fib6_info *f6i, |
WANG Cong | 83aa29e | 2014-09-11 15:35:12 -0700 | [diff] [blame] | 258 | const struct in6_addr *addr) |
| 259 | { |
WANG Cong | 83aa29e | 2014-09-11 15:35:12 -0700 | [diff] [blame] | 260 | struct ifacaddr6 *aca; |
| 261 | |
| 262 | aca = kzalloc(sizeof(*aca), GFP_ATOMIC); |
Ian Morris | 63159f2 | 2015-03-29 14:00:04 +0100 | [diff] [blame] | 263 | if (!aca) |
WANG Cong | 83aa29e | 2014-09-11 15:35:12 -0700 | [diff] [blame] | 264 | return NULL; |
| 265 | |
| 266 | aca->aca_addr = *addr; |
David Ahern | 93c2fb2 | 2018-04-18 15:38:59 -0700 | [diff] [blame] | 267 | fib6_info_hold(f6i); |
| 268 | aca->aca_rt = f6i; |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 269 | INIT_HLIST_NODE(&aca->aca_addr_lst); |
WANG Cong | 83aa29e | 2014-09-11 15:35:12 -0700 | [diff] [blame] | 270 | aca->aca_users = 1; |
| 271 | /* aca_tstamp should be updated upon changes */ |
| 272 | aca->aca_cstamp = aca->aca_tstamp = jiffies; |
Reshetova, Elena | affa78b | 2017-07-04 09:34:58 +0300 | [diff] [blame] | 273 | refcount_set(&aca->aca_refcnt, 1); |
WANG Cong | 83aa29e | 2014-09-11 15:35:12 -0700 | [diff] [blame] | 274 | |
| 275 | return aca; |
| 276 | } |
| 277 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 278 | /* |
| 279 | * device anycast group inc (add if not found) |
| 280 | */ |
WANG Cong | 013b4d9 | 2014-09-11 15:35:11 -0700 | [diff] [blame] | 281 | int __ipv6_dev_ac_inc(struct inet6_dev *idev, const struct in6_addr *addr) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 282 | { |
| 283 | struct ifacaddr6 *aca; |
David Ahern | 360a988 | 2018-04-18 15:39:00 -0700 | [diff] [blame] | 284 | struct fib6_info *f6i; |
David Ahern | afb1d4b5 | 2018-04-17 17:33:11 -0700 | [diff] [blame] | 285 | struct net *net; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 286 | int err; |
| 287 | |
Sabrina Dubroca | a9ed4a2 | 2014-09-02 10:29:29 +0200 | [diff] [blame] | 288 | ASSERT_RTNL(); |
| 289 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 290 | write_lock_bh(&idev->lock); |
| 291 | if (idev->dead) { |
| 292 | err = -ENODEV; |
| 293 | goto out; |
| 294 | } |
| 295 | |
| 296 | for (aca = idev->ac_list; aca; aca = aca->aca_next) { |
| 297 | if (ipv6_addr_equal(&aca->aca_addr, addr)) { |
| 298 | aca->aca_users++; |
| 299 | err = 0; |
| 300 | goto out; |
| 301 | } |
| 302 | } |
| 303 | |
David Ahern | afb1d4b5 | 2018-04-17 17:33:11 -0700 | [diff] [blame] | 304 | net = dev_net(idev->dev); |
David Ahern | 360a988 | 2018-04-18 15:39:00 -0700 | [diff] [blame] | 305 | f6i = addrconf_f6i_alloc(net, idev, addr, true, GFP_ATOMIC); |
| 306 | if (IS_ERR(f6i)) { |
| 307 | err = PTR_ERR(f6i); |
WANG Cong | 83aa29e | 2014-09-11 15:35:12 -0700 | [diff] [blame] | 308 | goto out; |
| 309 | } |
David Ahern | 360a988 | 2018-04-18 15:39:00 -0700 | [diff] [blame] | 310 | aca = aca_alloc(f6i, addr); |
Ian Morris | 63159f2 | 2015-03-29 14:00:04 +0100 | [diff] [blame] | 311 | if (!aca) { |
David Ahern | 360a988 | 2018-04-18 15:39:00 -0700 | [diff] [blame] | 312 | fib6_info_release(f6i); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 313 | err = -ENOMEM; |
| 314 | goto out; |
| 315 | } |
| 316 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 317 | aca->aca_next = idev->ac_list; |
| 318 | idev->ac_list = aca; |
WANG Cong | 83aa29e | 2014-09-11 15:35:12 -0700 | [diff] [blame] | 319 | |
| 320 | /* Hold this for addrconf_join_solict() below before we unlock, |
| 321 | * it is already exposed via idev->ac_list. |
| 322 | */ |
| 323 | aca_get(aca); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 324 | write_unlock_bh(&idev->lock); |
| 325 | |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 326 | ipv6_add_acaddr_hash(net, aca); |
| 327 | |
David Ahern | 360a988 | 2018-04-18 15:39:00 -0700 | [diff] [blame] | 328 | ip6_ins_rt(net, f6i); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 329 | |
WANG Cong | 013b4d9 | 2014-09-11 15:35:11 -0700 | [diff] [blame] | 330 | addrconf_join_solict(idev->dev, &aca->aca_addr); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 331 | |
| 332 | aca_put(aca); |
| 333 | return 0; |
| 334 | out: |
| 335 | write_unlock_bh(&idev->lock); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 336 | return err; |
| 337 | } |
| 338 | |
| 339 | /* |
| 340 | * device anycast group decrement |
| 341 | */ |
Eric Dumazet | b71d1d4 | 2011-04-22 04:53:02 +0000 | [diff] [blame] | 342 | int __ipv6_dev_ac_dec(struct inet6_dev *idev, const struct in6_addr *addr) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 343 | { |
| 344 | struct ifacaddr6 *aca, *prev_aca; |
| 345 | |
Sabrina Dubroca | a9ed4a2 | 2014-09-02 10:29:29 +0200 | [diff] [blame] | 346 | ASSERT_RTNL(); |
| 347 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 348 | write_lock_bh(&idev->lock); |
| 349 | prev_aca = NULL; |
| 350 | for (aca = idev->ac_list; aca; aca = aca->aca_next) { |
| 351 | if (ipv6_addr_equal(&aca->aca_addr, addr)) |
| 352 | break; |
| 353 | prev_aca = aca; |
| 354 | } |
| 355 | if (!aca) { |
| 356 | write_unlock_bh(&idev->lock); |
| 357 | return -ENOENT; |
| 358 | } |
| 359 | if (--aca->aca_users > 0) { |
| 360 | write_unlock_bh(&idev->lock); |
| 361 | return 0; |
| 362 | } |
| 363 | if (prev_aca) |
| 364 | prev_aca->aca_next = aca->aca_next; |
| 365 | else |
| 366 | idev->ac_list = aca->aca_next; |
| 367 | write_unlock_bh(&idev->lock); |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 368 | ipv6_del_acaddr_hash(aca); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 369 | addrconf_leave_solict(idev, &aca->aca_addr); |
| 370 | |
David Ahern | afb1d4b5 | 2018-04-17 17:33:11 -0700 | [diff] [blame] | 371 | ip6_del_rt(dev_net(idev->dev), aca->aca_rt); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 372 | |
| 373 | aca_put(aca); |
| 374 | return 0; |
| 375 | } |
| 376 | |
WANG Cong | 6c55549 | 2014-09-11 15:35:09 -0700 | [diff] [blame] | 377 | /* called with rtnl_lock() */ |
Eric Dumazet | b71d1d4 | 2011-04-22 04:53:02 +0000 | [diff] [blame] | 378 | static int ipv6_dev_ac_dec(struct net_device *dev, const struct in6_addr *addr) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 379 | { |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 380 | struct inet6_dev *idev = __in6_dev_get(dev); |
| 381 | |
Ian Morris | 63159f2 | 2015-03-29 14:00:04 +0100 | [diff] [blame] | 382 | if (!idev) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 383 | return -ENODEV; |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 384 | return __ipv6_dev_ac_dec(idev, addr); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 385 | } |
YOSHIFUJI Hideaki | 1ab1457 | 2007-02-09 23:24:49 +0900 | [diff] [blame] | 386 | |
Sabrina Dubroca | 381f4dc | 2014-09-10 23:23:02 +0200 | [diff] [blame] | 387 | void ipv6_ac_destroy_dev(struct inet6_dev *idev) |
| 388 | { |
| 389 | struct ifacaddr6 *aca; |
| 390 | |
| 391 | write_lock_bh(&idev->lock); |
| 392 | while ((aca = idev->ac_list) != NULL) { |
| 393 | idev->ac_list = aca->aca_next; |
| 394 | write_unlock_bh(&idev->lock); |
| 395 | |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 396 | ipv6_del_acaddr_hash(aca); |
| 397 | |
Sabrina Dubroca | 381f4dc | 2014-09-10 23:23:02 +0200 | [diff] [blame] | 398 | addrconf_leave_solict(idev, &aca->aca_addr); |
| 399 | |
David Ahern | afb1d4b5 | 2018-04-17 17:33:11 -0700 | [diff] [blame] | 400 | ip6_del_rt(dev_net(idev->dev), aca->aca_rt); |
Sabrina Dubroca | 381f4dc | 2014-09-10 23:23:02 +0200 | [diff] [blame] | 401 | |
| 402 | aca_put(aca); |
| 403 | |
| 404 | write_lock_bh(&idev->lock); |
| 405 | } |
| 406 | write_unlock_bh(&idev->lock); |
| 407 | } |
| 408 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 409 | /* |
| 410 | * check if the interface has this anycast address |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 411 | * called with rcu_read_lock() |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 412 | */ |
Eric Dumazet | a50feda | 2012-05-18 18:57:34 +0000 | [diff] [blame] | 413 | static bool ipv6_chk_acast_dev(struct net_device *dev, const struct in6_addr *addr) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 414 | { |
| 415 | struct inet6_dev *idev; |
| 416 | struct ifacaddr6 *aca; |
| 417 | |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 418 | idev = __in6_dev_get(dev); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 419 | if (idev) { |
| 420 | read_lock_bh(&idev->lock); |
| 421 | for (aca = idev->ac_list; aca; aca = aca->aca_next) |
| 422 | if (ipv6_addr_equal(&aca->aca_addr, addr)) |
| 423 | break; |
| 424 | read_unlock_bh(&idev->lock); |
Stephen Hemminger | cfcabdc | 2007-10-09 01:59:42 -0700 | [diff] [blame] | 425 | return aca != NULL; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 426 | } |
Eric Dumazet | a50feda | 2012-05-18 18:57:34 +0000 | [diff] [blame] | 427 | return false; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 428 | } |
| 429 | |
| 430 | /* |
| 431 | * check if given interface (or any, if dev==0) has this anycast address |
| 432 | */ |
Eric Dumazet | a50feda | 2012-05-18 18:57:34 +0000 | [diff] [blame] | 433 | bool ipv6_chk_acast_addr(struct net *net, struct net_device *dev, |
| 434 | const struct in6_addr *addr) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 435 | { |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 436 | unsigned int hash = inet6_acaddr_hash(net, addr); |
| 437 | struct net_device *nh_dev; |
| 438 | struct ifacaddr6 *aca; |
Eric Dumazet | a50feda | 2012-05-18 18:57:34 +0000 | [diff] [blame] | 439 | bool found = false; |
Pavel Emelianov | 7562f87 | 2007-05-03 15:13:45 -0700 | [diff] [blame] | 440 | |
Eric Dumazet | c6d14c8 | 2009-11-04 05:43:23 -0800 | [diff] [blame] | 441 | rcu_read_lock(); |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 442 | if (dev) |
| 443 | found = ipv6_chk_acast_dev(dev, addr); |
| 444 | else |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 445 | hlist_for_each_entry_rcu(aca, &inet6_acaddr_lst[hash], |
| 446 | aca_addr_lst) { |
| 447 | nh_dev = fib6_info_nh_dev(aca->aca_rt); |
| 448 | if (!nh_dev || !net_eq(dev_net(nh_dev), net)) |
| 449 | continue; |
| 450 | if (ipv6_addr_equal(&aca->aca_addr, addr)) { |
Eric Dumazet | a50feda | 2012-05-18 18:57:34 +0000 | [diff] [blame] | 451 | found = true; |
Eric Dumazet | bb69ae0 | 2010-06-07 11:42:13 +0000 | [diff] [blame] | 452 | break; |
| 453 | } |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 454 | } |
Eric Dumazet | c6d14c8 | 2009-11-04 05:43:23 -0800 | [diff] [blame] | 455 | rcu_read_unlock(); |
Pavel Emelianov | 7562f87 | 2007-05-03 15:13:45 -0700 | [diff] [blame] | 456 | return found; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 457 | } |
| 458 | |
FX Le Bail | 7c90cc2 | 2014-01-22 07:42:37 +0100 | [diff] [blame] | 459 | /* check if this anycast address is link-local on given interface or |
| 460 | * is global |
| 461 | */ |
| 462 | bool ipv6_chk_acast_addr_src(struct net *net, struct net_device *dev, |
| 463 | const struct in6_addr *addr) |
| 464 | { |
| 465 | return ipv6_chk_acast_addr(net, |
| 466 | (ipv6_addr_type(addr) & IPV6_ADDR_LINKLOCAL ? |
| 467 | dev : NULL), |
| 468 | addr); |
| 469 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 470 | |
| 471 | #ifdef CONFIG_PROC_FS |
| 472 | struct ac6_iter_state { |
Daniel Lezcano | 6ab57e7 | 2008-03-26 16:52:32 -0700 | [diff] [blame] | 473 | struct seq_net_private p; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 474 | struct net_device *dev; |
| 475 | struct inet6_dev *idev; |
| 476 | }; |
| 477 | |
| 478 | #define ac6_seq_private(seq) ((struct ac6_iter_state *)(seq)->private) |
| 479 | |
| 480 | static inline struct ifacaddr6 *ac6_get_first(struct seq_file *seq) |
| 481 | { |
| 482 | struct ifacaddr6 *im = NULL; |
| 483 | struct ac6_iter_state *state = ac6_seq_private(seq); |
Daniel Lezcano | 6ab57e7 | 2008-03-26 16:52:32 -0700 | [diff] [blame] | 484 | struct net *net = seq_file_net(seq); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 485 | |
Pavel Emelianov | 7562f87 | 2007-05-03 15:13:45 -0700 | [diff] [blame] | 486 | state->idev = NULL; |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 487 | for_each_netdev_rcu(net, state->dev) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 488 | struct inet6_dev *idev; |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 489 | idev = __in6_dev_get(state->dev); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 490 | if (!idev) |
| 491 | continue; |
| 492 | read_lock_bh(&idev->lock); |
| 493 | im = idev->ac_list; |
| 494 | if (im) { |
| 495 | state->idev = idev; |
| 496 | break; |
| 497 | } |
| 498 | read_unlock_bh(&idev->lock); |
| 499 | } |
| 500 | return im; |
| 501 | } |
| 502 | |
| 503 | static struct ifacaddr6 *ac6_get_next(struct seq_file *seq, struct ifacaddr6 *im) |
| 504 | { |
| 505 | struct ac6_iter_state *state = ac6_seq_private(seq); |
| 506 | |
| 507 | im = im->aca_next; |
| 508 | while (!im) { |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 509 | if (likely(state->idev != NULL)) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 510 | read_unlock_bh(&state->idev->lock); |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 511 | |
| 512 | state->dev = next_net_device_rcu(state->dev); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 513 | if (!state->dev) { |
| 514 | state->idev = NULL; |
| 515 | break; |
| 516 | } |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 517 | state->idev = __in6_dev_get(state->dev); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 518 | if (!state->idev) |
| 519 | continue; |
| 520 | read_lock_bh(&state->idev->lock); |
| 521 | im = state->idev->ac_list; |
| 522 | } |
| 523 | return im; |
| 524 | } |
| 525 | |
| 526 | static struct ifacaddr6 *ac6_get_idx(struct seq_file *seq, loff_t pos) |
| 527 | { |
| 528 | struct ifacaddr6 *im = ac6_get_first(seq); |
| 529 | if (im) |
| 530 | while (pos && (im = ac6_get_next(seq, im)) != NULL) |
| 531 | --pos; |
| 532 | return pos ? NULL : im; |
| 533 | } |
| 534 | |
| 535 | static void *ac6_seq_start(struct seq_file *seq, loff_t *pos) |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 536 | __acquires(RCU) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 537 | { |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 538 | rcu_read_lock(); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 539 | return ac6_get_idx(seq, *pos); |
| 540 | } |
| 541 | |
| 542 | static void *ac6_seq_next(struct seq_file *seq, void *v, loff_t *pos) |
| 543 | { |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 544 | struct ifacaddr6 *im = ac6_get_next(seq, v); |
| 545 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 546 | ++*pos; |
| 547 | return im; |
| 548 | } |
| 549 | |
| 550 | static void ac6_seq_stop(struct seq_file *seq, void *v) |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 551 | __releases(RCU) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 552 | { |
| 553 | struct ac6_iter_state *state = ac6_seq_private(seq); |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 554 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 555 | if (likely(state->idev != NULL)) { |
| 556 | read_unlock_bh(&state->idev->lock); |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 557 | state->idev = NULL; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 558 | } |
Eric Dumazet | ce81b76 | 2009-11-11 17:34:30 +0000 | [diff] [blame] | 559 | rcu_read_unlock(); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 560 | } |
| 561 | |
| 562 | static int ac6_seq_show(struct seq_file *seq, void *v) |
| 563 | { |
| 564 | struct ifacaddr6 *im = (struct ifacaddr6 *)v; |
| 565 | struct ac6_iter_state *state = ac6_seq_private(seq); |
| 566 | |
Harvey Harrison | 4b7a427 | 2008-10-29 12:50:24 -0700 | [diff] [blame] | 567 | seq_printf(seq, "%-4d %-15s %pi6 %5d\n", |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 568 | state->dev->ifindex, state->dev->name, |
Harvey Harrison | b071195 | 2008-10-28 16:05:40 -0700 | [diff] [blame] | 569 | &im->aca_addr, im->aca_users); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 570 | return 0; |
| 571 | } |
| 572 | |
Philippe De Muyter | 56b3d97 | 2007-07-10 23:07:31 -0700 | [diff] [blame] | 573 | static const struct seq_operations ac6_seq_ops = { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 574 | .start = ac6_seq_start, |
| 575 | .next = ac6_seq_next, |
| 576 | .stop = ac6_seq_stop, |
| 577 | .show = ac6_seq_show, |
| 578 | }; |
| 579 | |
Alexey Dobriyan | 2c8c1e7 | 2010-01-17 03:35:32 +0000 | [diff] [blame] | 580 | int __net_init ac6_proc_init(struct net *net) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 581 | { |
Christoph Hellwig | c350637 | 2018-04-10 19:42:55 +0200 | [diff] [blame] | 582 | if (!proc_create_net("anycast6", 0444, net->proc_net, &ac6_seq_ops, |
| 583 | sizeof(struct ac6_iter_state))) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 584 | return -ENOMEM; |
| 585 | |
| 586 | return 0; |
| 587 | } |
| 588 | |
Daniel Lezcano | 6ab57e7 | 2008-03-26 16:52:32 -0700 | [diff] [blame] | 589 | void ac6_proc_exit(struct net *net) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 590 | { |
Gao feng | ece31ff | 2013-02-18 01:34:56 +0000 | [diff] [blame] | 591 | remove_proc_entry("anycast6", net->proc_net); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 592 | } |
Jeff Barnhill | 2384d02 | 2018-11-02 20:23:57 +0000 | [diff] [blame^] | 593 | |
| 594 | /* Init / cleanup code |
| 595 | */ |
| 596 | int __init ipv6_anycast_init(void) |
| 597 | { |
| 598 | int i; |
| 599 | |
| 600 | for (i = 0; i < IN6_ADDR_HSIZE; i++) |
| 601 | INIT_HLIST_HEAD(&inet6_acaddr_lst[i]); |
| 602 | return 0; |
| 603 | } |
| 604 | |
| 605 | void ipv6_anycast_cleanup(void) |
| 606 | { |
| 607 | int i; |
| 608 | |
| 609 | spin_lock(&acaddr_hash_lock); |
| 610 | for (i = 0; i < IN6_ADDR_HSIZE; i++) |
| 611 | WARN_ON(!hlist_empty(&inet6_acaddr_lst[i])); |
| 612 | spin_unlock(&acaddr_hash_lock); |
| 613 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 614 | #endif |