IPv6: Remove local ULA if there is an external one
[project/netifd.git] / interface-ip.c
index 6699d2e..d18fa74 100644 (file)
@@ -1,6 +1,7 @@
 /*
  * netifd - network interface daemon
  * Copyright (C) 2012 Felix Fietkau <nbd@openwrt.org>
+ * Copyright (C) 2012 Steven Barth <steven@midlink.org>
  *
  * This program is free software; you can redistribute it and/or modify
  * it under the terms of the GNU General Public License version 2
@@ -33,6 +34,8 @@ enum {
        ROUTE_GATEWAY,
        ROUTE_METRIC,
        ROUTE_MTU,
+       ROUTE_VALID,
+       ROUTE_TABLE,
        __ROUTE_MAX
 };
 
@@ -43,6 +46,8 @@ static const struct blobmsg_policy route_attr[__ROUTE_MAX] = {
        [ROUTE_GATEWAY] = { .name = "gateway", .type = BLOBMSG_TYPE_STRING },
        [ROUTE_METRIC] = { .name = "metric", .type = BLOBMSG_TYPE_INT32 },
        [ROUTE_MTU] = { .name = "mtu", .type = BLOBMSG_TYPE_INT32 },
+       [ROUTE_TABLE] = { .name = "table", .type = BLOBMSG_TYPE_STRING },
+       [ROUTE_VALID] = { .name = "valid", .type = BLOBMSG_TYPE_INT32 },
 };
 
 const struct config_param_list route_attr_list = {
@@ -50,6 +55,12 @@ const struct config_param_list route_attr_list = {
        .params = route_attr,
 };
 
+
+struct list_head prefixes = LIST_HEAD_INIT(prefixes);
+static struct device_prefix *ula_prefix = NULL;
+static struct uloop_timeout valid_until_timeout;
+
+
 static void
 clear_if_addr(union if_addr *a, int mask)
 {
@@ -116,6 +127,9 @@ __find_ip_route_target(struct interface_ip_settings *ip, union if_addr *a,
                if (!match_if_addr(&route->addr, a, route->mask))
                        continue;
 
+               if (route->flags & DEVROUTE_TABLE)
+                       continue;
+
                if (!*res || route->mask < (*res)->mask)
                        *res = route;
        }
@@ -141,6 +155,8 @@ interface_ip_add_target_route(union if_addr *addr, bool v6)
 {
        struct interface *iface;
        struct device_route *route, *r_next = NULL;
+       bool defaultroute_target = false;
+       int addrsize = v6 ? sizeof(addr->in6) : sizeof(addr->in);
 
        route = calloc(1, sizeof(*route));
        if (!route)
@@ -148,7 +164,10 @@ interface_ip_add_target_route(union if_addr *addr, bool v6)
 
        route->flags = v6 ? DEVADDR_INET6 : DEVADDR_INET4;
        route->mask = v6 ? 128 : 32;
-       memcpy(&route->addr, addr, v6 ? sizeof(addr->in6) : sizeof(addr->in));
+       if (memcmp(&route->addr, addr, addrsize) == 0)
+               defaultroute_target = true;
+       else
+               memcpy(&route->addr, addr, addrsize);
 
        vlist_for_each_element(&interfaces, iface, node) {
                /* look for locally addressable target first */
@@ -172,7 +191,10 @@ interface_ip_add_target_route(union if_addr *addr, bool v6)
 
 done:
        route->iface = iface;
-       vlist_add(&iface->host_routes, &route->node, &route->flags);
+       if (defaultroute_target)
+               free(route);
+       else
+               vlist_add(&iface->host_routes, &route->node, route);
        return iface;
 }
 
@@ -212,7 +234,7 @@ interface_ip_add_route(struct interface *iface, struct blob_attr *attr, bool v6)
        }
 
        if ((cur = tb[ROUTE_TARGET]) != NULL) {
-               if (!inet_pton(af, blobmsg_data(cur), &route->addr)) {
+               if (!parse_ip_and_netmask(af, blobmsg_data(cur), &route->addr, &route->mask)) {
                        DPRINTF("Failed to parse route target: %s\n", (char *) blobmsg_data(cur));
                        goto error;
                }
@@ -230,10 +252,25 @@ interface_ip_add_route(struct interface *iface, struct blob_attr *attr, bool v6)
                route->flags |= DEVROUTE_METRIC;
        }
 
-       if ((cur = tb[ROUTE_MTU]) != NULL)
+       if ((cur = tb[ROUTE_MTU]) != NULL) {
                route->mtu = blobmsg_get_u32(cur);
+               route->flags |= DEVROUTE_MTU;
+       }
+
+       if ((cur = tb[ROUTE_TABLE]) != NULL) {
+               if (!system_resolve_rt_table(blobmsg_data(cur), &route->table)) {
+                       DPRINTF("Failed to resolve routing table: %s\n", (char *) blobmsg_data(cur));
+                       goto error;
+               }
 
-       vlist_add(&ip->route, &route->node, &route->flags);
+               if (route->table)
+                       route->flags |= DEVROUTE_TABLE;
+       }
+
+       if ((cur = tb[ROUTE_VALID]) != NULL)
+               route->valid_until = system_get_rtime() + blobmsg_get_u32(cur);
+
+       vlist_add(&ip->route, &route->node, route);
        return;
 
 error:
@@ -250,8 +287,25 @@ addr_cmp(const void *k1, const void *k2, void *ptr)
 static int
 route_cmp(const void *k1, const void *k2, void *ptr)
 {
-       return memcmp(k1, k2, sizeof(struct device_route) -
-                     offsetof(struct device_route, flags));
+       const struct device_route *r1 = k1, *r2 = k2;
+
+       if (r1->mask != r2->mask)
+               return r2->mask - r1->mask;
+
+       if (r1->metric != r2->metric)
+               return r1->metric - r2->metric;
+
+       if (r1->flags != r2->flags)
+               return r2->flags - r1->flags;
+
+       return memcmp(&r1->addr, &r2->addr, sizeof(r1->addr));
+}
+
+static int
+prefix_cmp(const void *k1, const void *k2, void *ptr)
+{
+       return memcmp(k1, k2, sizeof(struct device_prefix) -
+                       offsetof(struct device_prefix, addr));
 }
 
 static void
@@ -260,6 +314,7 @@ interface_handle_subnet_route(struct interface *iface, struct device_addr *addr,
        struct device *dev = iface->l3_dev.dev;
        struct device_route route;
 
+       memset(&route, 0, sizeof(route));
        route.iface = iface;
        route.flags = addr->flags;
        route.mask = addr->mask;
@@ -270,11 +325,14 @@ interface_handle_subnet_route(struct interface *iface, struct device_addr *addr,
                route.flags |= DEVADDR_KERNEL;
                system_del_route(dev, &route);
 
-               route.flags &= ~DEVADDR_KERNEL;
-               route.metric = iface->metric;
-               system_add_route(dev, &route);
+               if (!(addr->flags & DEVADDR_OFFLINK)) {
+                       route.flags &= ~DEVADDR_KERNEL;
+                       route.metric = iface->metric;
+                       system_add_route(dev, &route);
+               }
        } else {
-               system_del_route(dev, &route);
+               if (!(addr->flags & DEVADDR_OFFLINK))
+                       system_del_route(dev, &route);
        }
 }
 
@@ -313,7 +371,9 @@ interface_update_proto_addr(struct vlist_tree *tree,
        if (a_new && a_old) {
                keep = true;
 
-               if (a_old->flags != a_new->flags)
+               if (a_old->flags != a_new->flags ||
+                               a_old->valid_until != a_new->valid_until ||
+                               a_old->preferred_until != a_new->preferred_until)
                        keep = false;
 
                if ((a_new->flags & DEVADDR_FAMILY) == DEVADDR_INET4 &&
@@ -333,7 +393,7 @@ interface_update_proto_addr(struct vlist_tree *tree,
                a_new->enabled = true;
                if (!(a_new->flags & DEVADDR_EXTERNAL) && !keep) {
                        system_add_address(dev, a_new);
-                       if (iface->metric)
+                       if ((a_new->flags & DEVADDR_OFFLINK) || iface->metric)
                                interface_handle_subnet_route(iface, a_new, true);
                }
        }
@@ -413,12 +473,313 @@ interface_update_host_route(struct vlist_tree *tree,
                system_add_route(dev, route_new);
 }
 
+
+static void
+interface_set_prefix_address(struct device_prefix_assignment *assignment,
+               const struct device_prefix *prefix, struct interface *iface, bool add);
+
+static void interface_trigger_ula_prefix(struct interface *iface,
+               const struct device_prefix *prefix, bool enable)
+{
+       if (prefix == ula_prefix || (prefix->addr.s6_addr[0] & 0xfe) != 0xfc)
+               return;
+
+       bool external_ula = false;
+       struct device_prefix_assignment *ula_assign = NULL;
+       struct device_prefix *c;
+       list_for_each_entry(c, &prefixes, head) {
+               if (c != ula_prefix && (c->addr.s6_addr[0] & 0xfe) != 0xfc)
+                       continue;
+
+               struct device_prefix_assignment *a;
+               list_for_each_entry(a, &c->assignments, head) {
+                       if (!strcmp(a->name, iface->name)) {
+                               if (c == ula_prefix)
+                                       ula_assign = a;
+                               else if (a->enabled)
+                                       external_ula = true;
+                       }
+               }
+
+       }
+
+       // Remove ULA assignment if there is an externally managed ULA and vice versa
+       if (ula_assign && ((enable && !external_ula) || (!enable && external_ula)))
+               interface_set_prefix_address(ula_assign, ula_prefix, iface, enable);
+}
+
+
+static void
+interface_set_prefix_address(struct device_prefix_assignment *assignment,
+               const struct device_prefix *prefix, struct interface *iface, bool add)
+{
+       const struct interface *uplink = prefix->iface;
+       if (!iface->l3_dev.dev)
+               return;
+
+       struct device *l3_downlink = iface->l3_dev.dev;
+
+       struct device_addr addr;
+       memset(&addr, 0, sizeof(addr));
+       addr.addr.in6 = prefix->addr;
+       addr.addr.in6.s6_addr32[1] |= htonl(assignment->assigned);
+       addr.addr.in6.s6_addr[15] += 1;
+       addr.mask = assignment->length;
+       addr.flags = DEVADDR_INET6;
+       addr.preferred_until = prefix->preferred_until;
+       addr.valid_until = prefix->valid_until;
+
+       if (!add && assignment->enabled) {
+               time_t now = system_get_rtime();
+               addr.preferred_until = now;
+               if (!addr.valid_until || addr.valid_until - now > 7200)
+                       addr.valid_until = now + 7200;
+               system_add_address(l3_downlink, &addr);
+               assignment->enabled = false;
+
+               interface_trigger_ula_prefix(iface, prefix, true);
+       } else if (add && (iface->state == IFS_UP || iface->state == IFS_SETUP)) {
+               system_add_address(l3_downlink, &addr);
+               if (uplink && uplink->l3_dev.dev) {
+                       int mtu = system_update_ipv6_mtu(
+                                       uplink->l3_dev.dev, 0);
+                       if (mtu > 0)
+                               system_update_ipv6_mtu(l3_downlink, mtu);
+               }
+               assignment->enabled = true;
+
+               interface_trigger_ula_prefix(iface, prefix, false);
+       }
+}
+
+static bool interface_prefix_assign(struct list_head *list,
+               struct device_prefix_assignment *assign)
+{
+       int32_t current = 0, asize = (1 << (64 - assign->length)) - 1;
+       struct device_prefix_assignment *c;
+       list_for_each_entry(c, list, head) {
+               if (assign->assigned != -1) {
+                       if (assign->assigned > current && assign->assigned + asize < c->assigned) {
+                               list_add_tail(&assign->head, &c->head);
+                               return true;
+                       }
+               } else if (assign->assigned == -1) {
+                       current = (current + asize) & (~asize);
+                       if (current + asize < c->assigned) {
+                               assign->assigned = current;
+                               list_add_tail(&assign->head, &c->head);
+                               return true;
+                       }
+               }
+               current = (c->assigned + (1 << (64 - c->length)));
+       }
+       return false;
+}
+
+static void interface_update_prefix_assignments(struct device_prefix *prefix, bool setup)
+{
+       struct device_prefix_assignment *c;
+       struct interface *iface;
+
+       // Delete all assignments
+       while (!list_empty(&prefix->assignments)) {
+               c = list_first_entry(&prefix->assignments,
+                               struct device_prefix_assignment, head);
+               if ((iface = vlist_find(&interfaces, c->name, iface, node)))
+                       interface_set_prefix_address(c, prefix, iface, false);
+               list_del(&c->head);
+               free(c);
+       }
+
+       if (!setup)
+               return;
+
+       // End-of-assignment sentinel
+       c = malloc(sizeof(*c) + 1);
+       c->assigned = 1 << (64 - prefix->length);
+       c->length = 64;
+       c->name[0] = 0;
+       list_add(&c->head, &prefix->assignments);
+
+       // Excluded prefix
+       if (prefix->excl_length > 0) {
+               const char name[] = "!excluded";
+               c = malloc(sizeof(*c) + sizeof(name));
+               c->assigned = ntohl(prefix->excl_addr.s6_addr32[1]) &
+                               ((1 << (64 - prefix->length)) - 1);
+               c->length = prefix->excl_length;
+               memcpy(c->name, name, sizeof(name));
+               list_add(&c->head, &prefix->assignments);
+       }
+
+       struct list_head assign_later = LIST_HEAD_INIT(assign_later);
+       vlist_for_each_element(&interfaces, iface, node) {
+               if (iface->config_ip.assignment_length < 48 ||
+                               iface->config_ip.assignment_length > 64)
+                       continue;
+
+               size_t namelen = strlen(iface->name) + 1;
+               c = malloc(sizeof(*c) + namelen);
+               c->length = iface->config_ip.assignment_length;
+               c->assigned = iface->config_ip.assignment_hint;
+               c->enabled = false;
+               memcpy(c->name, iface->name, namelen);
+
+               // First process all custom assignments, put all others in later-list
+               if (c->assigned == -1 || !interface_prefix_assign(&prefix->assignments, c)) {
+                       if (c->assigned != -1) {
+                               c->assigned = -1;
+                               netifd_log_message(L_WARNING, "Failed to assign requested subprefix "
+                                               "of size %hhu for %s, trying other\n", c->length, c->name);
+                       }
+                       list_add_tail(&c->head, &assign_later);
+               }
+       }
+
+       // Then try to assign all other + failed custom assignments
+       while (!list_empty(&assign_later)) {
+               c = list_first_entry(&assign_later, struct device_prefix_assignment, head);
+               list_del(&c->head);
+               if (!interface_prefix_assign(&prefix->assignments, c)) {
+                       netifd_log_message(L_WARNING, "Failed to assign subprefix "
+                                       "of size %hhu for %s\n", c->length, c->name);
+                       free(c);
+               }
+       }
+
+       list_for_each_entry(c, &prefix->assignments, head)
+               if ((iface = vlist_find(&interfaces, c->name, iface, node)))
+                       interface_set_prefix_address(c, prefix, iface, true);
+}
+
+
+void interface_refresh_assignments(bool hint)
+{
+       static bool refresh = false;
+       if (!hint && refresh) {
+               struct device_prefix *p;
+               list_for_each_entry(p, &prefixes, head)
+                       interface_update_prefix_assignments(p, true);
+       }
+       refresh = hint;
+}
+
+
+static void
+interface_update_prefix(struct vlist_tree *tree,
+                            struct vlist_node *node_new,
+                            struct vlist_node *node_old)
+{
+       struct device_prefix *prefix_old, *prefix_new;
+       prefix_old = container_of(node_old, struct device_prefix, node);
+       prefix_new = container_of(node_new, struct device_prefix, node);
+
+       struct device_route route;
+       memset(&route, 0, sizeof(route));
+       route.flags = DEVADDR_INET6;
+       route.metric = INT32_MAX;
+       route.mask = (node_new) ? prefix_new->length : prefix_old->length;
+       route.addr.in6 = (node_new) ? prefix_new->addr : prefix_old->addr;
+
+       struct device_prefix_assignment *c;
+       struct interface *iface;
+
+       if (node_old && node_new) {
+               // Move assignments and refresh addresses to update valid times
+               list_splice(&prefix_old->assignments, &prefix_new->assignments);
+
+               list_for_each_entry(c, &prefix_new->assignments, head)
+                       if ((iface = vlist_find(&interfaces, c->name, iface, node)))
+                               interface_set_prefix_address(c, prefix_new, iface, true);
+       } else if (node_new) {
+               // Set null-route to avoid routing loops
+               system_add_route(NULL, &route);
+
+               interface_update_prefix_assignments(prefix_new, true);
+       } else if (node_old) {
+               interface_update_prefix_assignments(prefix_old, false);
+
+               // Remove null-route
+               system_del_route(NULL, &route);
+       }
+
+       if (node_old) {
+               list_del(&prefix_old->head);
+               free(prefix_old);
+       }
+
+       if (node_new)
+               list_add(&prefix_new->head, &prefixes);
+
+}
+
+struct device_prefix*
+interface_ip_add_device_prefix(struct interface *iface, struct in6_addr *addr,
+               uint8_t length, time_t valid_until, time_t preferred_until,
+               struct in6_addr *excl_addr, uint8_t excl_length)
+{
+       struct device_prefix *prefix = calloc(1, sizeof(*prefix));
+       prefix->length = length;
+       prefix->addr = *addr;
+       prefix->preferred_until = preferred_until;
+       prefix->valid_until = valid_until;
+       prefix->iface = iface;
+       INIT_LIST_HEAD(&prefix->assignments);
+
+       if (excl_addr) {
+               prefix->excl_addr = *excl_addr;
+               prefix->excl_length = excl_length;
+       }
+
+       if (iface)
+               vlist_add(&iface->proto_ip.prefix, &prefix->node, &prefix->addr);
+       else
+               interface_update_prefix(NULL, &prefix->node, NULL);
+
+       return prefix;
+}
+
+void
+interface_ip_set_ula_prefix(const char *prefix)
+{
+       char buf[INET6_ADDRSTRLEN + 4] = {0}, *saveptr;
+       if (prefix)
+               strncpy(buf, prefix, sizeof(buf) - 1);
+       char *prefixaddr = strtok_r(buf, "/", &saveptr);
+
+       struct in6_addr addr;
+       if (!prefixaddr || inet_pton(AF_INET6, prefixaddr, &addr) < 1) {
+               if (ula_prefix) {
+                       interface_update_prefix(NULL, NULL, &ula_prefix->node);
+                       ula_prefix = NULL;
+               }
+               return;
+       }
+
+       int length;
+       char *prefixlen = strtok_r(NULL, ",", &saveptr);
+       if (!prefixlen || (length = atoi(prefixlen)) < 1 || length > 64)
+               return;
+
+       if (!ula_prefix || !IN6_ARE_ADDR_EQUAL(&addr, &ula_prefix->addr) ||
+                       ula_prefix->length != length) {
+               if (ula_prefix)
+                       interface_update_prefix(NULL, NULL, &ula_prefix->node);
+
+               ula_prefix = interface_ip_add_device_prefix(NULL, &addr, length,
+                               0, 0, NULL, 0);
+       }
+}
+
 void
 interface_add_dns_server(struct interface_ip_settings *ip, const char *str)
 {
        struct dns_server *s;
 
        s = calloc(1, sizeof(*s));
+       if (!s)
+               return;
+
        s->af = AF_INET;
        if (inet_pton(s->af, str, &s->addr.in))
                goto add;
@@ -491,7 +852,7 @@ write_resolv_conf_entries(FILE *f, struct interface_ip_settings *ip)
        struct dns_server *s;
        struct dns_search_domain *d;
        const char *str;
-       char buf[32];
+       char buf[INET6_ADDRSTRLEN];
 
        vlist_simple_for_each_element(&ip->dns_servers, s, node) {
                str = inet_ntop(s->af, &s->addr, buf, sizeof(buf));
@@ -512,10 +873,11 @@ interface_write_resolv_conf(void)
        struct interface *iface;
        char *path = alloca(strlen(resolv_conf) + 5);
        FILE *f;
+       uint32_t crcold, crcnew;
 
        sprintf(path, "%s.tmp", resolv_conf);
        unlink(path);
-       f = fopen(path, "w");
+       f = fopen(path, "w+");
        if (!f) {
                D(INTERFACE, "Failed to open %s for writing\n", path);
                return;
@@ -536,8 +898,21 @@ interface_write_resolv_conf(void)
                if (!iface->proto_ip.no_dns)
                        write_resolv_conf_entries(f, &iface->proto_ip);
        }
+       fflush(f);
+       rewind(f);
+       crcnew = crc32_file(f);
        fclose(f);
-       if (rename(path, resolv_conf) < 0) {
+
+       crcold = crcnew + 1;
+       f = fopen(resolv_conf, "r");
+       if (f) {
+               crcold = crc32_file(f);
+               fclose(f);
+       }
+
+       if (crcold == crcnew) {
+               unlink(path);
+       } else if (rename(path, resolv_conf) < 0) {
                D(INTERFACE, "Failed to replace %s\n", resolv_conf);
                unlink(path);
        }
@@ -583,6 +958,13 @@ void interface_ip_set_enabled(struct interface_ip_settings *ip, bool enabled)
                        system_del_route(dev, route);
                route->enabled = _enabled;
        }
+
+       struct device_prefix *c;
+       struct device_prefix_assignment *a;
+       list_for_each_entry(c, &prefixes, head)
+               list_for_each_entry(a, &c->assignments, head)
+                       if (!strcmp(a->name, ip->iface->name))
+                               interface_set_prefix_address(a, c, ip->iface, enabled);
 }
 
 void
@@ -594,6 +976,7 @@ interface_ip_update_start(struct interface_ip_settings *ip)
        }
        vlist_update(&ip->route);
        vlist_update(&ip->addr);
+       vlist_update(&ip->prefix);
 }
 
 void
@@ -603,6 +986,8 @@ interface_ip_update_complete(struct interface_ip_settings *ip)
        vlist_simple_flush(&ip->dns_search);
        vlist_flush(&ip->route);
        vlist_flush(&ip->addr);
+       vlist_flush(&ip->prefix);
+       interface_write_resolv_conf();
 }
 
 void
@@ -614,6 +999,7 @@ interface_ip_flush(struct interface_ip_settings *ip)
        vlist_simple_flush_all(&ip->dns_search);
        vlist_flush_all(&ip->route);
        vlist_flush_all(&ip->addr);
+       vlist_flush_all(&ip->prefix);
 }
 
 static void
@@ -625,6 +1011,7 @@ __interface_ip_init(struct interface_ip_settings *ip, struct interface *iface)
        vlist_simple_init(&ip->dns_servers, struct dns_server, node);
        vlist_init(&ip->route, route_cmp, interface_update_proto_route);
        vlist_init(&ip->addr, addr_cmp, interface_update_proto_addr);
+       vlist_init(&ip->prefix, prefix_cmp, interface_update_prefix);
 }
 
 void
@@ -633,4 +1020,42 @@ interface_ip_init(struct interface *iface)
        __interface_ip_init(&iface->proto_ip, iface);
        __interface_ip_init(&iface->config_ip, iface);
        vlist_init(&iface->host_routes, route_cmp, interface_update_host_route);
+
+}
+
+static void
+interface_ip_valid_until_handler(struct uloop_timeout *t)
+{
+       time_t now = system_get_rtime();
+       struct interface *iface;
+       vlist_for_each_element(&interfaces, iface, node) {
+               if (iface->state != IFS_UP)
+                       continue;
+
+               struct device_addr *addr, *addrp;
+               struct device_route *route, *routep;
+               struct device_prefix *pref, *prefp;
+
+               vlist_for_each_element_safe(&iface->proto_ip.addr, addr, node, addrp)
+                       if (addr->valid_until && addr->valid_until < now)
+                               vlist_delete(&iface->proto_ip.addr, &addr->node);
+
+               vlist_for_each_element_safe(&iface->proto_ip.route, route, node, routep)
+                       if (route->valid_until && route->valid_until < now)
+                               vlist_delete(&iface->proto_ip.route, &route->node);
+
+               vlist_for_each_element_safe(&iface->proto_ip.prefix, pref, node, prefp)
+                       if (pref->valid_until && pref->valid_until < now)
+                               vlist_delete(&iface->proto_ip.prefix, &pref->node);
+
+       }
+
+       uloop_timeout_set(t, 1000);
+}
+
+static void __init
+interface_ip_init_worker(void)
+{
+       valid_until_timeout.cb = interface_ip_valid_until_handler;
+       uloop_timeout_set(&valid_until_timeout, 1000);
 }